Repository: OpenCCG/openccg
Branch: master
Commit: 9968e814a490
Files: 981
Total size: 8.0 MB

Directory structure:
gitextract_fqyg89tm/

├── .gitignore
├── AUTHORS
├── CHANGES
├── LICENSE
├── README.md
├── SAMPLE_GRAMMARS
├── TODO
├── bin/
│   ├── ccg-build
│   ├── ccg-build.bat
│   ├── ccg-cvr
│   ├── ccg-cvr.bat
│   ├── ccg-draw-graph
│   ├── ccg-draw-graph.bat
│   ├── ccg-draw-tree
│   ├── ccg-draw-tree.bat
│   ├── ccg-env
│   ├── ccg-env.bat
│   ├── ccg-grammardoc
│   ├── ccg-grammardoc.bat
│   ├── ccg-gt
│   ├── ccg-gt.bat
│   ├── ccg-ht-factors
│   ├── ccg-hypertagger
│   ├── ccg-hypertagger.bat
│   ├── ccg-parse
│   ├── ccg-parse.bat
│   ├── ccg-postagger
│   ├── ccg-postagger.bat
│   ├── ccg-realize
│   ├── ccg-realize.bat
│   ├── ccg-supertagger
│   ├── ccg-supertagger.bat
│   ├── ccg-test
│   ├── ccg-test.bat
│   ├── ccg-update
│   ├── ccg-update.bat
│   ├── ccg2xml
│   ├── ccg2xml.bat
│   ├── ccg_draw_tree.py
│   ├── dlf_parser.py
│   ├── tccg
│   ├── tccg.bat
│   ├── visccg
│   ├── visccg.bat
│   └── wccg
├── build.xml
├── ccg-format-grammars/
│   ├── arabic/
│   │   └── arabic.ccg
│   ├── inherit/
│   │   └── inherit.ccg
│   ├── tiny/
│   │   └── tiny.ccg
│   └── tinytiny/
│       └── tinytiny.ccg
├── ccgbank/
│   ├── bin/
│   │   ├── american-to-logical-quotes.py
│   │   ├── convert-mtc-systems.py
│   │   ├── convert-spaces-to-newlines.py
│   │   ├── convert_all
│   │   ├── correlate-to-judgments.py
│   │   ├── filter_feats.py
│   │   ├── find-betas-no-gold.py
│   │   ├── gen_parser_events_a
│   │   ├── gen_parser_events_b
│   │   ├── gen_parser_events_c
│   │   ├── gen_parser_events_d
│   │   ├── gen_parser_events_e
│   │   ├── gen_realizer_events_a
│   │   ├── gen_realizer_events_b
│   │   ├── gen_realizer_events_c
│   │   ├── gen_realizer_events_d
│   │   ├── gen_realizer_events_e
│   │   ├── get-text-from-mtc-style.py
│   │   ├── get-truecase-list.py
│   │   ├── get-uniq-nbest.py
│   │   ├── get_factors_from_parse.py
│   │   ├── get_just_words_from_ner_text.py
│   │   ├── lowercase_tagged_text.py
│   │   ├── merge-mtc-ids.py
│   │   ├── merge-stanford-morpha-with-pos.py
│   │   ├── merge_pos_ne.py
│   │   ├── my_unicode.py
│   │   ├── nbest-mtc-to-bleu-nist.py
│   │   ├── ner/
│   │   │   ├── NERApp/
│   │   │   │   └── src/
│   │   │   │       └── nerapp/
│   │   │   │           └── NERApp.java
│   │   │   ├── build-ner-api.properties
│   │   │   ├── build-ner-api.xml
│   │   │   ├── ner-tag.sh
│   │   │   ├── ner_word.py
│   │   │   └── post-process-stanford-ner.py
│   │   ├── normalize_text.py
│   │   ├── post-process-metricsmatr.py
│   │   ├── prepare-for-stanford-morpha.py
│   │   ├── reverse-spaces-to-newlines.py
│   │   ├── run-all-bleu.sh
│   │   ├── stem_nns_vbx
│   │   ├── toUTF-8.py
│   │   └── write_morph.py
│   ├── build-ht.properties
│   ├── build-ht.xml
│   ├── build-models.properties
│   ├── build-models.xml
│   ├── build-original.properties
│   ├── build-original.xml
│   ├── build-ps.properties
│   ├── build-ps.xml
│   ├── build-release.xml
│   ├── build-rz.properties
│   ├── build-rz.xml
│   ├── build-st.properties
│   ├── build-st.xml
│   ├── build.properties
│   ├── build.xml
│   ├── data/
│   │   ├── README
│   │   ├── get_wsj_nns_vb
│   │   ├── novel/
│   │   │   └── two-sents
│   │   ├── sample/
│   │   │   └── AUTO/
│   │   │       └── 00/
│   │   │           └── wsj_0001.auto
│   │   ├── stem_wsj_nns_vb
│   │   ├── wsj-nns-vb
│   │   ├── wsj-nns-vb-stems
│   │   └── wsj_0595Corrected.auto
│   ├── extract/
│   │   ├── add-chunks.xsl
│   │   ├── convert-to-graph.xsl
│   │   ├── convert-to-hlds.xsl
│   │   ├── grammar.xml
│   │   └── raise-nodes.xsl
│   ├── models/
│   │   ├── hypertagger/
│   │   │   ├── ht-prior.flm
│   │   │   ├── ht.config
│   │   │   ├── ht2.config
│   │   │   ├── ht2.train.config
│   │   │   ├── pos.config
│   │   │   ├── posprior.flm
│   │   │   └── vocab.flm
│   │   ├── parser/
│   │   │   ├── binary.flm
│   │   │   ├── gen-events.prefs
│   │   │   ├── leaf.flm
│   │   │   ├── model.init
│   │   │   ├── parse.prefs
│   │   │   ├── top.flm
│   │   │   ├── unary.flm
│   │   │   └── vocab.flm
│   │   ├── realizer/
│   │   │   ├── alph.init
│   │   │   ├── gen-events.prefs
│   │   │   ├── model.init
│   │   │   ├── rz-test.prefs
│   │   │   └── stp3.flm
│   │   └── supertagger/
│   │       ├── pos.config
│   │       ├── posprior.flm
│   │       ├── st.config
│   │       ├── st.config.train
│   │       ├── st.noprior.config
│   │       ├── stprior.flm
│   │       └── vocab.flm
│   ├── original/
│   │   └── models/
│   │       ├── postagger/
│   │       │   ├── pos.config
│   │       │   └── posprior.flm
│   │       └── supertagger/
│   │           ├── st.config
│   │           ├── stprior.flm
│   │           └── vocab.flm
│   ├── plugins/
│   │   ├── MyGenSynScorer.java
│   │   ├── MyNgramCombo.java
│   │   ├── MyNgramGenSynProduct.java
│   │   ├── MyNgramPrecisionBaselineGenInterp.java
│   │   ├── MyNgramPrecisionPerceptronInterp.java
│   │   ├── MyParserPerceptronScorer.java
│   │   ├── MyRealizerPerceptronScorer.java
│   │   ├── MySynAgrFeatureExtractor.java
│   │   ├── MySynSemAgrFeatureExtractor.java
│   │   └── MySynSemFeatureExtractor.java
│   ├── stanford-nlp/
│   │   ├── classifiers/
│   │   │   └── stanfordner-README
│   │   └── stanfordnlp-README
│   └── templates/
│       ├── addFilterLexFeats.xsl
│       ├── addStems.xsl
│       ├── adjustAppos.xsl
│       ├── adjustCandCcats1.xsl
│       ├── adjustCats.xsl
│       ├── adjustParenthetical.xsl
│       ├── adjustReportedSpeech.xsl
│       ├── adjustRoles.xsl
│       ├── adv-placement.xsl
│       ├── agr-macroInsert.xsl
│       ├── allotIdLeaf.xsl
│       ├── allotIdTree.xsl
│       ├── allotIndexRel.xsl
│       ├── anim-macroInsert.xsl
│       ├── annotateAppos-Dash.xsl
│       ├── annotateAppos1.xsl
│       ├── annotateAppos2.xsl
│       ├── annotateAppos3.xsl
│       ├── annotateBrackets.xsl
│       ├── annotateColons.xsl
│       ├── annotateDots.xsl
│       ├── annotateExtraposedAppos.xsl
│       ├── annotateNom-AdjConj.xsl
│       ├── annotateParentheticals1.xsl
│       ├── annotateParentheticals2.xsl
│       ├── annotatePlace.xsl
│       ├── annotatePrtConjs.xsl
│       ├── annotateQuotes.xsl
│       ├── annotateReportedSpeech.xsl
│       ├── annotateStrayAppos.xsl
│       ├── annotateVPCommas.xsl
│       ├── balanceAppos.xsl
│       ├── balanceDash-Paren.xsl
│       ├── catCheck.xsl
│       ├── ccgRules.xsl
│       ├── changePunct.xsl
│       ├── closedCatInsert.xsl
│       ├── collapseMWUFull.xsl
│       ├── collapseMWUPart.xsl
│       ├── collapseMWUSharedTask.xsl
│       ├── computeCats.xsl
│       ├── convTags.xsl
│       ├── correctMistakes1.xsl
│       ├── correctPPHeads.xsl
│       ├── exportToAuto.xsl
│       ├── filterLex.xsl
│       ├── find-s-back-n.xsl
│       ├── genchal11-out.xsl
│       ├── inferConjRules.xsl
│       ├── insertLF.xsl
│       ├── insertOrigPunctsLF.xsl
│       ├── insertPTBInfo.xsl
│       ├── insertPunctLF-PosMod.xsl
│       ├── insertPunctLF.xsl
│       ├── insertQuoteSemClassInfo.xsl
│       ├── insertSemFeats.xsl
│       ├── introduceMMExtns.xsl
│       ├── labelAppos.xsl
│       ├── labelConj1.xsl
│       ├── labelConj2.xsl
│       ├── labelConj3.xsl
│       ├── labelPlace1.xsl
│       ├── labelPlace2.xsl
│       ├── labelPuncts.xsl
│       ├── lexExtr.xsl
│       ├── macroInsert.xsl
│       ├── macroLexDef.xsl
│       ├── markMistakes.xsl
│       ├── markUnmatched.xsl
│       ├── mergeMorph.xsl
│       ├── morphExtr.xsl
│       ├── normPTBTags.xsl
│       ├── normPunctPos.xsl
│       ├── origPunctRules.xsl
│       ├── overtWHLexRels.xsl
│       ├── overtWHPronouns.xsl
│       ├── phraseExtractor.xsl
│       ├── preSentAdj.xsl
│       ├── punctLexConjRules.xsl
│       ├── reinsertPTBInfo.xsl
│       ├── repairUnmatched.xsl
│       ├── replaceColons.xsl
│       ├── rulesExtr.xsl
│       ├── sentFinalPuncts.xsl
│       ├── trueCaser.xsl
│       └── uncurryBareParse.xsl
├── devel/
│   ├── BEN.TODO
│   └── schedule.txt
├── docs/
│   ├── build.xml
│   ├── ccgbank-README
│   ├── guide/
│   │   ├── build.xml
│   │   ├── cgloss4e.sty
│   │   ├── gb4e.sty
│   │   ├── guide.tex
│   │   ├── openccg.bib
│   │   └── openccg.sty
│   ├── index.html
│   ├── maxent.cpp.patch
│   ├── realizer/
│   │   ├── build.xml
│   │   ├── cgloss4e.sty
│   │   ├── gb4e.sty
│   │   ├── manual.tex
│   │   ├── openccg.sty
│   │   └── refs.bib
│   ├── style.css
│   └── taggers-README
├── grammars/
│   ├── add-chunks.xsl
│   ├── add-family-members.xsl
│   ├── append.xsl
│   ├── categories.xsd
│   ├── comic/
│   │   ├── build.xml
│   │   ├── dict.xml
│   │   ├── dict.xsl
│   │   ├── grammar.xml
│   │   ├── lexicon-base.xsl
│   │   ├── lexicon.xml
│   │   ├── morph.xml
│   │   ├── rules-base.xml
│   │   ├── rules.xml
│   │   ├── testbed.xml
│   │   ├── types-extras.xml
│   │   └── types.xml
│   ├── convert-lists.xsl
│   ├── convert-to-graph.xsl
│   ├── convert-to-hlds.xsl
│   ├── core-en/
│   │   ├── add-chunks.xsl
│   │   ├── add-intonation-info.xsl
│   │   ├── adj.xsl
│   │   ├── adv.xsl
│   │   ├── auxv.xsl
│   │   ├── cats.xsl
│   │   ├── conj.xsl
│   │   ├── derive-features.xsl
│   │   ├── det.xsl
│   │   ├── dict.xsl
│   │   ├── drop-features.xsl
│   │   ├── lexicon.xsl
│   │   ├── misc.xsl
│   │   ├── np.xsl
│   │   ├── pp.xsl
│   │   ├── punct.xsl
│   │   ├── raise-nodes.xsl
│   │   ├── templates.xsl
│   │   ├── types.xml
│   │   ├── unary-rules.xsl
│   │   └── v.xsl
│   ├── dict.xsd
│   ├── extract-morph.xsl
│   ├── flights/
│   │   ├── build.xml
│   │   ├── dict.xml
│   │   ├── dict.xsl
│   │   ├── flairs.xml
│   │   ├── grammar.xml
│   │   ├── lexicon-base.xsl
│   │   ├── lexicon.xml
│   │   ├── morph.xml
│   │   ├── nina107.xml
│   │   ├── rules-base.xml
│   │   ├── rules.xml
│   │   ├── testbed.xml
│   │   ├── types-extras.xml
│   │   ├── types.xml
│   │   └── vera.xml
│   ├── grammar.xsd
│   ├── hlds.xsd
│   ├── lexicon.xsd
│   ├── mini-basque/
│   │   ├── build.xml
│   │   ├── dict.xml
│   │   ├── grammar.xml
│   │   ├── lexicon-base.xml
│   │   ├── lexicon.xml
│   │   ├── morph.xml
│   │   ├── parameters.xml
│   │   ├── preset-families.xml
│   │   ├── rules.xml
│   │   ├── testbed.out
│   │   ├── testbed.xml
│   │   └── types.xml
│   ├── mini-dyirbal/
│   │   ├── build.xml
│   │   ├── dict.xml
│   │   ├── grammar.xml
│   │   ├── lexicon-base.xml
│   │   ├── lexicon.xml
│   │   ├── morph.xml
│   │   ├── parameters.xml
│   │   ├── preset-families.xml
│   │   ├── rules.xml
│   │   ├── testbed.out
│   │   ├── testbed.xml
│   │   └── types.xml
│   ├── mini-english/
│   │   ├── build.xml
│   │   ├── dict.xml
│   │   ├── grammar.xml
│   │   ├── lexicon-base.xml
│   │   ├── lexicon.xml
│   │   ├── morph.xml
│   │   ├── parameters.xml
│   │   ├── preset-families.xml
│   │   ├── rules.xml
│   │   ├── testbed.out
│   │   ├── testbed.xml
│   │   └── types.xml
│   ├── mini-inuit/
│   │   ├── build.xml
│   │   ├── dict.xml
│   │   ├── grammar.xml
│   │   ├── lexicon-base.xml
│   │   ├── lexicon.xml
│   │   ├── morph.xml
│   │   ├── parameters.xml
│   │   ├── preset-families.xml
│   │   ├── rules.xml
│   │   ├── testbed.out
│   │   ├── testbed.xml
│   │   └── types.xml
│   ├── mini-nezperce/
│   │   ├── build.xml
│   │   ├── parameters.xml
│   │   ├── preset-families.xml
│   │   └── types.xml
│   ├── mini-tagalog/
│   │   ├── build.xml
│   │   ├── dict.xml
│   │   ├── grammar.xml
│   │   ├── lexicon-base.xml
│   │   ├── lexicon.xml
│   │   ├── morph.xml
│   │   ├── parameters.xml
│   │   ├── preset-families.xml
│   │   ├── rules.xml
│   │   ├── testbed.out
│   │   ├── testbed.xml
│   │   └── types.xml
│   ├── mini-turkish/
│   │   ├── build.xml
│   │   ├── dict.xml
│   │   ├── grammar.xml
│   │   ├── lexicon-base.xml
│   │   ├── lexicon.xml
│   │   ├── morph.xml
│   │   ├── parameters.xml
│   │   ├── preset-families.xml
│   │   ├── rules.xml
│   │   ├── testbed.out
│   │   ├── testbed.xml
│   │   └── types.xml
│   ├── morph.xsd
│   ├── parameters.xsd
│   ├── parametric-lexicon.xsl
│   ├── parametric-types.xsl
│   ├── raise-nodes.xsl
│   ├── routes/
│   │   ├── build.xml
│   │   ├── dict.xml
│   │   ├── dlf_test.xml
│   │   ├── grammar.xml
│   │   ├── lexicon-base.xml
│   │   ├── lexicon.xml
│   │   ├── morph.xml
│   │   ├── rules.xml
│   │   ├── testbed.xml
│   │   └── types.xml
│   ├── rules.xsd
│   ├── simplify-lists.xsl
│   ├── tiny/
│   │   ├── build.xml
│   │   ├── grammar.xml
│   │   ├── lexicon.xml
│   │   ├── morph.xml
│   │   ├── rules.xml
│   │   ├── testbed.xml
│   │   └── types.xml
│   ├── tokens.xsd
│   ├── treeify-lists.xsl
│   ├── types.xsd
│   └── worldcup/
│       ├── add-chunks.xsl
│       ├── build.xml
│       ├── dict.xml
│       ├── grammar.xml
│       ├── lexicon-base.xsl
│       ├── lexicon.xml
│       ├── morph.xml
│       ├── raise-nodes.xsl
│       ├── rules.xml
│       └── testbed.xml
├── lib/
│   ├── ASL
│   ├── LGPL
│   ├── LIBNOTES
│   ├── MIT
│   ├── SUN
│   ├── jdom.license
│   └── jline.license
├── pom.xml
├── src/
│   ├── ccg2xml/
│   │   ├── README
│   │   ├── Tree.py
│   │   ├── arabic.ccg
│   │   ├── build.xml
│   │   ├── ccg.ply
│   │   ├── ccg_editor.py
│   │   ├── convert-ply.py
│   │   ├── grammar_template.ccg
│   │   ├── lex.py
│   │   └── yacc.py
│   ├── kenlm/
│   │   ├── COPYING
│   │   ├── COPYING.LESSER
│   │   ├── LICENSE
│   │   ├── README
│   │   ├── build_jnilib.sh
│   │   ├── clean_query_only.sh
│   │   ├── jni/
│   │   │   └── wrap.cc
│   │   ├── lm/
│   │   │   ├── Jamfile
│   │   │   ├── bhiksha.cc
│   │   │   ├── bhiksha.hh
│   │   │   ├── binary_format.cc
│   │   │   ├── binary_format.hh
│   │   │   ├── blank.hh
│   │   │   ├── build_binary_main.cc
│   │   │   ├── config.cc
│   │   │   ├── config.hh
│   │   │   ├── enumerate_vocab.hh
│   │   │   ├── facade.hh
│   │   │   ├── fragment_main.cc
│   │   │   ├── kenlm_max_order_main.cc
│   │   │   ├── left.hh
│   │   │   ├── left_test.cc
│   │   │   ├── lm_exception.cc
│   │   │   ├── lm_exception.hh
│   │   │   ├── max_order.hh
│   │   │   ├── model.cc
│   │   │   ├── model.hh
│   │   │   ├── model_test.cc
│   │   │   ├── model_type.hh
│   │   │   ├── ngram_query.hh
│   │   │   ├── partial.hh
│   │   │   ├── partial_test.cc
│   │   │   ├── quantize.cc
│   │   │   ├── quantize.hh
│   │   │   ├── query_main.cc
│   │   │   ├── read_arpa.cc
│   │   │   ├── read_arpa.hh
│   │   │   ├── return.hh
│   │   │   ├── search_hashed.cc
│   │   │   ├── search_hashed.hh
│   │   │   ├── search_trie.cc
│   │   │   ├── search_trie.hh
│   │   │   ├── sizes.cc
│   │   │   ├── sizes.hh
│   │   │   ├── state.hh
│   │   │   ├── test.arpa
│   │   │   ├── test_nounk.arpa
│   │   │   ├── trie.cc
│   │   │   ├── trie.hh
│   │   │   ├── trie_sort.cc
│   │   │   ├── trie_sort.hh
│   │   │   ├── value.hh
│   │   │   ├── value_build.cc
│   │   │   ├── value_build.hh
│   │   │   ├── virtual_interface.cc
│   │   │   ├── virtual_interface.hh
│   │   │   ├── weights.hh
│   │   │   └── word_index.hh
│   │   └── util/
│   │       ├── Jamfile
│   │       ├── bit_packing.cc
│   │       ├── bit_packing.hh
│   │       ├── bit_packing_test.cc
│   │       ├── double-conversion/
│   │       │   ├── Jamfile
│   │       │   ├── LICENSE
│   │       │   ├── bignum-dtoa.cc
│   │       │   ├── bignum-dtoa.h
│   │       │   ├── bignum.cc
│   │       │   ├── bignum.h
│   │       │   ├── cached-powers.cc
│   │       │   ├── cached-powers.h
│   │       │   ├── diy-fp.cc
│   │       │   ├── diy-fp.h
│   │       │   ├── double-conversion.cc
│   │       │   ├── double-conversion.h
│   │       │   ├── fast-dtoa.cc
│   │       │   ├── fast-dtoa.h
│   │       │   ├── fixed-dtoa.cc
│   │       │   ├── fixed-dtoa.h
│   │       │   ├── ieee.h
│   │       │   ├── strtod.cc
│   │       │   ├── strtod.h
│   │       │   └── utils.h
│   │       ├── ersatz_progress.cc
│   │       ├── ersatz_progress.hh
│   │       ├── exception.cc
│   │       ├── exception.hh
│   │       ├── fake_ofstream.hh
│   │       ├── file.cc
│   │       ├── file.hh
│   │       ├── file_piece.cc
│   │       ├── file_piece.hh
│   │       ├── file_piece_test.cc
│   │       ├── getopt.c
│   │       ├── getopt.hh
│   │       ├── have.hh
│   │       ├── joint_sort.hh
│   │       ├── joint_sort_test.cc
│   │       ├── mmap.cc
│   │       ├── mmap.hh
│   │       ├── multi_intersection.hh
│   │       ├── multi_intersection_test.cc
│   │       ├── murmur_hash.cc
│   │       ├── murmur_hash.hh
│   │       ├── pcqueue.hh
│   │       ├── pool.cc
│   │       ├── pool.hh
│   │       ├── probing_hash_table.hh
│   │       ├── probing_hash_table_test.cc
│   │       ├── proxy_iterator.hh
│   │       ├── read_compressed.cc
│   │       ├── read_compressed.hh
│   │       ├── read_compressed_test.cc
│   │       ├── scoped.cc
│   │       ├── scoped.hh
│   │       ├── sized_iterator.hh
│   │       ├── sorted_uniform.hh
│   │       ├── sorted_uniform_test.cc
│   │       ├── string_piece.cc
│   │       ├── string_piece.hh
│   │       ├── string_piece_hash.hh
│   │       ├── thread_pool.hh
│   │       ├── tokenize_piece.hh
│   │       ├── tokenize_piece_test.cc
│   │       ├── usage.cc
│   │       └── usage.hh
│   ├── opennlp/
│   │   ├── ccg/
│   │   │   ├── Parse.java
│   │   │   ├── Realize.java
│   │   │   ├── TextCCG.java
│   │   │   ├── WebCCG.java
│   │   │   ├── alignment/
│   │   │   │   ├── AbstractEncodingScheme.java
│   │   │   │   ├── Alignment.java
│   │   │   │   ├── Alignments.java
│   │   │   │   ├── EncodingScheme.java
│   │   │   │   ├── IdentifiedPhraseReader.java
│   │   │   │   ├── IdentifiedPhraseWriter.java
│   │   │   │   ├── IndexBase.java
│   │   │   │   ├── Mapping.java
│   │   │   │   ├── MappingFormat.java
│   │   │   │   ├── MappingGroup.java
│   │   │   │   ├── MappingReader.java
│   │   │   │   ├── MappingWriter.java
│   │   │   │   ├── MosesEncodingScheme.java
│   │   │   │   ├── NAACLEncodingScheme.java
│   │   │   │   ├── Phrase.java
│   │   │   │   ├── PhrasePosition.java
│   │   │   │   ├── PhraseReader.java
│   │   │   │   ├── PhraseWriter.java
│   │   │   │   ├── Status.java
│   │   │   │   └── package.html
│   │   │   ├── disjunctivizer/
│   │   │   │   ├── AlignedEdgeFilter.java
│   │   │   │   ├── Disjunctivizer.java
│   │   │   │   ├── EdgeMatchFilter.java
│   │   │   │   ├── FilteredLFEdgeSet.java
│   │   │   │   ├── LFGraphDifference.java
│   │   │   │   ├── LabelMatchFilter.java
│   │   │   │   ├── MatchType.java
│   │   │   │   ├── MatchTypeFilter.java
│   │   │   │   ├── VertexMatchFilter.java
│   │   │   │   └── package.html
│   │   │   ├── grammar/
│   │   │   │   ├── AbstractApplicationRule.java
│   │   │   │   ├── AbstractCompositionRule.java
│   │   │   │   ├── AbstractRule.java
│   │   │   │   ├── AbstractSubstitutionRule.java
│   │   │   │   ├── AbstractTypeRaisingRule.java
│   │   │   │   ├── BackwardApplication.java
│   │   │   │   ├── BackwardComposition.java
│   │   │   │   ├── BackwardSubstitution.java
│   │   │   │   ├── BackwardTypeRaising.java
│   │   │   │   ├── ForwardApplication.java
│   │   │   │   ├── ForwardComposition.java
│   │   │   │   ├── ForwardSubstitution.java
│   │   │   │   ├── ForwardTypeRaising.java
│   │   │   │   ├── FragmentJoining.java
│   │   │   │   ├── GlueRule.java
│   │   │   │   ├── Grammar.java
│   │   │   │   ├── Rule.java
│   │   │   │   ├── RuleGroup.java
│   │   │   │   ├── TypeChangingRule.java
│   │   │   │   ├── Types.java
│   │   │   │   └── to-apml.xsl
│   │   │   ├── grammardoc/
│   │   │   │   ├── AbstractDocumenter.java
│   │   │   │   ├── Documenter.java
│   │   │   │   ├── DocumenterContext.java
│   │   │   │   ├── DocumenterException.java
│   │   │   │   ├── DocumenterFactory.java
│   │   │   │   ├── DocumenterName.java
│   │   │   │   ├── DocumenterNotFoundException.java
│   │   │   │   ├── DocumenterSourceException.java
│   │   │   │   ├── GrammarDoc.java
│   │   │   │   ├── GrammarDocException.java
│   │   │   │   ├── SourceGrammar.java
│   │   │   │   ├── SourceGrammarFile.java
│   │   │   │   ├── SourceGrammarFileType.java
│   │   │   │   └── html/
│   │   │   │       ├── HTMLDocumenter.java
│   │   │   │       ├── base.xsl
│   │   │   │       ├── categories.xsl
│   │   │   │       ├── comments.xsl
│   │   │   │       ├── grammar.xsl
│   │   │   │       ├── grammardoc.css
│   │   │   │       ├── lexicon.js
│   │   │   │       ├── lexicon.xsl
│   │   │   │       ├── morph.xsl
│   │   │   │       ├── navigation.xsl
│   │   │   │       ├── rules.xsl
│   │   │   │       └── types.xsl
│   │   │   ├── hylo/
│   │   │   │   ├── Alt.java
│   │   │   │   ├── Box.java
│   │   │   │   ├── Compacter.java
│   │   │   │   ├── Converter.java
│   │   │   │   ├── Diamond.java
│   │   │   │   ├── EPsScorer.java
│   │   │   │   ├── EnglishAgreementExtractor.java
│   │   │   │   ├── Flattener.java
│   │   │   │   ├── HyloAtom.java
│   │   │   │   ├── HyloFormula.java
│   │   │   │   ├── HyloHelper.java
│   │   │   │   ├── HyloVar.java
│   │   │   │   ├── LexDepFeatureExtractor.java
│   │   │   │   ├── LexDependency.java
│   │   │   │   ├── ModalOp.java
│   │   │   │   ├── Mode.java
│   │   │   │   ├── ModeLabel.java
│   │   │   │   ├── ModeVar.java
│   │   │   │   ├── Nominal.java
│   │   │   │   ├── NominalAtom.java
│   │   │   │   ├── NominalVar.java
│   │   │   │   ├── Op.java
│   │   │   │   ├── Proposition.java
│   │   │   │   ├── SatOp.java
│   │   │   │   └── graph/
│   │   │   │       ├── DefaultLFEdgeFactory.java
│   │   │   │       ├── LFEdge.java
│   │   │   │       ├── LFEdgeFactory.java
│   │   │   │       ├── LFEdgeLabel.java
│   │   │   │       ├── LFGraph.java
│   │   │   │       ├── LFGraphFactory.java
│   │   │   │       ├── LFVertex.java
│   │   │   │       ├── LFVertexType.java
│   │   │   │       └── package.html
│   │   │   ├── lexicon/
│   │   │   │   ├── DataItem.java
│   │   │   │   ├── DefaultTokenizer.java
│   │   │   │   ├── EnglishExpander.java
│   │   │   │   ├── EntriesItem.java
│   │   │   │   ├── FactorChainWord.java
│   │   │   │   ├── FactorKey.java
│   │   │   │   ├── Family.java
│   │   │   │   ├── FullWord.java
│   │   │   │   ├── LexException.java
│   │   │   │   ├── Lexicon.java
│   │   │   │   ├── LicensingFeature.java
│   │   │   │   ├── ListPairWord.java
│   │   │   │   ├── MacroAdder.java
│   │   │   │   ├── MacroItem.java
│   │   │   │   ├── MorphItem.java
│   │   │   │   ├── SimpleWord.java
│   │   │   │   ├── SupertaggerAdapter.java
│   │   │   │   ├── Tokenizer.java
│   │   │   │   ├── TrueCaser.java
│   │   │   │   ├── Word.java
│   │   │   │   └── WordWithPitchAccent.java
│   │   │   ├── ngrams/
│   │   │   │   ├── AAnFilter.java
│   │   │   │   ├── AbstractStandardNgramModel.java
│   │   │   │   ├── ConditionalProbabilityTable.java
│   │   │   │   ├── FactoredNgramModel.java
│   │   │   │   ├── FactoredNgramModelFamily.java
│   │   │   │   ├── KenNgramModel.java
│   │   │   │   ├── LinearNgramScorerCombo.java
│   │   │   │   ├── NgramDiversityPruningStrategy.java
│   │   │   │   ├── NgramFilter.java
│   │   │   │   ├── NgramPrecisionModel.java
│   │   │   │   ├── NgramScorer.java
│   │   │   │   ├── RepetitionScorer.java
│   │   │   │   ├── Reversible.java
│   │   │   │   ├── SRILMNgramModel.java
│   │   │   │   ├── SRILMNgramModelType.java
│   │   │   │   ├── SRILM_FactoredScorerMaker.java
│   │   │   │   ├── SRILM_ScorerMaker.java
│   │   │   │   ├── SelfParaphraseBiaser.java
│   │   │   │   ├── SignScorerInterpolation.java
│   │   │   │   ├── SignScorerProduct.java
│   │   │   │   ├── StandardNgramModel.java
│   │   │   │   └── kenlm/
│   │   │   │       ├── MurmurHash.java
│   │   │   │       └── jni/
│   │   │   │           └── KenLM.java
│   │   │   ├── parse/
│   │   │   │   ├── Chart.java
│   │   │   │   ├── DerivationHistory.java
│   │   │   │   ├── Edge.java
│   │   │   │   ├── EdgeHash.java
│   │   │   │   ├── ParseException.java
│   │   │   │   ├── Parser.java
│   │   │   │   ├── Supertagger.java
│   │   │   │   ├── postagger/
│   │   │   │   │   ├── BasicPOSTagger.java
│   │   │   │   │   ├── DummyPOSTagger.java
│   │   │   │   │   ├── POSTagSequenceGetter.java
│   │   │   │   │   ├── POSTagger.java
│   │   │   │   │   └── ml/
│   │   │   │   │       ├── POSPriorModel.java
│   │   │   │   │       └── POSTagFex.java
│   │   │   │   ├── supertagger/
│   │   │   │   │   ├── JavaSupertaggingApp.java
│   │   │   │   │   ├── LabellingStrategy.java
│   │   │   │   │   ├── WordAndPOSDictionaryLabellingStrategy.java
│   │   │   │   │   ├── io/
│   │   │   │   │   │   ├── XMLPOSDictionaryReader.java
│   │   │   │   │   │   └── XMLWordDictionaryReader.java
│   │   │   │   │   ├── ml/
│   │   │   │   │   │   ├── FeatureExtractor.java
│   │   │   │   │   │   ├── STFex.java
│   │   │   │   │   │   ├── STPriorModel.java
│   │   │   │   │   │   └── ZhangLeTrainingExtractor.java
│   │   │   │   │   └── util/
│   │   │   │   │       ├── PipedTokenizer.java
│   │   │   │   │       ├── ProbPairComparator.java
│   │   │   │   │       ├── STTaggerDictionary.java
│   │   │   │   │       ├── STTaggerPOSDictionary.java
│   │   │   │   │       ├── STTaggerWordDictionary.java
│   │   │   │   │       ├── SupertagSequenceGetter.java
│   │   │   │   │       └── TaggingDictionaryExtractor.java
│   │   │   │   └── tagger/
│   │   │   │       ├── Constants.java
│   │   │   │       ├── ProbIndexPair.java
│   │   │   │       ├── TaggedWord.java
│   │   │   │       ├── io/
│   │   │   │       │   ├── CorpusIterator.java
│   │   │   │       │   ├── PipeDelimitedFactoredBundleCorpusIterator.java
│   │   │   │       │   └── SRILMFactoredBundleCorpusIterator.java
│   │   │   │       ├── ml/
│   │   │   │       │   ├── MaxentModel.java
│   │   │   │       │   ├── TaggerFeature.java
│   │   │   │       │   ├── ZLMEM.java
│   │   │   │       │   └── ZLMaxentModel.java
│   │   │   │       ├── sequencescoring/
│   │   │   │       │   ├── Backpointer.java
│   │   │   │       │   ├── FBNode.java
│   │   │   │       │   ├── SequenceScorer.java
│   │   │   │       │   └── Trellis.java
│   │   │   │       └── util/
│   │   │   │           ├── CCGBankToSRILMFLM.java
│   │   │   │           ├── ConfigFileProcessor.java
│   │   │   │           └── ResultSink.java
│   │   │   ├── perceptron/
│   │   │   │   ├── Alphabet.java
│   │   │   │   ├── ComposedFeatureExtractor.java
│   │   │   │   ├── ComposedFeatureVector.java
│   │   │   │   ├── EventFile.java
│   │   │   │   ├── FeatureExtractor.java
│   │   │   │   ├── FeatureList.java
│   │   │   │   ├── FeatureMap.java
│   │   │   │   ├── FeatureVector.java
│   │   │   │   ├── Model.java
│   │   │   │   ├── PerceptronScorer.java
│   │   │   │   ├── ReRankingPerceptronScorer.java
│   │   │   │   └── Trainer.java
│   │   │   ├── realize/
│   │   │   │   ├── Chart.java
│   │   │   │   ├── DiversityPruningStrategy.java
│   │   │   │   ├── Edge.java
│   │   │   │   ├── EdgeCombos.java
│   │   │   │   ├── EdgeFactory.java
│   │   │   │   ├── EdgeHash.java
│   │   │   │   ├── FeatureLicenser.java
│   │   │   │   ├── Hypertagger.java
│   │   │   │   ├── LexicalDiversityPruningStrategy.java
│   │   │   │   ├── NBestPruningStrategy.java
│   │   │   │   ├── PruningStrategy.java
│   │   │   │   ├── Realizer.java
│   │   │   │   ├── RuleInstance.java
│   │   │   │   ├── StemPruningStrategy.java
│   │   │   │   ├── Tracker.java
│   │   │   │   └── hypertagger/
│   │   │   │       ├── FeatureExtractionException.java
│   │   │   │       ├── LFInfo.java
│   │   │   │       ├── LFLoader.java
│   │   │   │       ├── LMFactorExtractor.java
│   │   │   │       ├── TagExtract.java
│   │   │   │       ├── TagExtractor.java
│   │   │   │       ├── ZLMaxentHypertagger.java
│   │   │   │       ├── ZLMaxentModel.java
│   │   │   │       └── ZLPOSTagger.java
│   │   │   ├── synsem/
│   │   │   │   ├── AbstractCat.java
│   │   │   │   ├── Arg.java
│   │   │   │   ├── ArgStack.java
│   │   │   │   ├── AtomCat.java
│   │   │   │   ├── BasicArg.java
│   │   │   │   ├── CatReader.java
│   │   │   │   ├── Category.java
│   │   │   │   ├── CategoryFcn.java
│   │   │   │   ├── CategoryFcnAdapter.java
│   │   │   │   ├── ComplexCat.java
│   │   │   │   ├── DerivationHandler.java
│   │   │   │   ├── Dollar.java
│   │   │   │   ├── GenerativeSyntacticModel.java
│   │   │   │   ├── LF.java
│   │   │   │   ├── LexLogProbFeatureExtractor.java
│   │   │   │   ├── LexSemOrigin.java
│   │   │   │   ├── Modality.java
│   │   │   │   ├── ReRankingScorer.java
│   │   │   │   ├── SetArg.java
│   │   │   │   ├── Sign.java
│   │   │   │   ├── SignHash.java
│   │   │   │   ├── SignScorer.java
│   │   │   │   ├── Slash.java
│   │   │   │   ├── SlashMode.java
│   │   │   │   ├── SyntacticFeatureExtractor.java
│   │   │   │   ├── TargetCat.java
│   │   │   │   └── VarModality.java
│   │   │   ├── test/
│   │   │   │   ├── CrossValidateRealizer.java
│   │   │   │   ├── DerivMaker.java
│   │   │   │   ├── GenTargets.java
│   │   │   │   ├── Regression.java
│   │   │   │   ├── RegressionInfo.java
│   │   │   │   ├── ScorerMaker.java
│   │   │   │   ├── TimingMap.java
│   │   │   │   ├── UpdateTestbed.java
│   │   │   │   └── Validator.java
│   │   │   ├── unify/
│   │   │   │   ├── EmptySubstitution.java
│   │   │   │   ├── Feature.java
│   │   │   │   ├── FeatureStructure.java
│   │   │   │   ├── GFeatStruc.java
│   │   │   │   ├── GFeatVar.java
│   │   │   │   ├── GSubstitution.java
│   │   │   │   ├── GUnifier.java
│   │   │   │   ├── Indexed.java
│   │   │   │   ├── ModFcn.java
│   │   │   │   ├── Mutable.java
│   │   │   │   ├── SelfCondensingSub.java
│   │   │   │   ├── SimpleSubstitution.java
│   │   │   │   ├── SimpleType.java
│   │   │   │   ├── Substitution.java
│   │   │   │   ├── Unifiable.java
│   │   │   │   ├── Unifier.java
│   │   │   │   ├── UnifyControl.java
│   │   │   │   ├── UnifyFailure.java
│   │   │   │   └── Variable.java
│   │   │   └── util/
│   │   │       ├── ArrayListWithIdentityEquals.java
│   │   │       ├── CompositeFilter.java
│   │   │       ├── DelegatedFilter.java
│   │   │       ├── DisplayPrefs.java
│   │   │       ├── Filter.java
│   │   │       ├── FilteredMap.java
│   │   │       ├── FilteredSet.java
│   │   │       ├── GroupMap.java
│   │   │       ├── IntHashSetMap.java
│   │   │       ├── Interner.java
│   │   │       ├── InverseFilter.java
│   │   │       ├── JLineReader.java
│   │   │       ├── LineReader.java
│   │   │       ├── ListMap.java
│   │   │       ├── MembershipFilter.java
│   │   │       ├── Pair.java
│   │   │       ├── SingletonList.java
│   │   │       ├── StructureSharingList.java
│   │   │       ├── TrieMap.java
│   │   │       ├── VisitedFilter.java
│   │   │       ├── Visualizer.java
│   │   │       └── XmlScanner.java
│   │   └── ccgbank/
│   │       ├── CCGBankConvert.java
│   │       ├── CCGBankExtract.java
│   │       ├── CCGBankTask.java
│   │       ├── CCGBankTaskFileGroup.java
│   │       ├── CCGBankTaskSources.java
│   │       ├── CCGBankTaskTemplates.java
│   │       ├── CCGBankTaskTestbed.java
│   │       ├── InputSourceAdapter.java
│   │       ├── TemplatesProcessor.java
│   │       ├── XMLFilterProcessor.java
│   │       ├── XSLTProcessor.java
│   │       ├── ccgbank.properties
│   │       ├── convert/
│   │       │   ├── ApposTally.java
│   │       │   ├── DiscrCheck.java
│   │       │   ├── GenChal11Adjuster.java
│   │       │   ├── GenConjRule.java
│   │       │   ├── InfoHelper.java
│   │       │   ├── Javafns.java
│   │       │   ├── MWHelper.java
│   │       │   ├── MorphLookup.java
│   │       │   ├── OrigPunctRules.java
│   │       │   ├── PunctHelper.java
│   │       │   ├── RoleAdjuster.java
│   │       │   └── XSLTTrueCaser.java
│   │       ├── extract/
│   │       │   ├── CatNode.java
│   │       │   ├── DebugHelper.java
│   │       │   ├── DefaultLFHelper.java
│   │       │   ├── ExtractGrammar.java
│   │       │   ├── FreqTally.java
│   │       │   ├── InsertLFHelper.java
│   │       │   ├── LexExtract.java
│   │       │   ├── MorphExtrHelper.java
│   │       │   ├── MorphExtract.java
│   │       │   ├── RulesExtract.java
│   │       │   ├── RulesTally.java
│   │       │   └── Testbed.java
│   │       ├── lexicon-base.xsl
│   │       ├── parse/
│   │       │   ├── CCGbankDerivation.jjt
│   │       │   ├── SimpleNode.java
│   │       │   └── grammarInsert
│   │       └── rules-base.xsl
│   ├── pom.xml
│   └── srilmbridge/
│       ├── Makefile
│       └── srilmbridge.cpp
└── test/
    ├── grammar.xml
    ├── lexicon.xml
    ├── morph.xml
    ├── opennlp/
    │   └── ccg/
    │       ├── alignment/
    │       │   ├── AlignmentTest.java
    │       │   ├── IdentifiedPhraseReaderWriterTest.java
    │       │   ├── IndexBaseTest.java
    │       │   ├── MappingFormatTest.java
    │       │   ├── MappingGroupTest.java
    │       │   ├── MappingReaderWriterTest.java
    │       │   ├── MappingTest.java
    │       │   ├── PhraseReaderWriterTest.java
    │       │   └── PhraseTest.java
    │       ├── disjunctivizer/
    │       │   ├── AlignedEdgeFilterTest.java
    │       │   ├── DisjunctivizerTest.java
    │       │   ├── EdgeMatchFilterTest.java
    │       │   ├── FilteredLFEdgeSetTest.java
    │       │   ├── LFGraphDifferenceTest.java
    │       │   ├── LabelMatchFilterTest.java
    │       │   └── VertexMatchFilterTest.java
    │       ├── hylo/
    │       │   └── graph/
    │       │       ├── LFBaseTest.java
    │       │       ├── LFEdgeFactoryTest.java
    │       │       ├── LFEdgeTest.java
    │       │       ├── LFGraphTest.java
    │       │       └── LFVertexTest.java
    │       └── util/
    │           ├── CompositeFilterTest.java
    │           ├── DelegatedFilterTest.java
    │           ├── FilteredMapTest.java
    │           ├── FilteredSetTest.java
    │           ├── InverseFilterTest.java
    │           ├── MembershipFilterTest.java
    │           └── VisitedFilterTest.java
    ├── output.xml
    ├── paraphrases.xml
    ├── rules.xml
    └── testlf.xml

================================================
FILE CONTENTS
================================================

================================================
FILE: .gitignore
================================================
*.sw?
*~
*.jar
*.so
*.class
*.pyc
*.tgz
*.gz
*.lm
*.3bo
*.mod
vocab.*
!vocab.flm
.project
.classpath
bin/ccg2xml.py
bin/lex.py
bin/yacc.py
bin/ccg_editor.py
bin/Tree.py
ccgbank/convert/
ccgbank/data/novel/two-sents.dir/
ccgbank/extract/*
!ccgbank/extract/grammar.xml
!ccgbank/extract/*.xsl
ccgbank/feats/hypertagger/
ccgbank/feats/parser/
ccgbank/feats/realizer/
ccgbank/feats/supertagger/
ccgbank/logs/
ccgbank/models/*/*dict*
ccgbank/models/realizer/excl/
ccgbank/original/corpus/
ccgbank/original/feats/postagger/
ccgbank/original/feats/supertagger/
ccgbank/original/logs/
ccgbank/propccgbank/
ccgbank/stanford-nlp/*.jar
ccgbank/stanford-nlp/classifiers/*.prop
docs/api/
docs/grammars-rough-guide.pdf
docs/realizer-manual.pdf
docs/guide/guide.*
!docs/guide/guide.tex
docs/realizer/manual.*
!docs/realizer/manual.tex
lib/openccg.jar
output/
src/ccg2xml/ccg2xml.py
src/srilmbridge/*.h


================================================
FILE: AUTHORS
================================================
Main Authors:
     Core Java Code:
         Jason Baldridge <jmb -at- cogsci.ed.ac.uk>
         Gann Bierner <gbierner -at- cogsci.ed.ac.uk>
         Michael White <mwhite -at- inf.ed.ac.uk>
     CCG-to-XML:
         Ben Wing <ben -at- 666.com>
     Hypertagger:
         Dominic Espinosa <espinosa -at- ling.osu.edu>
     Supertagger:
         Dennis Mehay <mehay -at- ling.osu.edu>
     Disjunctivizer:
         Scott Martin <scott -at- ling.osu.edu>

Additional Contributors:
     Jonathan Barker <barker -at- ling.osu.edu>
       semantic graph visualization tool
     Cem Bozsahin <cem.bozsahin -at- ed.ac.uk / bozsahin -at- metu.edu.tr>
       grammars from Bozsahin and Steedman (2003)
     Gunes Erkan <gunes -at- ceng.metu.edu.tr>
       handling of type hierachies
     Dennis Mehay <mehay -at- ling.osu.edu>
       KenLM interface
       (in addition to supertagger)
     Scott Martin <scott -at- ling.osu.edu>
       GrammarDoc
       incoporating the SRILM toolkit for scoring
       build process for CCGbank grammar extraction
       (in addition to disjunctivizer)
     Rajakrishnan Rajkumar <raja -at- ling.osu.edu>
       build files and XSLT transforms for CCGbank grammar extraction
       English agreement model
     David Reitter <dreitter -at- inf.ed.ac.uk>
       command completion and per grammar history
       "tiny" grammar
     Alexandros Triantafyllidis <s0345201 -at- sms.ed.ac.uk>
       visualization of derivations via latex
     Ben Wing <ben -at- 666.com>
       wccg and WebCCG code; CCG-format grammars
       (in addition to ccg2xml)


================================================
FILE: CHANGES
================================================
0.9.6 - ...
-----------

* Updated .gitignore, CHANGES and docs/index.html for transition to
  GitHub


0.9.5 - dependency length minimization, disjunctivizer, KenLM
-------------------------------------------------------------

* Added features for dependency ordering and dependency length
  minimization in realization.

* Added disjunctivizer package, for creating a disjunctive LF XML
  structure based on an LF graph difference.

* Added support for using a very large 5-gram memory-mapped language
  model with KenLM on linux.

* Added n-best parser output.

* Added option for in-memory perceptron training.


0.9.4 - broad coverage paraphrasing, CCGbank training
-----------------------------------------------------

* Added Hockenmaier-style generative probability model for parsing and
  realization.

* Added supertagger and use of adaptive supertagging in parsing.

* Added build files for CCGbank training, documented in
  docs/ccgbank-README, as well as ones for parsing and realizing
  novel text (thereby generating grammatical paraphrases).

* Added release targets for CCGbank data and pre-built English models.

* Added use of Stanford tokenizer, morphological analyzer and named
  entity recognizer in parsing novel text.

* Added use of ordinary hashing for lex signs, so that signs that
  differ only in the pos tag can be distinguished (for robustness).

* Added hypertagger input option and derivation history output to ccg-realize.

* Added n-best realization output to ccg-test.

* Added tracking of lex heads to signs via modifier attr on slashes.

* Added gold standard pred info for training with hypertagger.

* Added initial syntactic feature extractor.

* Added caching of supertags in cats.

* Added option to use word positions in converting atoms in the LFs, 
  which is now the default.  Added :nowordpos command in tccg to 
  change the preference to the lexical naming option.
  
* Changed tccg to also update Grammar.theGrammar.prefs, which seems 
  to have fixed issue with :nosem option not working.
  
* Refactored feature extraction to use a trie for representing features 
  as a sequence of interned string keys, to allow for lazy feature 
  extraction that more quickly filters features not in the alphabet.
  
* Added serialization of signs.

* Added python script for drawing derivs in .auto files as trees (uses NLTK).

* Added cell pruning limit in realization.
  
* Added support for 'magic tokens' (like numbers) in ccg2xml,
  contributed by vanjena@users.sourceforge.net.

* Turned off caching of category hash codes b/c of problems with stale 
  values (a method of checking for staleness might be added later).

* Improved utf8 support (esp. for macs).  Note that utf8 support seems
  hopelessly broken for the Windows command-line, in that none of the
  available terminal apps (including for cygwin) both display
  characters correctly and work with tccg.  I/O to files works fine
  though.

* Added xml escaping for bleu and nbest output.

* Added ccg-draw-graph tool for visualizing semantic dependency
  graphs.

  
0.9.3 - minor changes
-------------------

* Added runCommand method in Visualizer so that the latex
  visualization works on Linux

* Added id info to test items and bleu output.

* Changed default lex licensing feature to be last in Lexicon.loadLicensingFeatures.

* Added loop for computing closure of licensed no sem edges in EdgeFactory.

* Changed FeatureLicenser to unify feat strucs instead of cats.

 
0.9.2 - VisCCG release plus initial hypertagger support
-------------------------------------------------------
* Added check for unary rule cycles in parser and realizer.

* Added initial version of greedy fragment assembly in realization when 
  a complete realization is not found.
  
* Added case for composition of X/Y Y/Z where Y has arity 2.

* Added option to filter rule apps by observed supercat-rule combos.

* VisCCG: Please see the list of changes in the archives at http://comp.ling.utexas.edu/wiki/doku.php/openccg/dev

* Added LexSemOrigin interface for tracking of origin of lexical 
  predications back to a sign or unary type changing rule.

* Removed unused LF in DataItem.

* Added supertagger-based filtering to lexical lookup.

* Upgraded to JDOM 1.1.

* Upgraded parser to use ambiguity packing.

* Added scoring and n-best pruning to parser.

* Refactored SignScorer to synsem package, for shared use
  by the realizer and parser.  NB:  This may require minor
  refactoring of imports and recompilation of realizer clients.

* Changed realizer to check instantiation of outermost args by 
  default, thereby improving completness at minor cost to efficiency.
  Accordingly, renamed checkInstantiation flag in EdgeFactory to 
  debugInstantiation, which now controls whether to report such 
  cats to System.err.

* Added hypertagger (realizer supertagger) interface and initial 
  version of beta-best realization using it.
  
* Changed Family.deriveSupertag to remove the semantic part of a 
  cat name following a colon.


0.9.1 - New tools: grammardoc, ccg2xml; other misc updates
----------------------------------------------------------
* Changed dateFormatNoYear to "*.MM.dd" to avoid ambiguity with 
  numbers.
  
* Changed Grammar.initializeTransformers to set indenting more robustly 
  by adding try-catch blocks for illegal argument exceptions.
  
* Refactored RuleGroup to apply unary and binary rules separately.

* Refactored Lexicon and RuleGroup to load lex/morph/rule info incrementally, 
  using a new XmlScanner utility class.  These changes avoid the need to 
  store large XML docs all in memory at once, while keeping the refactoring 
  to a minimum.
  
* Revised LF flattening to propapage the alts, opts & chunks based on 
  the expression structure, rather than the graph structure.  
  This change makes the 'shared' attribute (on nominal references) 
  more transparent in how it works with disjunctions that operate on 
  different levels of the tree.

* Revised LF compaction to allow duplicate predications, where an attempt 
  is made to attach them in different locations if possible.

* Added GrammarDoc, which generates HTML documentation from a source grammar.
  See README, under `Generating Grammar Documentation' for more information.

* Added initial version of ccg2xml, for specifying grammars in the 
  more human-friendly .ccg format.
  
* Changed build system
  - Made separate build files for ccg2xml and documentation
  - Made the `release' target of the main build file create a binary for
    distribution, instead of just the source
  
  
0.9.0 - Disjunctive LFs
-----------------------
* Refactored realizer to put all no-sem edges on the agenda, 
  which requires making an exception for edges with no indices 
  in the implementation of the index filter, but otherwise 
  yields a more uniform approach to creating edges.
  
* Refactored realizer to use representative edges (one per cat) 
  instead of edge groups, which ends up being simpler on the whole 
  and should be easier to explain.
  
* Refactored categories to allow for equality checks with and 
  without taking the LFs into consideration.
  
* Refactored edge equiv classes to use coverage bit vector 
  and cat sans LF to check equality.
  
* Refactored lex instantiation to produce all possible instantiations 
  that respect the alt exclusivity constraints.
  
* Changed Sign, DerivationHistory to store rule object.

* Changed alt edge construction to create new LF from input signs and rule, 
  since signs in equiv class of alts can now have different LFs.
  
* Added active alt tracking and completing of edges with optional bits.

* Changed HyloVar to check for equal types when checking for equality up 
  to var renaming.
  
* Refactored generics to avoid type warnings in Eclipse.

* Relaxed LF chunking constraints to allow combinations with edges 
  (or trackers more generally) that are shared across multiple 
  alt set options.
  
* Added "shared" attribute to nominal terms to indicate references 
  to nodes that are shared across alternatives in a disjunctive LF; 
  then revamped and reinforced the LF chunking constraints.
  
* Fixed problem with signMap not pointing to opt-completed edge.

* Improved edge printing from realizer chart to show derivations.

* Updated realizer to keep edges whose signs have the simplest derivation, 
  among those with the same surface words.
  
* Added filter for ungrammatical test cases in ccg-test text output.

* Added first draft of realizer manual.

  
0.8.6 - Java 1.5 switch, n-gram scoring improvements
----------------------------------------------------
* Added propagation of reverse flag on n-gram models.

* Refactored LinearNgramScorerCombo and n-gram models to 
  support interpolation at the word level.

* Added caching of log probs in NgramScorer, to avoid recomputing 
  log prob of words for a sign's initial sign.

* Added n-gram diversity pruning strategy.

* Changed SignHash to only keep signs that are unique up to surface words, 
  thereby ignoring different POS or supertags; also changed it to keep 
  signs with lower derivational complexity during insertion.
  
* Added reverse flag for loaded n-gram models with ccg-test, ccg-realize.

* Fixed sentence delimiter text output for reversible standard n-gram models; 
  made AAnFilter reversible.
  
* Added Xalan 2.6.0 jars, to support Java 1.5 builds.

* Added support for duration special tokens; note that the implementation has 
  an unavoidable dependency on Java 1.5.
 
 
0.8.5 - "Rough Guide", sem types, command history/completion, and more
---------------------------------------------------------------------- 
* Added initial core-en/types.xml.

* Generalized feature licensing to allow for selective listing of supertypes 
  in the also-licensed-by attribute.
  
* Fixed bug in unifying two vars with simple types.

* Removed useless SignHash.values method; clarified intention to 
  eventually remove this class.
  
* Streamlined lexical access for realization.

* Removed superfluous unique stamps in var classes.

* Added support for using simple types (aka sorts) with semantic features 
  and nominals.  During category instantiation, a morph item's class is 
  assigned to the nominal var(s) for the [*DEFAULT*] proposition, and
  the types of all nominal vars are then propagated to all other 
  nominal vars with the same name, throughout the category.  
  
* Changed tokenizer keep-words-with-sem-classes option in grammar.xsd 
  to replacement-sem-classes option, where all semantic classes to use 
  in replacing words with sem classes for language models are listed. 
  Also changed semantic class replacement routine to uppercase semantic 
  class names.
  
* Added initial sem types to core-en, comic, and flights grammars.

* Fixed bug in constructing type hierarchies with multiple inheritance.

* Added ccg-update tool, with initial task to add full words (pre-parsed) 
  to the testbed file; also updated ccg-test to use the pre-parsed words 
  when writing training text files.
  
* Updated ccg-cvr tool to use full words when present.
  Also added filter to remove test item duplicates from 
  cross-validation training sets.

* Added reporting of mean reciprocal rank to ccg-test, as well 
  as residual mean reciprocal rank, based on the cases that do 
  not match the target exactly.

* Updated ccg-cvr tool to work with factored language models.

* Fixed null pointer exception in DefaultTokenizer.format, Word.setW methods.

* Added timing of lex lookup to realization metrics.

* Added David's JLine console support to tccg, with command completion and 
  per grammar history.

* Added handling of coarticulations in the lexicon.

* Added caching of lex lookup during realization.

* Updated to-apml.xsl to handle 'and' in multiword elements.

* Updated visualizer to handle word lists and to ignore coarts.

* Added repetition scorer, for discounting repetitive realizations.

* Added scorer class, pruning strategy class options to ccg-realize.

* Added workaround for saving command history correctly with Java 1.4 on Linux.
 
* Added 'tiny' grammar.

* Added grammars "rough guide".

* Added supertag as another word attr.

* Revamped LMs to use trie maps, for better speed & scalability.

* Improved handling of nulls in FLMs.

* Cleaned up word representations.

* Added even/odd selection for scoring too in ccg-test.

* Added -reverse and -scorer options to ccg-test.

* Added reverse LM capability.

* Made supertag attrs configurable.

* Switched to JDOM 1.0.


0.8.4 - Factored language models (initial support), packing/unpacking, and more
--------------------------------------------------------------- 
* Added Alex's latex visualization of derivations
  (nb: launch of previewer works better on Windows than Linux)

* Added customizable tokenization and expansion routines for 
  dates/times/nums/amounts and other named entities.
  
* Added -2apml option to ccg-test.

* Added Word class and many related changes to tokenization.

* Added -textf|-textfsc options to ccg-test, for writing files in the format 
  expected by the SRILM toolkit for factored language models.

* Updated copyright notices.

* Changed ngram model to use canonical lists of words as keys, 
  removing size restriction. 
  
* Added -aanfilter option to ccg-test, with an optional list of
  exceptions, which may be culled from bigram counts.

* Added keep-words-with-sem-classes option to grammar.xsd, to 
  specify exceptional semantic classes where the word form is also 
  considered relevant for scoring models.
  
  NB: Also changed grammar.xsd to specify a custom tokenizer class name 
      and/or keep-words-with-sem-classes on a separate 
      tokenizer element.

* Added support for factored language models with fixed backoff paths,
  arranged into families of models for different child variables,
  and with the option to have secondary models for shorter available
  histories.  Also added corresponding -flm|-flmsc options to
  ccg-test.

* Added option to do scoring in a second stage, starting from a packed
  representation.
  
* Switch from cached combos to collected combos, making the anytime case
  more like the packed case.
  
* Added compacting of gen forest when unpacking is turned off.

* Added pretty-printing of regex-like gen forest.


0.8.3 - New efficiency methods, Cem-* grammars, and more
--------------------------------------------------------------- 
* Added grammars from Bozsahin and Steedman (2003).

* Improved instantiation of unary rules, ensuring that the 
  first pred is used for indexing, and fixing a bug whereby 
  a rule indexed by a lex pred would be missed.
  
* Added initial capability to use semantic classes in n-gram scoring, 
  as shown in ccg-realize.
  
* Added LF chunking rules, which yields the most dramatic improvement in
  efficiency. 

* Added systematic feature-based licensing and instantiation.

* Added caching of category combinations.

* Added labeling of the phrase in the XML output headed by the index
  associated with the <mark>+ semantic feature.
  
* Added feature filtering and LF indenting to tccg display options.

* Added XML configuration of LF relation sorting.

* Added :2tb (to testbed) command for adding the current parse to the 
  testbed.
  
* Fixed grammar loading so it no longer has to be from the current directory.

* Made it possible to list a stem as a member of an open class family with a
  separate pred, without getting an entry with the default pred too.

* Enabled indexRel to be declared at the level of entries or families.

* Added prefs import/export to tccg.

* Added ccg-cvr tool for cross-validating realizer.

* Reconfigured ccg-test with various new switches. 

* Put feature licensing on a switch.

* Made pruning strategy configurable.

* Changed representation of coord to work better with 
  chunking (though less concise).

* Added option to stop realizer after new best time limit (past first 
  complete realization) is exceeded, via :nbtl N command


0.8.2 - Edge pruning during realization, XML/APML I/O, and more
--------------------------------------------------------------- 
* Changed build to ccg-build, in bin directory; 
  also added separate build.xml files to each sample 
  grammar directory.  This way, a call to ccg-build 
  either builds the system or the current grammar, 
  depending on what directory you're in.
  
* Changed realizer to no longer allow unmatched 
  attr preds (ie sem features).  This way, the presence 
  of certain sem features can be used to control realization 
  choices, instead of requiring these features to always 
  be present.  To underspecify these choices, the idea 
  is to eventually allow for their optional inclusion. 

* Added more options to turn settings off individually in tccg.

* Enabled realizer to handle type changing rules with 
  their own semantics in the result category.
  
* Added configurable edge pruning per category during 
  realization, which controls the number of edges with 
  equivalent categories to keep in the chart.
  
* Fixed unification bug by adding occurs checks to Dollar's fill 
  method, needed at least in part b/c ArgStack doesn't quite 
  implement Unifiable.
  
* Replaced hashString with hashCode and equals up to var names, 
  yielding a 4-5% improvement in efficiency.
  
* Switched to grammar.xml file.  If none exists, an attempt is 
  made to load from the default files lexicon.xml, morph.xml and 
  rules.xml.  See grammar.xsd for format.
  
* Added LF load/save from/to XML via a sequence of transformations 
  specified in the grammar.xml file.

* Added save-to-xml (:2xml) option for saving LFs to XML 
  files from tccg.
  
* Added save-to-apml (:2apml) option for saving last input string to 
  APML files from tccg.
  
* Updated parser to apply unary rules repeatedly.

* Various updates to flights grammar, including use of FrameNet roles.
  

0.8.1 - OpenCCG Release with XML Schemas (!)
---------------------------------------------------- 
This release adds XML Schema validation to the grammar build 
process, where the comments in the XML schemas also 
serve as reference documentation for the grammar formats (wahoo!).
The release also contains several bug fixes to the unification 
routines, and a more substantial "flights" grammar with 
semantic control over pitch accents and boundary tones.


0.8.0 - First OpenNLP CCG Library Release 
---------------------------------------------------- 
Reorganized directories and renamed packages and tools. 
Added build target for worldcup sample grammar. 
Rewrote scripts for simplicity and parallelism. 
Cut out pre-processing components and any classes and  
libraries that looked like dead wood.  Started removing 
unnecessary interfaces.


Grok 0.7.0 - Towards a CCG Realizer
---------------------------------------------------- 
Mike is taking over Grok development and repurposing it for primary 
use as a CCG Realizer in limited domain dialogue systems. 
See http://www.iccs.informatics.ed.ac.uk/~mwhite/White-Baldridge-ENLG-2003-to-appear.pdf 
for a description of the effort so far.
Version 0.7.0 will be the last Grok release.
After this version, Grok will be split into separately usable 
and separately developed OpenNLP components.
Tom Morton will be responsible for further development of the 
pre-processing components.
Mike will be responsible for further development of the CCG 
parser and realizer.


Grok 0.6.0 - Multi-Modal CCG
---------------------------------------------------- 
For more information, see Jason's dissertation available at:
http://www.iccs.inf.ed.ac.uk/~jmb/dissertation


See Grok site for further history ...


================================================
FILE: LICENSE
================================================

GNU LESSER GENERAL PUBLIC LICENSE

Version 2.1, February 1999

(The master copy of this license lives on the GNU website.) 

Copyright (C) 1991, 1999 Free Software Foundation, Inc.  59 Temple Place, Suite
330, Boston, MA 02111-1307 USA Everyone is permitted to copy and distribute
verbatim copies of this license document, but changing it is not allowed.

[This is the first released version of the Lesser GPL.  It also counts as the
 successor of the GNU Library Public License, version 2, hence the version
 number 2.1.]

Preamble

The licenses for most software are designed to take away your freedom to share
and change it. By contrast, the GNU General Public Licenses are intended to
guarantee your freedom to share and change free software--to make sure the
software is free for all its users.

This license, the Lesser General Public License, applies to some specially
designated software packages--typically libraries--of the Free Software
Foundation and other authors who decide to use it. You can use it too, but we
suggest you first think carefully about whether this license or the ordinary
General Public License is the better strategy to use in any particular case,
based on the explanations below.

When we speak of free software, we are referring to freedom of use, not
price. Our General Public Licenses are designed to make sure that you have the
freedom to distribute copies of free software (and charge for this service if
you wish); that you receive source code or can get it if you want it; that you
can change the software and use pieces of it in new free programs; and that you
are informed that you can do these things.

To protect your rights, we need to make restrictions that forbid distributors to
deny you these rights or to ask you to surrender these rights. These
restrictions translate to certain responsibilities for you if you distribute
copies of the library or if you modify it.

For example, if you distribute copies of the library, whether gratis or for a
fee, you must give the recipients all the rights that we gave ou. You must make
sure that they, too, receive or can get the source code. If you link other code
with the library, you must provide complete object files to the recipients, so
that they can relink them with the library after making changes to the library
and recompiling it. And you must show them these terms so they know their
rights.

We protect your rights with a two-step method: (1) we copyright the library, and
(2) we offer you this license, which gives you legal permission to copy,
distribute and/or modify the library.

To protect each distributor, we want to make it very clear that there is no
warranty for the free library.  Also, if the library is modified by someone else
and passed on, the recipients should know that what they have is not the
original version, so that the original author's reputation will not be affected
by problems that might be introduced by others.

Finally, software patents pose a constant threat to the existence of any free
program. We wish to make sure that a company cannot effectively restrict the
users of a free program by obtaining a restrictive license from a patent
holder. Therefore, we insist that any patent license obtained for a version of
the library must be consistent with the full freedom of use specified in this
license.

Most GNU software, including some libraries, is covered by the ordinary GNU
General Public License. This license, the GNU Lesser General Public License,
applies to certain designated libraries, and is quite different from the
ordinary General Public License. We use this license for certain libraries in
order to permit linking those libraries into non-free programs.

When a program is linked with a library, whether statically or using a shared
library, the combination of the two is legally speaking a combined work, a
derivative of the original library. The ordinary General Public License
therefore permits such linking only if the entire combination fits its criteria
of freedom. The Lesser General Public License permits more lax criteria for
linking other code with the library.

We call this license the "Lesser" General Public License because it does Less to
protect the user's freedom than the ordinary General Public License. It also
provides other free software developers Less of an advantage over competing
non-free programs. These disadvantages are the reason we use the ordinary
General Public License for many libraries. However, the Lesser license provides
advantages in certain special circumstances.

For example, on rare occasions, there may be a special need to encourage the
widest possible use of a certain library, so that it becomes a de-facto
standard. To achieve this, non-free programs must be allowed to use the
library. A more frequent case is that a free library does the same job as widely
used non-free libraries. In this case, there is little to gain by limiting the
free library to free software only, so we use the Lesser General Public License.

In other cases, permission to use a particular library in non-free programs
enables a greater number of people to use a large body of free software. For
example, permission to use the GNU C Library in non-free programs enables many
more people to use the whole GNU operating system, as well as its variant, the
GNU/Linux operating system.

Although the Lesser General Public License is Less protective of the users'
freedom, it does ensure that the user of a program that is linked with the
Library has the freedom and the wherewithal to run that program using a modified
version of the Library.

The precise terms and conditions for copying, distribution and modification
follow. Pay close attention to the difference between a "work based on the
library" and a "work that uses the library". The former contains code derived
from the library, whereas the latter must be combined with the library in order
to run.

TERMS AND CONDITIONS FOR COPYING, DISTRIBUTION AND MODIFICATION

0. This License Agreement applies to any software library or other program which
contains a notice placed by the copyright holder or other authorized party
saying it may be distributed under the terms of this Lesser General Public
License (also called "this License"). Each licensee is addressed as "you".

A "library" means a collection of software functions and/or data prepared so as
to be conveniently linked with application programs (which use some of those
functions and data) to form executables.

The "Library", below, refers to any such software library or work which has been
distributed under these terms. A "work based on the Library" means either the
Library or any derivative work under copyright law: that is to say, a work
containing the Library or a portion of it, either verbatim or with modifications
and/or translated straightforwardly into another language. (Hereinafter,
translation is included without limitation in the term "modification".)

"Source code" for a work means the preferred form of the work for making
modifications to it. For a library, complete source code means all the source
code for all modules it contains, plus any associated interface definition
files, plus the scripts used to control compilation and installation of the
library.

Activities other than copying, distribution and modification are not covered by
this License; they are outside its scope. The act of running a program using the
Library is not restricted, and output from such a program is covered only if its
contents constitute a work based on the Library (independent of the use of the
Library in a tool for writing it). Whether that is true depends on what the
Library does and what the program that uses the Library does.

1. You may copy and distribute verbatim copies of the Library's complete source
code as you receive it, in any medium, provided that you conspicuously and
appropriately publish on each copy an appropriate copyright notice and
disclaimer of warranty; keep intact all the notices that refer to this License
and to the absence of any warranty; and distribute a copy of this License along
with the Library.

You may charge a fee for the physical act of transferring a copy, and you may at
your option offer warranty protection in exchange for a fee.

2. You may modify your copy or copies of the Library or any portion of it, thus
forming a work based on the Library, and copy and distribute such modifications
or work under the terms of Section 1 above, provided that you also meet all of
these conditions:

     a) The modified work must itself be a software library.  
     b) You must cause the files modified to carry prominent notices stating
     that you changed the files and the date of any change.  
     c) You must cause the whole of the work to be licensed at no charge to all
     third parties under the terms of this License.  
     d) If a facility in the modified Library refers to a function or a table of
     data to be supplied by an application program that uses the facility, other
     than as an argument passed when the facility is invoked, then you must make
     a good faith effort to ensure that, in the event an application does not
     supply such function or table, the facility still operates, and performs
     whatever part of its purpose remains meaningful.

     (For example, a function in a library to compute square roots has a purpose
     that is entirely well-defined independent of the application. Therefore,
     Subsection 2d requires that any application-supplied function or table used
     by this function must be optional: if the application does not supply it,
     the square root function must still compute square roots.)

     These requirements apply to the modified work as a whole. If identifiable
     sections of that work are not derived from the Library, and can be
     reasonably considered independent and separate works in themselves, then
     this License, and its terms, do not apply to those sections when you
     distribute them as separate works. But when you distribute the same
     sections as part of a whole which is a work based on the Library, the
     distribution of the whole must be on the terms of this License, whose
     permissions for other licensees extend to the entire whole, and thus to
     each and every part regardless of who wrote it.

     Thus, it is not the intent of this section to claim rights or contest your
     rights to work written entirely by you; rather, the intent is to exercise
     the right to control the distribution of derivative or collective works
     based on the Library.

     In addition, mere aggregation of another work not based on the Library with
     the Library (or with a work based on the Library) on a volume of a storage
     or distribution medium does not bring the other work under the scope of
     this License.

3. You may opt to apply the terms of the ordinary GNU General Public License
instead of this License to a given copy of the Library. To do this, you must
alter all the notices that refer to this License, so that they refer to the
ordinary GNU General Public License, version 2, instead of to this License. (If
a newer version than version 2 of the ordinary GNU General Public License has
appeared, then you can specify that version instead if you wish.) Do not make
any other change in these notices.

Once this change is made in a given copy, it is irreversible for that copy, so
the ordinary GNU General Public License applies to all subsequent copies and
derivative works made from that copy.

This option is useful when you wish to copy part of the code of the Library into
a program that is not a library.

4. You may copy and distribute the Library (or a portion or derivative of it,
under Section 2) in object code or executable form under the terms of Sections 1
and 2 above provided that you accompany it with the complete corresponding
machine-readable source code, which must be distributed under the terms of
Sections 1 and 2 above on a medium customarily used for software interchange.

If distribution of object code is made by offering access to copy from a
designated place, then offering equivalent access to copy the source code from
the same place satisfies the requirement to distribute the source code, even
though third parties are not compelled to copy the source along with the object
code.

5. A program that contains no derivative of any portion of the Library, but is
designed to work with the Library by being compiled or linked with it, is called
a "work that uses the Library". Such a work, in isolation, is not a derivative
work of the Library, and therefore falls outside the scope of this License.

However, linking a "work that uses the Library" with the Library creates an
executable that is a derivative of the Library (because it contains portions of
the Library), rather than a "work that uses the library". The executable is
therefore covered by this License. Section 6 states terms for distribution of
such executables.

When a "work that uses the Library" uses material from a header file that is
part of the Library, the object code for the work may be a derivative work of
the Library even though the source code is not.  Whether this is true is
especially significant if the work can be linked without the Library, or if the
work is itself a library. The threshold for this to be true is not precisely
defined by law.

If such an object file uses only numerical parameters, data structure layouts
and accessors, and small macros and small inline functions (ten lines or less in
length), then the use of the object file is unrestricted, regardless of whether
it is legally a derivative work. (Executables containing this object code plus
portions of the Library will still fall under Section 6.)

Otherwise, if the work is a derivative of the Library, you may distribute the
object code for the work under the terms of Section 6. Any executables
containing that work also fall under Section 6, whether or not they are linked
directly with the Library itself.

6. As an exception to the Sections above, you may also combine or link a "work
that uses the Library" with the Library to produce a work containing portions of
the Library, and distribute that work under terms of your choice, provided that
the terms permit modification of the work for the customer's own use and reverse
engineering for debugging such modifications.

You must give prominent notice with each copy of the work that the Library is
used in it and that the Library and its use are covered by this License. You
must supply a copy of this License. If the work during execution displays
copyright notices, you must include the copyright notice for the Library among
them, as well as a reference directing the user to the copy of this
License. Also, you must do one of these things:

     a) Accompany the work with the complete corresponding machine-readable
     source code for the Library including whatever changes were used in the
     work (which must be distributed under Sections 1 and 2 above); and, if the
     work is an executable linked with the Library, with the complete
     machine-readable "work that uses the Library", as object code and/or source
     code, so that the user can modify the Library and then relink to produce a
     modified executable containing the modified Library. (It is understood that
     the user who changes the contents of definitions files in the Library will
     not necessarily be able to recompile the application to use the modified
     definitions.)  

     b) Use a suitable shared library mechanism for linking with the Library. A
     suitable mechanism is one that (1) uses at run time a copy of the library
     already present on the user's computer system, rather than copying library
     functions into the executable, and (2) will operate properly with a
     modified version of the library, if the user installs one, as long as the
     modified version is interface-compatible with the version that the work was
     made with.  

     c) Accompany the work with a written offer, valid for at least three years,
     to give the same user the materials specified in Subsection 6a, above, for
     a charge no more than the cost of performing this distribution.  

     d) If distribution of the work is made by offering access to copy from a
     designated place, offer equivalent access to copy the above specified
     materials from the same place.  

     e) Verify that the user has already received a copy of these materials or
     that you have already sent this user a copy.

For an executable, the required form of the "work that uses the Library" must
include any data and utility programs needed for reproducing the executable from
it. However, as a special exception, the materials to be distributed need not
include anything that is normally distributed (in either source or binary form)
with the major components (compiler, kernel, and so on) of the operating system
on which the executable runs, unless that component itself accompanies the
executable.

It may happen that this requirement contradicts the license restrictions of
other proprietary libraries that do not normally accompany the operating
system. Such a contradiction means you cannot use both them and the Library
together in an executable that you distribute.

7. You may place library facilities that are a work based on the Library
side-by-side in a single library together with other library facilities not
covered by this License, and distribute such a combined library, provided that
the separate distribution of the work based on the Library and of the other
library facilities is otherwise permitted, and provided that you do these two
things:

     a) Accompany the combined library with a copy of the same work based on the
     Library, uncombined with any other library facilities. This must be
     distributed under the terms of the Sections above.  

     b) Give prominent notice with the combined library of the fact that part of
     it is a work based on the Library, and explaining where to find the
     accompanying uncombined form of the same work.

8. You may not copy, modify, sublicense, link with, or distribute the Library
except as expressly provided under this License. Any attempt otherwise to copy,
modify, sublicense, link with, or distribute the Library is void, and will
automatically terminate your rights under this License.  However, parties who
have received copies, or rights, from you under this License will not have their
licenses terminated so long as such parties remain in full compliance.

9. You are not required to accept this License, since you have not signed
it. However, nothing else grants you permission to modify or distribute the
Library or its derivative works. These actions are prohibited by law if you do
not accept this License. Therefore, by modifying or distributing the Library (or
any work based on the Library), you indicate your acceptance of this License to
do so, and all its terms and conditions for copying, distributing or modifying
the Library or works based on it.

10. Each time you redistribute the Library (or any work based on the Library),
the recipient automatically receives a license from the original licensor to
copy, distribute, link with or modify the Library subject to these terms and
conditions. You may not impose any further restrictions on the recipients'
exercise of the rights granted herein. You are not responsible for enforcing
compliance by third parties with this License.

11. If, as a consequence of a court judgment or allegation of patent
infringement or for any other reason (not limited to patent issues), conditions
are imposed on you (whether by court order, agreement or otherwise) that
contradict the conditions of this License, they do not excuse you from the
conditions of this License. If you cannot distribute so as to satisfy
simultaneously your obligations under this License and any other pertinent
obligations, then as a consequence you may not distribute the Library at
all. For example, if a patent license would not permit royalty-free
redistribution of the Library by all those who receive copies directly or
indirectly through you, then the only way you could satisfy both it and this
License would be to refrain entirely from distribution of the Library.

If any portion of this section is held invalid or unenforceable under any
particular circumstance, the balance of the section is intended to apply, and
the section as a whole is intended to apply in other circumstances.

It is not the purpose of this section to induce you to infringe any patents or
other property right claims or to contest validity of any such claims; this
section has the sole purpose of protecting the integrity of the free software
distribution system which is implemented by public license practices. Many
people have made generous contributions to the wide range of software
distributed through that system in reliance on consistent application of that
system; it is up to the author/donor to decide if he or she is willing to
distribute software through any other system and a licensee cannot impose that
choice.

This section is intended to make thoroughly clear what is believed to be a
consequence of the rest of this License.

12. If the distribution and/or use of the Library is restricted in certain
countries either by patents or by copyrighted interfaces, the original copyright
holder who places the Library under this License may add an explicit
geographical distribution limitation excluding those countries, so that
distribution is permitted only in or among countries not thus excluded. In such
case, this License incorporates the limitation as if written in the body of this
License.

13. The Free Software Foundation may publish revised and/or new versions of the
Lesser General Public License from time to time. Such new versions will be
similar in spirit to the present version, but may differ in detail to address
new problems or concerns.

Each version is given a distinguishing version number. If the Library specifies
a version number of this License which applies to it and "any later version",
you have the option of following the terms and conditions either of that version
or of any later version published by the Free Software Foundation. If the
Library does not specify a license version number, you may choose any version
ever published by the Free Software Foundation.

14. If you wish to incorporate parts of the Library into other free programs
whose distribution conditions are incompatible with these, write to the author
to ask for permission. For software which is copyrighted by the Free Software
Foundation, write to the Free Software Foundation; we sometimes make exceptions
for this. Our decision will be guided by the two goals of preserving the free
status of all derivatives of our free software and of promoting the sharing and
reuse of software generally.

                             NO WARRANTY 

15. BECAUSE THE LIBRARY IS LICENSED FREE OF CHARGE, THERE IS NO WARRANTY FOR THE
LIBRARY, TO THE EXTENT PERMITTED BY APPLICABLE LAW. EXCEPT WHEN OTHERWISE STATED
IN WRITING THE COPYRIGHT HOLDERS AND/OR OTHER PARTIES PROVIDE THE LIBRARY "AS
IS" WITHOUT WARRANTY OF ANY KIND, EITHER EXPRESSED OR IMPLIED, INCLUDING, BUT
NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A
PARTICULAR PURPOSE.  THE ENTIRE RISK AS TO THE QUALITY AND PERFORMANCE OF THE
LIBRARY IS WITH YOU. SHOULD THE LIBRARY PROVE DEFECTIVE, YOU ASSUME THE COST OF
ALL NECESSARY SERVICING, REPAIR OR CORRECTION.

16. IN NO EVENT UNLESS REQUIRED BY APPLICABLE LAW OR AGREED TO IN WRITING WILL
ANY COPYRIGHT HOLDER, OR ANY OTHER PARTY WHO MAY MODIFY AND/OR REDISTRIBUTE THE
LIBRARY AS PERMITTED ABOVE, BE LIABLE TO YOU FOR DAMAGES, INCLUDING ANY GENERAL,
SPECIAL, INCIDENTAL OR CONSEQUENTIAL DAMAGES ARISING OUT OF THE USE OR INABILITY
TO USE THE LIBRARY (INCLUDING BUT NOT LIMITED TO LOSS OF DATA OR DATA BEING
RENDERED INACCURATE OR LOSSES SUSTAINED BY YOU OR THIRD PARTIES OR A FAILURE OF
THE LIBRARY TO OPERATE WITH ANY OTHER SOFTWARE), EVEN IF SUCH HOLDER OR OTHER
PARTY HAS BEEN ADVISED OF THE POSSIBILITY OF SUCH DAMAGES.

                        END OF TERMS AND CONDITIONS

================================================
FILE: README.md
================================================
# OpenCCG

OpenCCG is a system for parsing and generating text using [combinatory categorial grammar](https://en.wikipedia.org/wiki/Combinatory_categorial_grammar) for syntax and [hybrid logic dependency semantics](https://www.aclweb.org/anthology/P02-1041) for, well, the semantic representation.

If that seems like a mouthful, don't worry too much about the details right now.
You can get started [installing OpenCCG](https://davehowcroft.com/post/installing-openccg/) and [working with OpenCCG using the `tccg` utility](https://davehowcroft.com/post/getting-started-with-openccg/) right now.

If, on the other hand, you want to start understanding what that mouthful means, Johanna Moore at the University of Edinburgh has some [helpful course notes on NLG in general and OpenCCG in particular](https://www.inf.ed.ac.uk/teaching/courses/nlg/).

# Project information

See CHANGES for a description of the project status. Also see the OpenCCG web site and wiki at UT Austin: 

* http://openccg.sf.net
* http://www.utcompling.com/wiki/openccg

This `README.md` file contains the configuration and build instructions. Next you'll probably want to look at the tutorial on writing grammars in the human-friendly 'dot ccg' syntax on [the UT Austin OpenCCG wiki](http://www.utcompling.com/wiki/openccg/visccg-tutorial).

After that it may be helpful to look at the "native" grammar specification in "Specifying Grammars for OpenCCG: A Rough Guide" in `docs/grammars-rough-guide.pdf`, as well as the `SAMPLE_GRAMMARS` file for descriptions of the sample grammars that come with the distribution, including ones using the DotCCG syntax.  A (somewhat dated) programmer's guide to using the OpenCCG realizer appears in `docs/realizer-manual.pdf`.

This release also includes a broad English coverage grammar from the CCGBank and associated statistical models; see `docs/ccgbank-README` for details.


# Requirements

* Version 1.6 or later of the Java 2 SDK (http://java.sun.com)
* For ccg2xml and other tools, Python version 2.4 to 2.7 (http://www.python.org)


# Libraries

If you're working with the latest source version from GitHub, you'll need to download the external libraries from the latest release, as GitHub discourages including binaries in their repos:

* Download the [latest release of OpenCCG from sourceforge](https://sourceforge.net/projects/openccg/)
* Unpack the archive and copy over the files from `openccg/lib/`, as well as `openccg/ccgbank/bin/ner/NERApp.jar`
* Build the latest source as described further below


# Configuring your environment variables

The easiest thing to do is to set the environment variables `JAVA_HOME` and `OPENCCG_HOME` to the relevant locations on your system. Set `JAVA_HOME` to match the top level directory containing the Java installation you want to use.

For example, on Windows:

```
C:\> set JAVA_HOME=C:\Program Files\jdk1.6.0_04
```

or on Unix:

```
% setenv JAVA_HOME /usr/local/java
  (csh)
> export JAVA_HOME=/usr/java
  (ksh, bash)
```

On Windows, to get these settings to persist, it's actually easiest to set your environment variables through the System Properties from the Control Panel. For example, under WinXP, go to Control Panel, click on System Properties, choose the Advanced tab, click on Environment Variables, and add your settings in the User variables area.

Next, likewise set `OPENCCG_HOME` to be the top level directory where you unzipped the download. In Unix, type `pwd` in the directory where this file is and use the path given to you by the shell as `OPENCCG_HOME`.  You can set this in the same manner as for `JAVA_HOME` above.

Next, add the directory `OPENCCG_HOME/bin` to your path. For example, you can set the path in your `.bashrc` file as follows:

```
> export PATH="$PATH:$OPENCCG_HOME/bin"
```

On Windows, you should also add the python main directory to your path.

Finally, if you are going to use [KenLM](https://kheafield.com/code/kenlm/) with very large language models for realization with CCGbank-extracted grammars on linux, you'll also need to set the library load path:

```
> export LD_LIBRARY_PATH=$LD_LIBRARY_PATH:$OPENCCG_HOME/lib
```

Once you have taken care of these things, you should be able to build and use the OpenCCG Library.

**Note**: Spaces are allowed in `JAVA_HOME` but not in `OPENCCG_HOME`.  To set an environment variable with spaces in it, you need to put quotes around the value when on Unix, but you must *NOT* do this when under Windows.


# Increasing Java memory limit

If you're working with a broad coverage grammar and statistical parsing or realization models, you'll probably need to increase the default memory limit for running OpenCCG's tools.  You can do so by editing `bin/ccg-env[.bat]`, increasing the JAVA_MEM environment variable at the end of this script.  For training perceptron models in memory, you may need 16g; for realization with the very large gigaword 5-gram model, you may need 8g; otherwise, for parsing and realization with CCGbank-derived models, 4g or possibly even 2g should suffice; finally, for small grammars 512m or 256m should be ok.

# Trying it out

If you've managed to configure the system, you should be able to change to the directory for the "tiny" sample grammar and run `tccg` (for text ccg), the command-line tool for interactively testing grammars:

```
> cd grammars
> cd tiny
> tccg (Windows/Unix)
```

Provided tccg starts properly, it loads the grammar files, parses them, and shows the command-line interface (at which point you can type `:h` for help or `:q` to quit).

If you trouble starting up tccg, make sure you have set the environment variables properly, and that the tccg script (located in `openccg/bin`) calls the right shell environment (top-line of the script; to solve the problem, either comment out this line or correct the path).


# Visualizing semantic graphs

Semantic dependency graphs in testbed files can be visualized with the help of Graphviz's dot tool.  First, download and install [Graphviz](http://www.graphviz.org/).  Then, use tccg to create a testbed files with logical forms in it.  For example, you can try some examples in the worldcup sample grammar and save them to a file using the command ':2tb tb.xml'.  Then make a directory to store the visualized graphs. Finally, run the ccg-draw-graph tool as shown below:

```
> cd grammars/worldcup
> tccg (parse examples, save using ':2tb tb.xml')
> mkdir graphs
> ccg-draw-graph -i tb.xml -v graphs/g
```

You can also show the semantic classes or word indices using the `-c` or `-w` options, respectively.  The graphs can be displayed with any PDF display tool.

Note that the graph visualization requires the logical forms to be stored in an xml node-rel format for graphs, as in the worldcup or routes sample grammars.  See `SAMPLE_GRAMMARS` for more information.


# Creating disjunctive logical forms

This release includes a new disjunctivizer package, for creating a disjunctive LF XML structure based on an LF graph difference.  An LF graph difference is a characterization of the difference between two Hybrid Logic Dependency Semantics graphs and an alignment between them in terms of the edits needed to make one into the other: inserts, deletes, and substitutions.  See the build file for junit tests that illustrate how to use the package.

# Generating grammar documentation

OpenCCG includes a tool for generating HTML documentation of the XML files that specify a grammar. It can be run either from the `ccg-grammardoc` script in the `bin/` directory, or as an Ant task. An example of how to incorporate GrammarDoc into an Ant build file is given in the "tiny" grammar (`grammars/tiny/build.xml`), in a build target called `document`.


# Building the system from source

The OpenCCG build system is based on Apache Ant.  Ant is a little but very handy tool that uses a build file written in XML (`build.xml`) as building instructions.  Building the Java portion of OpenCCG is accomplished using the script `ccg-build`; this works under Windows and Unix, but requires that you run it from the top-level directory (where the `build.xml` file is located).  If everything is right and all the required packages are visible, this action will generate a file called openccg.jar in the `./lib` directory.

Note that you should *not* build from source by invoking 'ant' directly.  Instead, you should use `ccg-build` as shown below (Unix), after ensuring that you've set `OPENCCG_HOME`, `JAVA_HOME` and updated your `PATH` (the `ccg-build` script invokes ant with various parameters that aren't set properly if ant is invoked from the command line):

```
> cd $OPENCCG_HOME
> ccg-build
```

# Working with the Eclipse IDE

The Eclipse IDE can be used for editing the Java source code, though setup can be a bit tricky.  The most reliable method seems to be as follows.  First, follow the instructions above for building the source from the command line.  Then, in Eclipse, choose File|New|Java Project to create a new Java Project, and give it a name, such as 'openccg'. Leave the default settings as they are, and click Next.  Then choose Link Additional Source and browse to the folder `src/` in the directory where you installed OpenCCG (i.e. `$OPENCCG_HOME/src`).  You'll need to give this location a new name, such as 'src2' ('src' is already taken by default).  The final step is to Add External JARs under the Libraries tab.  From OpenCCG's lib directory (i.e. `$OPENCCG_HOME/lib`), choose all of the `.jar` files.  At this point, you should be able to hit Finish and the code should compile in Eclipse.

Note that with Eclipse's default settings, the code will compile in your Eclipse workspace, which is separate from your OpenCCG installation (this is a good thing, as Eclipse uses a `bin/` directory for compiled Java classes, whereas OpenCCG uses `bin/` for command-line scripts).  Thus, once you have made a round of changes in Eclipse and are ready to try them out in OpenCCG, go back to the command line in `$OPENCCG_HOME` and invoke `ccg-build` to re-build the `openccg.jar` file. This will make your changes available in OpenCCG's programs, such as `tccg`.

# Bug Reports

Please report bugs at by creating [an issue with a description of the problem](https://github.com/OpenCCG/openccg/issues). 


================================================
FILE: SAMPLE_GRAMMARS
================================================
  
This SAMPLE_GRAMMARS file describes the sample grammars that come 
with the distribution, and provides an overview of how the grammars 
are organized.

Grammars written directly in the XML format used by OpenCCG appear in
separate directories under grammars/.  There are currently four small
English grammars -- tiny, worldcup, flights, and comic -- plus a series of
related grammars, mini-*, for Basque, Dyirbal, English, Inuit, Tagalog and
Turkish, which are from Bozsahin and Steedman's (2003) study of
ergativity. The worldcup grammar includes the English examples from
Baldridge (2002). (The Dutch, Turkish, Tagalog, and Toba Batak grammars
have not been updated from Grok version 0.6.) The flights and comic
grammars (used in the FLIGHTS and COMIC systems) make use of a shared
grammar of core English, in the core-en dir, and contain categories for
pitch accents and boundary tones.

Grammars written in the front-end `dot CCG' format, which attempts to provide 
a more powerful and easier-to-use format than the raw XML, are in separate
directories under ccg-format-grammars/.  There are currently three grammars
here -- tiny, tinytiny, and arabic. `tiny' is a grammar originally based on
the `tiny' English grammar contained in the grammars/ directory and
documented above.  It has been significantly expanded so as to demonstrate
the various features of the CCG format.  `tinytiny' is a smaller English
grammar extracted from `tiny', which attempts to demonstrate a minimal-size
useful grammar. `arabic' is a grammar of a large chunk of Classical Arabic,
written by Ben Wing.  It was created in particular to demonstrate the power
of CCG-format macros in handling complex morphology, and contains a nearly
full grammar of Arabic verbs.  Dot CCG grammars are compiled using ccg2xml; 
run ccg2xml -h for usage.

The best place to look for more info on the dot CCG format is in
ccg-format-grammars/tiny/tiny.ccg and in src/ccg2xml/README.

This release also includes a broad English coverage grammar from the
CCGBank and associated statistical models; see docs/ccgbank-README for
details.

Note that with all the grammars, there is the option to store logical
forms in an xml node-rel format for graphs.  Conversion to this graph
format is done using a couple of XSLT transforms specified in the
grammar.xml file; see grammars/worldcup/grammar.xml for an example.
When using this graph format, it is also possible to visualize the
semantic graphs, as described in the main README file.

At present, ccg2xml does not support writing grammar.xml files with
the XSLT transforms for the node-rel graph format.  As a workaround,
you can add these transforms to your own version of the file which you
then copy over the generated grammar.xml file, as shown below.

> ccg2xml --prefix= mygram.ccg
> cp mygram-grammar.xml grammar.xml


================================================
FILE: TODO
================================================

General OpenCCG development:
----------------------------

- Add check for target LF when adding/writing full words (incl. supertags).

- Look into better handling of optional args.

- Extend feature hierarchy biz to work with category types; 
  would make sense to also add category vars.

- Add final bits to grammars rough guide (esp. feature licensing).
  
- Add option to update testbed.

- Binding theory?
  
- Get agreement to work with anaphors in appositives.

- Add more dynamic checks, eg for non-existent indexRel values or licensing attrs.

- Add well-formedness check for unique roles -- ie, that role must occur
  only once per semantic head -- and associated method for declaring that
  roles must be unique.

- Interface to morph transducers.

- Make UnifyControl etc thread friendly.  Could try tying global vars to
  current thread.

- Improve unification efficiency.  Could try indexing, caching across calls
  to parser or realizer, and structure sharing with delayed copying. 


Realizer-oriented development:
------------------------------

- Try using coarticulations with pitch accents.

- Add orthographic post-processing (capitalization, spacing of punctuation).

- Look into instantiating outermost args. 


TODO prior to Feb 16:
---------------------

Tabs for testbed, lexicon, features
Nice tree graph for features
Get Arabic to compile
Issues of colors, fonts, etc. (Alexis help)
PNG's of the slash modalities
Option menu for different magnification (50%, 100%, 200% ...)
Get pretty buttons from Justin
Make sure all path, etc. issues are working
Figure out what's the deal with __init__.py -- importing from another dir

Possibly:
  help-over descriptions of families, provided by Javadoc-style comments in
  the source


Alexis -- help with more specific user-interface issues, overall management
involving various people

Sudipta --
  -- PNG's of slash modalities; add to editor
  -- TeX/Tk font conversion
  -- find a Tkinter package for displaying tree graphs; use it to add a graph for features to the editor
  -- figure out what's wrong with arabic?

semantics: RED
features: BLUE
categories: BLACK, sans serif font
background: WHITE


Ben TODO!!!!!
-------------

Create professional-looking web page off of comp.ling.utexas.edu


================================================
FILE: bin/ccg-build
================================================
#!/bin/sh
. ccg-env
ANT_HOME="$OPENCCG_LIB"
PROPS="-Dant.home=$ANT_HOME -Dopenccg.home=$OPENCCG_HOME"
case `uname` in
  CYGWIN* ) XALAN_JARS="$OPENCCG_LIB/xalan.jar;$OPENCCG_LIB/xercesImpl.jar;$OPENCCG_LIB/xml-apis.jar;$OPENCCG_LIB/xsltc.jar;$OPENCCG_LIB/serializer.jar"
            ANT_JARS="$OPENCCG_LIB/ant.jar;$OPENCCG_LIB/ant-launcher.jar;$OPENCCG_LIB/ant-contrib.jar"
            ANT_JARS="$ANT_JARS;$OPENCCG_LIB/ant-junit.jar;$OPENCCG_LIB/ant-junit4.jar;$OPENCCG_LIB/junit-4.10.jar"
            CP="$JAVA_HOME/lib/tools.jar;$OPENCCG_JAR;$ANT_JARS;$XALAN_JARS;$DIRLIBS;."
            PROPS="$PROPS -Dcygwin=true"
  ;;
  * ) XALAN_JARS="$OPENCCG_LIB/xalan.jar:$OPENCCG_LIB/xercesImpl.jar:$OPENCCG_LIB/xml-apis.jar:$OPENCCG_LIB/xsltc.jar:$OPENCCG_LIB/serializer.jar"
      ANT_JARS="$OPENCCG_LIB/ant.jar:$OPENCCG_LIB/ant-launcher.jar:$OPENCCG_LIB/ant-contrib.jar"
      ANT_JARS="$ANT_JARS:$OPENCCG_LIB/ant-junit.jar:$OPENCCG_LIB/ant-junit4.jar:$OPENCCG_LIB/junit-4.10.jar"
      CP="$JAVA_HOME/lib/tools.jar:$OPENCCG_JAR:$ANT_JARS:$XALAN_JARS:$DIRLIBS:."
  ;;
esac
"$JAVA" $JAVA_MEM -classpath "$CP" $PROPS org.apache.tools.ant.launch.Launcher $@


================================================
FILE: bin/ccg-build.bat
================================================
@echo off
call ccg-env
set ANT_HOME=%OPENCCG_LIB%
set PROPS=-Dant.home=%ANT_HOME% -Dopenccg.home=%OPENCCG_HOME%
set XALAN_JARS=%OPENCCG_LIB%\xalan.jar;%OPENCCG_LIB%\xercesImpl.jar;%OPENCCG_LIB%\xml-apis.jar;%OPENCCG_LIB%\xsltc.jar;%OPENCCG_LIB%\serializer.jar
set ANT_JARS=%OPENCCG_LIB%\ant.jar;%OPENCCG_LIB%\ant-launcher.jar;%OPENCCG_LIB%\ant-contrib.jar
set ANT_JARS=%ANT_JARS%;%OPENCCG_LIB%\ant-junit.jar;%OPENCCG_LIB%\ant-junit4.jar;%OPENCCG_LIB%\junit-4.10.jar
set CP="%JAVA_HOME%\lib\tools.jar";%OPENCCG_JAR%;%ANT_JARS%;%XALAN_JARS%;%DIRLIBS%;.
%JAVA% %JAVA_MEM% -classpath %CP% %PROPS% org.apache.tools.ant.launch.Launcher %*


================================================
FILE: bin/ccg-cvr
================================================
#!/bin/sh
# For usage, do: ccg-cvr -h
. ccg-env
"$JAVA" $JAVA_ARGS opennlp.ccg.test.CrossValidateRealizer $@


================================================
FILE: bin/ccg-cvr.bat
================================================
@echo off
rem For usage, do: ccg-cvr -h
call ccg-env
%JAVA_CMD% opennlp.ccg.test.CrossValidateRealizer %* 


================================================
FILE: bin/ccg-draw-graph
================================================
#!/bin/sh

python "$OPENCCG_HOME/bin/dlf_parser.py" "$@"


================================================
FILE: bin/ccg-draw-graph.bat
================================================
@echo off
python %OPENCCG_HOME%/bin/dlf_parser.py %*

================================================
FILE: bin/ccg-draw-tree
================================================
#!/bin/sh

python "$OPENCCG_HOME/bin/ccg_draw_tree.py" "$@"


================================================
FILE: bin/ccg-draw-tree.bat
================================================
@echo off
python %OPENCCG_HOME%/bin/ccg_draw_tree.py %*

================================================
FILE: bin/ccg-env
================================================
#!/bin/sh
# sets OpenCCG environment variables

if [ "$JAVA_HOME" = "" ] ; then
  echo
  echo "Error: JAVA_HOME not found in your environment."
  echo
  echo "Please set the JAVA_HOME variable in your environment to match the"
  echo "location of the Java Virtual Machine you want to use."
  exit 1
fi

if [ "$OPENCCG_HOME" = "" ] ; then
  echo
  echo "Error: OPENCCG_HOME not found in your environment."
  echo
  echo "Please set the OPENCCG_HOME variable in your environment to match the"
  echo "location of your OpenNLP CCG Library distribution."
  exit 1
fi

case `uname` in
  CYGWIN* ) OPENCCG_HOME="`cygpath -w $OPENCCG_HOME`"
  ;;
esac

OPENCCG_LIB="$OPENCCG_HOME/lib"
OPENCCG_SRC="$OPENCCG_HOME/src"
OPENCCG_CLASSES="$OPENCCG_HOME/output/classes"
OPENCCG_JAR="$OPENCCG_HOME/lib/openccg.jar"
case `uname` in
  CYGWIN* ) DIRLIBS="$OPENCCG_LIB/trove.jar;$OPENCCG_LIB/jdom.jar;$OPENCCG_LIB/jline.jar;$OPENCCG_LIB/jopt-simple.jar"
            CP="${OPENCCG_JAR};${DIRLIBS};."
  ;;
  * ) DIRLIBS="$OPENCCG_LIB/trove.jar:$OPENCCG_LIB/jdom.jar:$OPENCCG_LIB/jline.jar:$OPENCCG_LIB/jopt-simple.jar"
      CP="${OPENCCG_JAR}:${DIRLIBS}:."
  ;;
esac
# variant for use with 'build compile' option, if desired:
#CP="${OPENCCG_CLASSES}:${OPENCCG_SRC}:${DIRLIBS}"
JAVA="$JAVA_HOME/bin/java"
JAVA_MEM="-Xmx256m"
#JAVA_MEM="-Xmx2048m"
#JAVA_MEM="-Xmx8g"
#JAVA_MEM="-Xmx16g"
JAVA_ARGS="$JAVA_MEM -classpath $CP -Dfile.encoding=UTF8"


================================================
FILE: bin/ccg-env.bat
================================================
@echo off
rem sets OpenCCG environment variables

if not exist "%JAVA_HOME%" goto no_JAVA_HOME
if not exist "%OPENCCG_HOME%" goto no_OPENCCG_HOME

set OPENCCG_LIB=%OPENCCG_HOME%\lib
set DIRLIBS=%OPENCCG_LIB%\trove.jar;%OPENCCG_LIB%\jdom.jar;%OPENCCG_LIB%\jline.jar;%OPENCCG_LIB%\jopt-simple.jar
set XMLLIBS=%OPENCCG_LIB%\xml-apis.jar;%OPENCCG_LIB%\xercesImpl.jar;%OPENCCG_LIB%\xalan.jar
set OPENCCG_SRC=%OPENCCG_HOME%\src
set OPENCCG_CLASSES=%OPENCCG_HOME%\output\classes
set OPENCCG_JAR=%OPENCCG_HOME%\lib\openccg.jar
rem variant without XMLLIBS
rem set CP=%OPENCCG_JAR%;%DIRLIBS%;.
rem variant with XMLLIBS
set CP=%OPENCCG_JAR%;%DIRLIBS%;%XMLLIBS%;.
rem variant for use with 'build compile' option, if desired:
rem set CP=%OPENCCG_CLASSES%;%OPENCCG_SRC%;%DIRLIBS%
set JAVA="%JAVA_HOME%\bin\java"
set JAVA_MEM=-Xmx256m
rem set JAVA_MEM=-Xmx2048m
set JAVA_CMD=%JAVA% %JAVA_MEM% -classpath %CP% -Dfile.encoding=UTF8

goto end

:no_JAVA_HOME
echo.
echo Error: JAVA_HOME not found in your environment.
echo.
echo Please set the JAVA_HOME variable in your environment to match the
echo location of the Java Virtual Machine you want to use.
echo.
exit /b 1

:no_OPENCCG_HOME
echo.
echo Error: OPENCCG_HOME not found in your environment.
echo.
echo Please set the OPENCCG_HOME variable in your environment to match the
echo location of your OpenNLP CCG Library distribution.
echo.
exit /b 1

:end


================================================
FILE: bin/ccg-grammardoc
================================================
#!/bin/sh
#
# $Id: ccg-grammardoc,v 1.2 2006/12/03 17:14:23 mwhite14850 Exp $
# Script to run grammardoc from the command line.
# Author: Scott Martin (http://www.ling.osu.edu/~scott/)
#
# Usage: ccg-grammardoc [-s|--source sourceDir] [-d|--dest destDir]
#
. ccg-env
ANT_HOME="$OPENCCG_HOME/lib"
case `uname` in
  CYGWIN* ) CP="$CP;$ANT_HOME/ant.jar"
  ;;
  * ) CP="$CP:$ANT_HOME/ant.jar"
  ;;
esac
JAVA_ARGS="-Xmx128m -classpath $CP"
"$JAVA" $JAVA_ARGS opennlp.ccg.grammardoc.GrammarDoc $@


================================================
FILE: bin/ccg-grammardoc.bat
================================================
@echo off
rem Usage: ccg-grammardoc [-s|--source sourceDir] [-d|--dest destDir]
call ccg-env
set ANT_HOME=%OPENCCG_HOME%\lib
set CP=%CP%;%ANT_HOME%\ant.jar
set JAVA_ARGS=-Xmx128m -classpath %CP%
%JAVA% %JAVA_ARGS% opennlp.ccg.grammardoc.GrammarDoc %*


================================================
FILE: bin/ccg-gt
================================================
#!/bin/sh
# For usage, do: ccg-gt -h
. ccg-env
"$JAVA" $JAVA_ARGS opennlp.ccg.test.GenTargets $@


================================================
FILE: bin/ccg-gt.bat
================================================
@echo off
rem For usage, do: ccg-gt -h
call ccg-env
%JAVA_CMD% opennlp.ccg.test.GenTargets %*


================================================
FILE: bin/ccg-ht-factors
================================================
#!/bin/sh
. ccg-env
#CP=$CP:$OPENCCG_HOME/lib/jopt-simple.jar
#echo $JAVA_ARGS
"$JAVA" $JAVA_ARGS opennlp.ccg.realize.hypertagger.LMFactorExtractor $@


================================================
FILE: bin/ccg-hypertagger
================================================
#!/bin/sh
. ccg-env
#CP=$CP:$OPENCCG_HOME/lib/jopt-simple.jar
#echo $JAVA_ARGS
"$JAVA" $JAVA_ARGS opennlp.ccg.realize.hypertagger.TagExtract $@


================================================
FILE: bin/ccg-hypertagger.bat
================================================
@echo off
call ccg-env
%JAVA_CMD% opennlp.ccg.realize.hypertagger.TagExtract %*


================================================
FILE: bin/ccg-parse
================================================
#!/bin/sh
# Usage: ccg-parse -h
. ccg-env
"$JAVA" $JAVA_ARGS opennlp.ccg.Parse $@


================================================
FILE: bin/ccg-parse.bat
================================================
@echo off
rem Usage: ccg-parse -h
call ccg-env
%JAVA_CMD% opennlp.ccg.Parse %1 %2 %3 %4 %5 %6 %7 %8 %9 


================================================
FILE: bin/ccg-postagger
================================================
#!/bin/sh
. ccg-env
"$JAVA" $JAVA_ARGS opennlp.ccg.parse.postagger.BasicPOSTagger $@


================================================
FILE: bin/ccg-postagger.bat
================================================
@echo off
call ccg-env
%JAVA_CMD% opennlp.ccg.parse.postagger.BasicPOSTagger %*


================================================
FILE: bin/ccg-realize
================================================
#!/bin/sh
# Usage: ccg-realize (-g <grammarfile>) <inputfile> (<outputfile>)
. ccg-env
"$JAVA" $JAVA_ARGS opennlp.ccg.Realize $@


================================================
FILE: bin/ccg-realize.bat
================================================
@echo off
rem Usage: ccg-realize (-g <grammarfile>) <inputfile> (<outputfile>)
call ccg-env
rem set HPROF=-Xrunhprof:cpu=times,file=hmm-prof.txt
%JAVA_CMD% opennlp.ccg.Realize %1 %2 %3 %4 %5 %6 %7 %8 %9 


================================================
FILE: bin/ccg-supertagger
================================================
#!/bin/sh
. ccg-env
"$JAVA" $JAVA_ARGS opennlp.ccg.parse.supertagger.WordAndPOSDictionaryLabellingStrategy $@


================================================
FILE: bin/ccg-supertagger.bat
================================================
@echo off
call ccg-env
%JAVA_CMD% opennlp.ccg.parse.supertagger.WordAndPOSDictionaryLabellingStrategy %*


================================================
FILE: bin/ccg-test
================================================
#!/bin/sh
# For usage, do: ccg-test -h
. ccg-env
"$JAVA" $JAVA_ARGS opennlp.ccg.test.Regression "$@"


================================================
FILE: bin/ccg-test.bat
================================================
@echo off
rem For usage, do: ccg-test -h
call ccg-env
rem set HPROF=-Xrunhprof:cpu=times,file=hmm-prof.txt
%JAVA_CMD% opennlp.ccg.test.Regression %*


================================================
FILE: bin/ccg-update
================================================
#!/bin/sh
# For usage, do: ccg-update -h
. ccg-env
"$JAVA" $JAVA_ARGS opennlp.ccg.test.UpdateTestbed $@


================================================
FILE: bin/ccg-update.bat
================================================
@echo off
rem For usage, do: ccg-update -h
call ccg-env
%JAVA_CMD% opennlp.ccg.test.UpdateTestbed %*


================================================
FILE: bin/ccg2xml
================================================
#!/bin/sh

python "$OPENCCG_HOME/bin/ccg2xml.py" "$@"


================================================
FILE: bin/ccg2xml.bat
================================================
@echo off
python %OPENCCG_HOME%/bin/ccg2xml.py %*

================================================
FILE: bin/ccg_draw_tree.py
================================================
#
# ccg_draw_tree uses nltk.Tree to draw a tree from a CCGbank .auto file, 
# or to draw two trees from two .auto files
#

import sys

if len(sys.argv) == 1 or sys.argv[1] == '-h' or sys.argv[1] == '--help':
    print 'Usage: ccg_draw_tree <autofile> <deriv_id> (<autofile>) (<derivid>)'
    sys.exit(0)

autofile = sys.argv[1]
deriv_id = sys.argv[2]

autofile2 = None
deriv_id2 = None

if len(sys.argv) >= 4: 
    autofile2 = sys.argv[3]
    deriv_id2 = deriv_id
    if len(sys.argv) >= 5:
        deriv_id2 = sys.argv[4]

def get_deriv(autofile, deriv_id):
    print 'reading ' + deriv_id + ' from ' + autofile
    found_it = False
    file = open(autofile, 'rU')
    for line in file:
        if found_it == True:
            return line
        if line[0:2] == 'ID':
            if line.split()[0].split('=')[1] == deriv_id:
                found_it = True
    raise NameError('could not find ' + deriv_id + '!')

deriv = get_deriv(autofile, deriv_id)
deriv2 = None
if autofile2 != None:
    deriv2 = get_deriv(autofile2, deriv_id2)

print 'importing nltk.Tree'

from nltk import Tree
from nltk.draw.tree import draw_trees

ccgbank_node_pattern = r'<T.*?>'
ccgbank_leaf_pattern = r'<L.*?>'

# nb: the parens around leaves ends up creating blank nodes above leaves
def parse_ccgbank_node(s):
    if s =='': return ''
    return s.split(' ')[1]

def parse_ccgbank_leaf(s):
    tokens = s.split(' ')
    return Tree(tokens[1], [tokens[4]])

def excise_empty_nodes(t):
    if not isinstance(t,Tree): return t
    if t.node == '': return excise_empty_nodes(t[0])
    return Tree(t.node, [excise_empty_nodes(st) for st in t])

# nb: returns tree with blank nodes excised
def parse_ccgbank_tree(s):
    t = Tree.parse(s, 
                   parse_node=parse_ccgbank_node, 
                   parse_leaf=parse_ccgbank_leaf, 
                   node_pattern=ccgbank_node_pattern, 
                   leaf_pattern=ccgbank_leaf_pattern)
    return excise_empty_nodes(t)

print
print 'parsing: ' + deriv
t = parse_ccgbank_tree(deriv)
print t

t2 = None
if deriv2 != None:
    print
    print 'parsing: ' + deriv2
    t2 = parse_ccgbank_tree(deriv2)
    print t2

print
if t2 == None:
    print 'drawing tree'
    draw_trees(t)
else:
    print 'drawing trees'
    draw_trees(t,t2)


================================================
FILE: bin/dlf_parser.py
================================================
#
# dlf_parser.py (invoked by ccg-draw-graph) uses graphviz's dot to visualize (D)LF graphs
#
# author: Jonathan Barker (with minor contributions by Michael White)
# license: LGPL
#

from xml.etree.ElementTree import ElementTree
import optparse, sys, codecs, xml, os
from collections import defaultdict

# Parse arguments
op = optparse.OptionParser()

op.add_option("-i", "--input", type="string", help="input source: file or <stdin>(default)", default=sys.stdin)

op.add_option("-m", "--moses", type="string", help="file/directory prefix for moses output", default=None)

op.add_option("-v", "--visualize", type="string", help="file/directory prefix for .pdf output", default=None)

op.add_option("-w", "--wordindices", action="store_true", help="include word indices", default=False)

op.add_option("-c", "--classnames", action="store_true", help="include semantic class names", default=False)

(ops, args) = op.parse_args(sys.argv)

# Parse input file
input_source = ops.input if ops.input is sys.stdin else open(ops.input, "rt")
raw = xml.etree.ElementTree.XML(input_source.read())
snum = "None"
att_id = 0

# Get word number
def wordNum(wid):
    if wid.startswith("x"):
        return -1
    else:
        return int(wid[1:].strip("f"))

# Get node span
def span(nid, graph, w):
    if wordNum(nid) in w:
        return []
    w.append(wordNum(nid))
    for n, e in graph[nid]:
        if wordNum(n) not in w:
            w.append(wordNum(n))
            w.extend(span(n, graph, w))
    return w

# findall wrapper
def findAll(elem, match):
    return max(elem.findall(match), [])

# Class for representing predicates and attributes
class Pred:
    def __init__(self):
        self.attrib = []
        self.one_of = []
        self.opt = []

# Class for representing nodes, contains predicate and attribute information
class Node:
    def __init__(self):
        self.id = ""
        self.className = ""
        self.preds = defaultdict(Pred)

    def addPred(self, pred, attrib, one_of, opt):
        self.preds[pred].attrib.extend(attrib)
        self.preds[pred].one_of.extend(one_of)
        self.preds[pred].opt.extend(opt)

    def moses(self, graph):
        tree = " <tree label=\""
        # label
        pred = self.pred
        if pred is None:
            pred = self.id
        tree += "_".join([pred]+[k.upper()+"_"+v for (k,v) in self.attrib])
        # span
        tree += "\" span=\""
        s = span(self.id, graph, [])
        tree += str(min(s))+"-"+str(max(s))
        tree += "\"/>"
        return tree

    def dot(self):
        dot_node = self.id+" [label=<"
        withClassName = ops.classnames and len(self.className) > 0
        if ops.wordindices:
            dot_node += self.id
            if withClassName:
                dot_node += ":"
        if withClassName:
            dot_node += self.className
        if len(self.preds) > 0:
            if ops.wordindices or withClassName:
                dot_node += ":"
            labels = []
            for pname, p in self.preds.items():
                label = ""
                # pred
                label += "<FONT POINT-SIZE=\"20.0\">"+pname+"</FONT>"
                # att
                atts = []
                if len(p.attrib) > 0:
                    atts.append(",".join(["&lt;"+k.upper()+"&gt;"+v for (k, v) in p.attrib]))
                if len(p.one_of) > 0:
                    atts.append("|".join(["&lt;"+k.upper()+"&gt;"+v for (k, v) in p.one_of]))
                if len(p.opt) > 0:
                    atts.append("("+",".join(["&lt;"+k.upper()+"&gt;"+v for (k, v) in p.opt])+")?")
                if len(atts) > 0:
                    label += "<FONT POINT-SIZE=\"8.0\">"+",".join(atts)+"</FONT>"
                labels.append(label)
            dot_node += " | ".join(labels)
        dot_node += ">];\n"
        return dot_node

    def info(self):
        print "Node id:",self.id
        for pname, p in self.preds:
            print "\tPred:",self.pred
            print "\t\tAttrib:",p.attrib
            print "\t\tOne_of:",p.one_of
            print "\t\tOpt:",p.opt
        print "----------------"

# Returns just the id, stripping the class (if any)
def parseId(str):
    colonIndex = str.find(":")
    if colonIndex > 0: return str[:colonIndex]
    else: return str

# Returns the class from the id, or the empty string if none
def parseClass(str):
    colonIndex = str.find(":")
    if colonIndex > 0: return str[colonIndex+1:]
    else: return ""
            
# Method for parsing <node>
def parseNode(node, graph, nodes):
    n = nodes[node.get("id")]
    n.id = parseId(node.get("id"))
    n.className = parseClass(node.get("id"))
    attrib = [(k, v) for (k, v) in node.items() if k not in ["id", "pred"]]
    if node.get("pred") is not None:
        n.addPred(node.get("pred"), attrib, [], [])
    nodes[n.id] = n
    
    for elem in list(node):
        if elem.tag == "rel":
            parseRel(elem, n.id, graph, nodes, "")
        elif elem.tag == "one-of":
            parseOneOf(elem, n, attrib, node.get("pred"), graph, nodes)
        elif elem.tag == "opt":
            parseOpt(elem, n, graph, nodes)
        elif elem.tag == "node":
            parseNode(elem, graph, nodes)
        else:
            print snum+": Unexpected tag <"+elem.tag+"> after <node>"
            quit()

# Method for parsing <opt>
def parseOpt(opt, node, graph, nodes):
    for elem in list(opt):
        if elem.tag == "atts":
            for pname, p in node.preds.items():
                node.addPred(pname, [], [], [(k, v) for (k, v) in elem.items() if k not in ["id", "pred"]])
        elif elem.tag == "rel":
            parseRel(elem, node.id, graph, nodes, "style=dotted, ")
        else:
            print snum+": Unexpected tag <"+elem.tag+"> after <node>"
            quit()

# Method for parsing <one-of>
def parseOneOf(oneof, node, attrib, pred, graph, nodes):
    global att_id
    num_att = 0
    for elem in list(oneof):
        if elem.tag == "atts":
            if pred is not None:
                node.addPred(pred, [], [(k, v) for (k, v) in elem.items() if k not in ["id", "pred"]], [])
            else:
                node.addPred(elem.get("pred"), [], [(k, v) for (k, v) in elem.items() if k not in ["id", "pred"]], [])
            if len(list(elem)) > 0:
                num_att += 1
                new_att = Node()
                new_att.id = "att"+str(att_id)
                att_id += 1
                new_att.addPred(str(num_att), [], [], [])
                nodes[new_att.id] = new_att
                graph[node.id].append((new_att.id, " [style=dashed];\n"))
                for rel in list(elem):
                    parseRel(rel, new_att.id, graph, nodes, "")
        elif elem.tag == "rel":
            num_att += 1
            new_att = Node()
            new_att.id = "att"+str(att_id)
            att_id += 1
            new_att.addPred(str(num_att), [], [], [])
            nodes[new_att.id] = new_att
            graph[node.id].append((new_att.id, " [style=dashed];\n"))
            parseRel(elem, new_att.id, graph, nodes, "")
        else:
            print snum+": Unexpected tag <"+elem.tag+"> after <one-of>"
            quit()

# Method for parsing <rel>
def parseRel(rel, nid, graph, nodes, style):
    # <rel>
    for subnode in list(rel):
        if subnode.tag == "node":
            edge_label = " ["+style+"label = \""+rel.get("name")+"\"];\n"
            if subnode.get("id") is None:
                graph[nid].append((parseId(subnode.get("idref")), edge_label))
            else:
                graph[nid].append((parseId(subnode.get("id")), edge_label))
                parseNode(subnode, graph, nodes)
        elif subnode.tag == "one-of":
            subnode.set("name", rel.get("name"))
            parseRel(subnode, nid, graph, nodes, "style=dashed, ")
        else:
            print snum+": Unexpected tag <"+subnode.tag+"> after <rel>"
            quit()
# <item> 
item_no = 0
for item in findAll(raw, "item"):
    item_no += 1
    if item.get("numOfParses") == "0":
        print "Removing "+item.get("info")
    else:
        snum = item.get("info")
        # <lf>
        lf_num = 0
        for lf in findAll(item, "lf"):
            graph = defaultdict(list)
            nodes = defaultdict(Node)
            
            # <node>
            for node in list(lf):
                if node.tag == "node":
                    parseNode(node, graph, nodes)
                else:
                    print snum+": Unexpected tag <"+node.tag+"> after <lf>"
                    quit()

            # Plot the graph with GraphViz
            if ops.visualize != None:
                viz_name = ""
                if type(item.get("info")) != type("string"):
                    viz_name = ops.visualize+".item"+str(item_no)+"."+str(lf_num)
                else:
                    viz_name = ops.visualize+"."+item.get("info")+"."+str(lf_num)
                viz = codecs.open(viz_name+".dot", "w", "utf-8")
                viz.write("digraph lf {\n")
                for (k, v) in nodes.items():
                    viz.write(v.dot())
                for (left, rights) in graph.items():
                    for right in rights:
                        viz.write(left+"->"+right[0]+right[1])
                viz.write("}\n")
                viz.close()
                os.system("dot -Tpdf "+viz_name+".dot -o "+viz_name+".pdf")
                os.system("rm "+viz_name+".dot")
        lf_num += 1


================================================
FILE: bin/tccg
================================================
#!/bin/sh
# For usage, do: tccg -h
. ccg-env
"$JAVA" $JAVA_ARGS opennlp.ccg.TextCCG "$@"


================================================
FILE: bin/tccg.bat
================================================
@echo off
rem For usage, do: tccg -h
call ccg-env
%JAVA_CMD% opennlp.ccg.TextCCG %*


================================================
FILE: bin/visccg
================================================
#!/bin/sh

python "$OPENCCG_HOME/bin/ccg_editor.py" "$@"


================================================
FILE: bin/visccg.bat
================================================
@echo off
python %OPENCCG_HOME%/bin/ccg_editor.py %*


================================================
FILE: bin/wccg
================================================
#!/bin/sh
# For usage, do: tccg -h
. ccg-env
"$JAVA" $JAVA_ARGS opennlp.ccg.WebCCG "$@"


================================================
FILE: build.xml
================================================
<!-- $Id: build.xml,v 1.61 2011/12/14 03:11:05 mwhite14850 Exp $ -->
<!-- Copyright (C) 2003-13 Jason Baldridge, Michael White and Scott Martin -->
<project name="OpenCCG" default="package" basedir=".">

  <path id="gen.classpath">
    <fileset dir="lib" includes="*.jar"/>
  </path>

  <!-- =================================================================== -->
  <!-- Initialization target                                               -->
  <!-- =================================================================== -->
  <target name="init">
    <tstamp/>
    <property name="Name" value="OpenCCG"/>
    <property name="name" value="openccg"/>
    <property name="year" value="2013"/>
    <property name="version" value="0.9.5"/>

    <echo message="----------- ${Name} ${version} [${year}] ------------"/>

    <property name="debug" value="on"/>
    <property name="optimize" value="off"/>
    <property name="deprecation" value="on"/>

    <property name="top.dir" value="."/>
    <property name="src.dir" value="./src"/>
    <property name="bin.dir" value="./bin"/>
    <property name="lib.dir" value="./lib"/>
    <property name="docs.dir" value="./docs"/>
    <property name="test.dir" value="./test"/>
    <property name="packages" value="opennlp.ccg.*,opennlp.ccgbank.*"/>
    <property name="build.dir" value="./output"/>
    <property name="build.dest" value="./output/classes"/>
    <property name="build.gen" value="${top.dir}/output/gen"/>
    <property name="build.javadocs" value="${docs.dir}/api"/>

    <path id="build.classpath">
      <pathelement location="${lib.dir}/ant-junit.jar"/>
      <pathelement location="${lib.dir}/ant-launcher.jar"/>
      <pathelement location="${lib.dir}/ant.jar"/>
      <pathelement location="${lib.dir}/jdom.jar"/>
      <pathelement location="${lib.dir}/trove.jar"/>
      <pathelement location="${lib.dir}/javacc.jar"/>
      <pathelement location="${lib.dir}/jgrapht-jdk1.6.jar"/>
      <pathelement location="${lib.dir}/jline.jar"/>
      <pathelement location="${lib.dir}/jopt-simple.jar"/>
      <pathelement location="${lib.dir}/junit-4.10.jar"/>
      <pathelement location="${lib.dir}/serializer.jar"/>
      <pathelement location="${lib.dir}/xalan.jar"/>
      <pathelement location="${lib.dir}/xml-apis.jar"/>
      <pathelement location="${lib.dir}/xsltc.jar"/>
    </path>

    <filter token="year" value="${year}"/>
    <filter token="version" value="${version}"/>
    <filter token="date" value="${TODAY}"/>
    <filter token="log" value="true"/>
    <filter token="verbose" value="true"/>
  </target>


  <!-- =================================================================== -->
  <!-- Help on usage                                                       -->
  <!-- =================================================================== -->
  <target name="usage">
    <echo message=""/>
    <echo message=""/>
    <echo message="OpenCCG build file"/>
    <echo message="-------------------------------------------------------------"/>
    <echo message=""/>
    <echo message=" Available targets are:"/>
    <echo message=""/>
    <echo message="   package  --> generates the openccg.jar file (default)"/>
    <echo message="   compile  --> compiles the source code"/>
    <echo message="   javadoc  --> generates the API documentation"/>
    <echo message="   test     --> runs JUnit tests"/>
    <echo message="   clean    --> cleans up the compilation directory"/>
    <echo message=""/>
    <echo message=" See the comments inside the build.xml file for more details."/>
    <echo message="-------------------------------------------------------------"/>
    <echo message=""/>
    <echo message=""/>
  </target>


  <!-- =================================================================== -->
  <!-- Prepares the build directories                                      -->
  <!-- =================================================================== -->
  <target name="prepare" depends="init">
    <!-- create directories -->
    <mkdir dir="${build.dir}"/>
    <mkdir dir="${build.dest}"/>
    <mkdir dir="${build.gen}"/>
  </target>


  <!-- Runs JavaCC (parser generator)                                      -->
  <!-- =================================================================== -->
  <target name="javacc"
          depends="prepare"
          description="generates parser using javacc">
    <mkdir dir="${build.gen}/opennlp/ccgbank/parse"/>
    <copy file="${src.dir}/opennlp/ccgbank/parse/SimpleNode.java"
          todir="${build.gen}/opennlp/ccgbank/parse"/>
    <jjtree target="${src.dir}/opennlp/ccgbank/parse/CCGbankDerivation.jjt"
            javacchome="${lib.dir}"
            outputdirectory="${build.gen}/opennlp/ccgbank/parse" />
    <javacc target="${build.gen}/opennlp/ccgbank/parse/CCGbankDerivation.jj"
            outputdirectory="${build.gen}/opennlp/ccgbank/parse"
            javacchome="${lib.dir}/" />
  </target>


  <!-- =================================================================== -->
  <!-- Compiles the source directory                                       -->
  <!-- =================================================================== -->
  <target name="compile"
          depends="javacc"
          description="compiles the source code">
    <!-- compile generated JavaCC classes-->
    <javac srcdir="${build.gen}"
           destdir="${build.dest}"
           debug="${debug}"
           deprecation="${deprecation}"
           classpathref="build.classpath"
           nowarn="true"
           includeAntRuntime="false"
           excludes="**/.backup.orig/**"
           optimize="${optimize}"/>
    <javac srcdir="${src.dir}"
           destdir="${build.dest}"
           debug="${debug}"
           deprecation="${deprecation}"
           classpathref="build.classpath"
           nowarn="true"
           includeAntRuntime="false"
           excludes="**/.backup.orig/**,srilmbridge/,kenlm/"
           optimize="${optimize}">
    </javac>
    <subant antfile="${src.dir}/ccg2xml/build.xml" buildpath="${basedir}"/>
  </target>


  <!-- =================================================================== -->
  <!-- Creates the jar file                                                -->
  <!-- =================================================================== -->
  <target name="package"
          depends="compile"
          description="generates the openccg.jar file (default)">
    <jar jarfile="${lib.dir}/${name}.jar">
      <fileset dir="${build.dest}">
        <include name="**"/>
        <exclude name="**/alignment/*Test*.class"/>
        <exclude name="**/disjunctivizer/*Test*.class"/>
        <exclude name="**/hylo/graph/*Test*.class"/>
        <exclude name="**/util/*Test*.class"/>
      </fileset>
      <fileset dir="${src.dir}" includes="**/*.xsl"/>
      <fileset dir="${src.dir}" includes="**/*.properties"/>
      <!-- for grammardoc -->
      <fileset dir="${src.dir}" includes="**/*.css"/>
      <fileset dir="${src.dir}" includes="**/*.js"/>
    </jar>
  </target>


  <!-- =================================================================== -->
  <!-- Creates the release file                                            -->
  <!--                                                                     -->
  <!-- Note: to create a release based on a clean openccg source           -->
  <!-- directory, use the latest version in the repository which           -->
  <!-- should exclude all the compiled and derived files.                  -->
  <!-- =================================================================== -->
  <target name="release" depends="document,package">
    <subant antfile="${docs.dir}/build.xml" buildpath="${basedir}"
            target="clean"/>
    <antcall target="clean"/>
    <tar tarfile="${name}-${version}.tar">
      <tarfileset mode="755"
                  dir="../"
                  includes="${name}/bin/** ${name}/ccgbank/bin/**"/>
      <tarfileset dir="../"
                  includes="${name}/**"
                  excludes="${name}/.* **/CVS **/bin/ **/.backup.orig/ ${name}/classes/** ${name}/output/** ${name}/src/srilmbridge/** ${name}/grammars/**/test/ ${name}/grammars/**/apml/"/>
    </tar>
    <gzip src="${name}-${version}.tar"
          zipfile="../${name}-${version}.tgz" />
    <delete file="${name}-${version}.tar" />
  </target>


  <!-- =================================================================== -->
  <!-- Creates the homepage                                                -->
  <!-- NB: We haven't been including the API docs on the home page.        -->
  <!-- NB: To update the homepage:                                         -->
  <!--     1. go to openccg/docs                                           -->
  <!--     2. sftp username@web.sf.net                                     -->
  <!--     3. cd cd /home/groups/o/op/openccg/htdocs                       -->
  <!--     4. put index.html                                               -->
  <!-- =================================================================== -->
  <target name="homepage"
          depends="init,document"
          description="generates the API documentation">
    <tar tarfile="${name}-homepage.tar"
         basedir="./docs/"
         includes="**"
         excludes="**/CVS **/.backup.orig" />
    <gzip src="${name}-homepage.tar"
          zipfile="${build.dir}/${name}-homepage.tgz" />
    <delete file="${name}-homepage.tar" />
  </target>


  <!-- =================================================================== -->
  <!-- Creates the documentation                                           -->
  <!-- =================================================================== -->
  <target name="document" depends="prepare,javacc">
    <mkdir dir="${build.javadocs}"/>
    <javadoc packagenames="${packages}"
             destdir="${build.javadocs}"
             classpathref="build.classpath"
             author="true"
             version="true"
             use="true"
             splitindex="true"
             noindex="false"
             windowtitle="${name}"
             doctitle="The ${Name} API v${version}"
             bottom="Copyright &#169; ${year} Jason Baldridge, Gann Bierner, Michael White and additional contributors. All Rights Reserved.">
      <sourcepath>
        <pathelement path="${src.dir}"/>
        <pathelement path="${build.gen}"/>
      </sourcepath>
      <link href="http://docs.oracle.com/javase/6/docs/api/"/>
      <link href="http://jgrapht.org/javadoc/"/>
      <link href="http://www.jdom.org/docs/apidocs/"/>
    </javadoc>
    <subant antfile="${docs.dir}/build.xml" buildpath="${basedir}"/>
  </target>


  <!-- =================================================================== -->
  <!-- Runs all JUnit tests                                                -->
  <!-- =================================================================== -->
  <target name="test" depends="compile">
    <javac srcdir="${test.dir}" destdir="${build.dest}"
           classpathref="build.classpath" debug="on" includeAntRuntime="false"/>

    <junit haltonerror="true" fork="off" includeantruntime="false">
      <classpath>
        <pathelement location="${build.dest}"/>
        <pathelement path="${java.class.path}"/>
        <pathelement location="${lib.dir}/jdom.jar"/>
        <pathelement location="${lib.dir}/jgrapht-jdk1.6.jar"/>
        <pathelement location="${lib.dir}/junit-4.10.jar"/>
        <pathelement location="${lib.dir}/serializer.jar"/>
        <pathelement location="${lib.dir}/trove.jar"/>
      </classpath>
      <formatter type="plain" usefile="false" />
      <batchtest>
        <fileset dir="${test.dir}">
          <include name="**/*Test*.java"/>
        </fileset>
      </batchtest>
    </junit>
  </target>


  <!-- =================================================================== -->
  <!-- Cleans targets                                                      -->
  <!-- =================================================================== -->
  <target name="clean"
          depends="init"
          description="cleans up the directory">
    <delete dir="${build.dir}"/>
    <subant antfile="${src.dir}/ccg2xml/build.xml" buildpath="${basedir}"
            target="clean"/>
    <delete>
      <fileset dir="${bin.dir}" includes="*.pyc"/>
    </delete>
  </target>

  <target name="cleandocs" depends="init" description="cleans up the API docs directory, and extra pdf docs">
    <delete dir="${build.javadocs}"/>
    <subant antfile="${docs.dir}/build.xml" buildpath="${basedir}" target="clean"/>
  </target>

</project>

<!-- End of file -->


================================================
FILE: ccg-format-grammars/arabic/arabic.ccg
================================================
#############################################################
#                                                           #
#                         arabic.ccg                        #
#                                                           #
#############################################################

# Author: Ben Wing <ben@666.com>
# Date: April 2006

# This is a grammar for a fragment of Arabic.  It's particularly
# useful for demonstrating the extended use of macros to handle
# complicated morphological inflections.

# See the `tiny' grammar (tiny.ccg) for more info about the format
# of this file.

feature {
  CASE<2>: nom, acc, gen;
  NUM<2>: sg, du, pl;
  GEND<2>: m, f;
  STATE<2>: cons, non-cons {indef, def};
  ANIM<2>: hum, nonhum;
  PERS<2>: 1st, 2nd, 3rd;
  RESUMPTIVE<2>: nonres, res;
  SEM-NUM<X:NUM>: sg-X, du-X, pl-X;
  SEM-PERS<X:PERS>: 1st-X, 2nd-X, 3rd-X;
  TENSE<E>: past, pres;
  MOOD<E>: indic, subj, juss;

  # Here's a more complicated hierarchy, from the original tiny grammar.
  ontology: sem-obj {
              phys-obj {
                animate-being {
                  person
                },
                thing
              },
              situation {
                change {
                  action
                },
                state
              }
            };
}

rule {
  no typeraise;
  typeraise +: n => s;
  typeraise - $: n => s;
  typeraise - $: pp => s;
  typeraise - $: pp/n => s;
  typechange: s$1 | n[nom] => s$1 ;
  typechange: n<~2>[cons] => n<2>[3rd,def] /* n[gen,def] ;
  typechange: n<~2>[cons] => n<2>[3rd,indef] /* n[gen,indef] ;
}

##########################################################################
#                           Morphological entries                        #
#                                 (morph.xml)                            #
##########################################################################

word wa:Conj; # "and"
word anna:Comp; # "that", introducing sentential complements
word inna:Comp; # same, but only after the verb qaal "say"

word maa:InterrogPro(thing): 3rd; # "what"
word man:InterrogPro(person): 3rd; # "who"

word li:Prep; # "what"
word fii:Prep; # "who"

# This word means "this".  
word haadhaa {
  *: sg, m;
  haadhihi: sg, f;
  ha_ulaahi: pl;

  # Bizarrely, this word declines for case only in the dual.
  haadhaani: du, m, nom;
  haadhayni: du, m, acc;
  haadhayni: du, m, gen;

  haataani: du, f, nom;
  haatayni: du, f, acc;
  haatayni: du, f, gen;
}

# This word means "that".  
word dhaalik {
  *: sg, m;
  tilka: sg, f;
  ulaa_ika: pl;

  # Bizarrely, this word declines for case only in the dual.
  dhaanika: du, m, nom;
  dhaynika: du, m, acc;
  dhaynika: du, m, gen;

  taanika: du, f, nom;
  taynika: du, f, acc;
  taynika: du, f, gen;
}

# This is the relative pronoun.
word al-ladhii {
  *: sg, m;
  al-latii: sg, f;
  al-ladhiina: pl, m;
  al-laati: pl, f;

  # Bizarrely, this word declines for case only in the dual.
  al-ladhaani: du, m, nom;
  al-ladhayni: du, m, acc;
  al-ladhayni: du, m, gen;

  al-lataani: du, f, nom;
  al-latayni: du, f, acc;
  al-latayni: du, f, gen;
}

word pro:Pro {
  ana: 1st, 1st-X, sg, sg-X;
  anta: 2nd, 2nd-X, sg, sg-X, m;
  anti: 2nd, 2nd-X, sg, sg-X, f;
  huwa: 3rd, 3rd-X, sg, sg-X, m;
  hiya: 3rd, 3rd-X, sg, sg-X, f;
  naHnu: 1st, 1st-X, pl, pl-X;
  antun: 2nd, 2nd-X, pl, pl-X, m;
  antunna: 2nd, 2nd-X, pl, pl-X, f;
  hum: 3rd, 3rd-X, pl, pl-X, m;
  hunna: 3rd, 3rd-X, pl, pl-X, f;
}

word ii:: 1st, 1st-X, sg, sg-X;
word nii:: 1st, 1st-X, sg, sg-X;
word ka:: 2nd, 2nd-X, sg, sg-X, m;
word ki:: 2nd, 2nd-X, sg, sg-X, f;
word hu:: 3rd, 3rd-X, sg, sg-X, m;
word haa:: 3rd, 3rd-X, sg, sg-X, f;
word naa:: 1st, 1st-X, pl, pl-X;
word kum:: 2nd, 2nd-X, pl, pl-X, m;
word kunna:: 2nd, 2nd-X, pl, pl-X, f;
word hum:: 3rd, 3rd-X, pl, pl-X, m;
word hunna:: 3rd, 3rd-X, pl, pl-X, f;

#############################################
#                    Nouns                  #
#############################################

# This shows how a reasonably complicated morphology can be accommodated.
# It is certainly possible that some of this may (and probably should)
# be offloaded into a separate morphology-processing engine.  However,
# even in that case there is often a good deal more to the lexicon.

# We show a couple examples of complete paradigms, in order to make it
# easier to understand what's going on below.

# Here is a typical noun (kitaab "book") with a broken plural (kutub "books").
# For nouns with broken plurals, the plural is typically declined like
# the singular.  Note that Arabic nouns are conjugated for three numbers
# (singular, dual, plural), three cases (nominative, accusative, dative),
# and three states (indefinite, definite, construct). (The construct state
# is used for nouns that are modified by other nouns -- e.g. "book" in
# "the book of Mary".)

# Form		Nominative	Accusative	Dative
# ---------------------------------------------------------------
# sg.indef	kitaabun	kitaaban	kitaabin
# sg.def	al-kitaabu	al-kitaaba	al-kitaabi
# sg.cons	kitaabu		kitaaba		kitaabi
# 
# du.indef	kitaabaani	kitaabayni	kitaabayni
# du.def	al-kitaabaani	al-kitaabayni	al-kitaabayni
# du.cons	kitaabaa	kitaabay	kitaabay
# 
# pl.indef	kutubun		kutuban		kutubin
# pl.def	al-kutubu	al-kutuba	al-kutubi
# pl.cons	kutubu		kutuba		kutubi

# Here is a typical noun (mudarris "teacher") with a different kind of
# plural, a so-called "strong masculine plural", which has its own declension.

# Form		Nominative	Accusative	Dative
# ---------------------------------------------------------------
# sg.indef	mudarrisun	mudarrisan	mudarrisin
# sg.def	al-mudarrisu	al-mudarrisa	al-mudarrisi
# sg.cons	mudarrisu	mudarrisa	mudarrisi
#
# du.indef	mudarrisaani	mudarrisayni	mudarrisayni
# du.def	al-mudarrisaani	al-mudarrisayni	al-mudarrisayni
# du.cons	mudarrisaa	mudarrisay	mudarrisay
#
# pl.indef	mudarrisuuna	mudarrisiina	mudarrisiina
# pl.def	al-mudarrisuuna	al-mudarrisiina	al-mudarrisiina
# pl.cons	mudarrisuu	mudarrisii	mudarrisii

# Here, we make heavy use of macros.

# This macro says: Every time an expression of the form
# three-form-decl(...) occurs, replace it with the text that comes after.
# The parameters will be substituted into the text.  The braces that
# denote the macro's text do *NOT* form part of the text that is substituted.
# Note that macro substitutions are processed recursively: If the text
# of a macro substitution contains calls to other macros, they will also
# be processed.  This makes "inheritance" very easy to implement.

# This macro is used for a particular paradigm corresponding to a
# particular number of a word.

def three-different-form-decl(indef-form, def-form, cons-form,
			      indef-nom, indef-acc, indef-gen,
 			      def-nom, def-acc, def-gen,
	  	              cons-nom, cons-acc, cons-gen,
	 	              morph-num, sem-num, gend) {
  indef-form.indef-nom: morph-num, sem-num, gend, nom, indef;
  indef-form.indef-acc: morph-num, sem-num, gend, acc, indef;
  indef-form.indef-gen: morph-num, sem-num, gend, gen, indef;

  add-al(def-form.def-nom): morph-num, sem-num, gend, nom, def;
  add-al(def-form.def-acc): morph-num, sem-num, gend, acc, def;
  add-al(def-form.def-gen): morph-num, sem-num, gend, gen, def;

  cons-form.cons-nom: morph-num, sem-num, gend, nom, cons;
  cons-form.cons-acc: morph-num, sem-num, gend, acc, cons;
  cons-form.cons-gen: morph-num, sem-num, gend, gen, cons;
}

# It's questionable whether we should do this.  This assimilates al-
# to a following coronal consonant, e.g. ar-rajul, as-sigaara,
# ath-thalj, an-nuur, aDH-DHuhr, etc.
def add-al(form) regsub('^al-([std]h|DH|[tdszrnTDSZL])', 'a\1-\1', al-.form)

def three-form-decl(form, indef-nom, indef-acc, indef-gen,
		    def-nom, def-acc, def-gen,
		    cons-nom, cons-acc, cons-gen,
		    morph-num, sem-num, gend) {
  three-different-form-decl(form, form, form,
			    indef-nom, indef-acc, indef-gen,
 			    def-nom, def-acc, def-gen,
	  	            cons-nom, cons-acc, cons-gen,
	 	            morph-num, sem-num, gend)
}

# Using the above macro, we create two more macros to handle two common
# paradigm types: Accusative and genitive are the same, and the
# definite is either the same as the construct (two-form-decl-1) or
# the same as the indefinite (two-form-decl-2).

def two-form-decl-1(form, non-cons-nom, non-cons-obl,
		    cons-nom, cons-obl, morph-num, sem-num, gend) {
  three-form-decl(form, non-cons-nom, non-cons-obl, non-cons-obl,
		  non-cons-nom, non-cons-obl, non-cons-obl,
		  cons-nom, cons-obl, cons-obl,
		  morph-num, sem-num, gend)
}

def two-form-decl-2(form, indef-nom, indef-obl,
		    non-indef-nom, non-indef-obl, morph-num, sem-num, gend) {
  three-form-decl(form, indef-nom, indef-obl, indef-obl,
		  non-indef-nom, non-indef-obl, non-indef-obl,
		  non-indef-nom, non-indef-obl, non-indef-obl,
		  morph-num, sem-num, gend)
}

# In turn we create macros for particular paradigms: strong masculine ("uun"),
# strong feminine ("aat"), dual, and basic triptote (the paradigm for
# "kitaab" above and, in general, most singulars).

# Note that an alternative to using braces is to put the macro text on
# the same line as the `def' part of the macro (backslashes can be used
# to join multiple lines together).

def uun-plural(form) two-form-decl-1(form, uuna, iina, uu, ii, pl, pl-X, m)
def aat-plural(form) \
  two-form-decl-2(form, aatun, aatin, aatu, aati, pl, pl-X, f)
def dual(form, gend) \
  two-form-decl-1(form, aani, ayni, aa, ay, du, du-X, gend)
def triptote(form, morph-num, sem-num, gend) \
  three-form-decl(form, un, an, in, u, a, i, u, a, i, morph-num, sem-num, gend)

# Here we define macros for full paradigms for words.  Note how semicolons
# are not used, because they are supplied by the macro text itself.
# (Consult the text for three-form-decl() above, and remember that the
# braces denoting the macro text are not actually part of the text.  This
# means that if you really want braces as the outermost thing in some
# macro text, you'll need to supply two levels of braces.)

def thing(sing, plur) {
  word sing:N(thing) {
    triptote(sing, sg, sg-X, m)
    dual(sing, m)
    triptote(plur, sg, pl-X, f)
  }
}

def fem-thing(sing, plur) {
  word sing:N(thing) {
    triptote(sing.t, sg, sg-X, f)
    dual(sing.t, f)
    triptote(plur, sg, pl-X, f)
  }
}

def person(sing, plur, gend) {
  word sing:N(person) {
    triptote(sing, sg, sg-X, gend)
    dual(sing, gend)
    triptote(plur, pl, pl-X, gend)
  }
}

def male(sing, plur) person(sing, plur, m)
def female(sing, plur) person(sing, plur, f)

def strong-male(sing) {
  word sing:N(person) {
    triptote(sing, sg, sg-X, m)
    dual(sing, m)
    uun-plural(sing)
  }
}

# Here we define the actual words.  Note how short these definitions are,
# specifying only what's unpredictable.

thing(kitaab, kutub)
thing(waqt, _awqaat)
thing(Harf, Huruuf)
thing(dars, duruus)
thing(waqt, _awqaat)
fem-thing(sigaara, sagaayir)
fem-thing(madiina, mudun)
male(rajul, rijaal)
male(walad, _awlaad)
male(Taalib, Tullaab)
female(bint, _abnaat)
strong-male(mudarris)

word imra_a:N(person) {
  three-different-form-decl(imra_at, mar_at, imra_at,
			    un, an, in, u, a, i, u, a, i,
                            sg, sg-X, f)
  three-different-form-decl(imra_at, mar_at, imra_at,
			    aani, ayni, ayni, aani, ayni, ayni, aa, ay, ay,
                            du, du-X, f)
  triptote(nisaa_, pl, pl-X, f)
}

def extended_construct_word(stem, plur) {
  word stem:N(person) {
    three-form-decl(stem, un, an, in, u, a, i, uu, aa, ii, sg, sg-X, m)
    dual(stem, m)
    triptote(plur, pl, pl-X, m)
  }
}

extended_construct_word(_ax, _ixwaan)
extended_construct_word(_ab, _abnaa_)

# Typical paradigms:

# 1sg    'aktaa      'aktaa    'akta    |
# 2sg.m  taktaa      taktaa    takta    |
# 2sg.f  taktayna    taktay    taktay   |
# 3sg.m  yaktaa      yaktaa    yakta    |
# 3sg.f  taktaa      taktaa    takta    |
# 2du    taktayaani  taktayaa  taktayaa |
# 3du.m  yaktayaani  yaktayaa  yaktayaa |
# 3du.f  taktayaani  taktayaa  taktayaa |
# 1pl    naktaa      naktaa    nakta    |
# 2pl.m  taktawna    taktaw    taktaw   |
# 2pl.f  taktayna    taktayna  taktayna |
# 3pl.m  yaktawna    yaktaw    yaktaw   |
# 3pl.f  yaktayna    yaktayna  yaktayna |
# 
# 1sg    'aktuu      'aktuwa   'aktu    | 'aktii      'aktiya   'akti    
# 2sg.m  taktuu      taktuwa   taktu    | taktii      taktiya   takti    
# 2sg.f  taktiina    taktii    taktii   | taktiina    taktii    taktii   
# 3sg.m  yaktuu      yaktuwa   yaktu    | yaktii      yaktiya   yakti    
# 3sg.f  taktuu      taktuwa   taktu    | taktii      taktiya   takti    
# 2du    taktuwaani  taktuwaa  taktuwaa | taktiyaani  taktiyaa  taktiyaa 
# 3du.m  yaktuwaani  yaktuwaa  yaktuwaa | yaktiyaani  yaktiyaa  yaktiyaa 
# 3du.f  taktuwaani  taktuwaa  taktuwaa | taktiyaani  taktiyaa  taktiyaa 
# 1pl    naktuu      naktuwa   naktu    | naktii      naktiya   nakti    
# 2pl.m  taktuuna    taktuu    taktuu   | taktuuna    taktuu    taktuu   
# 2pl.f  taktuuna    taktuuna  taktuuna | taktiina    taktiina  taktiina 
# 3pl.m  yaktuuna    yaktuu    yaktuu   | yaktuuna    yaktuu    yaktuu   
# 3pl.f  yaktuuna    yaktuuna  yaktuuna | yaktiina    yaktiina  yaktiina 


def two-form-past(formv, formc) {
  formc.tu: past, 1st, sg;
  formc.ta: past, 2nd, m, sg;
  formc.ti: past, 2nd, f, sg;
  formv.a: past, 3rd, m, sg;
  formv.at: past, 3rd, f, sg;

  formc.tumaa: past, 2nd, du;
  formv.aa: past, 3rd, m, du;
  formv.ataa: past, 3rd, f, du;

  formc.naa: past, 1st, pl;
  formc.tum: past, 2nd, m, pl;
  formc.tunna: past, 2nd, f, pl;
  formv.uu: past, 3rd, m, pl;
  formc.na: past, 3rd, f, pl;
}

def 3rd-weak-past-ay(form) {
  form.ay.tu: past, 1st, sg;
  form.ay.ta: past, 2nd, m, sg;
  form.ay.ti: past, 2nd, f, sg;
  form.aa: past, 3rd, m, sg;
  form.at: past, 3rd, f, sg;

  form.ay.tumaa: past, 2nd, du;
  form.ay.aa: past, 3rd, m, du;
  form.ataa: past, 3rd, f, du;

  form.ay.naa: past, 1st, pl;
  form.ay.tum: past, 2nd, m, pl;
  form.ay.tunna: past, 2nd, f, pl;
  form.aw: past, 3rd, m, pl;
  form.ay.na: past, 3rd, f, pl;
}

def 3rd-weak-past-aw(form) {
  form.aw.tu: past, 1st, sg;
  form.aw.ta: past, 2nd, m, sg;
  form.aw.ti: past, 2nd, f, sg;
  form.aa: past, 3rd, m, sg;
  form.at: past, 3rd, f, sg;

  form.aw.tumaa: past, 2nd, du;
  form.aw.aa: past, 3rd, m, du;
  form.ataa: past, 3rd, f, du;

  form.aw.naa: past, 1st, pl;
  form.aw.tum: past, 2nd, m, pl;
  form.aw.tunna: past, 2nd, f, pl;
  form.aw: past, 3rd, m, pl;
  form.aw.na: past, 3rd, f, pl;
}

def 3rd-weak-past-ii(form) {
  form.ii.tu: past, 1st, sg;
  form.ii.ta: past, 2nd, m, sg;
  form.ii.ti: past, 2nd, f, sg;
  form.iya: past, 3rd, m, sg;
  form.iyat: past, 3rd, f, sg;

  form.ii.tumaa: past, 2nd, du;
  form.iy.aa: past, 3rd, m, du;
  form.iy.ataa: past, 3rd, f, du;

  form.ii.naa: past, 1st, pl;
  form.ii.tum: past, 2nd, m, pl;
  form.ii.tunna: past, 2nd, f, pl;
  form.uu: past, 3rd, m, pl;
  form.ii.na: past, 3rd, f, pl;
}

def strong-past(form) two-form-past(form, form)

# In general, almost all Arabic present-tense verbs of a particular mood
# can be defined using five forms.  Verbs with a hamza in the first radical
# have a problem in the first-singular; ideally this should be handled
# automatically using a regexp or something of that sort, but we don't have
# such support currently, so we use an optional param.

def gen-pres(mood, fsing, fsing-fem, fdual, fplur-masc, fplur-fem) {
  # This shows how you can use regular expressions if need be.
  # regsub(string, regex, repl) is a special built-in that does regular-
  # expression substitution on STRING, replacing all occurrences of
  # REGEX with REPL. Regular-expression syntax is as in Python.
  # In this case, Arabic verbs have a phonetic rule that eliminates
  # two glottal stops occurring near each other at the beginning of a
  # word.  For example, _a_kulu -> _aakulu, and _u_kalu -> _uukalu.
  # (That is, the vowel is lengthened.)
  # _ . regsub(foo, bar, fsing): pres, mood, 1st, sg;
  _ . regsub('^([aiu])_', '\1\1', fsing): pres, mood, 1st, sg;
  # _.fsing: pres, mood, 1st, sg;
  t.fsing: pres, mood, 2nd, m, sg;
  t.fsing-fem: pres, mood, 2nd, f, sg;
  y.fsing: pres, mood, 3rd, m, sg;
  t.fsing: pres, mood, 3rd, f, sg;

  t.fdual: pres, mood, 2nd, du;
  y.fdual: pres, mood, 3rd, m, du;
  t.fdual: pres, mood, 3rd, f, du;

  n.fsing: pres, mood, 1st, pl;
  t.fplur-masc: pres, mood, 2nd, m, pl;
  t.fplur-fem: pres, mood, 2nd, f, pl;
  y.fplur-masc: pres, mood, 3rd, m, pl;
  y.fplur-fem: pres, mood, 3rd, f, pl;
}

# The "two-form" present uses normal (non-3rd-weak) endings but may
# have two forms of the root, one form vocalic endings (almost all of them)
# and one for consonant endings (only the feminine plural).  This
# encompasses 2nd-weak verbs and doubled verbs, and (trivially) strong verbs.

def two-form-pres-indic(formv, formc) {
  gen-pres(indic, formv.u, formv.iina, formv.aani, formv.uuna, formc.na)
}

def two-form-pres-subj(formv, formc) {
  gen-pres(subj, formv.a, formv.ii, formv.aa, formv.uu, formc.na)
}

# The jussive is different because the base form (fsing) has no ending.
# This means that it may assume the consonant form instead of the vowel
# form, or may have a number of variants (in particular, for doubled
# verbs).  So the base form needs to be given explicitly.

def two-form-pres-juss(base, formv, formc) {
  gen-pres(juss, base, formv.ii, formv.aa, formv.uu, formc.na)
}

def strong-pres(form) {
  two-form-pres-indic(form, form)
  two-form-pres-subj(form, form)
  two-form-pres-juss(form, form, form)
}

def 2nd-weak-pres(formv, formc) {
  two-form-pres-indic(formv, formc)
  two-form-pres-subj(formv, formc)
  two-form-pres-juss(formc, formv, formc)
}

def doubled-pres(formv, formc) {
  two-form-pres-indic(formv, formc)
  two-form-pres-subj(formv, formc)
  two-form-pres-juss(formc, formv, formc)
  two-form-pres-juss(formv.a, formv, formc)
  two-form-pres-juss(formv.i, formv, formc)
}

# Verbs whose third radical is a /w/ or a /y/ have all manner of exceptional
# forms; easiest just to list them.  In general, there are three types,
# depending on whether the base singular forms end in -aa, -ii, or -uu.

def 3rd-weak-pres-aa(form) {
  gen-pres(indic, form.aa, form.ayna, form.ayaani, form.awna, form.ayna)
  gen-pres(subj, form.aa, form.ay, form.ayaa, form.aw, form.ayna)
  # Note the shortened vowel here.
  gen-pres(juss, form.a, form.ay, form.ayaa, form.aw, form.ayna)
}

def 3rd-weak-pres-ii(form) {
  gen-pres(indic, form.ii, form.iina, form.iyaani, form.uuna, form.iina)
  gen-pres(subj, form.iya, form.ii, form.iyaa, form.uu, form.iina)
  # Note the shortened vowel here.
  gen-pres(juss, form.i, form.ii, form.iyaa, form.uu, form.iina)
}

def 3rd-weak-pres-uu(form) {
  gen-pres(indic, form.uu, form.iina, form.uwaani, form.uuna, form.uuna)
  gen-pres(subj, form.uwa, form.ii, form.uwaa, form.uu, form.uuna)
  # Note the shortened vowel here.
  gen-pres(juss, form.u, form.ii, form.uwaa, form.uu, form.uuna)
}

def 2nd-weak-verb(pastv, props, pastc, presv, presc) {
  word pastv: props {
    two-form-past(pastv, pastc)
    2nd-weak-pres(presv, presc)
  }
}

# Note the way that macro calls can be constructed as well.  Here, the
# value of PAST_TYPE is the suffix at the end of the macro name.

def 3rd-weak-verb(past_stem, props, past_type, pres_stem, pres_type) {
  word past_stem . past_type: props {
    3rd-weak-past- . past_type(past_stem)
    3rd-weak-pres- . pres_type(pres_stem)
  }
}

def strong-verb(past, props, pres) {
  word past: props {
    strong-past(past)
    strong-pres(pres)
  }
}

2nd-weak-verb(kaan, TransV(pred=be), kun, akuun, akun)
2nd-weak-verb(naam, IntransV(pred=sleep), nim, anaam, anam)
2nd-weak-verb(qaal, SayV(pred=say), qul, aquul, aqul)
strong-verb(katab, TransV(pred=write), aktub)
strong-verb(dhahab, IntransV(pred=go), adhhab)
# Note that the following verb, which begins with a glottal stop,
# will have a modification made to it in the first-person singular present.
# (See above.)
strong-verb(_akal, IntransV TransV (pred=eat), a_kul)
3rd-weak-verb(ra_, TransV(pred=see), ay, ar, aa)
3rd-weak-verb(_a9T, DitransV(pred=give), ay, u9T, ii)
3rd-weak-verb(laq, TransV(pred=find), ii, alq, aa)
strong-verb(9araf, ThinkV(pred=know), a9rif) # see also 9alam
strong-verb(tafakkar, ThinkV(pred=think), atafakkar)
strong-verb(ta9allam, ThinkV(pred=learn), ata9allam)

family N {
  entry: n<2>[X, 3rd, nonres]: X:sem-obj(*);
}

family InterrogPro(Pro) {
  entry: s/*(s/n<2>[res]);
  entry: s/*(s|n<2>[nonres,nom]);
  entry: s/*(s/n<2>[nonres,acc]);
  member: maa, man;
}

family Pro {
  entry: n<2>[X, nom, def, nonres]: X:sem-obj(*);
  member: pro;
}

family Rel {
  entry: (n<~2>[CASE,nonres]\n<~2>[nonres])/*(s/n<2>[res]);
  entry: (n<~2>[CASE,nonres]\n<~2>[nonres])/*(s|n<2>[nonres,nom]);
  entry: (n<~2>[CASE,nonres]\n<~2>[nonres])/*(s/n<2>[nonres,acc]);
  member: al-ladhii;
}

family AndConj(Conj) {
  entry: n[pl, CASE, STATE] \* n[CASE, STATE] /* n[CASE, STATE];
  entry: s$1 \* s$1 /* s$1;
  member: wa;
}

family Det(indexRel=det) {
  entry: n<2>[X, def, nonres] /^ n<2>[X]: X:sem-obj(<det>*);
  member: haadhaa, dhaalik;
}

# good luck on this one! construct even more complicated ones!  
#
#ar-rajulu al-ladhii kataba al-kutuba ra_aa wa _a9Taa li binti hu al-kilaaba al-latii akalat sagaayira mudarrisii al-waladi

#"the man that wrote the books saw and gave to his daughter the dogs that ate the cigarettes of the boy's teachers."

# Works, correctly:

#ar-rajulu al-ladhii kataba al-kutuba ra_aa wa _a9Taa li binti hu as-sagaayira al-latii qultu inna al-waladu tafakkara anna al-mar_atu _a9Tat haa li ha_ulaahi al-mudarrisiina

#Bad

#ar-rajula al-ladhii katabat al-kutuba ra_aa wa _a9Taa li binti hu as-sagaayira al-latii qultu inna al-waladu tafakkara anna al-mar_atu _a9Tat haa li ha_ulaahi al-mudarrisiina

#"the man that wrote the books saw and gave to his daughter the cigarettes that I said that the boy thought that the woman gave them to those teachers"

# Fails, correctly:

#ar-rajulu al-ladhii kataba al-kutuba ra_aa wa _a9Taa li binti hu as-sagaayira al-latii qultu inna al-waladu tafakkara anna al-mar_atu _a9Tat hu li ha-ulaahi al-mudarrisiina

# Works:

# ar-rajulu al-ladhii al-waladu _a9Taa as-sagaayira li binti hu dhahaba
# ar-rajulu _a9Taa li binti hu as-sagaayira
# ar-rajulu al-ladhii waladu hu _a9Taa as-sagaayira li al-binti dhahaba

# Won't work:

# ar-rajulu al-ladhii al-waladu _a9Taa li binti hu as-sagaayira dhahaba
# ar-rajulu al-ladhii waladu hu _a9Taa li al-binti as-sagaayira dhahaba


family PossClitic(Cli, indexRel=poss) {
  entry: n<~1>[X, def, nonres] \* n<1>[X, cons]: X:sem-obj(<poss>*);
  entry: (n<~1>[X, def, nonres] / n<2>[res]) \* n<1>[X, cons]: X:sem-obj(<poss>*);
  member: ii, ka, ki, hu, haa, naa, kum, kunna, hum, hunna;
}

family ObjClitic(Cli, indexRel=poss) {
  entry: (s$1 | n<3>[nonres]) \ (s$1 / n<2>[nonres] | n<3>[nom,nonres]);
  entry: (s$1 / n<~2>[res] | n<3>[nonres]) \ (s$1 / n<2>[nonres] | n<3>[nom,nonres]);
  member: nii, ka, ki, hu, haa, naa, kum, kunna, hum, hunna;
}

family Adj(indexRel=adj) {
  entry: n<2>[X, NUM, GEND, CASE, STATE] \ n<2>[X]:
         X:sem-obj(<adj>*);
}

family Prep-Nom(Prep, indexRel="*NoSem*") {
  # The pp<~3> notation generates an 'inheritsFrom' tag rather than
  # an 'id' tag for the feature structure.
  entry: pp<~3>[lex=*] /< n<3>[gen,nonres];
  member: li, fii;
}

family Comp(indexRel="*NoSem*") {
  entry: sbar<~1>[lex=*] / s<1>;
  member: anna, inna;
}

family IntransV(V) {
  entry: s[E] | n<2>[X,NUM,PERS,GEND,non-cons,nonres,nom]:
	E:action(* ^ <Actor>X:animate-being);
}

family SayV(V) {
  entry: s[E] / sbar[Z, lex=inna] | n<2>[X,NUM,PERS,GEND,non-cons,nonres,nom]:
        E:action(* ^ <Actor>X:animate-being ^ <Situation>Z);
}

family ThinkV(V) {
  entry: s[E] / sbar[Z, lex=anna] | n<2>[X,NUM,PERS,GEND,non-cons,nonres,nom]:
        E:action(* ^ <Actor>X:animate-being ^ <Situation>Z);
}

family TransV(V) {
  entry: s[E] / n[Y,acc,nonres] | n<2>[X,NUM,PERS,GEND,non-cons,nonres,nom]:
        E:action(* ^ <Actor>X:animate-being ^ <Patient>Y:sem-obj);
}

family DitransV(V) {
  # The first slash (on the pp) is marked with a mode allowing backward xcomp.
  entry: s[E] /< pp[Z,lex=li] / n[Y,acc,nonres] | n<2>[X,NUM,PERS,GEND,non-cons,nonres,nom]:
        E:action(* ^ <Actor>X:animate-being ^ <Patient>Y:sem-obj ^
	         <Recipient>Z:animate-being) ;
}

testbed {
  # different states of subject
  rajulun dhahaba: 1;
  ar-rajulu dhahaba: 1;
  rajulu dhahaba: 0;

  # subject-verb agreement
  rajulun dhahabuu: 0;
  ar-rajulu dhahabuu: 0;
  rajulu dhahabuu: 0;

  # gender agreement
  ar-rajulu dhahaba: 1;
  ar-rajulu dhahabat: 0;
  al-bintu dhahaba: 0;
  al-bintu dhahabat: 1;

  # possession
  rajulun hu dhahaba: 0;
  ar-rajulu hu dhahaba: 0;
  rajulu hu dhahaba: 1;

  # subject case
  ar-rajula dhahaba: 0;
  ar-rajuli dhahaba: 0;

  # case in construct phrase
  _axuu ar-rajuli dhahaba: 1;
  _axuu ar-rajula dhahaba: 0;
  _axuu ar-rajulu dhahaba: 0;

  # construct state in construct phrase
  _axun ar-rajuli dhahaba: 0;
  al-_axu ar-rajuli dhahaba: 0;

  # object case
  ar-rajulu ra_aa al-kitaaba: 1;
  ar-rajulu ra_aa al-kitaabi: 0;
  ar-rajulu ra_aa al-kitaabu: 0;

  # preposition case
  ar-rajulu _a9Taa al-kitaaba li al-waladi: 1;
  ar-rajulu _a9Taa al-kitaaba li al-waladu: 0;
  ar-rajulu _a9Taa al-kitaaba li al-walada: 0;

  # subcategorization
  ar-rajulu ra_aa al-kitaaba li al-waladi: 0;

  # backward xcomp
  ar-rajulu _a9Taa li al-waladi al-kitaaba: 1;
  _a9Taa ar-rajulu li al-waladi al-kitaaba: 1;

  # object clitics
  ana ra_aytu hu: 1;
  ra_aytu hu ana: 1;
  ra_aytu ana hu: 0;
  hu ra_aytu ana: 0;
  hu ana ra_aytu: 0;

  huwa ra_aa nii: 1;
  huwa ra_aa ii: 0;
  huwa ra_aa ana: 0;

  ar-rajulu _a9Taa haa li al-waladi: 1;
  _a9Taa haa ar-rajulu li al-waladi: 1;

  # relative clauses
  # "I gave it to the man that the girl saw him"
  _a9Taytu haa li ar-rajuli al-ladhii al-bintu ra_at hu: 3;
  # "I gave it to the man that the girl saw her"
  _a9Taytu haa li ar-rajuli al-ladhii al-bintu ra_at haa: 0;
  # "I gave it to the man that the girl saw"
  _a9Taytu haa li ar-rajuli al-ladhii al-bintu ra_at: 0;
  # "I gave it to the man that the girl saw the boy"
  _a9Taytu haa li ar-rajuli al-ladhii al-bintu ra_at al-walada: 0;
}


================================================
FILE: ccg-format-grammars/inherit/inherit.ccg
================================================
# A minimal grammar which shows inheritance.
# Jason Baldridge, September 2007

################## Features #################

feature {
  case: nom acc;
}

################## Words #################

word John:NP (pred=john);
word Fido:NP (pred=fido);
word food:NP (pred=food);
word to:PP;
word sleeps:IntransV (pred=sleep);
word saw:TransV (pred=see);
word gave:DitransV (pred=give);

################## Categories #################

family NP {
  entry: np[X]:X(*);  
}

family PP {
  entry: pp[X]/np[X]:X(<Prep>*);  
}

def iv_cat (PostSyn, MoreSem) {
  s[E] \ np[X nom] PostSyn: E(* <Actor>X MoreSem)
}

def tv_cat (PreSyn, PostSyn, MoreSem) {
  iv_cat(PreSyn / np[Y acc] PostSyn, <Patient>Y MoreSem)
}

family IntransV(V) {
  entry: iv_cat(,);
}

family TransV(V) {
  entry: tv_cat(,,);
}

family DitransV(V) {
  entry: tv_cat(            , / np[Z acc] , <Addressee>Z);
  entry: tv_cat(/ pp[Z acc] ,             , <Addressee>Z);
}


################## Test sentences #################

testbed {
  John sleeps: 1;
  John saw Fido: 1;
  John gave Fido food: 1;
  John gave food to Fido: 1;
}


================================================
FILE: ccg-format-grammars/tiny/tiny.ccg
================================================
#############################################################
#                                                           #
#                          tiny.ccg                         #
#                                                           #
#############################################################

# Author: Ben Wing <ben@666.com>
# Date: April 2006

# This is derived from Geert-Jan M. Kruijff's 'coordination' grammar,
# which was simplified, revised and extended.
# 
#                     David Reitter, dreitter at inf.ed.ac dot uk, 01/2005
#                     Michael White, mwhite at inf dot ed.ac.uk, 01/2005

# This is the `tiny' grammar, in .ccg format.  There are a bunch
# of comments below to explain the format.  See also the `arabic'
# grammar for an example of extended macro use to handle a complex
# morphology.

# To generate a grammar for use with OpenCCG, use `genccg' (or whatever
# it's currently called).  This generates the various XML files needed for
# OpenCCG (grammar.xml, lexicon.xml, morph.xml, types.xml, and rules.xml).
# After doing this, you can run `tccg' to load the grammar and use it for
# parsing.

# Some general notes about this format:

# -- The general feel of the syntax is like C, Java or Perl.  Indentation
#    and whitespace is unimportant. (The only exception is in macro
#    definitions, where the text of a macro must either be on the same line
#    as the definition -- possibly extended with backslash
#    line-continuation markers -- or be enclosed in braces.)
#
# -- The syntax tries to be very forgiving of the usage of commas and
#    semicolons, for the benefit of macro definitions.  In most lists, in
#    fact, commas are optional -- arguments can be separated by no commas,
#    one comma, or many commas, and extra commas can occur at the end of
#    the list.  All of this makes macro definitions and macro calls much
#    easier.  We usually write such lists below without commas.
#
#    The main exception where commas matter is in macro calls.  You can
#    still put an extra comma at the end of a macro call, but otherwise you
#    must have exactly one comma (no more, no less) between arguments.  The
#    reason is that macro arguments can contain pretty much any text
#    whatsoever (including no text at all), so commas are needed to
#    indicate where one argument stops and the next one starts.
#
#    NOTE: The parser pays attention to parens, brackets, and braces in the
#    text of a macro call argument, and will not get confused by commas
#    inside of matched delimiters.  Thus, a macro call `foo(a, bar(b, c))'
#    is correctly interpreted as a call to foo() with two arguments, `a'
#    and `bar(b, c)', and *NOT* a call to foo() with three arguments `a',
#    `bar(b', and `c)'.)
#
#    Note also how the text of macro definitions and calls can optionally
#    be surrounded by braces, to clearly delimit the text boundaries (see
#    below).  It's important to note that the braces do *NOT* form part of
#    the text itself; if you really want your text surrounded by braces,
#    you need to add a second set around the text.
#
# -- You can use the `-t' option to see what things look like after macro
#    substitutions have been applied.
#
# -- The order of declarations in this file is not significant except
#    that macros and features must be defined before they can be used.
#
# -- You can surround literal text (word stems, inflections, etc.) with
#    single or double quotes in order to insert characters into the text
#    that would otherwise be interpreted by the parser, such as spaces,
#    colons, etc.  Without such quotes, the only characters that can occur
#    in a word are letters, numbers, '_', '-', '+' and '%'.  Note, however,
#    that there is no such thing as "reserved words" in this format; words
#    like 'feature', 'word', 'entry', etc. that have a special significance
#    in the right place in the syntax can otherwise be freely used as word
#    stems and inflections, macro variable names, part of speech tags, etc.

#############################################################
#                                                           #
#                          FEATURES                         #
#                                                           #
#############################################################

# Declaration of features.  This is used as follows:
#
# (1) So that you can just specify a feature value inside brackets below,
#     and the appropriate feature is substituted.  That is, a declaration
#     like n[nom] is equivalent to n[CASE=nom].
#
# (2) To specify the types listed in types.xml.
#
# (3) To specify the feature values used in word declarations.  These
#     compile out into <macro ...> declarations in morph.xml (unrelated to
#     our own use of macros).  In order for this to happen, however, you
#     *must* specify a "macro-tie", inside of parentheses after the feature
#     type.  This is either a number (for a syntactic macro) or a letter
#     (for a semantic macro).  See below for exactly how these are used.
#
# (A "strict feature" mode may be implemented at some point, where all
# features that are used in category definitions must be declared.)

feature {
  # A number following the feature type, as follows, is used for syntactic
  # features that can be attached to a word.  The number is a feature-
  # structure ID; when an atomic category in a lexical category definition
  # has the corresponding ID, these features will be inserted into that
  # category.  Hence, the <2> here corresponds to the <2> that occurs
  # below in the definition of Noun, Det, verbcat(), etc.
  CASE<2>: nom acc;
  NUM<2>: sg pl;
  # You can specify more than one number if you want.
  # NUM<2,3>: sg pl;

  # A word in place of a number causes semantic macros to be created; if
  # used in a word {} declaration, the relevant info will be inserted into
  # the hybrid logic part of a lexical category declaration, attached to
  # the argument of the given name.  A declaration like (X:NUM) means that
  # 'NUM' is used in the XML <diamond mode="..."> declaration in place of
  # the feature's actual name. (FIXME: I don't know what the significance
  # of this is.)
  sem-num<X:NUM>: sg-X pl-X;
  TENSE<E>: past pres;

  # You can create hierarchical values as shown.
  PERS<2>: non-3rd {1st 2nd} 3rd;

  # Alternatively, you can explicitly list the parent(s) of a feature --
  # e.g. to create multiple-inheritance hierarchies.
  #alternate-pers<2>: non-3rd 1st[non-3rd] 2nd[non-3rd] 3rd;

  # Here's a more complicated hierarchy, from the original tiny grammar.
  ontology: sem-obj {
              phys-obj {
                animate-being {
                  person
                }
                thing
              }
              situation {
                change {
                  action
                }
                state
              }
            };

  # Here we show how you can mix the two ways of declaring hierarchies,
  # if you have a primarily single-inheritance hierarchy but with certain
  # multiply-inherited values.  In this hierarchy, 'werewolf' gets both
  # 'man' and 'wolf' as its parents.  'intersex' will have only 'man' and
  # 'woman' as parents -- 'rational-being' will not be specified as it's
  # redundant.
  entity: being {
	    # We would call this `thing' but that is used above in
            # the `ontology' hierarchy, and causes a warning to be issued
            thing2
            animate {
              irrational-being {
                fish
                mammal { dog-like {dog wolf} cat horse }
              }
              rational-being {
                man {
                  centaur[horse]
                  werewolf[wolf]
                }
                woman {
                  mermaid[fish]
                }
                intersex[man woman]
              }
            }
          }
          nothingness;
}

# You can also specify that a feature is "distributive" and/or give
# licensing information for the realizer.
#
# Here's the equivalent of the stuff in flights/lexicon.xml and
# flights/types.xml.
#
# A ! before a feature makes it distributive.  You can specify
# licensing-related attributes on either a feature or a feature-value, in
# the standard way of specifying attributes in .ccg format.

feature {
  !owner(location=args-only, instantiate=false);
  !info;
  form: dcl-base {dcl, fronted},
        q-base {q(license-marked-cats=true, also-licensed-by=q-base),
                wh(license-marked-cats=true, also-licensed-by=q-base)},
        base,
        emb(location=target-only),
        inf(location=target-only),
        adj(location=target-only),
        ng;
}

# If you really want the feature value as used in the word {} declarations
# to be different from the feature value elsewhere, you can do that.
# This allows you to generate the following XML:
#
#  <macro name="@acc0">
#    <fs id="0" attr="case" val="p-case"/>
#  </macro>
#  <macro name="@acc1">
#    <fs id="1" attr="case" val="p-case"/>
#  </macro>
#  <macro name="@acc2">
#    <fs id="2" attr="case" val="p-case"/>
#  </macro>
#  <macro name="@acc3">
#    <fs id="3" attr="case" val="p-case"/>
#  </macro>
#
#feature {
#  case<0>: acc0:p-case;
#  case<1>: acc1:p-case;
#  case<2>: acc2:p-case;
#  case<3>: acc3:p-case;
#}

# NOTE: (1) This doesn't quite work in ccg2xml yet, since only `acc3' gets
# added to the hierarchy in types.xml. (2) The entire motivation for doing
# this kind of thing is kludgy, and will be eliminated by allowing features
# to be explicitly specified for the result of a lexical insertion rule,
# much like the way that type-raising rules currently work.

# Here's how you specify a relation-sorting order, in case you care.
relation-sorting: foo * bar baz;

#############################################################
#                                                           #
#                           WORDS                           #
#                                                           #
#############################################################

#
################## Functional words #################
#

# Some examples of words.
#
# The format of word declarations is
#
# word STEM:FAMILY ...(ATTRS): FEATURES;
#
# or
#
# word STEM:FAMILY ...(ATTRS) { INFLECTED-FORM: FEATURES; ...}
#
# where STEM is the word's stem, FAMILY is a list of the families that a
# word is part of, and ATTRS specifies any other attributes associated
# with the word.  FEATURES gives the word's features; these come from the
# feature {} declarations above. (NOTE: Only feature values whose features
# specify a "macro-tie" value -- something in <> following the
# feature's name -- can be used.  See above.)
#
# ATTRS is a list; each attribute is either a specification ATTRIBUTE=VALUE
# or a single VALUE (equivalent to class=VALUE).  The useful attributes are
#
# class		Semantic class of a word.
# pred		Semantic predicate of a word, used in the logical form;
#               if omitted, defaults to the word's stem.
# excluded      List of excluded lexical categories.
# coart         Boolean indicating that this entry is a coarticulation,
#               eg a pitch accent, gesture, or other word-associated element.
#
# Any of FAMILY, ATTRS and/or FEATURES can be omitted.
#
# The second form above, with braces, is used for words with different
# inflections.  Instead of specifying the features directly after the word,
# you list the features for each inflection separately.  Note that * is
# shorthand for the stem itself.
#
# Note that there can be more than one word {} declaration for a single stem.
#
# The families in FAMILY can be either a family name, from a family {}
# block, or a part of speech. (`genccg' will derive the appropriate parts
# of speech from any families given when creating the XML file.)  Note that
# the words associated with a particular family can be specified either by
# tagging each word with its family, by listing a family's words explicitly
# using the `member' declaration inside of a family {} block, or by a
# combination of the two.

word the:Det;
word some:Det;
word a:Det: sg;

word for;

word pro1:Pro(animate-being) {
  I: 1st sg nom sg-X;
  me: 1st sg acc sg-X;
  we: 1st pl nom pl-X;
  us: 1st pl acc pl-X;
}

word pro2:Pro(animate-being) {
  you: 2nd;
}

word pro3f:Pro(animate-being) {
  she: 3rd sg nom sg-X;
  her: 3rd sg acc sg-X;
}

word pro3m:Pro(animate-being) {
  he: 3rd sg nom sg-X;
  him: 3rd sg acc sg-X;
}

word pro3n:Pro(thing) {
  it: 3rd sg sg-X;
}

# If we want the CLASS associated with only some of the inflections,
# we can use the same stem in more than one decl. (Assigning neuter to
# "they" is strange but that's how the original morph.xml did it!)

word pro3n:Pro {
  they: 3rd pl nom pl-X;
  them: 3rd pl acc pl-X;
}

#
################## Nouns #################
#

# Here, we make use of macros.  The basic idea behind macros is simple:
# They simply do string substitution.  However, parameters can be given,
# making them very powerful.

# This macro says: Every time an expression of the form basic-noun(...) 
# occurs, replace it with the text that comes after.  The parameters will
# be substituted into the text.  The braces that denote the macro's text do
# *NOT* form part of the text that is substituted. (Alternatively, you
# can put the entire replacement text on the same line as the macro
# definition, using a backslash at the end of the line if needed in order
# to continue the definition on the next line.) Likewise, braces can be
# used to surround text in an argument to a macro call and will not form of
# the argument's text.  This is useful when the argument's text contains
# commas.  In either case, if you really want the text itself to have
# braces around it, you need to put two sets of braces around it.

# Note that macro substitutions are processed recursively: If the
# text of a macro substitution contains calls to other macros, they will
# also be processed.  This makes "inheritance" very easy to implement.

# Inside of a macro definition's text, the . operator can be used; this
# concatenates two words together into a single word.  See the definition
# of normal-noun() below for a simple example.

# Substitution of arguments does not occur inside of quoted text.

def basic-noun(sing, plur, class) {
  word sing:N(class) {
    *: sg sg-X;
    plur: pl pl-X;
  }
}

#def normal-noun(stem, class) {
#  word stem:N(class) {
#    *: sg sg-X;
#    stem . s: pl pl-X;
#  }
#}

# or equivalently, using our definition of basic-noun():

# def normal-noun(stem, class) basic-noun(stem, stem . s, class)

# But in fact, we do something more clever to handle pluralization.
# Here we make use of some built-in macros():
#
# regsub(PATTERN, REPLACEMENT, TEXT):
#   Replace all occurrences of regexp PATTERN with REPLACEMENT in TEXT.
#   This follows normal Python conventions for regular expression
#   substitution.
#
# ifmatch(PATTERN, TEXT, IF-TEXT, ELSE-TEXT):
#   If TEXT matches PATTERN at its beginning, substitute IF-TEXT; else,
#   substitute ELSE-TEXT.
#
# ifmatch-nocase(PATTERN, TEXT, IF-TEXT, ELSE-TEXT):
#   Just like ifmatch() but its pattern-matching is case-insensitive.

def pluralize(word) {
  # This shows a complicated expression involving the built-ins
  # 'ifmatch' and 'regsub'.  If the word ends in a vowel + o or y,
  # we add s.  Else, if the word ends in (consonant) + o or y, or s, sh, ch,
  # or x, we change y to i and add es.  Finally, in all other cases,
  # just add s.  So buy -> buys, boy-> boys, but try -> tries, lady -> ladies.
  # Similarly, go -> goes but goo -> goos.  For words like volcano -> volcanos
  # you have to put the forms in manually (or change the rule here, and put
  # forms in -o + es in manually, e.g. does, goes, tomatoes, potatoes).
  #
  ifmatch('^.*[aeiou][oy]$', word, word . s,
    ifmatch('^.*([sxoy]|sh|ch)$', word, regsub('^(.*)y$', '\1i', word) . es,
            word . s))
}

def noun(sing, class) basic-noun(sing, pluralize(sing), class)

noun(book, thing)
noun(DVD, thing)
noun(glass, thing)
noun(church, thing)
noun(flower, thing)
noun(bath, thing)
noun(teacher, person)
noun(lady, person) # Pluralized (correctly) to 'ladies'
noun(boy, person)  # Pluralized (correctly) to 'boys'

# An irregular noun.
basic-noun(policeman, policemen, person)

#
################## Verbs #################
#

# The "props" parameter specifies families or attributes.

def basic-verb(stem, props, 3sing, pasttense) {
  word stem:props {
    *: pres non-3rd sg;
    3sing: pres 3rd sg;
    *: pres pl;
    pasttense: past;
  }
}

def verb(stem, props, pasttense) \
  basic-verb(stem, props, pluralize(stem), pasttense)

verb(buy, TransV DitransBenV, bought)
verb(rent, TransV DitransBenV, rented)
verb(go, IntransV, went)
verb(sleep, IntransV, slept)
# Here we show how you can specify a predicate or other attribute.
# Admittedly this is not too useful here, but it can be much more so in
# the case of a foreign language, where we want the semantic predicates
# to be in English. (See arabic.ccg.)
verb(eat, TransV IntransV (pred=manjar), ate)

#############################################################
#                                                           #
#                           RULES                           #
#                                                           #
#############################################################

# This declaration specifies the contents of rules.xml.  Each statement
# specifies a single rule; it is also possible for statements to cancel
# some or all rules.
#
# Note that some rules are enabled by default; this includes application,
# composition and crossed composition (forward and backward in each case),
# as well as forward type-raising from np to s/(s\np) and backward
# type-raising from np to s$1\(s$1/np).

rule {
  # turn off forward cross-composition
  no xcomp +;

  # this is how we could turn off all type-raising rules.
  # no typeraise;

  # Declare a backward type-raising rule from pp to s$1\(s$1/pp).
  # The $ causes a dollar-sign raise category to be created, as shown;
  # without it, we'd just get s\(s/pp).
  typeraise - $: pp => s;

  # Declare a type-changing rule to enable pro-drop (not useful in English!)
  # typechange: s[finite]\np[nom]$1 => s[finite]$1 ;
}

# This shows how you can turn off all defaults and specify your own
# properties from scratch, if you want.

# rule {
#   no; # remove all defaults
#   app +-;
#   comp +-; # +- means both forward and backward
#   xcomp -;
#   sub +-;
#   xsub +-;
#   # Defaults for typeraising are np => s, if omitted.
#   typeraise +;
#   typeraise - $;
# }
# 

#############################################################
#                                                           #
#                         CATEGORIES                        #
#                                                           #
#############################################################

# Specify lexical families and the lexical insertion rules for each
# family.  Properties of the family can be given in parens after the
# family name.  The family name should either be the same as a part
# of speech, or the part of speech should be given in parens after
# the family name.

# Categories can be specified in an expected form, e.g. s\np[nom]/np[acc].
# The notation np<3>[acc] corresponds to XML code like this:
#      <atomcat type="np">
#        <fs id="3">
#          <feat attr="CASE" val="acc"/>
#        </fs>
#      </atomcat>
# i.e. the <3> specifies the feature-structure ID, and the [acc]
# specifies a <feat> constraint.  In this case, a constraint of the form
# [CASE=acc] is generated because of the feature {} declaration above.
# If an unknown value is given, e.g. [foo], it's assumed to be a feature,
# rather than a feature value, and you get code like
#          <feat attr="foo"> <featvar name="FOO"/> </feat>
#          <feat attr="CASE" val="acc"/>
# You can also write [foo=bar] to explicitly give a feature and value.
# And an entry like [X] corresponds to
#          <feat attr="index"> <lf> <nomvar name="X"/> </lf> </feat>
# Note also that slashes can be followed by a slash mode, e.g. /<, or
# the mode can be omitted; in this case, a default mode is generated:
# \<, />, |.

family Det(indexRel=det) {
  entry: np<2>[X PERS=3rd] /^ n<2>[X]:
         X:sem-obj(<det>*);
}

family Prep-Nom(Prep, indexRel="*NoSem*") {
  # You can name your entries, as shown, although it's not clear there's
  # much point.
  #
  # The pp<~3> notation generates an 'inheritsFrom' tag rather than an 'id'
  # tag for the feature structure.  This unifies only the properties not
  # explicitly given in the category, i.e. everything but 'lex' will unify.
  #
  # The entry [lex=*] corresponds to <feat attr="lex" val="[*DEFAULT*]"/>
  # and means that a feature 'lex' will be attached, whose value is the
  # word stem.
  entry Nominal: pp<~3>[lex=*] /< np<3>[acc];

  # If members are specified, the family defaults to 'closed'.
  member: for;
}

family Conj {
  entry: np[NUM, X0] \* np[X1] / np[X2]:
         X0(and ^ <First>(L1 ^ elem ^ <Item>X1 ^
	                  <Next>(L2 ^ elem ^ <Item>X2)));
}

family DollarTest {
  entry: s\np$1\*(s\np);
  entry: s\(np$1)\*(s\np);
}

family N {
  entry: n<2>[X NUM]: X:sem-obj(*);
}

family Pro {
  entry: np<2>[X NUM PERS CASE]:
         X:sem-obj(*);
}

# Here we create a macro to describe the category for a verb, with transitive
# arguments ARGS (possibly empty) and corresponding semantics SEM.
# Don't call this macro just "verb" since that's used above already!

def verbcat(args, sem) {
  # A * here corresponds to <prop name="[*DEFAULT*]"/>.
  # Similar use of * appears above in [lex=*] in prepositions,
  # and <det>* in determiners.
  s<1>[E] \ np<2>[X NUM PERS nom] args:
     E:action(* <Actor>X:animate-being sem)
}
family IntransV(V) {
  entry: verbcat(,);
}

# This shows how we could extend verbcat() to handle transitive verbs.
# Since the arguments for ditransitive verbs could potentially either
# before or after the transitive argument, we need two different macros.
# Or, we could create one macro, with two different parameters for "before"
# and "after" arguments.

def before_transverbcat(args, sem) {
  verbcat(args / np<3>[Y acc], <Patient>Y:sem-obj sem)
}

def after_transverbcat(args, sem) {
  verbcat(/ np<3>[Y acc] args, <Patient>Y:sem-obj sem)
}

family TransV(V) {
  entry: after_transverbcat(,);
}

family DitransBenV(V) {

  # Careful here!  Remember that the arguments in a CCG category will be
  # listed in backwards order compared to how they appear in the surface
  # syntax.  Hence SUBJ VERB X Y Z corresponds to s\np/z/y/x.

  entry DTV:
    after_transverbcat(/< np[Z acc], <Beneficiary>Z:animate-being);
  entry NP-PPfor:
    before_transverbcat(/ pp[Z lex=for], <Beneficiary>Z:animate-being);

  # This shows how we could define the previous entry directly in
  # terms of verbcat().
  #entry NP-PPfor: verbcat(/ pp<4>[Z lex=for] /< np<3>[Y acc],
  #                         <Patient>Y:sem-obj <Beneficiary>Z:animate-being);
}

#############################################################
#                                                           #
#                           TESTBED                         #
#                                                           #
#############################################################

# Statements to put in testbed.xml.  If you omit the number, it will omit
# the corresponding numOfParses item in the XML; I think this currently
# is equivalent to specifying 1 as the number.  If you put a ! before a
# line, this indicates a "known failure" (known="true" in the XML).

testbed {
  the teacher buys the policeman a book: 1;
  the teacher buys the policemen some flowers: 1;
  the teachers buy a book: 3;
  she buys it: 3;
  she buy it: 0;
  # Possible example of a known failure, in case we know we don't correctly
  # reject "she buy buy":
  ! she buy buy: 0;
  they buys it: 0;
  she buys the flower for him: 1;
  she buys the flower for he: 0;
  her buys the flower for him: 0;
  he rented her a DVD: 1;
  he rented a DVD for her: 1;
  he rented a DVD her: 0;
}


================================================
FILE: ccg-format-grammars/tinytiny/tinytiny.ccg
================================================
# A truly minimal grammar for CCG.
# Ben Wing, May 2006

################## Features #################


feature {
  CASE<2>: nom acc;
  NUM<2>: sg pl;
  PERS<2>: non-3rd {1st 2nd} 3rd;

  TENSE<E>: past pres;
  SEM-NUM<X:NUM>: sg-X pl-X;

# Some alternate code that appeared from somewhere, I'm not sure anymore.
# Enable the following three statements and disable the statement above
# beginning `NUM<2>: ...'.  It looks like it tries to implement something to
# do with number agreement. (Note that number agreement is already taken care
# of in the normal system.  I'm not sure what the code is trying to do.)
#  num<2,X:num>: sg pl;
#  num<1,2>: sg-agr:sg pl-agr:pl;
#  num<2>: sg-2:sg pl-2:pl;

  ontology: sem-obj {
              phys-obj {
                animate-being {
                  person
                }
                thing
              }
              situation {
                change {
                  action
                }
                state
              }
            };
}

################## Words #################

# Example of how to have punctuation and other non-word characters in a
# lexical item.
word '.':Punc;
word ',':Punc;
word '?':Punc;

word the:Det;
word a:Det: sg;

word pro1:Pro(animate-being) {
  I: 1st sg nom sg-X;
  me: 1st sg acc sg-X;
  we: 1st pl nom pl-X;
  us: 1st pl acc pl-X;
}

def noun(sing, plur, class) {
  word sing:N(class) {
    *: sg sg-X;
    plur: pl pl-X;
  }
}

noun(book, books, thing)
noun(peach, peaches, thing)
noun(boy, boys, person)
noun(policeman, policemen, person)

def verb(stem, props, 3sing, pasttense) {
  word stem:props {
    *: pres non-3rd sg;
    3sing: pres 3rd sg;
    *: pres pl;
    pasttense: past;
  }
}

verb(go, IntransV, goes, went)
verb(sleep, IntransV, sleeps, slept)
verb(eat, TransV IntransV, eats, ate)
verb(see, TransV, sees, saw)
# This is a test of set arguments.  Not clear it's useful or should be here;
# maybe move to tiny.ccg?
verb(setverb, SetargV, setverbs, setverbed)

################## Categories #################

family Punc {
  entry: punc;
}

family Det(indexRel=det) {
  entry: np<2>[X PERS=3rd]/^ n<2>[X]:
         X:sem-obj(<det>*);
}

family N {
  entry: n<2>[X]:
         X:sem-obj(*);
}

family Pro {
  entry: np<2>[X]:
         X:sem-obj(*);  
}

family IntransV(V) {
  entry: s<1>[E] \ np<2>[X nom]:
         E:action(* <Actor>X:animate-being);
}

family TransV(V) {
  entry: s<1>[E] \ np<2>[X nom] / np<3>[Y acc]:
         E:action(* <Actor>X:animate-being <Patient>Y:sem-obj);
}

family SetargV(V) {
  entry: s<1>[E] {\np<2>[X nom], / np<3>[Y acc]}:
         E:action(* <Actor>X:animate-being <Patient>Y:sem-obj);
}

################## Test sentences #################


testbed {
	the policemen eat:	2;
  the boys eat: 2;
  the boys eat the peaches: 1;
  the policeman sleeps: 1;
  the policemen sleeps: 0;
  the policemen sleep: 1;
  the policeman sleeps the peach: 0;
  the policeman saw me: 1;
  the policeman saw I: 0;
  I see the book: 1;
  I sees the book: 0;
  I see a book: 1;
  I see a books: 0;
}


================================================
FILE: ccgbank/bin/american-to-logical-quotes.py
================================================
"""
Copryright (c) 2011 Dennis N. Mehay

Assumes tokenized, PTB3-normalized UTF-8 text, one sentence per line.

<stdin> => <stdout>

Turns 'American'-style quotations into 'British'/'logical'-style quotations.

So, e.g.,

`` Hello , '' said John .

becomes:

`` Hello '' , said John .

[Insert LGPL here]
"""

import sys, codecs, os

streamReader = codecs.lookup("utf-8")[2]
streamWriter = codecs.lookup("utf-8")[-1]

sys.stdin = streamReader(sys.stdin)
sys.stdout = streamWriter(sys.stdout)

for ln in sys.stdin:
    # trim off extra whitespace and replace double spaces with single spaces.
    ln = ln.strip().replace(u"  ", u" ")
    # now replace
    #  <space>, ''
    # with
    #  <space>''
    # and
    # <space>. ''
    # with
    # <space>'' .
    ln = ln.replace(u" , ''", " '' ,").replace(u" . ''", " '' .")
    # now fix any double-punct messes this might have created.
    ln = ln.replace(u" '' . ?", u" . '' ?").replace(u" '' . !", u" . '' !")
    sys.stdout.write(ln + '\n')


================================================
FILE: ccgbank/bin/convert-mtc-systems.py
================================================
"""
This program takes a set of documents (all streamed from stdin at once) and formats them in a way suitable for
use with the NIST-distributed mteval script. The output is in UTF-8.

Usage: cat [MTC_DIR_FOR_SYSTEM] | python convert-mtc.systems.py [doctype-string {'source', 'target', 'ref'} (default='target')] | [NEW_XML_DOC_TO_STDOUT]
"""
import sys, os, re, codecs, xml.sax.saxutils, my_unicode
try:
    import chardet
except:
    chardet = None
from xml.etree.ElementTree import *
from collections import defaultdict

def tokenize(t):
    """very simple text tokenization:
    <blah>n't => <blah> n't
    <blah>'s  => <blah> 's
    <blah>'   => <blah> '
    where '<blah>' is not whitespace.
    """
    t = t.replace("n't", " n't").replace("'s", " 's").replace("' ", " ' ")
    if t[-1] == "'":
        t = t[:-1] + " " + t[-1]
    return t.replace("  ", " ")

def decode_line(ln, encoding):
    res = None
    try:
        res = ln.decode(encoding)
    except:
        try:
            res = ln.decode("iso-8859-2")
        except:
            try:
                res = ln.decode("iso-8859-1")
            except:
                try:
                    res = ln.decode("utf-8")
                except:
                    try:
                        res = ln.decode("GB2312")
                    except:
                        try:
                            res = ln.decode("Big5")
                        except:
                            try:
                                res = ln.decode("EUC-TW")
                            except:
                                res = ln
                
    return res

doc_pattern = re.compile(u"<[Dd][Oo][Cc] docid=\"(.*)\" sysid=\"(.*)\">(.*)")
doc_pattern_source = re.compile(u"<[Dd][Oo][Cc] docid=\"(.*)\">(.*)")
seg_pattern = re.compile(u"<seg id=\"?(.*)\"?>(.*)</seg>$")

doc_type = "target"
if len(sys.argv) >= 2:
    doc_type = sys.argv[1].lower()
if not doc_type in ["target", "source", "reference"]:
    doc_type = "target"
    
mtc_in = sys.stdin.readlines()
mtc_all = (os.linesep).join(mtc_in)

if not chardet is None:
    encoding = chardet.detect(mtc_all)['encoding']
else:
    encoding = "ISO-8859-2"

# turn stdout into a UTF-8 converting writer.
streamWriter = codecs.lookup("UTF-8")[-1]
sys.stdout = streamWriter(sys.stdout)
output = sys.stdout

# map from auto-assigned ID to MTC ID.
autoid2mtcid = {}

mtc     = defaultdict(lambda: [])
sys = None
for l in mtc_in:
    l = decode_line(l, encoding).strip()
    if l.startswith("<DOC"):
        match = doc_pattern.findall(l)[0] if (doc_type == "target") else doc_pattern_source.findall(l)[0]
        if doc_type == "target":
            (docid, sysid) = (match[0], match[1])
        else:
            (docid, sysid) = (match[0], None)
        docid = docid.replace("_",".")
        curr_doc = docid
        curr_sys = sysid
        sys = curr_sys
    elif l.startswith("<seg"):
        match = seg_pattern.findall(l)[0]
        (segid, text) = (match[0], match[1])
        
        mtc[(curr_sys, curr_doc)].append((segid, text.strip()))

output.write("<?xml version=\"1.0\" encoding=\"UTF-8\"?>" + \
             os.linesep + "<!DOCTYPE mteval SYSTEM \"ftp://jaguar.ncsl.nist.gov/mt/resources/mteval-xml-v1.3.dtd\">" + os.linesep +\
             "<mteval>" + os.linesep)
if doc_type == "target":
    output.write("    <tstset setid=\"multiple_translation_set\" srclang=\"Chinese\" trglang=\"English\" sysid=\"%s\">" % sys + os.linesep)
elif doc_type == "source":
    output.write("    <srcset setid=\"multiple_translation_set\" srclang=\"Chinese\">" + os.linesep)
else:
    output.write("    <refset setid=\"multiple_translation_set\" srclang=\"Chinese\" trglang=\"English\" refid=\"1\">" + os.linesep)
docs = mtc.keys()
docs.sort()

for (sy,doc) in docs:
    output.write("        <doc docid=\"%s\" genre=\"nw\">" % doc + os.linesep)
    segids_and_texts = mtc[(sy,doc)]
    segids_and_texts.sort(lambda a,b: cmp(int(a[0]),int(b[0])))
    for (segid,text) in segids_and_texts:
        output.write("            <seg id=\"%s\"> %s </seg>" % (segid,xml.sax.saxutils.escape(my_unicode.removeInvalidChars(tokenize(text)))) + os.linesep)
    output.write("        </doc>" + os.linesep)

if doc_type == "target":
    output.write("    </tstset>" + os.linesep + "</mteval>")
elif doc_type == "source":
    output.write("    </srcset>" + os.linesep + "</mteval>")
else:
    output.write("    </refset>" + os.linesep + "</mteval>")


================================================
FILE: ccgbank/bin/convert-spaces-to-newlines.py
================================================
#
# converts spaces to newlines, and newlines to special <eol> chars,
# from stdin to stdout
#
import sys, re;
[sys.stdout.write(re.sub(' ','\n',re.sub('\n','<eol>',line))) for line in sys.stdin]


================================================
FILE: ccgbank/bin/convert_all
================================================
#!/bin/bash
for i in 00 01 02 03 04 05 06 07 08 09 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
do
   echo "Starting conversion for section $i"
   nice ccg-build -Dsect=$i -Dfile=* convert-puncts-aux-bbn >& logs/log.convert.$i &
done


================================================
FILE: ccgbank/bin/correlate-to-judgments.py
================================================
"""
Correlate human judgments (streamed into sys.stdin -- e.g., from the MTC)
to the BLEU/NIST scores in the given directories (sys.argv[1] and sys.argv[2]).

Depends on rpy2 having been installed.
"""
import sys, os
try:
    import rpy2
    import rpy2.robjects as robjs
    
except ImportError:
    print >> sys.stderr, "please install rpy2. exiting..."
    sys.exit(-1)


def num2string(n):
    """
    E.g., 0 => '00', 1 => '01' and 10 => '10'.
    """
    try:
        numm = int(n)
    except:
        numm = n
    if numm < 10:
        return str(numm)
    else:
        return str(numm)
    
human_judgments = []
human_judgments_fluency = [] # fluency.
human_judgments_acc = [] # accuracy.
human_judgments_ave = [] # average of both.
   
for l in sys.stdin:
    l = l.strip()    
    if l.startswith("#"):
        continue
    lparts = l.split(",")
    # appending (sys,doc,judge,ref_sys,segment,fluency,accuracy)
    human_judgments.append(tuple(lparts[0:7]))
    human_judgments_fluency.append(int(lparts[5]))
    human_judgments_acc.append(int(lparts[6]))
    human_judgments_ave.append((float(lparts[5]) + float(lparts[6]))/2.0)

human_judgments_fluency = robjs.FloatVector([float(i) for i in human_judgments_fluency])
human_judgments_acc = robjs.FloatVector([float(i) for i in human_judgments_acc])
human_judgments_ave = robjs.FloatVector([float(i) for i in human_judgments_ave])

bleu_nist_dir1 = sys.argv[1]
bleu_nist_dir2 = sys.argv[2]

# the next two are maps from: (sys,doc,ref,segID) => score
bleu_scores = {}
nist_scores = {}

for f in [fl for fl in os.listdir(bleu_nist_dir1) if ("BLEU" in fl or "NIST" in fl)]:
    for l in open(bleu_nist_dir1 + os.sep + f, "rb").readlines():
        if l.strip() == "":
            continue
        (sys,ref_sys,doc,seg,bleu_or_nist_score) = l.split(",")
        if "BLEU" in f:
            bleu_scores[(sys,doc,ref_sys,"S"+num2string(seg))] = bleu_or_nist_score
        else:
            nist_scores[(sys,doc,ref_sys,"S"+num2string(seg))] = bleu_or_nist_score
    

for f in [fl for fl in os.listdir(bleu_nist_dir2) if ("BLEU" in fl or "NIST" in fl)]:
    for l in open(bleu_nist_dir2 + os.sep + f, "rb").readlines():
        if l.strip() == "":
            continue
        (sys,ref_sys,doc,seg,bleu_or_nist_score) = l.split(",")
        if "BLEU" in f:
            bleu_scores[(sys,doc,ref_sys,"S"+num2string(seg))] = float(bleu_or_nist_score)
        else:
            nist_scores[(sys,doc,ref_sys,"S"+num2string(seg))] = float(bleu_or_nist_score)


# for both BLEU and NIST, compute rpy2 vectors that parallel the seqeuence
# of human judgments.
# step through the (sys,doc,judge,ref_sys,segment,fluency,accuracy) tuples.
bleu_lst = []
nist_lst = []
for (s,d,j,rs,sg,f,a) in human_judgments:
    if (s,d,rs,sg) in bleu_scores:
        bleu_lst.append(bleu_scores.get((s,d,rs,sg)))
    else:
        print "nope", (s,d,rs,sg)
    if (s,d,rs,sg) in nist_scores:
        nist_lst.append(nist_scores.get((s,d,rs,sg)))
    else:
        print "nope", (s,d,rs,sg)

bleu_vec = robjs.FloatVector(bleu_lst)
nist_vec = robjs.FloatVector(nist_lst)

# compute correlations
b_fluency = robjs.r['cor'](bleu_vec, human_judgments_fluency)
b_accuracy = robjs.r['cor'](bleu_vec, human_judgments_acc)
b_average  = robjs.r['cor'](bleu_vec, human_judgments_ave)

print "BLEU's Pearson correlation wrt fluency:", b_fluency
print "BLEU's Pearson correlation wrt accuracy:", b_accuracy
print "BLEU's Pearson correlation wrt the average of fluency and accuracy", b_average

nist_fluency = robjs.r['cor'](nist_vec, human_judgments_fluency)
nist_accuracy = robjs.r['cor'](nist_vec, human_judgments_acc)
nist_average  = robjs.r['cor'](nist_vec, human_judgments_ave)

print "NIST's Pearson correlation wrt fluency:", nist_fluency
print "NIST's Pearson correlation wrt accuracy:", nist_accuracy
print "NIST's Pearson correlation wrt the average of fluency and accuracy", nist_average


================================================
FILE: ccgbank/bin/filter_feats.py
================================================
#!/usr/bin/env python
"""
(c) 2008 Dennis N. Mehay
Use this file any way you want, just please give the
author credit if it makes it into any research in any 
meaningful way.  I make no claims whatsoever about the
fitness or merchantability of this code.  Use at
your own risk.
"""
import sys, math
from optparse import OptionParser as OP

pr = OP()
pr.add_option("-i","--input",type="string",help="input source [default=<stdin>].",\
                  default=sys.stdin)
pr.add_option("-o","--output",type="string",help="output location [default=<stdout>].",\
                  default=sys.stdout)
pr.add_option("-n","--number",type="int",\
                  help="number of times a category must have been seen to retain [default=5]",\
                  default=5)
pr.add_option("-f","--feat_freq",type="int",help="feature frequency cutoff\n"+\
                  "(how frequent must a feature be to retain it? [default=1])",default=1)

(opts,args) = pr.parse_args(sys.argv)

inf = opts.input
if not inf is sys.stdin:
    inf = open(inf,'r')

outf = opts.output
if not outf is sys.stdout:
    outf = open(outf,'w')

try:
    tag_cnt = {}
    ft_cnt = {}
    lines = {}
    
    ln_cnt = -1
    for l in inf:
        l = l.strip()
        ln_cnt += 1
        lines[ln_cnt] = l
        l = l.split()
        tag = l[0]
        tag_cnt[tag] = tag_cnt.get(tag,0) + 1
        feats = l[1:]
        if ':' in feats[0] and not(feats[-1]==':'):
            # real-valued features
            feats = map(lambda a: (a[0:a.rfind(':')],a[a.rfind(':')+1:]), l[1:])

            for (f,act) in feats:
                ft_cnt[f] = ft_cnt.get(f,0) + 1 #math.fabs(float(act))
        else:
            # boolean
            for f in feats:
                ft_cnt[f] = ft_cnt.get(f,0) + 1

    for i in range(ln_cnt + 1):
        l = lines.get(i)
        l = l.strip().split()
        tag = l[0]
        feats = l[1:]
        if tag_cnt.get(tag) >= opts.number:
            tag_printed = False
            if ':' in feats[0] and not(feats[-1]==':'):
                # real-valued features
                feats = map(lambda a: (a[0:a.rfind(':')],a[a.rfind(':')+1:]), l[1:])
                for (f,act) in feats:
                    if ft_cnt.get(f) >= opts.feat_freq:
                        if not tag_printed:
                            print >> outf, tag,
                            tag_printed = True
                        print >> outf, f+':'+act,
            else:
                # boolean
                for f in feats:
                    if not tag_printed:
                        print >> outf, tag,
                        tag_printed = True
                    print >> outf, f,
            print >> outf, ''

        if i%100==0:
            outf.flush()
finally:
    outf.flush()
    if not inf is sys.stdin:
        inf.close()
    if not outf is sys.stdout:
        outf.close()


================================================
FILE: ccgbank/bin/find-betas-no-gold.py
================================================
"""
Given:

(1) a file supertagged words (OpenCCC file output format
as produced by, e.g., WordAndPOSDictionaryLabellingStrategy),

(2) a list (as a string) of tagging ambiguity levels (e.g.,
"1.4 1.6 1.8...") that represent the desired tag/word levels
(rounded off at the hundredths place to <=1.41, <=1.61, etc.),

(3) possibly tagging dictionaries (if needed),
and

(4) the corresponding 'K' parameters (e.g., "20 150" as in Clark and
Curran (2007)),

produce the list of betas that would produce those ambiguity
levels.
"""

import optparse
import sys
import decimal
import math

"""
A little on-the-fly class creation for iterating through multi-stag format files.
"""
class STIterator:
    def __init__(self, f):
        self.f = f
    def next(self):
        l = self.f.readline()
        while l.strip()=='' and l:
            l = self.f.readline()
        if l:
            lines = []
            # not at eof.
            if l.strip() != "<s>":
                print >> sys.stderr, "line=", l.strip(), "ill-formed st output file."
                raise Exception
            else:
                l = self.f.readline()
                while l.strip() != "</s>" and l:
                    lines.append(l.strip())
                    l = self.f.readline()
                if lines == []:
                    print >> sys.stderr, "line=", l.strip(), "ill-formed st output file."
                    raise Exception
                else:
                    res = []
                    for ln in lines:
                        # each line is: word <howmanypos> POS1 ... POSN <howmanysupertags> ST1 ... STM
                        # we just want the word, first pos and supertags.
                        parts = ln.split()
                        wd = parts[0]
                        pos = parts[2]
                        how_many_poss = int(parts[1])
                        stgs = zip(parts[2+(how_many_poss*2)+1::2],map(lambda n: float(n), parts[2+(how_many_poss*2)+2::2]))
                        res.append((wd,pos,stgs))
                    return res
        else:
            raise  StopIteration
    def __iter__(self): return self


p = optparse.OptionParser()

p.add_option("-i", "--inputf",  type="string", help="input source [default=<stdin>]",        default=sys.stdin)
p.add_option("-o", "--outputf", type="string", help="output destination [default=<stdout>]", default=sys.stdout)
p.add_option("-a", "--ambiguities", type="string", help="a space delimited string of tagging ambiguity levels [default=\"1.2 1.4 1.6 1.8 2.0 2.5 3.0 3.5\"]",
             default="1.2 1.4 1.6 1.8 2.0 2.5 3.0 3.5")
p.add_option("-K", "--Ks", type="string", help="a space delimited string of K values (only two) [default=\"20 150\", optional]", \
             default="20 150")
p.add_option("-w", "--wordkeyeddict", type="string", help="word-keyed tagging dict [no default, optional]",\
             default=None)
p.add_option("-p", "--poskeyeddict", type="string", help="POS-keyed tagging dict [no default, optional]",\
             default=None)

(ops,args) = p.parse_args()

   
try:
    # POS-keyed dict must be there if word-keyed one is.
    assert (not (not (ops.wordkeyeddict is None) and (ops.poskeyeddict is None)))
except:
    print >> sys.stderr, "need POS-keyed dict if using word-keyed dict."
    sys.exit(-1)

inf = ops.inputf
if not inf is sys.stdin:
    inf = open(inf, 'r')
    
outf = ops.outputf
if not outf is sys.stdout:
    outf = open(outf, 'w')

input_sents = [s for s in STIterator(inf)]

wdict = {}
if not ops.wordkeyeddict is None:
    entries = map(lambda l: l.split(), open(ops.wordkeyeddict, 'r').readlines())
    wdict[entries[0]] = (int(entries[1]), set(entries[2:]))

pdict = {}
if not ops.poskeyeddict is None:
    entries = map(lambda l: l.split(), open(ops.poskeyeddict, 'r').readlines())
    posdict[entries[0]] = set(entries[1:])
    
try:
    ambs = map(lambda a: float(a), ops.ambiguities.split())
    betas = []
    current_beta = 1.0
    last_beta_above  = None
    last_beta_below = 0.0
    total_tags   = 0.0
    total_words  = 0.0
    total_right  = 0.0
    ks = map(lambda kay: int(kay), ops.Ks.split())
    for a in ambs:
        current_beta = 1.0
        last_beta_above  = None
        last_beta_below = 0.0
        k =  ks[0] if a!=ambs[-1] else ks[1]
        found = False
        while not found:
            total_tags   = 0.0
            total_words  = 0.0
            total_right  = 0.0                    
            for insent in input_sents:
                for lex in insent:
                    total_words += 1
                    w   = lex[0]
                    pos = lex[1]
                    stags = lex[2]
                    if len(wdict)>0:
                        # filter with appropriate dictionary.
                        (freq,tags) = wdict.get(w,(0,set([])))
                        if freq >= k:
                            tags = tags
                        else:
                            tags = pdict.get(pos,set([]))
                        if len(tags)>0:
                            stags = filter(lambda st: st[0] in tags, stags)
                    best = stags[0][1]
                    # how many tags are there that made the beta cut-off?
                    total_tags += len(filter(lambda st: st[1] >= (current_beta * best), stags))
            # round to the nearest hundredth
            tags_per_word = (float(total_tags)/total_words)
            decimal.getcontext().prec = 4
            as_string = str(decimal.Decimal(str(tags_per_word)))
            # we're looking for 1.40..., or 1.60..., etc. (as the case may be)
            found = tags_per_word == a or ((as_string[:3]==str(a)[:3]) and (as_string[3]=='0'))

            if found:
                betas.append(current_beta)
                current_beta = 1.0
                last_beta = None
            else:
                # decide which direction to loosen the beta.
                if tags_per_word > a:
                    # get more restrictive (i.e., larger beta).
                    if last_beta_above is None:
                        print >> sys.stderr, "error"
                        sys.exit(-1)
                    else:
                        tempbeta = current_beta
                        current_beta += math.fabs(last_beta_above - current_beta)/2.0
                        last_beta_below = tempbeta

                else:
                    # get less restrictive (i.e., smaller beta)
                    tempbeta = current_beta
                    current_beta -= math.fabs(current_beta - last_beta_below)/2.0
                    last_beta_above = tempbeta

    print >> outf, "betas", ' '.join(map(lambda b: str(b), betas))
except:
    print "Unexpected error:", sys.exc_info()[0]
    raise
finally:
    # clean up, clean up...
    if not inf is sys.stdin:
        inf.close()
    if not outf is sys.stdout:
        outf.close()        


================================================
FILE: ccgbank/bin/gen_parser_events_a
================================================
#!/bin/bash
for i in 02 03 04 05
do
   ccg-build -Dsect=$i -f build-ps.xml gen-parser-events &> logs/log.gen.parser.events.$i 
done


================================================
FILE: ccgbank/bin/gen_parser_events_b
================================================
#!/bin/bash
for i in 06 07 08 09
do
   ccg-build -Dsect=$i -f build-ps.xml gen-parser-events &> logs/log.gen.parser.events.$i 
done


================================================
FILE: ccgbank/bin/gen_parser_events_c
================================================
#!/bin/bash
for i in 10 11 12 13
do
   ccg-build -Dsect=$i -f build-ps.xml gen-parser-events &> logs/log.gen.parser.events.$i 
done


================================================
FILE: ccgbank/bin/gen_parser_events_d
================================================
#!/bin/bash
for i in 14 15 16 17
do
   ccg-build -Dsect=$i -f build-ps.xml gen-parser-events &> logs/log.gen.parser.events.$i 
done


================================================
FILE: ccgbank/bin/gen_parser_events_e
================================================
#!/bin/bash
for i in 18 19 20 21
do
   ccg-build -Dsect=$i -f build-ps.xml gen-parser-events &> logs/log.gen.parser.events.$i 
done


================================================
FILE: ccgbank/bin/gen_realizer_events_a
================================================
#!/bin/bash
for i in 02 03 04 05
do
   ccg-build -Dsect=$i -f build-rz.xml gen-realizer-events &> logs/log.gen.realizer.events.$i 
done


================================================
FILE: ccgbank/bin/gen_realizer_events_b
================================================
#!/bin/bash
for i in 06 07 08 09
do
   ccg-build -Dsect=$i -f build-rz.xml gen-realizer-events &> logs/log.gen.realizer.events.$i 
done


================================================
FILE: ccgbank/bin/gen_realizer_events_c
================================================
#!/bin/bash
for i in 10 11 12 13
do
   ccg-build -Dsect=$i -f build-rz.xml gen-realizer-events &> logs/log.gen.realizer.events.$i 
done


================================================
FILE: ccgbank/bin/gen_realizer_events_d
================================================
#!/bin/bash
for i in 14 15 16 17
do
   ccg-build -Dsect=$i -f build-rz.xml gen-realizer-events &> logs/log.gen.realizer.events.$i 
done


================================================
FILE: ccgbank/bin/gen_realizer_events_e
================================================
#!/bin/bash
for i in 18 19 20 21
do
   ccg-build -Dsect=$i -f build-rz.xml gen-realizer-events &> logs/log.gen.realizer.events.$i 
done


================================================
FILE: ccgbank/bin/get-text-from-mtc-style.py
================================================
"""
Gets the text from a MTC-style corpus.
Just looks for '<seg id=...> </seg>' segments.

<stdin> => <stdout>

(c) 2011 Dennis Nolan Mehay
[Insert LGPL here]
"""
import re, sys, codecs, os

pattern = re.compile(u"<seg id=[^ ]*>\\s*(.*)\\s*</seg>")

input = sys.stdin.read()

try:
    import chardet
    encoding = chardet.detect(input)['encoding']
except:
    # this is what the original MTC corpus is encoded in.
    encoding = "iso-8859-2"

input = input.decode(encoding)
streamWriter = codecs.lookup(encoding)[-1]
sys.stdout = streamWriter(sys.stdout)

for seg in pattern.findall(input):
    sys.stdout.write(seg.strip() + os.linesep)
    

================================================
FILE: ccgbank/bin/get-truecase-list.py
================================================
"""
Requires Python >= 2.6x+ but < 3.0.

Takes in a stream (from stdin) or file of *tokenized* plain text (utf-8),
returns a list of words that occurred more than twice and were in upper-case
more frequently than not.
"""
import optparse, sys, codecs, os
from collections import defaultdict

def isAllUpper(st):
    return ( st.upper() == st and st.lower() != st )

op = optparse.OptionParser()

op.add_option("-i", "--input", type="string", help="input file or stream (default = <stdin>)",
              default=sys.stdin)
op.add_option("-o", "--output", type="string", help="output file or stream (default = <stdout>)",
              default=sys.stdout)
op.add_option("-f", "--use_first", action="store_true", help="whether to use the first word of each "+\
              "sentence for counting uppercase vs. lowercase (default = False)", default=False)

(ops, args) = op.parse_args()

inf = ops.input
if not inf is sys.stdin:
    inf = open(inf, "rb")

use_first_word   = ops.use_first

outf = ops.output
if not outf is sys.stdout:
    outf = codecs.open(outf, "wb", "utf-8")
else:
    # make stdout code utf-8
    streamWriter = codecs.lookup("UTF-8")[-1]
    outf = streamWriter(outf)

# map from: lowercased_word_key => specific_cased_form => count
wds2ulcounts = defaultdict(lambda: defaultdict(lambda: 0))

try:
    l = inf.readline()

    while l:
        l = l.strip().decode("utf-8")
        if l == u"":
            continue
    
        words = l.split()
    
        if not use_first_word:
           words = words[1:]
    
        for w in words:
            key = w.lower()
            wds2ulcounts[key][w] += 1
                
        l = inf.readline()
    
    for (wdkey,frms) in wds2ulcounts.items():
        wdforms = frms.items()
        # sum all counts. if more than 2, then write out the most frequent, else don't.
        sum_all = sum([cnt for (wf,cnt) in wdforms])
        # if there is only one form, seen more than once and it is a cased form, print it (this last will avoid printing punctuation and
        # always-lowercase words like 'the').
        if len(wdforms) == 1:
            most_freq = wdforms[0]            
            if sum_all > 2 and most_freq[0].lower() != most_freq[0]:
                #outf.write("wd %s only has one form, seen %d times" % (wdforms[0][0], wdforms[0][1]) + os.linesep)
                outf.write(most_freq[0] + os.linesep)
            else:
                continue
        else:
            if sum_all == 2:
                #outf.write("wd %s only occurred twice. cannot decide which is most frequent." % (wdkey) + os.linesep)
                continue
            else:
                wdforms.sort(lambda a,b: -cmp(a[1],b[1]))
                most_freq = wdforms[0]
                second_most_freq = wdforms[1]
                # see whether there is a tie. if so, no dice.
                if most_freq[1] == second_most_freq[1]:
                    #outf.write("wd %s occurred more than twice, but there was a tie btw forms %s and %s (perhaps others)." % \
                    #           (wdkey, wdforms[0][0], wdforms[1][0]) + os.linesep)
                    continue
                else:
                    # only mention it if the most freq form is uppercased somewhere.
                    if most_freq[0][0].lower() != most_freq[0][0]:
                        #outf.write("wd %s occurred most with form %s." % (wdkey, wdforms[0][0]) + os.linesep)
                        outf.write(most_freq[0] + os.linesep)
                    
finally:
    try:
        outf.close()
    except:
        pass

    try:
        inf.close()
    except:
        pass
        

================================================
FILE: ccgbank/bin/get-uniq-nbest.py
================================================
from BeautifulSoup import BeautifulStoneSoup as BSS
import codecs
import sys, os
streamWriter = codecs.lookup('utf-8')[-1]
sys.stdout = streamWriter(sys.stdout)

inf = open(sys.argv[1], "rb").read()
try:
    beta = float(sys.argv[2])
except:
    beta = 0.1
    
soup = BSS(inf)

segs = soup.findAll(lambda t: t.name == u'seg')

tot_paraphrases = 0.0
tot_segs = 0.0

for seg in segs:
    tot_segs += 1
    if seg.get('complete') == 'true':
        best = seg.find(lambda p: p.name == 'best')
        ref          = seg.ref.find(text=True)
        eye_dee      = seg.get(u'id')
        paraphrases  = set([p.find(text=True) for p in seg.findAll(lambda e: e.name in [u'best', u'next'])])
        tot_paraphrases += len(paraphrases)
        sys.stdout.write(ref + u' ||| ' + u' <-> '.join(paraphrases))
        sys.stdout.write(os.linesep)

print "ave paraphrases/seg", tot_paraphrases/tot_segs


================================================
FILE: ccgbank/bin/get_factors_from_parse.py
================================================
#!/usr/bin/env python

"""
(c) 2008 Dennis N. Mehay
Use this file any way you want, just please give the
author credit if it makes it into any research in any 
meaningful way.  I make no claims whatsoever about the
fitness or merchantability of this code.  Use at
your own risk.

Take a file of CCGbank-style parses and get the words, 
POSs and lexical cat's from them.

We also insert the word as the 'lemma', just as a placeholder.

So we have the following output form (for each parse
in the input file):

<word1>|<word1AsLemma>|<POS1>|<ccg_lexcat1> ... <wordN>|<wordNAsLemma>|<POSN>|<ccg_lexcatN>

Print out parse IDs (if there) as they are.
"""
import sys, re
import optparse

p = optparse.OptionParser()
p.add_option("-i", "--inputf", type="string", \
                 help="Input file to be postprocessed (one parse per line with IDs preceding them) [defaults to stdin]",\
                 default=None)
p.add_option("-o", "--outputf", type="string", \
                 help="The output location [defaults to stdout]",\
                 default=None)

(opts, args) = p.parse_args(sys.argv)

inf = None
outf = None

if opts.inputf is None:
    inf = sys.stdin
else:
    inf = open(opts.inputf,'r')

if opts.outputf is None:
    outf = sys.stdout
else:
    outf = open(opts.outputf,'w')

try:
    global lexNodePattern
    lexNodePattern = re.compile(r'(<L\s.*?>)+?')
    
    """
    A procedure that returns a list of all lexical nodes in a CCGbank-style
    parse tree (in string representation).
    """
    def getLexicalNodes(tree):
        matches = re.findall(lexNodePattern, tree)
        return matches
    
    for l in inf:
        if "ID=" in l:
            print >> outf, l.strip()
        elif l.strip()!='':
            nodes = getLexicalNodes(l.strip())
            ans = ''
            for n in nodes:
                parts = n.split()
                (w,pos,st) = (parts[4],parts[2],parts[1])
                ans += w+'|'+w+'|'+pos+'|'+st+ ' '
            print >> outf, ans.strip()
        
finally:
    if not opts.inputf is None:
        inf.close()
    if not opts.outputf is None:
        outf.close()

    
================================================
FILE: ccgbank/bin/get_just_words_from_ner_text.py
================================================
"""
Takes NE tagged text from stdin (assuming utf-8) and does just what it says: prints to stdout only the words.
"""
import codecs, sys, os
from optparse import OptionParser as OP

pr = OP()
pr.add_option("-o","--output",type="string",help="output location [default=<stdout>].",\
                  default=sys.stdout)

(opts,args) = pr.parse_args(sys.argv)

outf = opts.output
if not outf is sys.stdout:
    outf = open(outf,'w')

streamWriter = codecs.lookup("utf-8")[-1]
outw = streamWriter(outf)

for l in sys.stdin:
    l = l.decode("utf-8")
    parts = l.split()
    snt = []
    for p in parts:
        if u"_" in p:
            subparts = p.split(u"_")
            if len(subparts) > 1:
                w = u"_".join(subparts[:-1])
            else:
                w = p
            snt.append(w)
        else:
            snt.append(p)
    outw.write(u" ".join(snt) + '\n')

outf.flush()
if not outf is sys.stdout:
    outf.close()


================================================
FILE: ccgbank/bin/lowercase_tagged_text.py
================================================
#!/usr/bin/env python
"""
Takes a POS-tagged file and writes out the text with tokens lowercased except for
proper nouns.  A file with the list of word-tag pairs can also be written out.

(c) 2010 Michael White
[insert LGPL here]
"""

import sys
from optparse import OptionParser as OP

pr = OP()
pr.add_option("-i","--input",type="string",help="input source [default=<stdin>]",\
                  default=sys.stdin)
pr.add_option("-o","--output",type="string",help="output location [default=<stdout>]",\
                  default=sys.stdout)
pr.add_option("-p","--pairs",type="string",help="output file for word-tag pairs",\
                  default=None)

(opts,args) = pr.parse_args(sys.argv)

inf = opts.input
if not inf is sys.stdin:
    inf = open(inf,'r')

outf = opts.output
if not outf is sys.stdout:
    outf = open(outf,'w')

pairsf = opts.pairs
if not pairsf is None:
    pairsf = open(pairsf,'w')
    
try:
    sent = []
    pairs = []
    for l in inf:
        l = l.strip()
        l = l.split()
        if l[0] == '<s>':
            sent = []
            pairs = []
        elif l[0] == '</s>':
            print >> outf, ' '.join(sent)
            if not pairsf is None:
                for (token,tag) in pairs:
                    print >> pairsf, token, tag
        else:
            token,tag = l[0],l[1]
            if tag[:3] != 'NNP' and (len(token) <= 1 or not token[1].isupper()):
                token = token.lower()
            sent.append(token)
            pairs.append((token,tag))
            if len(l) >= 4:
                tag2 = l[3]
                pairs.append((token,tag2))
finally:
    if not inf is sys.stdin:
        inf.close()
    if not outf is sys.stdout:
        outf.close()
    if not pairsf is None:
        pairsf.close()


================================================
FILE: ccgbank/bin/merge-mtc-ids.py
================================================
"""
This program re-inserts the MTC unique IDs (sys+DOC+segment) into an auto-number-ID'ed parse of said
MTC (or similar) document produced by OpenCCG's 'ccg-parse'.

Usage: python merge-mtc-ids.py [output-of-OpenCCG-parser] [MTC-like-input-file] > [output-of-OpenCCG-parser-with-original-MTC-ids]
"""
import sys, os, re, codecs

try:
    import chardet
except:
    chardet = None
from xml.etree.ElementTree import *

doc_pattern = re.compile(u"<[Dd][Oo][Cc] docid=\"(.*)\" sysid=\"(.*)\">(.*)")
seg_pattern = re.compile(u"<seg id=\"?(.*)\"?>(.*)</seg>$")

openccg_in = sys.argv[1]
#mtc_in = codecs.open(sys.argv[2], "rb", "utf-8").read()
if not chardet is None:
    encoding = chardet.detect(open(sys.argv[2], "rb").read())['encoding']
else:
    encoding = "ISO-8859-2"
mtc_in = codecs.open(sys.argv[2], "rb", encoding).readlines()

# turn stdout into a UTF-8 converting writer.
streamWriter = codecs.lookup(encoding)[-1]
sys.stdout = streamWriter(sys.stdout)
output = sys.stdout

# map from auto-assigned ID to MTC ID.
autoid2mtcid = {}

mtc_ids     = []
for l in mtc_in:
    l = l.strip()
    if l.startswith("<DOC"):
        match = doc_pattern.findall(l)[0]
        (docid, sysid) = (match[0], match[1])
        curr_doc = docid
        curr_sys = sysid
    elif l.startswith("<seg"):
        match = seg_pattern.findall(l)[0]
        (segid, text) = (match[0], match[1])
        mtc_ids.append((curr_sys, curr_doc, segid, text.strip()))


output.write("<?xml version=\"1.0\" encoding=\"UTF-8\"?>" + os.linesep + "<regression>" + os.linesep)
for event, elem in iterparse(openccg_in):
    if elem.tag.lower() == "item":
        next_mtc_id = mtc_ids.pop(0)
        elem.set("info", u",".join(next_mtc_id[:-1]))
        output.write(u"\t" + tostring(elem).strip() + os.linesep)
output.write("</regression>" + os.linesep)


================================================
FILE: ccgbank/bin/merge-stanford-morpha-with-pos.py
================================================
"""
Given two files: (1) the output of Stanford's re-implementation of 'morpha' and (2) the 'pairs' file of <word><space><POS>(<space><SEMCLASS>),
merge them into a morph.xml file.
"""
import sys, codecs, os
from optparse import OptionParser as OP
from xml.sax import saxutils

pr = OP()
pr.add_option("-m","--morpha_input",type="string",help="morpha input file (required arg)",\
                  default=None)
pr.add_option("-p","--pairs_input",type="string",help="pairs input file (required arg)",\
                  default=None)
pr.add_option("-o","--output",type="string",help="output location [default=<stdout>]",\
                  default=sys.stdout)

(opts,args) = pr.parse_args(sys.argv)

# we do not check that you passed in the files (this is intended for internal use only, not as a
# user-friendly app).
pinf = codecs.open(opts.pairs_input,'rb','utf-8')
minf = codecs.open(opts.morpha_input,'rb','utf-8')

outf = opts.output
if not outf is sys.stdout:
    outf = codecs.open(outf,'wb','utf-8')
else:
    streamWriter = codecs.lookup("utf-8")[-1]
    outf = streamWriter(sys.stdout)

pl = pinf.readline()
ml = minf.readline()

outf.write('<?xml version="1.0" encoding="UTF-8"?>' + '\n')
outf.write('<morph name="novel">' + '\n')

entries = []

try:
    while pl and ml:
        pl = pl.strip()
        ml = ml.strip()
        pl = pl.split()
        ml = ml.split()
        # skip blank lines from line ending differences
        if len(pl) < 2: 
            pl = pinf.readline()
            ml = minf.readline()        
            continue
        s = ['<entry word="']
        s.append(saxutils.escape(pl[0]))
        s.append('" pos="')
        s.append(pl[1])
        s.append('"')
        if len(pl) > 2:
            s.append(' class="')
            s.append(saxutils.escape(pl[2]))
            s.append('"')
        if ml[0].lower() != pl[0].lower() and not ("^" in ml[0] or "*****" in ml[0]): # add stem only if distinct.
            s.append(' stem="')
            s.append(saxutils.escape(ml[0]))
            s.append('"')
        s.append('/>')
        entries.append(s[:])
        pl = pinf.readline()
        ml = minf.readline()        

    # sort/uniq
    entries.sort()
    last_one = None

    for e in entries:
        if last_one is None or e != last_one:
            outf.write(u''.join(e) + '\n')
            last_one = e
            
    outf.write('</morph>' + '\n')
finally:
    pinf.close()
    minf.close()
    if not outf is sys.stdout:
        outf.close()
        

================================================
FILE: ccgbank/bin/merge_pos_ne.py
================================================
#!/usr/bin/env python
"""
Takes a POS-tagged file and a file of the original, NE-tagged text and writes out a file of:

...
[word]<whitespace(s)>[POS]<whitespace(s)>[SEM_CLASS](if any)<whitespace(s)>[stem](if any)
...

(c) 2011 Dennis N. Mehay
[insert LGPL here]
"""

class POSOutputIter:
    def __init__(self, filelikeobj):
        self.f = filelikeobj

    def __iter__(self): return self
    
    def next(self):
        try:
            nxtLn = self.f.readline().strip()
            nxtSent = []
            if nxtLn != "<s>":
                raise StopIteration
            nxtLn = self.f.readline().strip()
            while nxtLn != "</s>":
                nxtSent.append(nxtLn)
                nxtLn = self.f.readline().strip()
            return nxtSent
        except:
            raise StopIteration
        
import sys, codecs, os
from optparse import OptionParser as OP

pr = OP()
pr.add_option("-p","--pos_in",type="string",help="POS-tagged input",\
                  default=None)
pr.add_option("-n","--ner_tagged_in",type="string",help="NE-tagged input (no POS tags yet)",\
                  default=None)
pr.add_option("-o","--output",type="string",help="output location [default=<stdout>]",\
                  default=sys.stdout)

(opts,args) = pr.parse_args(sys.argv)

pinf = opts.pos_in
if not pinf is sys.stdin:
    pinf = codecs.open(pinf,'r', 'utf-8')

ninf = opts.ner_tagged_in
if not ninf is sys.stdin:
    ninf = codecs.open(ninf,'r', 'utf-8')
    
outf = opts.output
if not outf is sys.stdout:
    outf = codecs.open(outf,'wb', 'utf-8')
else:
    streamWriter = codecs.lookup("utf-8")[-1]
    outf = streamWriter(sys.stdout)

try:
    for posSent in POSOutputIter(pinf):
        origSent = ninf.readline()        
        for (posTW,NETagW) in zip(posSent, origSent.split()):
            NETagWParts = NETagW.split(u"_")

            if len(NETagWParts) > 1:
                NETag = u"\t" + NETagWParts[-1]
            else:
                NETag = ""

            posTW = posTW.split()
            w = posTW[0]
            
            tgs = posTW[1:][::2][:2]
            for t in tgs:
                outf.write(w + u"\t" + t + NETag + '\n')
        

finally:
    pinf.close()
    ninf.close()
    outf.close()


================================================
FILE: ccgbank/bin/my_unicode.py
================================================
"""
Useful functions for dealing with Unicode messiness that arises from dealing with messy
input (e.g., gibberish from the Multiple Translation Chinese corpus).
"""
import re, doctest
eval(r'u"[\u0080-\uffff]+"')
RE_XML_ILLEGAL = u'([\u0000-\u0008\u000b-\u000c\u000e-\u001f\ufffe-\uffff])' + \
                 u'|' + \
                 u'([%s-%s][^%s-%s])|([^%s-%s][%s-%s])|([%s-%s]$)|(^[%s-%s])' % \
                 (unichr(0xd800),unichr(0xdbff),unichr(0xdc00),unichr(0xdfff),
                  unichr(0xd800),unichr(0xdbff),unichr(0xdc00),unichr(0xdfff),
                  unichr(0xd800),unichr(0xdbff),unichr(0xdc00),unichr(0xdfff))
invalid_char_re = re.compile("[^\u0009\u000a\u000d\u0020-\uD7FF\uE000-\uFFFD]")

def removeInvalidChars(text):
    """
    Text is a unicode string. All characters that are not valid XML characters are removed.
    """
    return re.sub(RE_XML_ILLEGAL, "?", text)
    
if __name__=="__main__":
    doctest.testmod()


================================================
FILE: ccgbank/bin/nbest-mtc-to-bleu-nist.py
================================================
"""
This program takes the n-best realizer output as one file (with sys+DOC+segment IDs -- 'info' attributes),
the tb.xml parser output of OpenCCG (for grabbing the strings of those things that did not parse),
and creates an XML form suitable for use as a reference in the NIST-distributed BLEU script.

Usage: python nbest-mtc-to-bleu-nist.py [nbest-from-realizer] [parser-output(tb.xml)] [max-n] | [NIST/BLEU-compatible-multiref-file]
"""
import sys, os, re, codecs, tempfile, xml.sax.saxutils
try:
    import chardet
except:
    chardet = None
from xml.etree.ElementTree import *
from collections import defaultdict

# hack procedure. remove later.
def remove_ne(txt):
    # remove: Time, Location, Organization, Person, Money, Percent, Date
    txt = txt.replace(" LOCATION", "").replace(" PERSON", "").replace(" MONEY", "").replace(" PERCENT", "").replace(" DATE", "").replace(" TIME", "").replace(" ORGANIZATION", "")
    return txt

doc_pattern = re.compile(u"<[Dd][Oo][Cc] docid=\"(.*)\" sysid=\"(.*)\">(.*)")
seg_pattern = re.compile(u"<seg id=\"?(.*)\"?>(.*)</seg>$")

openccg_all = open(sys.argv[1], "rb").read().replace("_&", "_&amp;").replace(" & ", "&amp; ")
parser_all = open(sys.argv[2], "rb").read().replace("_&", "_&amp;").replace(" & ", "&amp; ")

if not chardet is None:
    encoding1 = chardet.detect(openccg_all)['encoding']
else:
    encoding1 = "utf-8"

if not chardet is None:
    encoding2 = chardet.detect(parser_all)['encoding']
else:
    encoding2 = "utf-8"
    
openccg_src = tempfile.NamedTemporaryFile()
openccg_src.write(openccg_all)
openccg_src.flush()
openccg_all = None

parser_src = tempfile.NamedTemporaryFile()
parser_src.write(parser_all)
parser_src.flush()
parser_all = None

try:
    n_size = int(sys.argv[3])
except:
    n_size = 4
    
# turn stdout into a UTF-8 converting writer.
streamWriter = codecs.lookup("utf-8")[-1]
sys.stdout = streamWriter(sys.stdout)
output = sys.stdout

# list of list of (ID/ref pairs)
refs = []

# max number of unique refs in any (there may not 'n_size' in any of them)
max_num_refs = 0

# map from docID -> [(segID, [text])]
doc_to_segs = defaultdict(lambda: [])

# get unparsed strings.
for event, elem in iterparse(parser_src.name):
    if elem.tag.lower() == "item" and elem.get("numOfParses") == "0":
        txt = elem.get("string").strip()
        (sys,doc,seg) = elem.get("info").split(",")
        doc_to_segs[doc].append((seg, [txt]))

for event, elem in iterparse(openccg_src.name):
    if elem.tag.lower() == "seg":
        (sys,doc,seg) = elem.get("id").split(",")
        is_complete = True if elem.get("complete") else False
        nbest_realizations = []
        if not is_complete:
            # just get the original input.            
            for child in list(elem):
                if child.tag.lower() == "ref":
                    nbest_realizations.append(child.text.strip())
        else:
            # get the n-best (only keeping unique strings), so, e.g., 4-best might turn into
            # 1-best if they're all the same.
            how_many = 0
            for child in list(elem):
                if child.tag.lower() in ["ref", "best", "next"] and how_many < n_size:
                    txt = child.text.strip()
                    if not txt in nbest_realizations:
                        nbest_realizations.append(txt)
                    how_many += 1
                elif how_many >= n_size:
                    break
            if len(nbest_realizations) > max_num_refs:
                max_num_refs = len(nbest_realizations)
                
        doc_to_segs[doc].append((seg, nbest_realizations))


output.write("<?xml version=\"1.0\" encoding=\"UTF-8\"?>" + \
             os.linesep + "<!DOCTYPE mteval SYSTEM \"ftp://jaguar.ncsl.nist.gov/mt/resources/mteval-xml-v1.3.dtd\">" + os.linesep +\
             "<mteval>" + os.linesep)

docs = doc_to_segs.keys()
docs.sort()

for i in range(max_num_refs):
    output.write("<refset setid=\"multiple_translation_set\" srclang=\"Chinese\" trglang=\"English\" refid=\"%d\">" % (i+1) + os.linesep)
    for doc in docs:
        output.write("    <doc docid=\"%s\" genre=\"nw\">" % doc + os.linesep)
        segs = doc_to_segs[doc]
        segs.sort(lambda a,b: cmp(int(a[0]), int(b[0])))
        for (seg, paraphrases) in segs:
            this_one = i
            if i >= len(paraphrases):
                # there aren't as many paraphrases here as there are in the maximum length ref, so we just re-duplicate
                # the last one of this ref.                
                this_one = len(paraphrases)-1
            output.write("        <seg id=\"%d\"> %s </seg>" % (int(seg), xml.sax.saxutils.escape(remove_ne(paraphrases[this_one].replace("_"," "))) + os.linesep))
        output.write("    </doc>" + os.linesep)
    output.write("</refset>" + os.linesep)
output.write("</mteval>")


================================================
FILE: ccgbank/bin/ner/NERApp/src/nerapp/NERApp.java
================================================
package nerapp;

import java.io.*;
//import edu.stanford.nlp.ie.crf.*;
import edu.stanford.nlp.ie.AbstractSequenceClassifier;
import edu.stanford.nlp.ie.NERClassifierCombiner;
import edu.stanford.nlp.io.IOUtils;
import edu.stanford.nlp.ling.CoreAnnotations;
import edu.stanford.nlp.ling.HasWord;
import edu.stanford.nlp.sequences.DocumentReaderAndWriter;
import edu.stanford.nlp.sequences.PlainTextDocumentReaderAndWriter;
import edu.stanford.nlp.util.CoreMap;
import java.io.IOException;
import java.util.ArrayList;
import java.util.List;


/** This tags text using the Stanford NE tagger API.
 *  <p>
 *  Usage: <code>java -cp "stanford-ner.jar:." NERApp [serializedClassifier] [fileName]</code>
 *  <p>
 *  There are no default arguments.
 *  (Created by modifying Jenny Finkel and Chris Manning's example "NERDemo.java".)
 *  <p>
 *  @author Dennis N. Mehay
 */

public class NERApp {

    @SuppressWarnings("unchecked")
    public static void main(String[] args) throws IOException {
      DocumentReaderAndWriter<CoreMap> readerAndWriter = new PlainTextDocumentReaderAndWriter<CoreMap>();
      String usageStr = System.getProperty("line.separator") +
                        "java -cp \"stanford-core-nlp.jar:.\" NERApp [inputFileName] [outputFileName] [classifierModelFile1] (...[classifierModelFile10])"+
                    	System.getProperty("line.separator") + System.getProperty("line.separator") +
                   	"(I.e., you can specify between one and ten classifiers whose predictions will be combined.\n"+
	                "Specify the best model first -- it will have precedence in the model combination.)" +
                        System.getProperty("line.separator");

      if (args.length < 3) {
          System.out.println(usageStr);
          System.exit(-1);
      }

      String[] classifierMods = new String[10];

      for(int j = 2; j < args.length; j++) {
	  classifierMods[j-2] = args[j].trim();
      }

      int numClassifiers = 0;
      AbstractSequenceClassifier classifier = null; //CRFClassifier.getClassifierNoExceptions(serializedClassifier);
      for(String classMod : classifierMods) { if(classMod != null) { numClassifiers++; } }
      switch (numClassifiers) {
          case 1:
	      classifier = new NERClassifierCombiner(true, false, false, classifierMods[0]);
	      break;
          case 2:
	      classifier = new NERClassifierCombiner(true, false, false, classifierMods[0], classifierMods[1]);
	      break;
          case 3:
	      classifier = new NERClassifierCombiner(true, false, false, classifierMods[0], classifierMods[1], classifierMods[2]);
	      break;
          case 4:
	      classifier = new NERClassifierCombiner(true, false, false, classifierMods[0], classifierMods[1], classifierMods[2], classifierMods[3]);
	      break;
          case 5:
	      classifier = new NERClassifierCombiner(true, false, false, classifierMods[0], classifierMods[1], classifierMods[2], classifierMods[3], classifierMods[4]);
	      break;
          case 6:
	      classifier = new NERClassifierCombiner(true, false, false, classifierMods[0], classifierMods[1], classifierMods[2], classifierMods[3], classifierMods[4],
						     classifierMods[5]);
	      break;
          case 7:
	      classifier = new NERClassifierCombiner(true, false, false, classifierMods[0], classifierMods[1], classifierMods[2], classifierMods[3], classifierMods[4],
						     classifierMods[5], classifierMods[6]);
	      break;
          case 8:
	      classifier = new NERClassifierCombiner(true, false, false, classifierMods[0], classifierMods[1], classifierMods[2], classifierMods[3], classifierMods[4],
						     classifierMods[5], classifierMods[6], classifierMods[7]);
	      break;
          case 9:
	      classifier = new NERClassifierCombiner(true, false, false, classifierMods[0], classifierMods[1], classifierMods[2], classifierMods[3], classifierMods[4],
						     classifierMods[5], classifierMods[6], classifierMods[7], classifierMods[8]);
	      break;
          case 10:
	      classifier = new NERClassifierCombiner(true, false, false, classifierMods[0], classifierMods[1], classifierMods[2], classifierMods[3], classifierMods[4],
						     classifierMods[5], classifierMods[6], classifierMods[7], classifierMods[8], classifierMods[9]);
	      break;
          default:
	      System.out.println(usageStr);
	      System.exit(-1);
      }


      Iterable<String> sents = IOUtils.readLines(args[0]);
      BufferedWriter outf = new BufferedWriter(new FileWriter(new File(args[1])));

      for (String sent : sents) {
          String[] parts = sent.split("\\s+");
          List<HasWord> wdList = new ArrayList<HasWord>(parts.length);
          for(String w : parts) {
              wdList.add(new MyWord(w));
          }
          List<CoreMap> tagging = classifier.classifySentence(wdList);
          String currNE = null;
          StringBuilder res = new StringBuilder();

          String wd, annot;
          int cursor = -1;
          for(CoreMap item : tagging) {
              cursor += 1;
              wd = item.get(CoreAnnotations.TextAnnotation.class);
              annot = item.get(CoreAnnotations.AnswerAnnotation.class);
              
              if(annot != null && annot.equals("O") || annot.equals("MISC")) {
                  annot = null;
              }

              if(currNE != null && !currNE.equals(annot)) {
                  res.append("</");  res.append(currNE); res.append(">");
                  currNE = null;
              }

              if(annot != null && !annot.equals(currNE)) {
                  currNE = annot;
                  res.append(" ");
                  res.append("<");  res.append(currNE); res.append(">");
                  res.append(wd);
              } else {
                  res.append(" ");
                  res.append(wd);
              }

          }
          if(null != currNE) {
              res.append("</");  res.append(currNE); res.append(">");
          }
          outf.write(res.toString() + System.getProperty("line.separator"));
          outf.flush();
      }
      outf.close();
    }


    public static String classifyToString(List<CoreMap> sentence, DocumentReaderAndWriter<CoreMap> readerAndWriter, AbstractSequenceClassifier classif) {
    PlainTextDocumentReaderAndWriter.OutputStyle outFormat =
      PlainTextDocumentReaderAndWriter.OutputStyle.fromShortName("inlineXML");

    DocumentReaderAndWriter<CoreMap> tmp = readerAndWriter;
    readerAndWriter = new PlainTextDocumentReaderAndWriter<CoreMap>();
    readerAndWriter.init(classif.flags);

    StringBuilder sb = new StringBuilder();
    sb.append(((PlainTextDocumentReaderAndWriter<CoreMap>) readerAndWriter).getAnswers(sentence, outFormat, true));
    return sb.toString();
  }
}

class MyWord implements HasWord {

    private String wd = null;

    public MyWord(String wd) {
        this.wd = wd;
    }

    public String word() {
        return wd;
    }

    public void setWord(String string) {
        this.wd = string;
    }

}


================================================
FILE: ccgbank/bin/ner/build-ner-api.properties
================================================
# For compiling against the Stanford API.
stanford.core.nlp=../../stanford-nlp/stanford-core-nlp.jar

================================================
FILE: ccgbank/bin/ner/build-ner-api.xml
================================================
<!--
 Copyright (C) 2012 Dennis N. Mehay
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
-->

<!-- This build file is for compiling the NE tagging application that uses the Stanford NLP API into a JAR-->

<!-- $Id: build-ner-api.xml,v 1.1 2011/12/05 23:23:48 dnmehay Exp $ -->
<project name="BuildNERApp" default="all" basedir=".">
  
  <taskdef resource="net/sf/antcontrib/antlib.xml"/>
  <property file="./build-ner-api.properties"/>

  <!-- =================================================================== -->
  <!-- Initialization target                                               -->
  <!-- =================================================================== -->
  <target name="init">
    <tstamp/>
  </target>
  
  <target name="compile-ner-app" depends="init">
    <echo message="classpath ${stanford.core.nlp}"/>
    <javac includeantruntime="false" classpath="${stanford.core.nlp}" srcdir="./NERApp/src/" destdir="./NERApp/src/"/>
  </target>

  <target name="jar-ner-app" depends="compile-ner-app">
    <jar basedir="./NERApp/src" destfile="./NERApp.jar" includes="nerapp/*.class"/>
  </target>

  <!-- =================================================================== -->
  <!-- Top-level                                                           -->
  <!-- run all                                                             -->
  <!-- =================================================================== -->

  <target name="all" depends="jar-ner-app"/>
</project>


================================================
FILE: ccgbank/bin/ner/ner-tag.sh
================================================
#!/bin/bash
#
# Tag a file $1 using Stanford NER located in base directory $2 (first arg, e.g., "/home/me/stanford-ner-2.1.0") 
# with model $3 (second arg, e.g., "all.3class.distsim.crf.ser.gz").
#
# Output is placed in the file whose path is given in argument $4.
#
java -mx700m -cp "$1/stanford-ner.jar:`dirname $0`/NERApp.jar" nerapp.NERApp $2/classifiers/$3 $1 2> /dev/null | python `dirname $0`/post-process-stanford-ner.py > $4


================================================
FILE: ccgbank/bin/ner/ner_word.py
================================================
class NERWord:
    """
    A simple wrapper for NER-labelled words.
    """
    def __init__(self, wd, label=None, delim="/"):
        self.wd = wd
        self.label = label
        self.delim = delim

    @staticmethod
    def parseLineOfWords(ln):
        """
        Parses a line of words labelled with NE labels (e.g., "<PERSON>John Smith</PERSON> entered the <LOCATION>United States</LOCATION>").
        """
        res = []
        for w in ln:
            if "</" in w and w.endswith(">"):
                parts = w.partition("</")
                (wd,lb) = (parts[0], "</"+parts[2])

                if "<" in wd and ">" in wd:
                    parts = wd.partition(">")
                    wd = parts[2]
                    lb = lb[2:-1]
            elif w.startswith("<") and ">" in w:
                parts = w.partition(">")
                (wd,lb) = (parts[2], parts[0]+">")
            else:
                (wd,lb) = (w,None)
            res.append((wd,lb))

        # now distribute the labels to words between within the <TAG>...</TAG> labels.
        final_res = []
        i = len(res) - 1
        while i >= 0:
            (wd,lb) = res[i]
            if lb is None:
                final_res.append(NERWord(wd,lb))
            elif not "</" in lb:
                final_res.append(NERWord(wd,lb))
            else:
                final_res.append(NERWord(wd,lb[2:-1]))
                i -= 1
                (wd_prm,lb_prm) = res[i]
                # apply this label until we 
                while lb_prm is None:
                    final_res.append(NERWord(wd_prm, lb[2:-1]))
                    i -= 1
                    (wd_prm,lb_prm) = res[i]
                final_res.append(NERWord(wd_prm, lb[2:-1]))
            i -= 1
        final_res.reverse()
        return final_res

    def getLabel(self):
        return self.label

    def getWord(self):
        return self.wd
    
    def __repr__(self): return self.__str__()
    
    def __str__(self): return self.wd + self.delim + (self.getLabel() if not self.getLabel() is None else "")
    
        
================================================
FILE: ccgbank/bin/ner/post-process-stanford-ner.py
================================================
import sys, optparse, os, codecs
from ner_word import NERWord
import math

"""
Take Stanford 'inlineXML' output from stdin, pipe processed version thereof to stdout.

E.g., 

$ echo "This is a <ORGANIZATION>US Dept of Defense</ORGANIZATION> example ." | python post-process-stanford-ner.py
This is a US_Dept_of_Defense_ORGANIZATION example .

Type: 

$ python post-process-stanford-ner.py -h 

for help on the command-line options.
"""

def fuseNERWords(list_of_ner_words):
    return "_".join([nerWrd.getWord() for nerWrd in list_of_ner_words] + [list_of_ner_words[0].getLabel()])

op = optparse.OptionParser()
op.add_option("--known_verbs", type="string", \
                  help="file containing known verbs (for split-at-verb-boundary heuristic) [defaults to an empty list of known verbs]",\
                  default=None)

(ops, args) = op.parse_args()

known_verbs = set([v.strip() for v in open(ops.known_verbs, "rb").readlines()]) if not ops.known_verbs is None else set()
puncts = set([',', "'", '"', ".", "?", "!"])
heuristic_splitters = (known_verbs | puncts)

for l in sys.stdin:
    l = l.strip()
    if l == "":
        continue
    ner_parts = l.split()
    ner_parts = NERWord.parseLineOfWords(ner_parts)

    i = 0

    current_NE = None
    current_group = None

    res = []
    while i < len(ner_parts):
        prt = ner_parts[i]
        (wd,ne) = (prt.getWord(), prt.getLabel())

        if not ne is None:
            # we have a NE label. is it a continuation of what came before (if anything)?
            if ne == current_NE:
                current_group.append(prt)
            else: 
                if current_NE is None:
                    current_NE = ne
                    current_group = [prt]
                else:
                    res.append(fuseNERWords(current_group))
                    current_NE = ne
                    current_group = [prt]
        else:
            if not current_NE is None:
                res.append(fuseNERWords(current_group))
                current_NE = None
                current_group = None
            res.append(wd)
        
        i += 1
    
    if not current_NE is None:
        res.append(fuseNERWords(current_group))

    print " ".join(res)


================================================
FILE: ccgbank/bin/normalize_text.py
================================================
"""
Assuming UTF-8 input (defaults to stdin, otherwise, supply a file), normalize plain text in
various ways -- e.g., normalize quotation marks.

Copyright Dennis N. Mehay (2011)
[Insert LGPL here]
"""
from optparse import OptionParser as OP
import codecs, sys, os

op = OP()
op.add_option("-i", "--input", type="string", help="input stream of text (file, or default=sys.stdin)", default=sys.stdin)
op.add_option("-o", "--output", type="string", help="output stream (file, or default=sys.stdout)", default=sys.stdout)

(ops,args) = op.parse_args()


if not ( ops.input is sys.stdin or ops.input == "-" ):
    inf = codecs.open(ops.input, "rb", "utf-8")
else:
    streamReader = codecs.lookup("utf-8")[2]
    inf = streamReader(sys.stdin)

if not ( ops.output is sys.stdout or ops.output == "-" ):
    outf = codecs.open(ops.output, "wb", "utf-8")
else:
    streamWriter = codecs.lookup("utf-8")[-1]
    outf = streamWriter(sys.stdout)

try:
    l = inf.readline().strip()
    while l:
        transformed_line = []
        opening_quotes = True
        for c in l:
            if c == u'"' and opening_quotes:
                transformed_line.append(u"``")
                opening_quotes = False # next double quotes will be closing quotes.
            elif c == u'"' and not opening_quotes:
                transformed_line.append(u"''")
                opening_quotes = True # reset the open-close tracker.
            else:
                transformed_line.append(c)

        outf.write(u"".join(transformed_line) + os.linesep)
        
        l = inf.readline().strip()
finally:
    inf.close()
    outf.close()


================================================
FILE: ccgbank/bin/post-process-metricsmatr.py
================================================
"""
Pipe in a MetricsMATR-style mteval script output and, given (as sys.argv[1]) the name of the
reference system, produce a file that has lines of the form:

<sys>,<ref>,<doc>,<seg>,<score>
...
<sys>,<ref>,<doc>,<seg>,<score>
"""
import sys
refid = sys.argv[1].strip()

for l in sys.stdin:
    # e.g., "multiple_translation_set        E09     XIN20020316.0014        1       0.0715856157727753"
    (setid,sysid,docid,segid,score) = l.strip().split()
    print ",".join([sysid, refid, docid, segid, score])
    

================================================
FILE: ccgbank/bin/prepare-for-stanford-morpha.py
================================================
"""
Take in a space-delimited file of <word>...<POS>...<SEM-CLASS> and turn it into 
a form that the Stanford NE recognizer can accept (and from which we can extract
all the information we need later).

<stdin> => <stdout>
"""

import sys, codecs, os

streamWriter = codecs.lookup("utf-8")[-1]
sys.stdout = streamWriter(sys.stdout)

streamReader = codecs.lookup("utf-8")[2]
sys.stdin = streamReader(sys.stdin)

for l in sys.stdin:
    l = l.strip()
    parts = l.split()
    if len(parts) > 2:
        # has NE label.
        wordform = u"*****".join([parts[0],parts[-1]]).replace("_","^")
    else:
        wordform = parts[0]
    pos = parts[1]

    joined = u"_".join([wordform, pos])
    sys.stdout.write(joined + '\n')


================================================
FILE: ccgbank/bin/reverse-spaces-to-newlines.py
================================================
#
# reverses the conversion from spaces to newlines, and newlines to special <eol> chars,
# from stdin to stdout
#
import sys, re;
[sys.stdout.write(re.sub('<eol>','\n',re.sub('\n',' ',line))) for line in sys.stdin]


================================================
FILE: ccgbank/bin/run-all-bleu.sh
================================================
#!/bin/bash
# run Bleu/NIST on all systems sys directory (passed in) with all references in the ref directory
# (also passed in as an arg).
# $1 is the mteval script.
# $2 is the location of the system directory (where all the system files are stored)
# $3 is the location of the reference directory (where all the reference files are stored).
# $4 is the location of the source *file*.
# $5 is the location where the scores will go.
curr_dir=`dirname $0`
for sys in `ls $2/E*`
do
    for ref in `ls $3/*`
    do
	echo "Command line: $1 --metricsMATR -t $sys -r $ref -s $4"
	sys_shortname=`basename ${sys} | sed "s/^\(E[0-9][0-9]\).*/\1/g"`
	ref_shortname=`basename ${ref} | sed "s/^\(E[0-9][0-9]\).*/\1/g"`
	$1 --metricsMATR -t $sys -r $ref -s $4
	cat BLEU-seg.scr | python $curr_dir/post-process-metricsmatr.py ${ref_shortname} > $5/BLEU.${sys_shortname}-${ref_shortname}.scr
	cat NIST-seg.scr | python $curr_dir/post-process-metricsmatr.py ${ref_shortname} > $5/NIST.${sys_shortname}-${ref_shortname}.scr
	rm BLEU-*; rm NIST-*;
    done
done


================================================
FILE: ccgbank/bin/stem_nns_vbx
================================================
#/bin/bash
#
# produces a file <novelfile>.dir/morph from <novelfile>.dir/pairs
# that lists the words, pos tags and, for plural nouns and verbs, 
# also stems, derived using morpha
#
# write plural nouns and verbs to <novelfile>.dir/nns-vbx
cat $1.dir/pairs | sort | uniq | grep -E "NNS|VB." > $1.dir/nns-vbx
# get rest
cat $1.dir/pairs | sort | uniq | grep -E -v "NNS|VB." | grep -E -v "s>" > $1.dir/non-nns-vbx
# get stems
cat $1.dir/nns-vbx | tr [:blank:] _ | morpha > $1.dir/nns-vbx.stems
# merge stems
paste $1.dir/nns-vbx $1.dir/nns-vbx.stems > $1.dir/nns-vbx-stems
# merge files
cat $1.dir/non-nns-vbx $1.dir/nns-vbx-stems | sort | uniq > $1.dir/morph
# cleanup
rm -f $1.dir/nns-vbx* $1.dir/non-nns-vbx


================================================
FILE: ccgbank/bin/toUTF-8.py
================================================
"""
Copryright (c) 2011 Dennis N. Mehay

Assumes that 'chardet' is installed.

Re-encodes most known Unicode encodings as UTF-8.

(Provided that there is enough text for chardet to
correctly determine the encoding of the input file.)

If any file exists by the output file name, it will
be overwritten.

[Insert LGPL here]
"""

import sys, codecs, optparse

try:
    import chardet
except ImportError, ie:
    print >> sys.stderr, "'chardet' must be installed for this script to work. Exiting..."
    sys.exit(-1)

op = optparse.OptionParser()
op.add_option("-i", "--inputf", type="string", help="input file [required]", default=None)
op.add_option("-o", "--outputf", type="string", help="output file [required, will be overwritten]", default=None)

(ops,args) = op.parse_args()

try:
    assert(not (ops.inputf is None or ops.outputf is None))
except AssertionError, ae:
    print >> sys.stderr, "provide input and output files (type: 'python toUTF-8.py -h' for help)"
    sys.exit(-1)

# get input file's content and convert to utf-8
inf = open(ops.inputf, "rb")
input = inf.read()
outf = None
try:
    encoding = chardet.detect(input).get('encoding')
    input = input.decode(encoding)
    outf = codecs.open(ops.outputf, "wb", "utf-8")
    outf.write(input)
except Exception, e:
    print >> sys.stderr, "Something went wrong. Perhaps your input format is too obscure"
finally:
    outf.close()
    inf.close()


================================================
FILE: ccgbank/bin/write_morph.py
================================================
#!/usr/bin/env python
"""
Takes a file of word-tag pairs or word-tag-stem triples and writes an xml morph file.

(c) 2010 Michael White (modifed by D.N. Mehay 2011)
[insert LGPL here]
"""

import sys
from optparse import OptionParser as OP
from xml.sax import saxutils

global sem_classes
sem_classes = set(["PERSON", "ORGANIZATION", "LOCATION", "MONEY", "PERCENT", "TIME", "DATE"])

pr = OP()
pr.add_option("-i","--input",type="string",help="input source [default=<stdin>]",\
                  default=sys.stdin)
pr.add_option("-o","--output",type="string",help="output location [default=<stdout>]",\
                  default=sys.stdout)

(opts,args) = pr.parse_args(sys.argv)

inf = opts.input
if not inf is sys.stdin:
    inf = open(inf,'r')

outf = opts.output
if not outf is sys.stdout:
    outf = open(outf,'w')

try:
    print >> outf, '<morph name="novel">'
    for l in inf:
        l = l.strip()
        l = l.split()
        s = ['<entry word="']
        s.append(saxutils.escape(l[0]))
        s.append('" pos="')
        s.append(l[1])
        s.append('"')
        # added by DNM (02 Nov 2011)
        if len(l) >= 3:
            if l[2] in sem_classes:
                s.append(' class="')
                s.append(saxutils.escape(l[2]))
                s.append('"')
            else:
                s.append(' stem="')
                s.append(saxutils.escape(l[2]))
                s.append('"')
        if len(l) >= 4:
            s.append(' stem="')
            s.append(saxutils.escape(l[3]))
            s.append('"')

finally:
    if not inf is sys.stdin:
        inf.close()
    if not outf is sys.stdout:
        outf.close()


================================================
FILE: ccgbank/build-ht.properties
================================================

# nb: info.dir is specified in build.properties
preds.train=${info.dir}/preds-train
preds.dev=${info.dir}/preds-00-all
ht.factors.train=${info.dir}/ht.factors.train
ht.factors.dev=${info.dir}/ht.factors.dev

grammar.dir=${extract.dir}
ht.corpus.dir=${extract.dir}/test

ht.feats.dir=${feats.dir}/hypertagger
ht.models.dir=${models.dir}/hypertagger
pos.lm=${ht.models.dir}/pos.lm
st.lm=${ht.models.dir}/st.lm
vocab.pos=${ht.models.dir}/vocab.pos
vocab.st=${ht.models.dir}/vocab.st
vocab.train=${ht.models.dir}/vocab.train
posprior.lm=${ht.models.dir}/p_w0.lm
pos.feats=${ht.feats.dir}/pos.feats
pos.dev.feats=${ht.feats.dir}/pos.feats.00
pos.mod=${ht.models.dir}/pos.mod
htprior.lm=${ht.models.dir}/t_p0w0.lm
pos.dict=${ht.models.dir}/pos.dict.min10
word.dict=${ht.models.dir}/word.dict.min10
ht.feats=${ht.feats.dir}/ht.feats
ht2.feats=${ht.feats.dir}/ht2.feats
ht.dev.feats=${ht.feats.dir}/ht.dev.feats
ht.dev.log=${log.dir}/ht.dev.log
ht.mod=${ht.models.dir}/ht.mod
ht2.mod=${ht.models.dir}/ht2.mod

argnames=Arg0:A0 Arg1:A1 Arg1a:A1a Arg1b:A1b Arg2:A2 Arg2a:A2a Arg2b:A2b Arg3:A3 Arg4:A4 Arg5:A5


================================================
FILE: ccgbank/build-ht.xml
================================================
<!--
 Copyright (C) 2010-11 Dominic Espinosa and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
-->

<!-- This build file is for hypertagging models using the converted CCGbank. -->

<!-- $Id: build-ht.xml,v 1.10 2011/11/08 19:58:08 mwhite14850 Exp $ -->
<project name="HtModels" default="all" basedir=".">
  
  <taskdef resource="net/sf/antcontrib/antlib.xml"/>
  <property file="build.properties"/>
  <property file="build-models.properties"/>
  <property file="build-ht.properties"/>


  <!-- =================================================================== -->
  <!-- Initialization target                                               -->
  <!-- =================================================================== -->
  <target name="init">
    <tstamp/>
    <!-- initial hypertagger dependencies go here -->
    <uptodate targetfile="${ht.factors.train}" srcfile="${preds.train}" property="ht.factors.train.uptodate"/>
  </target>


  <!-- =================================================================== -->
  <!-- POS tagger and hypertagger                                          -->
  <!-- =================================================================== -->
	
  <target name="get-factors" depends="init" unless="ht.factors.train.uptodate">
                <echo message="Extracting SRILM factors from LF corpus" />
                <java classname="opennlp.ccg.realize.hypertagger.LMFactorExtractor" 
                        output="${ht.factors.train}" error="${log.dir}/ht.factors.train.log">
                        <arg value="${preds.train}"/>
                </java>
                <java classname="opennlp.ccg.realize.hypertagger.LMFactorExtractor"
                        output="${factors.dev}" error="${log.dir}/ht.factors.dev.log">
                        <arg value="${preds.dev}"/>
                </java>
  </target>

  <target name="check-vocab" depends="init">
    <uptodate targetfile="${vocab.train}" srcfile="${ht.factors.train}" property="vocab.train.uptodate"/>
  </target>

  <target name="get-vocab" depends="get-factors,check-vocab" unless="vocab.train.uptodate">
    <echo message="Writing counts from factor file"/>
    <exec executable="fngram-count" dir="${ht.models.dir}">
      <arg value="-text"/> <arg value="${basedir}/${ht.factors.train}"/> 
      <arg line="-factor-file vocab.flm -write-counts -sort"/>
    </exec>
    <for list="w,t,p" param="F">
      <sequential>
	<exec executable="cut" dir="${ht.models.dir}" output="${ht.models.dir}/uni.count">
	  <arg line="-f 2,3 @{F}.count"/>
	</exec>
	<move file="${ht.models.dir}/uni.count" tofile="${ht.models.dir}/@{F}.count"/>
      </sequential>
    </for>
    <echo message="Writing vocab with frequency cutoffs"/>
    <exec executable="ngram-count" dir="${ht.models.dir}">
      <arg line="-read p.count -write-vocab vocab.pos -sort"/>
    </exec>
    <exec executable="ngram-count" dir="${ht.models.dir}">
      <arg line="-read w.count -gt1min 5 -write-vocab vocab.words -read-with-mincounts -sort"/>
    </exec>
    <exec executable="ngram-count" dir="${ht.models.dir}">
      <arg line="-read t.count -gt1min 10 -write-vocab vocab.st -read-with-mincounts -sort"/>
    </exec>
    <concat destfile="${vocab.train}">
      <filelist dir="${ht.models.dir}" files="vocab.pos,vocab.st,vocab.words"/>
    </concat>
    <delete>
      <filelist dir="${ht.models.dir}" files="w.count,t.count,p.count"/>
    </delete>
  </target>

  <target name="check-pos-prior-lm" depends="init">
    <uptodate targetfile="${posprior.lm}" srcfile="${vocab.train}" property="posprior.lm.uptodate"/>
  </target>

  <target name="make-pos-prior-lm" depends="get-vocab,check-pos-prior-lm" unless="posprior.lm.uptodate">
    <echo message="Making POS prior language model using ${ht.models.dir}/posprior.flm"/>
    <exec executable="fngram-count" dir="${ht.models.dir}">
      <arg value="-text"/> <arg value="${basedir}/${ht.factors.train}"/> 
      <arg line="-factor-file posprior.flm -vocab vocab.train -lm -unk -write-counts -nonull"/>
      <arg line="-no-virtual-begin-sentence -no-virtual-end-sentence"/>
      <arg line="-no-add-start-sentence-token -no-add-end-sentence-token"/>
    </exec>
  </target>

  <target name="check-pos-feats" depends="init">
    <uptodate targetfile="${pos.feats}" srcfile="${posprior.lm}" property="pos.feats.uptodate"/>
  </target>

  <target name="get-pos-feats" depends="make-pos-prior-lm,check-pos-feats" unless="pos.feats.uptodate">
    <echo message="Extracting hyper-POS training features to ${pos.feats}"/>
    <java classname="opennlp.ccg.realize.hypertagger.TagExtract" 
	  input="${training.dirs}" output="${log.dir}/pf.out" error="${log.dir}/get-pos-feats.err">
      <arg value="-pos"/>
      <arg value="-P"/> <arg value="${ht.models.dir}/posprior.flm"/>
      <arg value="-v"/> <arg value="${ht.models.dir}/vocab.train"/>
      <arg value="-g"/> <arg value="${grammar.dir}/grammar.xml"/>
      <arg value="-an"/> <arg value="${argnames}"/>
      <arg value="-o"/> <arg value="${pos.feats}"/>
      <arg value="-d"/> <arg line="${ht.corpus.dir}"/>
      <arg line="${training.dirs}"/>
    </java>
    <echo message="Filtering POS training features by frequency"/>
    <exec executable="python">
      <arg value="bin/filter_feats.py"/>
      <arg value="-i"/> <arg value="${pos.feats}"/>
      <arg value="-o"/> <arg value="${ht.feats.dir}/pos.feats.tmp"/>
      <arg line="-n 1 -f 5"/>
    </exec>
    <move file="${ht.feats.dir}/pos.feats.tmp" tofile="${pos.feats}"/>
  </target>

  <target name="check-pos-model" depends="init">
    <uptodate targetfile="${pos.mod}" srcfile="${pos.feats}" property="pos.mod.uptodate"/>
  </target>

  <target name="make-pos-model" 
	  depends="get-pos-feats,check-pos-model" 
	  unless="pos.mod.uptodate">
    <echo message="Making POS tagging model to ${pos.mod}"/>
    <exec executable="maxent" output="${log.dir}/train-pos.log">
      <arg value="${pos.feats}"/> 
      <arg line="-v --lbfgs -c 0 -i 200 -g 1"/>
      <arg value="-m"/> <arg value="${pos.mod}"/>
    </exec>
  </target>


  <target name="check-ht-prior-lm" depends="init">
    <uptodate targetfile="${htprior.lm}" srcfile="${vocab.train}" property="htprior.lm.uptodate"/>
  </target>

  <target name="make-ht-prior-lm" depends="get-vocab,check-ht-prior-lm" unless="htprior.lm.uptodate">
    <echo message="Making hypertag prior language model using ${ht.models.dir}/stprior.flm"/>
    <exec executable="fngram-count" dir="${ht.models.dir}">
      <arg value="-text"/> <arg value="${basedir}/${ht.factors.train}"/> 
      <arg line="-factor-file ht-prior.flm -vocab vocab.train -lm -unk -write-counts -nonull"/>
      <arg line="-no-virtual-begin-sentence -no-virtual-end-sentence"/>
      <arg line="-no-add-start-sentence-token -no-add-end-sentence-token"/>
    </exec>
  </target>

  <target name="check-ht-feats" depends="init">
    <uptodate targetfile="${ht.feats}" srcfile="${htprior.lm}" property="ht.feats.uptodate"/>
  </target>

  <target name="get-ht-feats" depends="make-ht-prior-lm,check-ht-feats" unless="ht.feats.uptodate">
    <echo message="Extracting hypertagger training features to ${ht.feats}"/>
    <java classname="opennlp.ccg.realize.hypertagger.TagExtract"
	  input="${ht.factors.train}" output="${log.dir}/ht.out" error="${log.dir}/get-ht-feats.err">
<!--      <arg value="-H"/> <arg value="${ht.models.dir}/ht-prior.flm"/>
      <arg value="-V"/> <arg value="${ht.models.dir}/vocab.train"/> 
-->
      <arg value="-g"/> <arg value="${grammar.dir}/grammar.xml"/>
      <arg value="-an"/> <arg value="${argnames}"/>
      <arg value="-o"/> <arg value="${ht.feats}"/>
      <arg value="-d"/> <arg line="${ht.corpus.dir}"/>
      <arg line="${training.dirs}"/>
    </java>
    <echo message="Filtering hypertagger training features by frequency"/>
    <exec executable="python">
      <arg value="bin/filter_feats.py"/>
      <arg value="-i"/> <arg value="${ht.feats}"/>
      <arg value="-o"/> <arg value="${ht.feats.dir}/ht.feats.tmp"/>
      <arg line="-n ${catfreq.cutoff} -f 2"/>
    </exec>
    <move file="${ht.feats.dir}/ht.feats.tmp" tofile="${ht.feats}"/>
  </target>

  <target name="check-tag-dicts" depends="init">
    <uptodate targetfile="${pos.dict}" srcfile="${ht.factors.train}" property="pos.dict.uptodate"/>
  </target>

  <target name="get-tag-dicts" depends="get-factors,check-tag-dicts" unless="pos.dict.uptodate">
    <echo message="Extracting tag dictionaries to ${pos.dict} and ${word.dict}"/>
    <java classname="opennlp.ccg.parse.supertagger.util.TaggingDictionaryExtractor">
      <arg value="-i"/> <arg value="${ht.factors.train}"/>
      <arg value="-f"/> <arg value="${catfreq.cutoff}"/>
      <arg value="-p"/> <arg value="${pos.dict}"/>
      <arg value="-w"/> <arg value="${word.dict}"/>
    </java>
  </target>
	
  <target name="check-ht-model" depends="init">
    <uptodate targetfile="${ht.mod}" property="ht.mod.uptodate">
      <srcfiles dir="${basedir}" includes="${pos.dict},${ht.feats}"/>
    </uptodate>
  </target>

  <!-- this step takes a very long time; a couple of days, perhaps -->
  <target name="make-ht-model" 
	  depends="make-pos-model,get-ht-feats,get-tag-dicts,check-ht-model" 
	  unless="ht.mod.uptodate">
    <echo message="Making hypertagging model to ${ht.mod}"/>
    <exec executable="maxent" output="${log.dir}/train-ht.log">
      <arg value="${ht.feats}"/> 
      <arg line="-v --lbfgs -c 0 -i 275 -g 1"/>
      <arg value="-m"/> <arg value="${ht.mod}"/>
    </exec>
  </target>
  
<target name="check-ht2-feats" depends="init">
    <uptodate targetfile="${ht2.feats}" srcfile="${htprior.lm}" property="ht2.feats.uptodate"/>
  </target>
  
  <target name="get-ht2-feats" depends="make-ht-prior-lm,check-ht2-feats" unless="ht2.feats.uptodate">
    <echo message="Extracting hypertagger-2pass training features to ${ht2.feats}"/>
    <java classname="opennlp.ccg.realize.hypertagger.TagExtract"
	  input="${ht.factors.train}" output="${log.dir}/ht2.out" error="${log.dir}/get-ht2-feats.err">
<!--      <arg value="-H"/> <arg value="${ht.models.dir}/ht-prior.flm"/>
      <arg value="-V"/> <arg value="${ht.models.dir}/vocab.train"/> 
-->
      <arg value="-g"/> <arg value="${grammar.dir}/grammar.xml"/>
      <arg value="-an"/> <arg value="${argnames}"/>
      <arg value="-o"/> <arg value="${ht2.feats}"/>
      <arg value="-d"/> <arg line="${ht.corpus.dir}"/>
      <arg value="-y"/> <arg line="${ht.mod}"/>
      <arg line="${training.dirs}"/>
    </java>
    <echo message="Filtering hypertagger training features by frequency"/>
    <exec executable="python">
      <arg value="bin/filter_feats.py"/>
      <arg value="-i"/> <arg value="${ht2.feats}"/>
      <arg value="-o"/> <arg value="${ht.feats.dir}/ht2.feats.tmp"/>
      <arg line="-n ${catfreq.cutoff} -f 2"/>
    </exec>
    <move file="${ht.feats.dir}/ht2.feats.tmp" tofile="${ht2.feats}"/>
  </target>
  
  <target name="check-ht2-model" depends="init">
    <uptodate targetfile="${ht2.mod}" property="ht2.mod.uptodate">
      <srcfiles dir="${basedir}" includes="${ht2.feats}"/>
    </uptodate>
  </target>

  <!-- this step takes a number of hours, perhaps -->
  <target name="make-ht2-model" 
	  depends="get-ht2-feats,check-ht2-model" 
	  unless="ht2.mod.uptodate">
    <echo message="Making hypertagging-2pass model to ${ht2.mod}"/>
    <exec executable="maxent" output="${log.dir}/train-ht2.log">
      <arg value="${ht2.feats}"/> 
      <arg line="-v --lbfgs -c 0 -i 250 -g 1"/>
      <arg value="-m"/> <arg value="${ht2.mod}"/>
    </exec>
  </target>

  <target name="test-ht2">
    <echo message="Testing hypertagging-2pass model on dev set to ${log.dir}/ht2.dev.log"/>
    <java classname="opennlp.ccg.realize.hypertagger.ZLMaxentHypertagger" 
	  output="${log.dir}/ht2.dev.out" error="${log.dir}/ht2.dev.err">
      <arg value="-c"/> <arg value="${ht.models.dir}/ht2.config"/>
      <arg value="-g"/> <arg value="${grammar.dir}/grammar.xml"/>
      <arg value="-o"/> <arg value="${log.dir}/ht2.dev.log"/>
      <arg value="-d"/> <arg value="${ht.corpus.dir}"/>
      <arg line="00"/>
    </java>
  </target>


  <!-- =================================================================== -->
  <!-- Top-level                                                           -->
  <!-- =================================================================== -->

  <target name="all" depends="make-ht-model,make-ht2-model"/>

  <target name="clean" >
    <delete file="${ht.mod}"/>
    <delete file="${ht2.mod}"/>
    <delete file="${pos.mod}"/>
    <delete file="${ht.feats}"/>
    <delete file="${pos.feats}"/>
    <delete file="${pos.dev.feats}"/>
    <delete file="${ht.dev.feats}"/>
  </target>

</project>


================================================
FILE: ccgbank/build-models.properties
================================================

# nb: info.dir is specified in build.properties
factors.train=${info.dir}/factors-train
factors.dev=${info.dir}/factors-00-all
text.train=${info.dir}/text-train
text.sc.train=${info.dir}/textsc-train
text.dev=${info.dir}/text-00-all

catfreq.cutoff=10

feats.dir=./feats
models.dir=./models
plugins.dir=./plugins

original.postagger.models.dir=./original/models/postagger

novel.dir=${data.dir}/novel
novel.file=${novel.dir}/two-sents


================================================
FILE: ccgbank/build-models.xml
================================================
<!--
 Copyright (C) 2010-11 Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
-->

<!-- This build file is for parsing and realization models using the converted CCGbank. -->

<!-- $Id: build-models.xml,v 1.36 2011/04/25 15:43:29 mwhite14850 Exp $ -->
<project name="CCGbankModels" default="all" basedir=".">
  
  <taskdef resource="net/sf/antcontrib/antlib.xml"/>
  <property file="build.properties"/>
  <property file="build-models.properties"/>


  <!-- =================================================================== -->
  <!-- Initialization target                                               -->
  <!-- =================================================================== -->
  <target name="init">
    <tstamp/>
  </target>


  <!-- =================================================================== -->
  <!-- Plugins                                                             -->
  <!-- =================================================================== -->

  <target name="compile-plugins" depends="init">
    <javac srcdir="${plugins.dir}" includeAntRuntime="true"/>
  </target>


  <!-- =================================================================== -->
  <!-- Chaining build files                                                -->
  <!-- =================================================================== -->

  <target name="st-all" depends="init">
    <echo>Invoking supertagger all</echo>
    <subant antfile="build-st.xml" buildpath="${basedir}">
      <target name="all"/>
    </subant>
    <echo>Done</echo>
  </target>

  <target name="ps-all" depends="init">
    <echo>Invoking parser all</echo>
    <subant antfile="build-ps.xml" buildpath="${basedir}">
      <target name="all"/>
    </subant>
    <echo>Done</echo>
  </target>

  <target name="ht-all" depends="init">
    <echo>Invoking hypertagger all</echo>
    <subant antfile="build-ht.xml" buildpath="${basedir}">
      <target name="all"/>
    </subant>
    <echo>Done</echo>
  </target>

  <target name="rz-all" depends="init">
    <echo>Invoking realizer all</echo>
    <subant antfile="build-rz.xml" buildpath="${basedir}">
      <target name="all"/>
    </subant>
    <echo>Done</echo>
  </target>


  <!-- =================================================================== -->
  <!-- Top-level                                                           -->
  <!-- 1st: run all                                                        -->
  <!-- 2nd: train parser and realizer perceptron models (see build files)  -->
  <!-- =================================================================== -->

  <target name="all" depends="compile-plugins,st-all,ps-all,ht-all,rz-all"/>

</project>


================================================
FILE: ccgbank/build-original.properties
================================================

# nb: original.ccgbank.dir and data.dir are specified in build.properties

original.dir=./original

corpus.dir=${original.dir}/corpus
feats.dir=${original.dir}/feats
models.dir=${original.dir}/models
original.log.dir=${original.dir}/logs

train.leaves.srilm=${corpus.dir}/train.leaves.srilm
dev.leaves.srilm=${corpus.dir}/dev.leaves.srilm

postagger.feats.dir=${feats.dir}/postagger
postagger.models.dir=${models.dir}/postagger
supertagger.feats.dir=${feats.dir}/supertagger
supertagger.models.dir=${models.dir}/supertagger

train.pos.seq=${postagger.feats.dir}/train.pos.seq
pos.lm=${postagger.models.dir}/pos.lm
train.st.seq=${supertagger.feats.dir}/train.st.seq
st.lm=${supertagger.models.dir}/st.lm
vocab.pos=${postagger.models.dir}/vocab.pos
vocab.st=${supertagger.models.dir}/vocab.st
vocab.train=${supertagger.models.dir}/vocab.train
posprior.lm=${postagger.models.dir}/p_w0.lm
pos.feats=${postagger.feats.dir}/pos.feats
pos.mod=${postagger.models.dir}/pos.mod
stprior.lm=${supertagger.models.dir}/t_p0w0.lm
pos.dict=${supertagger.models.dir}/pos.dict.min10
word.dict=${supertagger.models.dir}/word.dict.min10
st.feats=${supertagger.feats.dir}/st.feats
st.mod=${supertagger.models.dir}/st.mod

novel.dir=${data.dir}/novel
novel.file=${novel.dir}/two-sents


================================================
FILE: ccgbank/build-original.xml
================================================
<!--
 Copyright (C) 2010 Michael White and Dennis Mehay
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
-->

<!-- This build file is for POS and super-taggers using the original CCGbank. -->

<!-- $Id: build-original.xml,v 1.8 2011/11/12 22:37:21 mwhite14850 Exp $ -->
<project name="CCGbankModels" default="all" basedir=".">
  
  <taskdef resource="net/sf/antcontrib/antlib.xml"/>
  <property file="build.properties"/>
  <property file="build-original.properties"/>
  <property name="training.dirs" value="02,03,04,05,06,07,08,09,10,11,12,13,14,15,16,17,18,19,20,21"/>


  <!-- =================================================================== -->
  <!-- Initialization target                                               -->
  <!-- =================================================================== -->
  <target name="init">
    <tstamp/>
    <!-- initial dependencies -->
    <uptodate targetfile="${train.leaves.srilm}" srcfile="${original.ccgbank.dir}/02/wsj_0200.auto" property="train.leaves.srilm.uptodate"/>
  </target>


  <!-- =================================================================== -->
  <!-- Corpus format and splits                                            -->
  <!-- =================================================================== -->

  <target name="make-corpus-splits" depends="init" unless="train.leaves.srilm.uptodate">
    <echo message="Making corpus splits in ${corpus.dir}"/>
    <concat destfile="${corpus.dir}/dev.auto">
      <fileset dir="${original.ccgbank.dir}" includes="00/*.auto"/>
    </concat>
    <concat destfile="${corpus.dir}/train.auto">
      <fileset dir="${original.ccgbank.dir}" 
	       includes="*/*.auto"
	       excludes="00/*,01/*,22/*,23/*,24/*"/>
    </concat>
    <concat destfile="${corpus.dir}/test.auto">
      <fileset dir="${original.ccgbank.dir}" includes="23/*.auto"/>
    </concat>
    <java classname="opennlp.ccg.parse.tagger.util.CCGBankToSRILMFLM">
      <arg value="-i"/> <arg value="${corpus.dir}/dev.auto"/>
      <arg value="-o"/> <arg value="${corpus.dir}/dev.leaves.srilm"/>
    </java>
    <java classname="opennlp.ccg.parse.tagger.util.CCGBankToSRILMFLM">
      <arg value="-i"/> <arg value="${corpus.dir}/train.auto"/>
      <arg value="-o"/> <arg value="${corpus.dir}/train.leaves.srilm"/>
    </java>
    <java classname="opennlp.ccg.parse.tagger.util.CCGBankToSRILMFLM">
      <arg value="-i"/> <arg value="${corpus.dir}/test.auto"/>
      <arg value="-o"/> <arg value="${corpus.dir}/test.leaves.srilm"/>
    </java>
    <delete>
      <filelist dir="${corpus.dir}" files="dev.auto,train.auto,test.auto"/>
    </delete>
  </target>


  <!-- =================================================================== -->
  <!-- POS tagger and supertagger                                          -->
  <!-- =================================================================== -->

  <target name="check-pos-sequences" depends="init">
    <uptodate targetfile="${train.pos.seq}" srcfile="${train.leaves.srilm}" property="train.pos.seq.uptodate"/>
  </target>

  <target name="get-pos-sequences" depends="make-corpus-splits,check-pos-sequences" unless="train.pos.seq.uptodate">
    <echo message="Extracting pos tag sequences to ${train.pos.seq}"/>
    <java classname="opennlp.ccg.parse.postagger.POSTagSequenceGetter">
      <arg value="-i"/> <arg value="${train.leaves.srilm}"/>
      <arg value="-o"/> <arg value="${train.pos.seq}"/>
    </java>
  </target>

  <target name="check-pos-lm" depends="init">
    <uptodate targetfile="${pos.lm}" srcfile="${train.pos.seq}" property="pos.lm.uptodate"/>
  </target>

  <target name="make-pos-lm" depends="get-pos-sequences,check-pos-lm" unless="pos.lm.uptodate">
    <echo message="Writing pos language model to ${pos.lm}"/>
    <exec executable="ngram-count">
      <arg value="-wbdiscount"/>
      <arg value="-lm"/> <arg value="${pos.lm}"/>
      <arg value="-order"/> <arg value="9"/>
      <arg value="-text"/> <arg value="${train.pos.seq}"/>
    </exec>
  </target>

  <target name="check-st-sequences" depends="init">
    <uptodate targetfile="${train.st.seq}" srcfile="${train.leaves.srilm}" property="train.st.seq.uptodate"/>
  </target>

  <target name="get-st-sequences" depends="make-corpus-splits,check-st-sequences" unless="train.st.seq.uptodate">
    <echo message="Extracting supertag sequences to ${train.st.seq}"/>
    <java classname="opennlp.ccg.parse.supertagger.util.SupertagSequenceGetter">
      <arg value="-i"/> <arg value="${train.leaves.srilm}"/>
      <arg value="-o"/> <arg value="${train.st.seq}"/>
    </java>
  </target>

  <target name="check-st-lm" depends="init">
    <uptodate targetfile="${st.lm}" srcfile="${train.st.seq}" property="st.lm.uptodate"/>
  </target>

  <target name="make-st-lm" depends="get-st-sequences,check-st-lm" unless="st.lm.uptodate">
    <echo message="Writing supertag language model to ${st.lm}"/>
    <exec executable="ngram-count">
      <arg value="-wbdiscount"/>
      <arg value="-lm"/> <arg value="${st.lm}"/>
      <arg value="-order"/> <arg value="9"/>
      <arg value="-text"/> <arg value="${train.st.seq}"/>
    </exec>
  </target>

  <target name="check-vocab" depends="init">
    <uptodate targetfile="${vocab.train}" srcfile="${train.leaves.srilm}" property="vocab.train.uptodate"/>
  </target>

  <target name="get-vocab" depends="make-corpus-splits,check-vocab" unless="vocab.train.uptodate">
    <echo message="Writing counts from factor file"/>
    <exec executable="fngram-count" dir="${supertagger.models.dir}">
      <arg value="-text"/> <arg value="${basedir}/${train.leaves.srilm}"/> 
      <arg line="-factor-file vocab.flm -write-counts -sort"/>
    </exec>
    <for list="w,t,p" param="F">
      <sequential>
	<exec executable="cut" dir="${supertagger.models.dir}" output="${supertagger.models.dir}/uni.count">
	  <arg line="-f 2,3 @{F}.count"/>
	</exec>
	<move file="${supertagger.models.dir}/uni.count" tofile="${supertagger.models.dir}/@{F}.count"/>
      </sequential>
    </for>
    <echo message="Writing vocab with frequency cutoffs"/>
    <exec executable="ngram-count" dir="${supertagger.models.dir}">
      <arg line="-read p.count -write-vocab vocab.pos -sort"/>
    </exec>
    <exec executable="ngram-count" dir="${supertagger.models.dir}">
      <arg line="-read w.count -gt1min 3 -write-vocab vocab.words -read-with-mincounts -sort"/>
    </exec>
    <exec executable="ngram-count" dir="${supertagger.models.dir}">
      <arg line="-read t.count -gt1min 10 -write-vocab vocab.st -read-with-mincounts -sort"/>
    </exec>
    <concat destfile="${vocab.train}">
      <filelist dir="${supertagger.models.dir}" files="vocab.pos,vocab.st,vocab.words"/>
    </concat>
    <copy file="${supertagger.models.dir}/vocab.pos" todir="${postagger.models.dir}"/>
    <copy file="${supertagger.models.dir}/vocab.train" todir="${postagger.models.dir}"/>
    <delete>
      <filelist dir="${supertagger.models.dir}" files="w.count,t.count,p.count"/>
    </delete>
  </target>

  <target name="check-pos-prior-lm" depends="init">
    <uptodate targetfile="${posprior.lm}" srcfile="${vocab.train}" property="posprior.lm.uptodate"/>
  </target>

  <target name="make-pos-prior-lm" depends="get-vocab,check-pos-prior-lm" unless="posprior.lm.uptodate">
    <echo message="Making POS prior language model using ${postagger.models.dir}/posprior.flm"/>
    <exec executable="fngram-count" dir="${postagger.models.dir}">
      <arg value="-text"/> <arg value="${basedir}/${train.leaves.srilm}"/> 
      <arg line="-factor-file posprior.flm -vocab vocab.train -lm -unk -write-counts -nonull"/>
      <arg line="-no-virtual-begin-sentence -no-virtual-end-sentence"/>
      <arg line="-no-add-start-sentence-token -no-add-end-sentence-token"/>
    </exec>
  </target>

  <target name="check-pos-feats" depends="init">
    <uptodate targetfile="${pos.feats}" srcfile="${posprior.lm}" property="pos.feats.uptodate"/>
  </target>

  <target name="get-pos-feats" depends="make-pos-prior-lm,check-pos-feats" unless="pos.feats.uptodate">
    <echo message="Extracting POS training features to ${pos.feats}"/>
    <java classname="opennlp.ccg.parse.postagger.ml.POSTagFex"
	  input="${train.leaves.srilm}" output="${pos.feats}">
      <arg value="-p"/> <arg value="${postagger.models.dir}/posprior.flm"/>
      <arg value="-v"/> <arg value="${postagger.models.dir}/vocab.train"/>
    </java>
    <echo message="Filtering POS training features by frequency"/>
    <exec executable="python">
      <arg value="bin/filter_feats.py"/>
      <arg value="-i"/> <arg value="${pos.feats}"/>
      <arg value="-o"/> <arg value="${postagger.feats.dir}/pos.feats.tmp"/>
      <arg line="-n 1 -f 5"/>
    </exec>
    <move file="${postagger.feats.dir}/pos.feats.tmp" tofile="${pos.feats}"/>
  </target>

  <target name="check-pos-model" depends="init">
    <uptodate targetfile="${pos.mod}" srcfile="${pos.feats}" property="pos.mod.uptodate"/>
  </target>

  <target name="make-pos-model" 
	  depends="make-pos-lm,get-pos-feats,check-pos-model" 
	  unless="pos.mod.uptodate">
    <echo message="Making POS tagging model to ${pos.mod}"/>
    <exec executable="maxent" output="${original.log.dir}/pos.log">
      <arg value="${pos.feats}"/> 
      <arg line="-v --lbfgs -c 0 -i 200 -g 1"/>
      <arg value="-m"/> <arg value="${pos.mod}"/>
    </exec>
  </target>

  <target name="test-pos-model" depends="init">
    <echo message="Testing POS tagging model on dev set to ${original.log.dir}/pos.dev.log"/>
    <java classname="opennlp.ccg.parse.postagger.BasicPOSTagger"
	  input="${dev.leaves.srilm}" output="${original.log.dir}/pos.dev.log">
      <arg value="-c"/> <arg value="${postagger.models.dir}/pos.config"/>
      <arg value="-e"/>
    </java>
  </target>

  <target name="test-postagger-novel" depends="init">
    <echo message="POS tagging novel sentences to ${novel.file}.pos"/>
    <java classname="opennlp.ccg.parse.postagger.BasicPOSTagger"
	  input="${novel.file}" output="${novel.file}.pos">
      <arg value="-c"/> <arg value="${postagger.models.dir}/pos.config"/>
    </java>
  </target>

  <target name="check-tag-dicts" depends="init">
    <uptodate targetfile="${pos.dict}" srcfile="${train.leaves.srilm}" property="pos.dict.uptodate"/>
  </target>

  <target name="get-tag-dicts" depends="make-corpus-splits,check-tag-dicts" unless="pos.dict.uptodate">
    <echo message="Extracting tag dictionaries to ${pos.dict} and ${word.dict}"/>
    <java classname="opennlp.ccg.parse.supertagger.util.TaggingDictionaryExtractor">
      <arg value="-i"/> <arg value="${train.leaves.srilm}"/>
      <arg value="-f"/> <arg value="10"/>
      <arg value="-p"/> <arg value="${pos.dict}"/>
      <arg value="-w"/> <arg value="${word.dict}"/>
    </java>
  </target>

  <target name="check-st-feats" depends="init">
    <uptodate targetfile="${st.feats}" srcfile="${supertagger.models.dir}/vocab.train" property="st.feats.uptodate"/>
  </target>

  <target name="get-st-feats" depends="get-vocab,check-st-feats" unless="st.feats.uptodate">
    <echo message="Extracting supertagger training features to ${st.feats}"/>
    <java classname="opennlp.ccg.parse.supertagger.ml.STFex"
	  input="${train.leaves.srilm}" output="${st.feats}">
      <arg value="-v"/> <arg value="${supertagger.models.dir}/vocab.train"/>
      <arg value="-p"/> <arg value="${postagger.models.dir}/pos.config"/>
    </java>
    <echo message="Filtering supertagger training features by frequency"/>
    <exec executable="python">
      <arg value="bin/filter_feats.py"/>
      <arg value="-i"/> <arg value="${st.feats}"/>
      <arg value="-o"/> <arg value="${supertagger.feats.dir}/st.feats.tmp"/>
      <arg line="-n 10 -f 2"/>
    </exec>
    <move file="${supertagger.feats.dir}/st.feats.tmp" tofile="${st.feats}"/>
  </target>

  <target name="check-st-model" depends="init">
    <uptodate targetfile="${st.mod}" property="st.mod.uptodate">
      <srcfiles dir="${basedir}" includes="${pos.dict},${st.feats}"/>
    </uptodate>
  </target>

  <target name="make-st-model" 
	  depends="make-pos-model,make-st-lm,get-tag-dicts,get-st-feats,check-st-model" 
	  unless="st.mod.uptodate">
    <echo message="Making supertagging model to ${st.mod}"/>
    <exec executable="maxent" output="${original.log.dir}/st.log">
      <arg value="${st.feats}"/> 
      <arg line="-v --lbfgs -c 0 -i 400 -g 1"/>
      <arg value="-m"/> <arg value="${st.mod}"/>
    </exec>
  </target>

  <target name="test-st-model" depends="init">
    <echo message="Testing supertagging model on dev set to ${original.log.dir}/st.dev.log"/>
    <java classname="opennlp.ccg.parse.supertagger.WordAndPOSDictionaryLabellingStrategy"
	  input="${dev.leaves.srilm}" output="${original.log.dir}/st.dev.log" error="${original.log.dir}/st.dev.report">
      <arg value="-c"/> <arg value="${supertagger.models.dir}/st.config"/>
      <arg value="-e"/>
      <arg value="-beta"/> <arg value="0.1"/>
    </java>
  </target>


  <!-- =================================================================== -->
  <!-- Top-level                                                           -->
  <!-- =================================================================== -->

  <target name="pos" depends="make-pos-model"/>
  <target name="all" depends="make-st-model"/>
  <target name="test" depends="test-pos-model,test-st-model"/>
  <target name="test-novel" depends="test-postagger-novel"/>

</project>


================================================
FILE: ccgbank/build-ps.properties
================================================
# nb: feats.dir and models.dir are specified in build-models.properties

parser.feats.dir=${feats.dir}/parser
parser.models.dir=${models.dir}/parser
deriv.factors.train=${parser.feats.dir}/deriv.factors.train
vocab.parser.train=${parser.models.dir}/vocab.parser.train
nbest.list.size=5

original.postagger.models.dir=./original/models/postagger

# what percentage of first 10 words being cased makes the heuristic say a sentence is in
# title-case? (change if desired)
titlecase.threshold=0.5

# you will need to download and extract ccgbank-data.tgz or english-models.tgz to get the truecase list
truecase.list=./aux/aux-files/truecase-list.gz

# we assume you have the stanford core nlp jar file and NE tagging models
# see docs/ccgbank-README for installation instructions
# you can also modify the properties below to point to the jar and model files elsewhere
stanford.core.nlp.dir=./stanford-nlp
stanford.core.nlp.jar=${stanford.core.nlp.dir}/stanford-core-nlp.jar

# by default, we assume you have placed the Stanford core NLP jar file in ./stanford-nlp, and that
# there are the following models in a subdirectory there called 'classifiers'
# (you can get Stanford NE recognition models from: http://nlp.stanford.edu/software/CRF-NER.shtml
# or from the core NLP download, per docs/ccgbank-README)
ner.model1=${stanford.core.nlp.dir}/classifiers/english.all.3class.distsim.crf.ser.gz 
ner.model2=${stanford.core.nlp.dir}/classifiers/english.muc.7class.distsim.crf.ser.gz
ner.model3=${stanford.core.nlp.dir}/classifiers/english.conll.4class.distsim.crf.ser.gz

# if you're using an older version of the Stanford NLP tools, it may
# be convenient to comment in the older names below
#ner.model1=${stanford.core.nlp.dir}/classifiers/all.3class.distsim.crf.ser.gz 
#ner.model2=${stanford.core.nlp.dir}/classifiers/muc.distsim.crf.ser.gz
#ner.model3=${stanford.core.nlp.dir}/classifiers/conll.distsim.crf.ser.gz


================================================
FILE: ccgbank/build-ps.xml
================================================
<!--
 Copyright (C) 2011-12 Michael White, Dennis N. Mehay
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
-->

<!-- This build file is for parsing models using the converted CCGbank. -->

<!-- $Id: build-ps.xml,v 1.16 2011/12/13 07:20:09 mwhite14850 Exp $ -->
<project name="CCGbankParserModels" default="all" basedir=".">
  
  <taskdef resource="net/sf/antcontrib/antlib.xml"/>
  <property file="build.properties"/>
  <property file="build-models.properties"/>
  <property file="build-st.properties"/>
  <property file="build-ps.properties"/>


  <!-- =================================================================== -->
  <!-- Initialization target                                               -->
  <!-- =================================================================== -->
  <target name="init">
    <tstamp/>
    <!-- initial parser dependencies -->
    <uptodate targetfile="${deriv.factors.train}" srcfile="${test.dir}/02/wsj_0201.xml" property="deriv.factors.train.uptodate"/>
  </target>


  <!-- =================================================================== -->
  <!-- Parser                                                              -->
  <!-- =================================================================== -->

  <target name="get-deriv-factors-train" depends="init" unless="deriv.factors.train.uptodate">
    <for list="${training.dirs}" param="sect">
      <sequential>
	<echo>Extracting derivation factors for section @{sect}</echo>
	<exec executable="ccg-test" dir="." output="${log.dir}/log.extract.derivs.@{sect}">
	  <arg value="-derivf"/> <arg value="${parser.feats.dir}/deriv-factors-@{sect}"/>
	  <arg value="-g"/> <arg value="${extract.dir}/grammar.xml"/>
	  <arg value="${test.dir}/@{sect}"/>
	</exec>
      </sequential>
    </for>
    <echo>Concatenating training derivation factors to ${deriv.factors.train}</echo>
    <concat destfile="${deriv.factors.train}">
      <fileset dir="${parser.feats.dir}" includes="deriv-factors-*" excludes="deriv-factors-00,deriv-factors-23"/>
    </concat>
  </target>

  <target name="check-parser-vocab" depends="init">
    <uptodate targetfile="${vocab.parser.train}" srcfile="${deriv.factors.train}" property="vocab.parser.train.uptodate"/>
  </target>

  <target name="get-parser-vocab" depends="get-deriv-factors-train,check-parser-vocab" unless="vocab.parser.train.uptodate">
    <echo message="Writing counts from factor file"/>
    <exec executable="fngram-count" dir="${parser.models.dir}">
      <arg value="-text"/> <arg value="${basedir}/${deriv.factors.train}"/> 
      <arg line="-factor-file vocab.flm -write-counts -sort"/>
    </exec>
    <for list="w,wt,ws,e,h,p,cp,ct,tt,t,s,cs,ts" param="F">
      <sequential>
	<exec executable="cut" dir="${parser.models.dir}" output="${parser.models.dir}/uni.count">
	  <arg line="-f 2,3 @{F}.count"/>
	</exec>
	<move file="${parser.models.dir}/uni.count" tofile="${parser.models.dir}/@{F}.count"/>
      </sequential>
    </for>
    <echo message="Writing vocab with frequency cutoffs"/>
    <concat destfile="${parser.models.dir}/min20.count">
      <filelist dir="${parser.models.dir}" files="w.count,wt.count,ws.count"/>
    </concat>
    <concat destfile="${parser.models.dir}/min10.count">
      <filelist dir="${parser.models.dir}" files="e.count,h.count,p.count,cp.count,ct.count,tt.count,t.count,s.count,cs.count,ts.count"/>
    </concat>
    <exec executable="ngram-count" dir="${parser.models.dir}">
      <arg line="-read min20.count -gt1min 20 -write-vocab vocab.min20 -read-with-mincounts -sort"/>
    </exec>
    <exec executable="ngram-count" dir="${parser.models.dir}">
      <arg line="-read min10.count -gt1min ${catfreq.cutoff} -write-vocab vocab.min10 -read-with-mincounts -sort"/>
    </exec>
    <concat destfile="${vocab.parser.train}">
      <filelist dir="${parser.models.dir}" files="vocab.min20,vocab.min10"/>
    </concat>
    <delete>
      <fileset dir="${parser.models.dir}" includes="*.count,vocab.min20,vocab.min10"/>
    </delete>
  </target>

  <target name="check-parser-flms" depends="init">
    <uptodate targetfile="${parser.models.dir}/ct_p0.lm" srcfile="${vocab.parser.train}" property="parser.flms.uptodate"/>
  </target>

  <target name="make-parser-flms" depends="get-parser-vocab,check-parser-flms" unless="parser.flms.uptodate">
    <for list="top,leaf,unary,binary" param="F">
      <sequential>
	<echo message="Making gen syn language models using ${parser.models.dir}/@{F}.flm"/>
	<exec executable="fngram-count" dir="${parser.models.dir}">
	  <arg value="-text"/> <arg value="${basedir}/${deriv.factors.train}"/> 
	  <arg line="-factor-file @{F}.flm -vocab vocab.parser.train -lm -unk -write-counts -nonull"/>
	  <arg line="-no-virtual-begin-sentence -no-virtual-end-sentence"/>
	  <arg line="-no-add-start-sentence-token -no-add-end-sentence-token"/>
	</exec>
      </sequential>
    </for>
    <delete>
      <fileset dir="${parser.models.dir}" includes="*.count"/>
    </delete>
  </target>

  <target name="copy-train-grammar" depends="init">
    <echo>Copying train grammar with cutoffs to ${extract.dir}</echo>
    <copy todir="${extract.dir}" overwrite="true">
      <fileset dir="${grams.dir}/train-cfc10" includes="*.xml,*.html"/>
    </copy>
  </target>

  <target name="copy-dev-morph" depends="copy-train-grammar">
    <echo>Copying dev morph to ${extract.dir}</echo>
    <copy tofile="${extract.dir}/morph.xml" file="${grams.dir}/dev/morph.xml" overwrite="true"/>
  </target>

  <target name="test-parser" depends="copy-dev-morph">
    <echo>Loading parse.prefs</echo>
    <exec executable="tccg" dir="${parser.models.dir}">
      <arg line="-importprefs parse.prefs"/>
    </exec>
    <echo>Parsing dev section to ${log.dir}/parse.dev.log</echo>
    <exec executable="ccg-test" dir="${basedir}" output="${log.dir}/parse.dev.log">
      <arg value="-norealization"/>
      <arg value="-g"/> <arg value="${extract.dir}/grammar.xml"/>
      <arg value="-stconfig"/> <arg value="${supertagger.models.dir}/st.config"/>
      <arg value="-parsescorer"/> <arg value="plugins.MyGenSynScorer"/>
      <arg value="${test.dir}/00"/>
    </exec>
  </target>


  <!-- =================================================================== -->
  <!-- Parser Perceptron Model                                             -->
  <!-- =================================================================== -->

  <target name="check-parser-flms-excl-sect" depends="init">
    <uptodate targetfile="${parser.models.dir}/excl02/ct_p0.lm" 
	      srcfile="${vocab.parser.train}" property="parser.flms.excl.sect.uptodate"/>
  </target>

  <!-- train models excluding each section in turn -->
  <target name="make-parser-flms-excl-sect" 
	  depends="get-parser-vocab,check-parser-flms-excl-sect" unless="parser.flms.excl.sect.uptodate">
    <for list="${training.dirs}" param="sect">
      <sequential>
	<echo>Concatenating training derivation factors excluding sect @{sect} to ${deriv.factors.train}.excl@{sect}</echo>
	<concat destfile="${deriv.factors.train}.excl@{sect}">
	  <fileset dir="${parser.feats.dir}" includes="deriv-factors-*" 
		   excludes="deriv-factors-@{sect},deriv-factors-00,deriv-factors-23"/>
	</concat>
	<echo>Copying flm files to ${parser.models.dir}/excl@{sect}</echo>
	<copy todir="${parser.models.dir}/excl@{sect}" overwrite="true">
	  <fileset dir="${parser.models.dir}" includes="*.flm"/>
	</copy>
	<for list="top,leaf,unary,binary" param="F">
	  <sequential>
	    <echo message="Making gen syn language models using ${parser.models.dir}/excl@{sect}/@{F}.flm"/>
	    <exec executable="fngram-count" dir="${parser.models.dir}/excl@{sect}">
	      <arg value="-text"/> <arg value="${basedir}/${deriv.factors.train}.excl@{sect}"/> 
	      <arg line="-factor-file @{F}.flm -vocab ../vocab.parser.train -lm -unk -write-counts -nonull"/>
	      <arg line="-no-virtual-begin-sentence -no-virtual-end-sentence"/>
	      <arg line="-no-add-start-sentence-token -no-add-end-sentence-token"/>
	    </exec>
	  </sequential>
	</for>
	<delete>
	  <fileset dir="${parser.models.dir}/excl@{sect}" includes="*.count"/>
	  <fileset file="${deriv.factors.train}.excl@{sect}"/>
	</delete>
      </sequential>
    </for>
  </target>

  <!-- generate parser events for each section -->
  <macrodef name="gen-parser-events-for-sect">
    <attribute name="sect"/>
    <sequential>
      <echo>Generating parser training events for sect @{sect}</echo>
      <echo>Copying train grammar with to ${extract.dir}</echo>
      <copy todir="${extract.dir}" overwrite="true">
	<fileset dir="${grams.dir}/train" includes="*.xml,*.html"/>
      </copy>
      <echo>Loading gen-events.prefs</echo>
      <exec executable="tccg" dir="${parser.models.dir}">
	<arg line="-importprefs gen-events.prefs"/>
      </exec>
      <echo>Generating events to ${parser.feats.dir}/events-@{sect}.gz</echo>
      <exec executable="ccg-test" dir="${basedir}" output="${log.dir}/gen.parser.events.@{sect}.log">
	<arg value="-Dgensyn.model.dir=${parser.models.dir}/excl@{sect}"/>
	<arg value="-norealization"/>
	<arg value="-g"/> <arg value="${extract.dir}/grammar.xml"/>
	<arg value="-2events"/> <arg value="${parser.feats.dir}/events-@{sect}.gz"/>
	<arg value="-stconfig"/> <arg value="${supertagger.models.dir}/st.config.train"/>
	<arg value="-parsescorer"/> <arg value="plugins.MyGenSynScorer"/>
	<arg value="-extractor"/> <arg value="plugins.MySynSemFeatureExtractor"/>
	<arg value="${test.dir}/@{sect}"/>
      </exec>
    </sequential>
  </macrodef>

  <target name="check-parser-events" depends="init">
    <uptodate targetfile="${parser.feats.dir}/events-${sect}.gz" 
	      srcfile="${parser.models.dir}/excl02/ct_p0.lm" property="parser.events.uptodate"/>
  </target>

  <target name="gen-parser-events" 
	  depends="make-parser-flms-excl-sect,check-parser-events" unless="parser.events.uptodate">
    <gen-parser-events-for-sect sect="${sect}"/>
  </target>

  <target name="check-parser-events-train" depends="init">
    <uptodate targetfile="${parser.feats.dir}/events-02.gz" srcfile="${parser.models.dir}/excl02/ct_p0.lm" property="parser.events.train.uptodate"/>
  </target>

  <!-- see bin/gen_parser_events_* for scripts to extract events in parallel -->
  <target name="gen-parser-events-train" 
	  depends="make-parser-flms-excl-sect,check-parser-events-train" unless="parser.events.train.uptodate">
    <for list="${training.dirs}" param="sect">
      <sequential>
	<gen-parser-events-for-sect sect="@{sect}"/>
      </sequential>
    </for>
  </target>

  <target name="check-parser-events-concat" depends="init">
    <uptodate targetfile="${parser.feats.dir}/events-train.gz" 
	      srcfile="${parser.feats.dir}/events-02.gz" property="parser.events.concat.uptodate"/>
  </target>

  <target name="concat-parser-events" 
	  depends="gen-parser-events-train,check-parser-events-concat" unless="parser.events.concat.uptodate">
    <echo>Concatenating event files to ${parser.feats.dir}/events-train.gz</echo>
    <for list="${training.dirs}" param="sect">
      <sequential>
	<echo>Concatenating ${parser.feats.dir}/events-@{sect}.gz</echo>
	<gunzip src="${parser.feats.dir}/events-@{sect}.gz"/>
	<concat destfile="${parser.feats.dir}/events-train" append="true">
	  <fileset file="${parser.feats.dir}/events-@{sect}"/>
	</concat>
	<delete file="${parser.feats.dir}/events-@{sect}" quiet="true"/>
      </sequential>
    </for>
    <gzip src="${parser.feats.dir}/events-train" destfile="${parser.feats.dir}/events-train.gz"/>
    <delete file="${parser.feats.dir}/events-train" quiet="true"/>
  </target>

  <target name="check-parser-alphabet" depends="init">
    <uptodate targetfile="${parser.feats.dir}/alph.gz" 
	      srcfile="${parser.feats.dir}/events-train.gz" property="parser.alphabet.uptodate"/>
  </target>

  <target name="calc-parser-alphabet" 
	  depends="concat-parser-events,check-parser-alphabet" unless="parser.alphabet.uptodate">
    <echo>Calculating feature alphabet as ${parser.feats.dir}/alph.gz</echo>
    <java classname="opennlp.ccg.perceptron.Alphabet" output="${log.dir}/log.parser.alphabet">
      <arg value="${parser.feats.dir}/events-train.gz"/>
      <arg value="${parser.feats.dir}/alph.gz"/>
      <arg value="-p"/> <arg value="5"/>
    </java>
  </target>

  <target name="check-parser-perceptron" depends="init">
    <uptodate targetfile="${parser.models.dir}/model.gz" 
	      srcfile="${parser.feats.dir}/alph.gz" property="parser.perceptron.uptodate"/>
  </target>

  <target name="train-parser-perceptron" 
	  depends="calc-parser-alphabet,check-parser-perceptron" unless="parser.perceptron.uptodate">
    <echo>Training perceptron model to ${parser.models.dir}/model.gz</echo>
    <java classname="opennlp.ccg.perceptron.Trainer" output="${log.dir}/log.parser.perceptron">
      <arg value="${parser.feats.dir}/events-train.gz"/>
      <arg value="${parser.feats.dir}/alph.gz"/>
      <arg value="10"/>
      <arg value="${parser.models.dir}/model.gz"/>
      <arg value="-i"/> <arg value="${parser.models.dir}/model.init"/>
      <arg value="-n"/> <arg value="1"/>
    </java>
  </target>

  <target name="test-parser-perceptron" depends="copy-dev-morph">
    <echo>Loading parse.prefs</echo>
    <exec executable="tccg" dir="${parser.models.dir}">
      <arg line="-importprefs parse.prefs"/>
    </exec>
    <echo>Parsing dev section to ${log.dir}/parse.perceptron.dev.log</echo>
    <exec executable="ccg-test" dir="${basedir}" output="${log.dir}/parse.perceptron.dev.log">
      <arg value="-norealization"/>
      <arg value="-g"/> <arg value="${extract.dir}/grammar.xml"/>
      <arg value="-stconfig"/> <arg value="${supertagger.models.dir}/st.config"/>
      <arg value="-parsescorer"/> <arg value="plugins.MyParserPerceptronScorer"/>
      <arg value="${test.dir}/00"/>
    </exec>
  </target>


  <!-- =================================================================== -->
  <!-- Parsing novel data                                                  -->
  <!-- =================================================================== -->

  <target name="prepare-novel-dir" depends="init">
    <mkdir dir="${basedir}/${novel.file}.dir"/>
  </target>

  <target name="check-for-tok" depends="prepare-novel-dir">
    <uptodate targetfile="${novel.file}.dir/text.tok" srcfile="${basedir}/${novel.file}" property="text.tok.uptodate"/>
  </target>

  <target name="prepare-novel-text" depends="check-for-tok" unless="text.tok.uptodate">
    <!-- We brute-force a java task with <exec...>...</exec>, since -->
    <!-- for some reason <java> tasks only work for OpenCCG java (?)-->
    <!-- First tokenize -->
    <exec executable="java" dir="${basedir}" output="${novel.file}.dir/text.tok" error="${novel.file}.dir/errlog">
      <arg value="-Dfile.encoding=UTF8"/>
      <arg value="-cp"/> <arg value="${stanford.core.nlp.jar}"/>
      <arg value="edu.stanford.nlp.process.PTBTokenizer"/>
      <arg value="-preserveLines"/> 
      <arg value="-options"/> 
      <arg value="untokenizable=noneKeep,latexQuotes=true,normalizeCurrency=false,normalizeParentheses=true,normalizeOtherBrackets=true,ptb3Ellipsis=true,ptb3Dashes=true,strictTreebank3=false"/>
      <arg value="${basedir}/${novel.file}"/>
    </exec>
    <!-- This takes "American"-style attributive quotations to "British"/"logical" style. -->
    <exec executable="python" dir="${basedir}" input="${novel.file}.dir/text.tok" output="${novel.file}.dir/text" error="${novel.file}.dir/errlog">
      <arg value="./bin/american-to-logical-quotes.py"/>
    </exec>
  </target>

  <target name="copy-train-grammar-novel" depends="prepare-novel-dir">
    <echo>Copying training grammar with cutoffs and other miscellanea to ${novel.file}.dir/extract/</echo>
    <copy todir="${novel.file}.dir/extract/" overwrite="true">
      <fileset dir="${grams.dir}/train-cfc10" includes="*.xml,*.xsl"/>
    </copy>
    <copy todir="${novel.file}.dir/extract/" overwrite="true">
      <fileset dir="${extract.dir}" includes="*.xsl"/>
    </copy>
    <copy todir="${novel.file}.dir/extract/info/" file="${extract.dir}/info/combos-train" overwrite="true"/>
  </target>

  <!-- Prepare for further processing by truecasing -->
  <target name="check-truecased-text" depends="prepare-novel-text">
    <uptodate targetfile="${novel.file}.dir/truecased-text" srcfile="${novel.file}.dir/text" property="truecased.text.uptodate"/>
  </target>

  <target name="truecase-text" depends="check-truecased-text" unless="truecased.text.uptodate">
    <echo message="Truecasing text for NER tagging into file ${novel.file}.dir/truecased-text"/>
    <java classname="opennlp.ccg.lexicon.TrueCaser" input="${novel.file}.dir/text" output="${novel.file}.dir/truecased-text">
      <arg value="-t"/> <arg value="${truecase.list}"/>
      <arg value="-r"/> <arg value="${titlecase.threshold}"/>
    </java>
  </target>

  <target name="check-for-ner" depends="truecase-text">
    <uptodate targetfile="${novel.file}.dir/nertext" srcfile="${novel.file}.dir/truecased-text" property="ner.text.uptodate"/>
  </target>

  <!-- NER tag with Stanford NE tagger. See docs/ccgbank-README for installation instructions, -->
  <!-- and build-ps.properties for NE-related properties. -->
  <target name="ner-tag-text" depends="check-for-ner" unless="ner.text.uptodate">
    <echo message="NER tagging into file ${novel.file}.dir/nertext"/>
    <echo message="Models: ${ner.model1}, ${ner.model2}, ${ner.model3}"/>
    <java classname="nerapp.NERApp" classpath="bin/ner/NERApp.jar:${stanford.core.nlp.jar}" error="${novel.file}.dir/tmplogf">
      <arg value="${novel.file}.dir/truecased-text"/> 
      <arg value="${novel.file}.dir/nertext.raw"/>
      <arg value="${ner.model1}"/> <arg value="${ner.model2}"/> <arg value="${ner.model3}"/>
    </java>
    <exec executable="python" input="${novel.file}.dir/nertext.raw" output="${novel.file}.dir/nertext" error="${novel.file}.dir/tmplogf">
      <arg value="bin/ner/post-process-stanford-ner.py"/>
    </exec>
    <delete file="${novel.file}.dir/tmplogf" quiet="true"/>
  </target>

  <!-- get just the words (not NE labels) for POS tagging -->
  <target name="check-for-pos-prep" depends="ner-tag-text">
    <uptodate targetfile="${novel.file}.dir/nertext-nolabs" srcfile="${novel.file}.dir/nertext" property="pos.prep.uptodate"/>
  </target>

  <target name="postag-prep" depends="check-for-pos-prep" unless="pos.prep.uptodate">
    <!-- nb: using output file here and input file in next step seems to help ensure 
	 file is ready for reading (ant bug?) -->
    <exec executable="python" input="${novel.file}.dir/nertext">
      <arg value="bin/get_just_words_from_ner_text.py"/>
      <arg value="-o"/> <arg value="${novel.file}.dir/nertext-nolabs"/>
    </exec>
  </target>

  <!-- POS tag -->
  <target name="check-novel-pos-tags"  depends="postag-prep">
    <uptodate targetfile="${novel.file}.dir/pos" srcfile="${novel.file}.dir/nertext-nolabs" property="pos.uptodate"/>
  </target>

  <!-- postag fused NE tokens (without labels) using true-cased POS tagger. -->
  <target name="postag-novel" depends="check-novel-pos-tags" unless="pos.uptodate">
    <echo message="POS tagging novel sentences to ${novel.file}.dir/pos"/>
    <java classname="opennlp.ccg.parse.postagger.BasicPOSTagger">
      <arg value="-i"/> <arg value="${novel.file}.dir/nertext-nolabs"/>
      <arg value="-o"/> <arg value="${novel.file}.dir/pos"/>
      <arg value="-c"/> <arg value="${supertagger.models.dir}/pos.config"/>
    </java>
  </target>

  <!-- rejoin pos-tagged words and NE labels for making the novel morph file -->
  <target name="check-merged-ne-pos" depends="postag-novel">
    <uptodate targetfile="${novel.file}.dir/pairs" srcfile="${novel.file}.dir/pos" property="check.merged.ne.pos.uptodate"/>
  </target>

  <target name="merge-ne-pos" depends="check-merged-ne-pos" unless="check.merged.ne.pos.uptodate">
    <echo message="Merging POS-tagged words and NE-labelled words for morph file creation"/>
    <exec executable="python" dir="${basedir}" output="${novel.file}.dir/pairs">
      <arg value="bin/merge_pos_ne.py"/> 
      <arg value="-p"/> 
      <arg value="${novel.file}.dir/pos"/> <arg value="-n"/> <arg value="${novel.file}.dir/nertext"/>
    </exec>
  </target>

  <target name="check-novel-morph-xml" depends="merge-ne-pos">
    <uptodate targetfile="${novel.file}.dir/morph.xml" srcfile="${novel.file}.dir/pairs" property="novel.morph.uptodate"/>
  </target>

  <target name="make-novel-morph-xml" depends="check-novel-morph-xml" unless="novel.morph.uptodate">
    <echo message="Sorting and stemming to ${novel.file}.dir/morph"/>
    <exec executable="python" input="${novel.file}.dir/pairs" dir="${basedir}"
	  output="${novel.file}.dir/morph.input"
	  error="${novel.file}.dir/tmplogf">
      <arg value="bin/prepare-for-stanford-morpha.py"/>
    </exec>
    <!-- The following doesn't work for some reason having to do with
    ant, so we brute-force the equivalent with an 'exec' task below. 
    -->
    <!--
    <java classname="edu.stanford.nlp.process.Morphology"
    output="${novel.file}.dir/morph"
    classpath="${stanford.core.nlp.jar}" error="${novel.file}.dir/errlog">
      <arg value="${novel.file}.dir/morph.input"/>
    </java>
    -->
    <exec executable="java" dir="${basedir}" output="${novel.file}.dir/morph" error="${novel.file}.dir/errlog">
      <arg value="-Dfile.encoding=UTF8"/>
      <arg value="-cp"/> <arg value="${stanford.core.nlp.jar}"/>
      <arg value="edu.stanford.nlp.process.Morphology"/> <arg value="${novel.file}.dir/morph.input"/>
    </exec>
    <!-- this next step sort/uniq's and merges. -->
    <exec executable="python" dir="${basedir}"
	  output="${novel.file}.dir/morph.xml"
	  error="${novel.file}.dir/tmplogf">
      <arg value="bin/merge-stanford-morpha-with-pos.py"/>
      <arg value="-m"/> <arg value="${novel.file}.dir/morph"/>
      <arg value="-p"/> <arg value="${novel.file}.dir/pairs"/>
    </exec>
    <delete file="${novel.file}.dir/errlogf" quiet="true"/>
    <delete file="${novel.file}.dir/tmplogf" quiet="true"/>
  </target>

  <target name="merge-novel-morph-xml" depends="make-novel-morph-xml,copy-train-grammar-novel">
    <echo>Merging training morph (with cutoffs) and novel morph to ${novel.file}.dir/extract/morph.xml</echo>
    <xslt style="templates/mergeMorph.xsl" basedir="${convert.dir}" force="true"
	  in="${grams.dir}/train-cfc10/morph.xml" out="${novel.file}.dir/extract/morph.xml">
      <factory name="org.apache.xalan.processor.TransformerFactoryImpl"/>
      <param name="newmorphfile" expression="../${novel.file}.dir/morph.xml"/>
    </xslt>
  </target>

  <target name="check-test-parser-novel-nbest" depends="merge-novel-morph-xml">
    <uptodate targetfile="${novel.file}.dir/tb.xml" srcfile="${novel.file}.dir/morph.xml" property="check-test-parser-novel-nbest.uptodate"/>
  </target>

  <target name="test-parser-novel-nbest" depends="check-test-parser-novel-nbest" unless="check-test-parser-novel-nbest.uptodate">
    <echo>Loading parse.prefs</echo>
    <java classname="opennlp.ccg.TextCCG">
      <arg value="-importprefs"/> <arg value="${parser.models.dir}/parse.prefs"/>
    </java>
    <echo>Parsing ${novel.file}.dir/nertext-nolabs to ${novel.file}.dir/tb.xml</echo>
    <java classname="opennlp.ccg.Parse" output="${novel.file}.dir/parse.log">
      <arg value="-g"/> <arg value="${novel.file}.dir/extract/grammar.xml"/>
      <arg value="-stconfig"/> <arg value="${supertagger.models.dir}/st.config"/>
      <arg value="-parsescorer"/> <arg value="plugins.MyGenSynScorer"/>
      <arg value="${novel.file}.dir/nertext-nolabs"/>
      <arg value="${novel.file}.dir/tb.xml"/>
      <arg value="-nbestListSize"/> <arg value="${nbest.list.size}"/>
      <arg value="-includederivs"/>
      <arg value="-includescores"/>
    </java>
  </target>

  <target name="check-test-parser-novel" depends="merge-novel-morph-xml">
    <uptodate targetfile="${novel.file}.dir/tb.xml" srcfile="${novel.file}.dir/morph.xml" property="check-test-parser-novel.uptodate"/>
  </target>

  <target name="test-parser-novel" depends="check-test-parser-novel" unless="check-test-parser-novel.uptodate">
    <echo>Loading parse.prefs</echo>
    <java classname="opennlp.ccg.TextCCG">
      <arg value="-importprefs"/> <arg value="${parser.models.dir}/parse.prefs"/>
    </java>
    <echo>Parsing ${novel.file}.dir/nertext-nolabs to ${novel.file}.dir/tb.xml</echo>
    <java classname="opennlp.ccg.Parse" output="${novel.file}.dir/parse.log">
      <arg value="-g"/> <arg value="${novel.file}.dir/extract/grammar.xml"/>
      <arg value="-stconfig"/> <arg value="${supertagger.models.dir}/st.config"/>
      <arg value="-parsescorer"/> <arg value="plugins.MyGenSynScorer"/>
      <arg value="${novel.file}.dir/nertext-nolabs"/>
      <arg value="${novel.file}.dir/tb.xml"/>
    </java>
  </target>

  <!-- =================================================================== -->
  <!-- Top-level                                                           -->
  <!-- 1st: run all                                                        -->
  <!-- 2nd: run bin/gen_parser_events_* to extract events in parallel      -->
  <!-- 3rd: run train-parser-perceptron                                    -->
  <!-- =================================================================== -->

  <target name="all" depends="make-parser-flms,make-parser-flms-excl-sect"/>
  <target name="train-perceptron" depends="train-parser-perceptron"/>
  <target name="test" depends="test-parser"/>
  <target name="test-perceptron" depends="test-parser-perceptron"/>
  <target name="test-novel" depends="test-parser-novel"/>

</project>


================================================
FILE: ccgbank/build-release.xml
================================================
<!--
 Copyright (C) 2011 Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
-->

<!-- This build file is for creating the archive files ccgbank-data.tgz and english-models.tgz. -->

<!-- $Id: build-release.xml,v 1.6 2011/12/12 19:53:06 mwhite14850 Exp $ -->
<project name="CCGbankRelease" default="all" basedir=".">
  
  <taskdef resource="net/sf/antcontrib/antlib.xml"/>
  <property file="build.properties"/>
  <property file="build-release.properties"/>


  <!-- =================================================================== -->
  <!-- Initialization target                                               -->
  <!-- =================================================================== -->
  <target name="init">
    <tstamp/>
    <!-- initial dependencies -->
    <available file="${tmp.dir}/original/00/wsj_0001.auto" property="ccgbank.spaceconverted.exists"/>
    <available file="${tmp.dir}/propccgbank/00/wsj_0001.auto" property="propccgbank.spaceconverted.exists"/>
    <available file="${tmp.dir}/propccgbank.patch" property="propccgbank.patch.exists"/>
    <available file="${basedir}/ccgbank-data.tgz" property="ccgbank.data.exists"/>
    <available file="${basedir}/english-models.tgz" property="english.models.exists"/>
  </target>


  <!-- =================================================================== -->
  <!-- Make ccgbank-data.tgz                                               -->
  <!-- =================================================================== -->

  <target name="convert-spaces-ccgbank" depends="init" unless="ccgbank.spaceconverted.exists">
    <echo message="Converting spaces to newlines in original ccgbank"/>
    <for param="file">
      <path>
	<fileset dir="${original.ccgbank.dir}" includes="*/*.auto"/>
      </path>
      <sequential>
	<propertyregex override="yes" property="file.name" input="@{file}" regexp=".*/([^/].*)" replace="\1"/>
	<propertyregex override="yes" property="file.dir" input="@{file}" regexp=".*/([^/]*)/[^/]*" replace="\1"/>
	<mkdir dir="${tmp.dir}/original/${file.dir}"/>
	<exec executable="python" input="@{file}" output="${tmp.dir}/original/${file.dir}/${file.name}">
	  <arg value="bin/convert-spaces-to-newlines.py"/>
	</exec>
      </sequential>
    </for>
  </target>

  <target name="convert-spaces-propccgbank" depends="init" unless="propccgbank.spaceconverted.exists">
    <echo message="Converting spaces to newlines in propccgbank"/>
    <for param="file">
      <path>
	<fileset dir="${ccgbank.dir}" includes="*/*.auto"/>
      </path>
      <sequential>
	<propertyregex override="yes" property="file.name" input="@{file}" regexp=".*/([^/].*)" replace="\1"/>
	<propertyregex override="yes" property="file.dir" input="@{file}" regexp=".*/([^/]*)/[^/]*" replace="\1"/>
	<mkdir dir="${tmp.dir}/propccgbank/${file.dir}"/>
	<exec executable="python" input="@{file}" output="${tmp.dir}/propccgbank/${file.dir}/${file.name}">
	  <arg value="bin/convert-spaces-to-newlines.py"/>
	</exec>
      </sequential>
    </for>
  </target>

  <target name="make-propccgbank-patch" depends="convert-spaces-ccgbank,convert-spaces-propccgbank" 
	  unless="propccgbank.patch.exists">
    <echo message="Making patch file propccgbank.patch"/>
    <exec executable="diff" dir="${tmp.dir}" output="${tmp.dir}/propccgbank.patch" logError="true">
      <arg line="-urN original propccgbank"/>
    </exec>
  </target>

  <target name="make-ccgbank-data-tarball" depends="make-propccgbank-patch">
    <echo message="Making ccgbank-data.tgz"/>
    <!-- nb: using hardcoded dir names to get relative paths straight -->
    <tar destfile="ccgbank-data.tgz" compression="gzip"
         basedir="${basedir}"
         includes="aux/** tmp/propccgbank.patch" />
  </target>

  <target name="make-ccgbank-data" depends="init" unless="ccgbank.data.exists">
    <antcall target="make-ccgbank-data-tarball"/>
  </target>


  <!-- =================================================================== -->
  <!-- Make english-models.tgz                                             -->
  <!-- =================================================================== -->

  <target name="make-english-models" depends="init" unless="english.models.exists">
    <echo message="Making english-models.tgz"/>
    <!-- nb: using hardcoded dir names to get relative paths straight -->
    <tar destfile="english-models.tgz" compression="gzip"
         basedir="${basedir}"
         includes="models/*/*.lm models/*/*.3bo models/*/*.gz models/*/*.mod 
		   models/*/vocab.* models/*/*dict*
		   aux/aux-files/truecase-list.gz plugins/*.class 
		   extract/grammars/** extract/info/combos-train"
	 excludes="**/*.flm"/>
  </target>


  <!-- =================================================================== -->
  <!-- Extract ccgbank-data.tgz                                            -->
  <!-- =================================================================== -->

  <target name="patch-ccgbank" depends="convert-spaces-ccgbank">
    <echo message="Patching original ccgbank with patch file propccgbank.patch"/>
    <mkdir dir="${tmp.dir}/patched"/>
    <copy todir="${tmp.dir}/patched"> <fileset dir="${tmp.dir}/original"/> </copy>
    <exec executable="patch" dir="${tmp.dir}/patched" logError="true">
      <arg line="-p1 -u -s -i ../propccgbank.patch"/>
    </exec>
    <echo message="Reversing spaces to newlines in patched ccgbank to propccgbank"/>
    <mkdir dir="${ccgbank.dir}"/>
    <for param="file">
      <path>
	<fileset dir="${tmp.dir}/patched" includes="*/*.auto"/>
      </path>
      <sequential>
	<propertyregex override="yes" property="file.name" input="@{file}" regexp=".*/([^/].*)" replace="\1"/>
	<propertyregex override="yes" property="file.dir" input="@{file}" regexp=".*/([^/]*)/[^/]*" replace="\1"/>
	<mkdir dir="${ccgbank.dir}/${file.dir}"/>
	<exec executable="python" input="@{file}" output="${ccgbank.dir}/${file.dir}/${file.name}">
	  <arg value="bin/reverse-spaces-to-newlines.py"/>
	</exec>
      </sequential>
    </for>
  </target>

  <target name="check-propccgbank" depends="init">
    <uptodate srcfile="${basedir}/ccgbank-data.tgz" targetfile="${ccgbank.dir}/00/wsj_0001.auto" 
	      property="propccgbank.uptodate"/>
  </target>

  <target name="extract-ccgbank-data" depends="check-propccgbank" unless="propccgbank.uptodate">
    <echo message="Extracting ccgbank-data.tgz"/>
    <untar src="ccgbank-data.tgz" dest="${basedir}" compression="gzip"/>
    <antcall target="patch-ccgbank"/>
  </target>


  <!-- =================================================================== -->
  <!-- Extract english-models.tgz                                          -->
  <!-- =================================================================== -->

  <target name="extract-english-models" depends="init">
    <echo message="Extracting english-models.tgz"/>
    <untar src="english-models.tgz" dest="${basedir}" compression="gzip"/>
  </target>


  <!-- =================================================================== -->
  <!-- Cleans temp files                                                   -->
  <!-- =================================================================== -->
  <target name="clean" depends="init">
    <delete dir="${tmp.dir}/original"/>
    <delete dir="${tmp.dir}/patched"/>
    <delete dir="${tmp.dir}/propccgbank"/>
    <delete file="${tmp.dir}/propccgbank.patch"/>
  </target>


  <!-- =================================================================== -->
  <!-- Top-level                                                           -->
  <!-- =================================================================== -->

  <target name="all" depends="make-ccgbank-data,make-english-models,clean"/>
  <target name="extract-data" depends="extract-ccgbank-data,clean"/>
  <target name="extract-models" depends="extract-english-models"/>

</project>


================================================
FILE: ccgbank/build-rz.properties
================================================

# nb: feats.dir and models.dir is specified in build-models.properties
realizer.feats.dir=${feats.dir}/realizer
realizer.models.dir=${models.dir}/realizer
realizer.model.global=model.global
realizer.alph.init=alph.init
realizer.alph.name=alph.gz
realizer.model.name=model.gz

big.words.lm=${realizer.models.dir}/gigaword4.5g.kenlm.bin
words.lm=${realizer.models.dir}/train.3bo
words.sc.lm=${realizer.models.dir}/train-sc.3bo
stpos.flm=${realizer.models.dir}/stp3.flm

# nb: vocab.train is copied from build-st.properties (which is otherwise not needed)
supertagger.models.dir=${models.dir}/supertagger
vocab.train=${supertagger.models.dir}/vocab.train

# todo: import this property instead
hypertagger.models.dir=${models.dir}/hypertagger

# nb: parser.models.dir is copied from build-ps.properties (which is otherwise not needed)
parser.models.dir=${models.dir}/parser


================================================
FILE: ccgbank/build-rz.xml
================================================
<!--
 Copyright (C) 2010-11 Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
-->

<!-- This build file is for realization models using the converted CCGbank. -->

<!-- $Id: build-rz.xml,v 1.20 2011/12/13 07:46:48 mwhite14850 Exp $ -->
<project name="CCGbankRealizerModels" default="all" basedir=".">
  
  <taskdef resource="net/sf/antcontrib/antlib.xml"/>
  <property file="build.properties"/>
  <property file="build-models.properties"/>
  <property file="build-rz.properties"/>


  <!-- =================================================================== -->
  <!-- Initialization target                                               -->
  <!-- =================================================================== -->
  <target name="init">
    <tstamp/>
  </target>

  <target name="init-deps" depends="init">
    <!-- initial dependencies -->
    <!-- nb: assumes supertagger already built -->
    <uptodate targetfile="${words.lm}" srcfile="${vocab.train}" property="words.lm.uptodate"/>
    <uptodate targetfile="${words.sc.lm}" srcfile="${vocab.train}" property="words.sc.lm.uptodate"/>
    <uptodate targetfile="${realizer.models.dir}/t_p0p1p2.lm" srcfile="${factors.train}" property="stpos.flm.uptodate"/>
  </target>

  <target name="copy-train-grammar" depends="init">
    <echo>Copying train grammar to ${extract.dir}</echo>
    <copy todir="${extract.dir}" overwrite="true">
      <fileset dir="${grams.dir}/train" includes="*.xml,*.html"/>
    </copy>
  </target>

  <target name="copy-dev-morph" depends="copy-train-grammar">
    <echo>Copying dev morph to ${extract.dir}</echo>
    <copy tofile="${extract.dir}/morph.xml" file="${grams.dir}/dev/morph.xml" overwrite="true"/>
  </target>

  <target name="copy-test-morph" depends="copy-train-grammar">
    <echo>Copying test morph to ${extract.dir}</echo>
    <copy tofile="${extract.dir}/morph.xml" file="${grams.dir}/test/morph.xml" overwrite="true"/>
  </target>

  <target name="load-prefs-train" depends="init">
    <echo>Loading gen-events.prefs</echo>
    <exec executable="tccg" dir="${realizer.models.dir}">
      <arg line="-importprefs gen-events.prefs"/>
    </exec>
  </target>

  <target name="load-prefs-test" depends="init">
    <echo>Loading rz-test.prefs</echo>
    <java classname="opennlp.ccg.TextCCG">
      <arg value="-importprefs"/> <arg value="${realizer.models.dir}/rz-test.prefs"/>
    </java>
  </target>


  <!-- =================================================================== -->
  <!-- N-gram models                                                       -->
  <!-- =================================================================== -->

  <target name="make-words-lm" depends="init-deps" unless="words.lm.uptodate">
    <echo message="Building trigram language model to ${words.lm}"/>
    <exec executable="ngram-count">
      <arg value="-kndiscount"/> <arg value="-unk"/>
      <arg value="-lm"/> <arg value="${words.lm}"/>
      <arg value="-order"/> <arg value="3"/>
      <arg value="-vocab"/> <arg value="${vocab.train}"/>
      <arg value="-text"/> <arg value="${text.train}"/>
    </exec>
  </target>

  <target name="make-words-sc-lm" depends="init-deps" unless="words.sc.lm.uptodate">
    <echo message="Building trigram language model with semantic class replacement to ${words.sc.lm}"/>
    <exec executable="ngram-count">
      <arg value="-kndiscount"/> <arg value="-unk"/>
      <arg value="-lm"/> <arg value="${words.sc.lm}"/>
      <arg value="-order"/> <arg value="3"/>
      <arg value="-vocab"/> <arg value="${vocab.train}"/>
      <arg value="-text"/> <arg value="${text.sc.train}"/>
    </exec>
  </target>

  <target name="make-stpos-flm" depends="init-deps" unless="stpos.flm.uptodate">
    <echo message="Making super-/pos tag factored language model using ${stpos.flm}"/>
    <exec executable="fngram-count" dir="${realizer.models.dir}">
      <arg value="-text"/> <arg value="${basedir}/${factors.train}"/> 
      <arg value="-vocab"/> <arg value="${basedir}/${vocab.train}"/> 
      <arg value="-factor-file"/> <arg value="${basedir}/${stpos.flm}"/> 
      <arg line="-lm -write-counts"/>
    </exec>
    <delete>
      <fileset dir="${realizer.models.dir}" includes="*.count"/>
    </delete>
  </target>

  <!-- train word models excluding each section in turn -->
  <target name="check-lms-excl-sect" depends="init-deps">
    <uptodate targetfile="${realizer.models.dir}/excl/train.excl02.3bo" 
	      srcfile="${vocab.train}" property="lms.excl.sect.uptodate"/>
  </target>

  <target name="make-lms-excl-sect" depends="check-lms-excl-sect" unless="lms.excl.sect.uptodate">
    <for list="${training.dirs}" param="sect">
      <sequential>
	<echo>Concatenating training text excluding sect @{sect} to ${text.train}.excl@{sect}</echo>
	<concat destfile="${text.train}.excl@{sect}">
	  <fileset dir="${info.dir}" includes="text-*-all" 
		   excludes="text-@{sect}-all,text-00-all,text-23-all"/>
	</concat>
	<echo>Concatenating sem class replaced training text excluding sect @{sect} to ${text.sc.train}.excl@{sect}</echo>
	<concat destfile="${text.sc.train}.excl@{sect}">
	  <fileset dir="${info.dir}" includes="textsc-*-all" 
		   excludes="textsc-@{sect}-all,textsc-00-all,textsc-23-all"/>
	</concat>
	<echo>Building trigram language model to ${realizer.models.dir}/excl/train.excl@{sect}.3bo</echo>
	<exec executable="ngram-count">
	  <arg value="-kndiscount"/> <arg value="-unk"/>
	  <arg value="-lm"/> <arg value="${realizer.models.dir}/excl/train.excl@{sect}.3bo"/>
	  <arg value="-order"/> <arg value="3"/>
	  <arg value="-vocab"/> <arg value="${vocab.train}"/>
	  <arg value="-text"/> <arg value="${text.train}.excl@{sect}"/>
	</exec>
	<echo>Building trigram language model to ${realizer.models.dir}/excl/train-sc.excl@{sect}.3bo</echo>
	<exec executable="ngram-count">
	  <arg value="-kndiscount"/> <arg value="-unk"/>
	  <arg value="-lm"/> <arg value="${realizer.models.dir}/excl/train-sc.excl@{sect}.3bo"/>
	  <arg value="-order"/> <arg value="3"/>
	  <arg value="-vocab"/> <arg value="${vocab.train}"/>
	  <arg value="-text"/> <arg value="${text.sc.train}.excl@{sect}"/>
	</exec>
	<echo>Deleting concatenated text files</echo>
	<delete>
	  <fileset file="${text.train}.excl@{sect}"/>
	</delete>
	<delete>
	  <fileset file="${text.sc.train}.excl@{sect}"/>
	</delete>
      </sequential>
    </for>
  </target>


  <!-- =================================================================== -->
  <!-- Perceptron Model                                                    -->
  <!-- =================================================================== -->

  <target name="gen-realizer-events-prep" depends="make-lms-excl-sect">
    <echo>Invoking parser target for generative models excluding each section</echo>
    <subant antfile="build-ps.xml" buildpath="${basedir}">
      <target name="make-parser-flms-excl-sect"/>
    </subant>
    <echo>Done</echo>
  </target>

  <!-- generate realizer events for each section -->
  <macrodef name="gen-realizer-events-for-sect">
    <attribute name="sect"/>
    <sequential>
      <echo>Generating realizer training events for sect @{sect}</echo>
      <echo>Copying train grammar to ${extract.dir}</echo>
      <copy todir="${extract.dir}" overwrite="true">
	<fileset dir="${grams.dir}/train" includes="*.xml,*.html"/>
      </copy>
      <echo>Generating events to ${realizer.feats.dir}/events-@{sect}.gz</echo>
      <exec executable="ccg-test" dir="${basedir}" output="${log.dir}/gen.realizer.events.@{sect}.log">
	<arg value="-Dgensyn.model.dir=${parser.models.dir}/excl@{sect}"/>
	<arg value="-Dwords.lm=${realizer.models.dir}/excl/train.excl@{sect}.3bo"/>
	<arg value="-noparsing"/>
	<arg value="-g"/> <arg value="${extract.dir}/grammar.xml"/>
	<arg value="-2events"/> <arg value="${realizer.feats.dir}/events-@{sect}.gz"/>
	<arg value="-htconfig"/> <arg value="${hypertagger.models.dir}/ht2.train.config"/> 
	<arg value="-scorer"/> <arg value="plugins.MyNgramGenSynProduct"/>
<!-- 	<arg value="-extractor"/> <arg value="plugins.MySynAgrFeatureExtractor"/> -->
	<arg value="-extractor"/> <arg value="plugins.MySynSemAgrFeatureExtractor"/>
	<arg value="${test.dir}/@{sect}"/>
      </exec>
    </sequential>
  </macrodef>

  <target name="check-realizer-events" depends="init-deps">
    <uptodate targetfile="${realizer.feats.dir}/events-${sect}.gz" 
	      srcfile="${realizer.models.dir}/excl/train.excl02.3bo" property="realizer.events.uptodate"/>
  </target>

  <target name="gen-realizer-events" 
	  depends="gen-realizer-events-prep,load-prefs-train,check-realizer-events" unless="realizer.events.uptodate">
    <gen-realizer-events-for-sect sect="${sect}"/>
  </target>

  <target name="check-realizer-events-train" depends="init-deps">
    <uptodate targetfile="${realizer.feats.dir}/events-02.gz" 
	      srcfile="${realizer.models.dir}/excl/train.excl02.3bo" property="realizer.events.train.uptodate"/>
  </target>

  <!-- see bin/gen_realizer_events_* for scripts to extract events in parallel -->
  <target name="gen-realizer-events-train" 
	  depends="gen-realizer-events-prep,load-prefs-train,check-realizer-events-train" unless="realizer.events.train.uptodate">
    <for list="${training.dirs}" param="sect">
      <sequential>
	<gen-realizer-events-for-sect sect="@{sect}"/>
      </sequential>
    </for>
  </target>

  <target name="check-realizer-events-concat" depends="init-deps">
    <uptodate targetfile="${realizer.feats.dir}/events-train.gz" 
	      srcfile="${realizer.feats.dir}/events-02.gz" property="realizer.events.concat.uptodate"/>
  </target>

  <target name="concat-realizer-events" 
	  depends="gen-realizer-events-train,check-realizer-events-concat" unless="realizer.events.concat.uptodate">
    <echo>Concatenating event files to ${realizer.feats.dir}/events-train.gz</echo>
    <for list="${training.dirs}" param="sect">
      <sequential>
	<echo>Concatenating ${realizer.feats.dir}/events-@{sect}.gz</echo>
	<gunzip src="${realizer.feats.dir}/events-@{sect}.gz"/>
	<concat destfile="${realizer.feats.dir}/events-train" append="true">
	  <fileset file="${realizer.feats.dir}/events-@{sect}"/>
	</concat>
	<delete file="${realizer.feats.dir}/events-@{sect}" quiet="true"/>
      </sequential>
    </for>
    <gzip src="${realizer.feats.dir}/events-train" destfile="${realizer.feats.dir}/events-train.gz"/>
    <delete file="${realizer.feats.dir}/events-train" quiet="true"/>
  </target>

  <target name="check-realizer-alphabet" depends="init-deps">
    <uptodate targetfile="${realizer.feats.dir}/alph.gz" 
	      srcfile="${realizer.feats.dir}/events-train.gz" property="realizer.alphabet.uptodate"/>
  </target>

  <target name="calc-realizer-alphabet" 
	  depends="concat-realizer-events,check-realizer-alphabet" unless="realizer.alphabet.uptodate">
    <echo>Calculating feature alphabet as ${realizer.feats.dir}/alph.gz</echo>
    <java classname="opennlp.ccg.perceptron.Alphabet" output="${log.dir}/log.realizer.alphabet">
      <arg value="${realizer.feats.dir}/events-train.gz"/>
      <arg value="${realizer.feats.dir}/alph.gz"/>
      <arg value="-p"/> <arg value="5"/>
    </java>
  </target>

  <target name="check-realizer-perceptron-global" depends="init-deps">
    <uptodate targetfile="${realizer.models.dir}/${realizer.model.global}" 
	      srcfile="${realizer.feats.dir}/events-train.gz" property="realizer.perceptron.global.uptodate"/>
  </target>

  <target name="train-realizer-perceptron-global" 
	  depends="check-realizer-perceptron-global" unless="realizer.perceptron.global.uptodate">
    <echo>Training perceptron model with global feats to ${realizer.models.dir}/${realizer.model.global}</echo>
    <java classname="opennlp.ccg.perceptron.Trainer" output="${log.dir}/log.realizer.perceptron.global">
      <arg value="${realizer.feats.dir}/events-train.gz"/>
      <arg value="${realizer.models.dir}/${realizer.alph.init}"/>
      <arg value="2"/>
      <arg value="${realizer.models.dir}/${realizer.model.global}"/>
      <arg value="-i"/> <arg value="${realizer.models.dir}/model.init"/>
      <!-- <arg value="-in_mem"/> -->
    </java>
  </target>

  <target name="check-realizer-perceptron" depends="init-deps">
    <uptodate targetfile="${realizer.models.dir}/${realizer.model.name}" 
	      srcfile="${realizer.feats.dir}/${realizer.alph.name}" property="realizer.perceptron.uptodate"/>
  </target>

  <target name="train-realizer-perceptron" 
	  depends="calc-realizer-alphabet,train-realizer-perceptron-global,check-realizer-perceptron" 
	  unless="realizer.perceptron.uptodate">
    <echo>Training perceptron model to ${realizer.models.dir}/${realizer.model.name} </echo>
    <echo>from ${realizer.feats.dir}/${realizer.alph.name}</echo>
    <java classname="opennlp.ccg.perceptron.Trainer" output="${log.dir}/log.realizer.perceptron">
      <arg value="${realizer.feats.dir}/events-train.gz"/>
      <arg value="${realizer.feats.dir}/${realizer.alph.name}"/>
      <arg value="5"/>
      <arg value="${realizer.models.dir}/${realizer.model.name}"/>
      <arg value="-i"/> <arg value="${realizer.models.dir}/${realizer.model.global}"/>
      <!-- <arg value="-n"/> <arg value="1"/> -->
      <!-- <arg value="-in_mem"/> -->
    </java>
  </target>


  <!-- =================================================================== -->
  <!-- Testing                                                             -->
  <!-- =================================================================== -->

  <target name="test-realizer" depends="copy-dev-morph,load-prefs-test">
    <echo>Realizing dev section to ${log.dir}/realize.dev.log</echo>
    <exec executable="ccg-test" dir="${basedir}" output="${log.dir}/realize.dev.log">
      <arg value="-noparsing"/>
      <arg value="-g"/> <arg value="${extract.dir}/grammar.xml"/>
      <arg value="-htconfig"/> <arg value="${hypertagger.models.dir}/ht2.config"/>
      <arg value="-scorer"/> <arg value="plugins.MyNgramGenSynProduct"/>
      <arg value="${test.dir}/00"/>
    </exec>
  </target>

  <target name="test-realizer-perceptron" depends="copy-dev-morph,load-prefs-test">
    <echo>Realizing dev section to ${log.dir}/realize.perceptron.dev.log</echo>
    <exec executable="ccg-test" dir="${basedir}" output="${log.dir}/realize.perceptron.dev.log">
      <arg value="-Drealizer.model.name=${realizer.model.name}"/>
      <arg value="-noparsing"/>
      <arg value="-g"/> <arg value="${extract.dir}/grammar.xml"/>
      <arg value="-htconfig"/> <arg value="${hypertagger.models.dir}/ht2.config"/>
      <arg value="-scorer"/> <arg value="plugins.MyRealizerPerceptronScorer"/>
      <arg value="-bleu"/> <arg value="${log.dir}/realize.perceptron.dev.bleu"/>
      <arg value="-realserdir"/> <arg value="${log.dir}/ser"/>
      <arg value="${test.dir}/00"/>
    </exec>
  </target>

  <target name="test-realizer-perceptron-23" depends="copy-test-morph,load-prefs-test">
    <echo>Realizing test section to ${log.dir}/realize.perceptron.test.log</echo>
    <exec executable="ccg-test" dir="${basedir}" output="${log.dir}/realize.perceptron.test.log">
      <arg value="-Drealizer.model.name=${realizer.model.name}"/>
      <arg value="-noparsing"/>
      <arg value="-g"/> <arg value="${extract.dir}/grammar.xml"/>
      <arg value="-htconfig"/> <arg value="${hypertagger.models.dir}/ht2.config"/>
      <arg value="-scorer"/> <arg value="plugins.MyRealizerPerceptronScorer"/>
      <arg value="-bleu"/> <arg value="${log.dir}/realize.perceptron.test.bleu"/>
      <arg value="-realserdir"/> <arg value="${log.dir}/ser"/>
      <arg value="${test.dir}/23"/>
    </exec>
  </target>

  <!-- nb: this target relies on test-parser-novel having been run first -->
  <target name="test-realizer-novel" depends="load-prefs-test">
    <echo>Realizing ${novel.file}.dir/tb.xml to ${novel.file}.dir/realize.nbest</echo>
    <java classname="opennlp.ccg.test.Regression" output="${novel.file}.dir/realize.log">
      <arg value="-noparsing"/>
      <arg value="-g"/> <arg value="${novel.file}.dir/extract/grammar.xml"/>
      <arg value="-htconfig"/> <arg value="${hypertagger.models.dir}/ht2.config"/>
      <!-- <arg value="-htgold"/> -->
      <arg value="-scorer"/> <arg value="plugins.MyRealizerPerceptronScorer"/>
      <arg value="-nbestrealfile"/> <arg value="${novel.file}.dir/realize.nbest"/>
      <arg value="${novel.file}.dir/tb.xml"/>
    </java>
  </target>


  <!-- =================================================================== -->
  <!-- Top-level                                                           -->
  <!-- 1st: run all                                                        -->
  <!-- 2nd: run event-gen-prep                                             -->
  <!-- 3rd: run bin/gen_realizer_events_* to extract events in parallel    -->
  <!-- 4th: run train-perceptron                                           -->
  <!-- =================================================================== -->

  <target name="all" depends="make-words-lm,make-words-sc-lm,make-stpos-flm"/>
  <target name="event-gen-prep" depends="gen-realizer-events-prep"/>
  <target name="train-perceptron" depends="train-realizer-perceptron"/>
  <target name="train-perceptron-global" depends="train-realizer-perceptron-global"/>
  <target name="test" depends="test-realizer"/>
  <target name="test-perceptron" depends="test-realizer-perceptron"/>
  <target name="test-perceptron-23" depends="test-realizer-perceptron-23"/>
  <target name="test-novel" depends="test-realizer-novel"/>

</project>


================================================
FILE: ccgbank/build-st.properties
================================================

# nb: feats.dir and models.dir are specified in build-models.properties

supertagger.feats.dir=${feats.dir}/supertagger
supertagger.models.dir=${models.dir}/supertagger
train.pos.seq=${supertagger.feats.dir}/train.pos.seq
pos.lm=${supertagger.models.dir}/pos.lm
train.st.seq=${supertagger.feats.dir}/train.st.seq
st.lm=${supertagger.models.dir}/st.lm
vocab.pos=${supertagger.models.dir}/vocab.pos
vocab.st=${supertagger.models.dir}/vocab.st
vocab.train=${supertagger.models.dir}/vocab.train
posprior.lm=${supertagger.models.dir}/p_w0.lm
pos.feats=${supertagger.feats.dir}/pos.feats
pos.mod=${supertagger.models.dir}/pos.mod
pos.dict=${supertagger.models.dir}/pos.dict.min10
word.dict=${supertagger.models.dir}/word.dict.min10
st.feats=${supertagger.feats.dir}/st.feats
st.mod=${supertagger.models.dir}/st.mod


================================================
FILE: ccgbank/build-st.xml
================================================
<!--
 Copyright (C) 2010 Michael White and Dennis Mehay
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
-->

<!-- This build file is for supertagging models using the converted CCGbank. -->

<!-- $Id: build-st.xml,v 1.4 2011/11/12 22:37:21 mwhite14850 Exp $ -->
<project name="CCGbankSupertaggerModels" default="all" basedir=".">
  
  <taskdef resource="net/sf/antcontrib/antlib.xml"/>
  <property file="build.properties"/>
  <property file="build-models.properties"/>
  <property file="build-st.properties"/>


  <!-- =================================================================== -->
  <!-- Initialization target                                               -->
  <!-- =================================================================== -->
  <target name="init">
    <tstamp/>
    <!-- initial supertagger dependencies -->
    <uptodate targetfile="${train.pos.seq}" srcfile="${factors.train}" property="train.pos.seq.uptodate"/>
    <uptodate targetfile="${train.st.seq}" srcfile="${factors.train}" property="train.st.seq.uptodate"/>
    <uptodate targetfile="${vocab.train}" srcfile="${factors.train}" property="vocab.train.uptodate"/>
    <uptodate targetfile="${pos.dict}" srcfile="${factors.train}" property="pos.dict.uptodate"/>
  </target>


  <!-- =================================================================== -->
  <!-- POS tagger and supertagger                                          -->
  <!-- =================================================================== -->

  <target name="get-pos-sequences" depends="init" unless="train.pos.seq.uptodate">
    <echo message="Extracting pos tag sequences to ${train.pos.seq}"/>
    <java classname="opennlp.ccg.parse.postagger.POSTagSequenceGetter">
      <arg value="-i"/> <arg value="${factors.train}"/>
      <arg value="-o"/> <arg value="${train.pos.seq}"/>
    </java>
  </target>

  <target name="check-pos-lm" depends="init">
    <uptodate targetfile="${pos.lm}" srcfile="${train.pos.seq}" property="pos.lm.uptodate"/>
  </target>

  <target name="make-pos-lm" depends="get-pos-sequences,check-pos-lm" unless="pos.lm.uptodate">
    <echo message="Writing pos language model to ${pos.lm}"/>
    <exec executable="ngram-count">
      <arg value="-wbdiscount"/>
      <arg value="-lm"/> <arg value="${pos.lm}"/>
      <arg value="-order"/> <arg value="9"/>
      <arg value="-text"/> <arg value="${train.pos.seq}"/>
    </exec>
  </target>

  <target name="get-st-sequences" depends="init" unless="train.st.seq.uptodate">
    <echo message="Extracting supertag sequences to ${train.st.seq}"/>
    <java classname="opennlp.ccg.parse.supertagger.util.SupertagSequenceGetter">
      <arg value="-i"/> <arg value="${factors.train}"/>
      <arg value="-o"/> <arg value="${train.st.seq}"/>
    </java>
  </target>

  <target name="check-st-lm" depends="init">
    <uptodate targetfile="${st.lm}" srcfile="${train.st.seq}" property="st.lm.uptodate"/>
  </target>

  <target name="make-st-lm" depends="get-st-sequences,check-st-lm" unless="st.lm.uptodate">
    <echo message="Writing supertag language model to ${st.lm}"/>
    <exec executable="ngram-count">
      <arg value="-wbdiscount"/>
      <arg value="-lm"/> <arg value="${st.lm}"/>
      <arg value="-order"/> <arg value="9"/>
      <arg value="-text"/> <arg value="${train.st.seq}"/>
    </exec>
  </target>

  <target name="get-vocab" depends="init" unless="vocab.train.uptodate">
    <echo message="Writing counts from factor file"/>
    <exec executable="fngram-count" dir="${supertagger.models.dir}">
      <arg value="-text"/> <arg value="${basedir}/${factors.train}"/> 
      <arg line="-factor-file vocab.flm -write-counts -sort"/>
    </exec>
    <for list="w,t,p" param="F">
      <sequential>
	<exec executable="cut" dir="${supertagger.models.dir}" output="${supertagger.models.dir}/uni.count">
	  <arg line="-f 2,3 @{F}.count"/>
	</exec>
	<move file="${supertagger.models.dir}/uni.count" tofile="${supertagger.models.dir}/@{F}.count"/>
      </sequential>
    </for>
    <echo message="Writing counts from text file with semantic class replacement"/>
    <exec executable="ngram-count" dir="${supertagger.models.dir}" output="${supertagger.models.dir}/sc.count">
      <arg value="-text"/> <arg value="${basedir}/${text.sc.train}"/> 
      <arg line="-order 1"/>
    </exec>
    <echo message="Writing vocab with frequency cutoffs"/>
    <concat destfile="${supertagger.models.dir}/wsc.count">
      <filelist dir="${supertagger.models.dir}" files="w.count,sc.count"/>
    </concat>
    <exec executable="ngram-count" dir="${supertagger.models.dir}">
      <arg line="-read p.count -write-vocab vocab.pos -sort"/>
    </exec>
    <exec executable="ngram-count" dir="${supertagger.models.dir}">
      <arg line="-read w.count -read wsc.count -gt1min 3 -write-vocab vocab.words -read-with-mincounts -sort"/>
    </exec>
    <exec executable="ngram-count" dir="${supertagger.models.dir}">
      <arg line="-read t.count -gt1min ${catfreq.cutoff} -write-vocab vocab.st -read-with-mincounts -sort"/>
    </exec>
    <concat destfile="${vocab.train}">
      <filelist dir="${supertagger.models.dir}" files="vocab.pos,vocab.st,vocab.words"/>
    </concat>
    <delete>
      <filelist dir="${supertagger.models.dir}" files="w.count,t.count,p.count,sc.count,wsc.count"/>
    </delete>
  </target>

  <target name="check-pos-prior-lm" depends="init">
    <uptodate targetfile="${posprior.lm}" srcfile="${vocab.train}" property="posprior.lm.uptodate"/>
  </target>

  <target name="make-pos-prior-lm" depends="get-vocab,check-pos-prior-lm" unless="posprior.lm.uptodate">
    <echo message="Making POS prior language model using ${supertagger.models.dir}/posprior.flm"/>
    <exec executable="fngram-count" dir="${supertagger.models.dir}">
      <arg value="-text"/> <arg value="${basedir}/${factors.train}"/> 
      <arg line="-factor-file posprior.flm -vocab vocab.train -lm -unk -write-counts -nonull"/>
      <arg line="-no-virtual-begin-sentence -no-virtual-end-sentence"/>
      <arg line="-no-add-start-sentence-token -no-add-end-sentence-token"/>
    </exec>
  </target>

  <target name="check-pos-feats" depends="init">
    <uptodate targetfile="${pos.feats}" srcfile="${posprior.lm}" property="pos.feats.uptodate"/>
  </target>

  <target name="get-pos-feats" depends="make-pos-prior-lm,check-pos-feats" unless="pos.feats.uptodate">
    <echo message="Extracting POS training features to ${pos.feats}"/>
    <java classname="opennlp.ccg.parse.postagger.ml.POSTagFex"
	  input="${factors.train}" output="${pos.feats}">
      <arg value="-p"/> <arg value="${supertagger.models.dir}/posprior.flm"/>
      <arg value="-v"/> <arg value="${supertagger.models.dir}/vocab.train"/>
    </java>
    <echo message="Filtering POS training features by frequency"/>
    <exec executable="python">
      <arg value="bin/filter_feats.py"/>
      <arg value="-i"/> <arg value="${pos.feats}"/>
      <arg value="-o"/> <arg value="${supertagger.feats.dir}/pos.feats.tmp"/>
      <arg line="-n 1 -f 5"/>
    </exec>
    <move file="${supertagger.feats.dir}/pos.feats.tmp" tofile="${pos.feats}"/>
  </target>

  <target name="check-pos-model" depends="init">
    <uptodate targetfile="${pos.mod}" srcfile="${pos.feats}" property="pos.mod.uptodate"/>
  </target>

  <target name="make-pos-model" 
	  depends="make-pos-lm,get-pos-feats,check-pos-model" 
	  unless="pos.mod.uptodate">
    <echo message="Making POS tagging model to ${pos.mod}"/>
    <exec executable="maxent" output="${log.dir}/pos.log">
      <arg value="${pos.feats}"/> 
      <arg line="-v --lbfgs -c 0 -i 200 -g 1"/>
      <arg value="-m"/> <arg value="${pos.mod}"/>
    </exec>
  </target>

  <target name="test-pos-model" depends="init">
    <echo message="Testing POS tagging model on dev set to ${log.dir}/pos.dev.log"/>
    <java classname="opennlp.ccg.parse.postagger.BasicPOSTagger"
	  input="${factors.dev}" output="${log.dir}/pos.dev.log">
      <arg value="-c"/> <arg value="${supertagger.models.dir}/pos.config"/>
      <arg value="-e"/>
    </java>
  </target>

  <target name="get-tag-dicts" depends="init" unless="pos.dict.uptodate">
    <echo message="Extracting tag dictionaries to ${pos.dict} and ${word.dict}"/>
    <java classname="opennlp.ccg.parse.supertagger.util.TaggingDictionaryExtractor">
      <arg value="-i"/> <arg value="${factors.train}"/>
      <arg value="-f"/> <arg value="${catfreq.cutoff}"/>
      <arg value="-p"/> <arg value="${pos.dict}"/>
      <arg value="-w"/> <arg value="${word.dict}"/>
    </java>
  </target>

  <target name="check-st-feats" depends="init">
    <uptodate targetfile="${st.feats}" srcfile="${supertagger.models.dir}/vocab.train" property="st.feats.uptodate"/>
  </target>

  <target name="get-st-feats" depends="get-vocab,check-st-feats" unless="st.feats.uptodate">
    <echo message="Extracting supertagger training features to ${st.feats}"/>
    <java classname="opennlp.ccg.parse.supertagger.ml.STFex"
	  input="${factors.train}" output="${st.feats}">
      <arg value="-v"/> <arg value="${supertagger.models.dir}/vocab.train"/>
      <arg value="-p"/> <arg value="${supertagger.models.dir}/pos.config"/>
    </java>
    <echo message="Filtering supertagger training features by frequency"/>
    <exec executable="python">
      <arg value="bin/filter_feats.py"/>
      <arg value="-i"/> <arg value="${st.feats}"/>
      <arg value="-o"/> <arg value="${supertagger.feats.dir}/st.feats.tmp"/>
      <arg line="-n ${catfreq.cutoff} -f 2"/>
    </exec>
    <move file="${supertagger.feats.dir}/st.feats.tmp" tofile="${st.feats}"/>
  </target>

  <target name="make-st-model" depends="make-pos-model,make-st-lm,get-tag-dicts,get-st-feats">
    <!-- outofdate task seems to be working here whereas uptodate was not (strange?!) -->
    <outofdate>
      <sourcefiles>
	<fileset file="${pos.dict}"/>
	<fileset file="${st.feats}"/>
      </sourcefiles>
      <targetfiles path="${st.mod}"/>
      <sequential>
	<echo message="Making supertagging model to ${st.mod}"/>
	<exec executable="maxent" output="${log.dir}/st.log">
	  <arg value="${st.feats}"/> 
	  <arg line="-v --lbfgs -c 0 -i 400 -g 1"/>
	  <arg value="-m"/> <arg value="${st.mod}"/>
	</exec>
      </sequential>
    </outofdate>
  </target>

  <target name="test-st-model" depends="init">
    <echo message="Testing supertagging model on dev set to ${log.dir}/st.dev.log"/>
    <java classname="opennlp.ccg.parse.supertagger.WordAndPOSDictionaryLabellingStrategy"
	  input="${factors.dev}" output="${log.dir}/st.dev.log" error="${log.dir}/st.dev.report">
      <arg value="-c"/> <arg value="${supertagger.models.dir}/st.config"/>
      <arg value="-e"/>
      <arg value="-beta"/> <arg value="0.1"/>
    </java>
  </target>


  <!-- =================================================================== -->
  <!-- Top-level                                                           -->
  <!-- =================================================================== -->

  <target name="all" depends="make-pos-model,make-st-model"/>
  <target name="test" depends="test-pos-model,test-st-model"/>

</project>


================================================
FILE: ccgbank/build.properties
================================================

data.dir=./data
templates.dir=./templates
convert.dir=./convert
extract.dir=./extract
info.dir=${extract.dir}/info
test.dir=${extract.dir}/test
grams.dir=${extract.dir}/grammars
log.dir=./logs
tmp.dir=./tmp

training.dirs=02,03,04,05,06,07,08,09,10,11,12,13,14,15,16,17,18,19,20,21

# nb: the "propccgbank" and aux files should be unpacked from 
#     the ccgbank-data.tgz (see docs/ccgbank-README for details);
#     the original ccgbank dir property below can be changed to 
#     point to your copy of the CCGBank, or you can just create a 
#     symbolic link from ./ccgbank1.1 to your copy of it

ccgbank.dir=./propccgbank/pp_head_verbsAnnotated/AUTO
original.ccgbank.dir=./ccgbank1.1/data/AUTO

#sect=*
sect=00
#file=*
file=wsj_0001

aux.top.dir=./aux
aux.dir=${aux.top.dir}/aux-files
words=${data.dir}/wsj-nns-vb
stems=${data.dir}/wsj-nns-vb-stems


================================================
FILE: ccgbank/build.xml
================================================
<!--
 Copyright (C) 2005-2011 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
-->

<!-- This build file is for corpus conversion and grammar extraction. -->

<!-- $Id: build.xml,v 1.29 2011/11/20 15:39:18 mwhite14850 Exp $ -->
<project name="CCGBankExtract" default="extract" basedir=".">
  
  <taskdef resource="net/sf/antcontrib/antlib.xml"/>
  <property file="build.properties" />

  <!-- =================================================================== -->
  <!-- File lists for re-use by transformations.                           -->
  <!-- =================================================================== -->
  <filelist id="convert-initial" dir="${templates.dir}">
    <file name="uncurryBareParse.xsl" />
    <file name="markMistakes.xsl" />
    <file name="correctMistakes1.xsl" />
    <file name="changePunct.xsl" />
    <file name="adjustCats.xsl" />
    <file name="labelConj1.xsl" />
  </filelist>

  <filelist id="convert-all" dir="${templates.dir}">
    <file name="uncurryBareParse.xsl" />
    <file name="markMistakes.xsl" />
    <file name="correctMistakes1.xsl" />
    <file name="changePunct.xsl" />
    <!--<file name="adjustCandCcats1.xsl",-->
    <file name="adjustCats.xsl" />

    <file name="allotIdLeaf.xsl" />
    <file name="insertPTBInfo.xsl" />
    <file name="labelConj1.xsl" />

    <file name="annotateExtraposedAppos.xsl" />
    <file name="annotateReportedSpeech.xsl" />
    <file name="adjustReportedSpeech.xsl" />
    <file name="annotateParentheticals1.xsl" />
    <file name="adjustParenthetical.xsl" />

    <!--Appositive vs Conjunction detection and annotation-->
    <file name="annotateAppos1.xsl" />
    <file name="annotateAppos2.xsl" />
    <!-- Provide correct analysis for Appositives present-->
    <file name="labelAppos.xsl" />
    <file name="annotateAppos3.xsl" />
    <!-- Ensure proper balancing of the appositives detected above.-->
    <file name="balanceAppos.xsl" />
    <!-- Delete balancing commas-->
    <file name="adjustAppos.xsl" />

    <!-- Confer comma cats to place names-->
    <file name="labelPlace1.xsl" />
    <file name="labelPlace2.xsl" />
    <file name="annotatePlace.xsl" />

    <file name="labelConj2.xsl" />
    <file name="labelConj3.xsl" />

    <!-- Various other types of comma adjuncts-->
    <file name="labelPuncts.xsl" />

    <file name="preSentAdj.xsl" />
    <file name="annotateVPCommas.xsl" />
    <file name="annotateParentheticals2.xsl" />

    <file name="annotateStrayAppos.xsl" />
    <file name="annotateNom-AdjConj.xsl" />

    <file name="inferConjRules.xsl" />
    <file name="annotatePrtConjs.xsl" />

    <!-- Dash & bracket rules-->
    <file name="annotateAppos-Dash.xsl" />
    <file name="balanceDash-Paren.xsl" />
    <file name="annotateBrackets.xsl" />

    <!-- Colon rules-->
    <file name="annotateColons.xsl" />

    <!-- Dot rules-->
    <file name="annotateDots.xsl" />

    <!-- Final period feats-->
    <file name="sentFinalPuncts.xsl" />

    <!--<file name="replaceColons.xsl"/>-->
    <file name="allotIdLeaf.xsl" />
    <!-- <file name="reinsertPTBInfo.xsl" /> -->

    <!--Add PTB quotation marks-->
    <file name="insertQuoteSemClassInfo.xsl" />
    <file name="annotateQuotes.xsl" />
    <file name="allotIdTree.xsl" />

    <!--Collapse NEs if desired options are set-->
    <file name="collapseMWUPart.xsl"/>

    <!--Shared task NE collapsing -->
    <!-- <file name="collapseMWUSharedTask.xsl"/> -->
    
    <file name="trueCaser.xsl"/>

    <file name="introduceMMExtns.xsl"/>

    <file name="correctPPHeads.xsl" />
    <file name="computeCats.xsl" />
    <file name="adjustRoles.xsl" />
    <file name="addStems.xsl" />

    <!--Normalize tags-->
    <file name="normPTBTags.xsl" />
    <file name="normPunctPos.xsl" />
    <file name="allotIndexRel.xsl" />
  </filelist>

  <filelist id="convert-conj" dir="${templates.dir}">
    <file name="inferConjRules.xsl" />
  </filelist>

  <filelist id="convert-final" dir="${templates.dir}">
    <file name="computeCats.xsl" />
    <file name="adjustRoles.xsl" />
    <file name="addStems.xsl" />
    <file name="normPunctPos.xsl" />
  </filelist>

  <filelist id="extract-lexicon" dir="${templates.dir}">
    <file name="filterLex.xsl" />
    <file name="closedCatInsert.xsl" />
    <file name="insertLF.xsl" />
    <!--<file name="insertPunctLF.xsl"/>-->
    <file name="insertPunctLF-PosMod.xsl" />
    <file name="addFilterLexFeats.xsl"/>
    <file name="insertSemFeats.xsl" />
    <file name="markUnmatched.xsl" />
    <file name="repairUnmatched.xsl" />
    <!--<file name="macroLexDef.xsl"/>-->
  </filelist>

  <filelist id="extract-morph" dir="${templates.dir}">
    <file name="morphExtr.xsl" />
    <file name="macroInsert.xsl" />
  </filelist>

  <filelist id="extract-rules" dir="${templates.dir}">
    <file name="ccgRules.xsl" />
  </filelist>


  <!-- =================================================================== -->
  <!-- Init                                                                -->
  <!-- =================================================================== -->

  <target name="init">
    <taskdef resource="opennlp/ccgbank/ccgbank.properties"/>
    <!-- make property 'ext' encoding sect and file, using 'all' instead of * -->
    <var name="fid" value="${file}"/>
    <if>
      <equals arg1="${fid}" arg2="*" />
      <then>
	<var name="fid" value="all"/>
      </then>
    </if>
    <var name="sid" value="${sect}"/>
    <if>
      <equals arg1="${sid}" arg2="*" />
      <then>
	<var name="sid" value="all"/>
      </then>
    </if>
    <property name="ext" value="${sid}-${fid}"/>
  </target>


  <!-- =================================================================== -->
  <!-- Conversion                                                          -->
  <!-- NB: can use bin/convert-all to run sections in parallel             -->
  <!-- =================================================================== -->

  <!-- Checks whether converted files are up-to-date wrt the flag file. -->
  <!-- NB: to run conversion again, delete ${convert.dir}/done-*        -->
  <target name="check-converted" depends="init">
    <uptodate property="converted.uptodate" targetfile="${convert.dir}/done-${ext}">
      <srcfiles dir="${ccgbank.dir}" includes="${sect}/${file}.auto"/>
    </uptodate>
  </target>

  <!-- This version includes all the aux files (incl quotes), but no NE info. -->
  <target name="convert-puncts-aux" depends="check-converted" unless="converted.uptodate">
    <convert target="${convert.dir}" wordsFile="${words}" stemsFile="${stems}" auxFileDirectory="${aux.dir}">
      <sources>
	<fileset dir="${ccgbank.dir}">
	  <include name="${sect}/${file}.auto" />
	</fileset>
      </sources>
      <templates>
	<filelist refid="convert-all" />
      </templates>
    </convert>
    <touch file="${convert.dir}/done-${ext}"/>
  </target>

  <!-- This version also includes NE info. -->
  <target name="convert-puncts-aux-bbn" depends="check-converted" unless="converted.uptodate">
    <convert target="${convert.dir}" wordsFile="${words}" stemsFile="${stems}" auxFileDirectory="${aux.dir}" bbnAuxDirectory="${aux.dir}">
      <sources>
	<fileset dir="${ccgbank.dir}">
	  <include name="${sect}/${file}.auto" />
	</fileset>
      </sources>
      <templates>
	<filelist refid="convert-all" />
      </templates>
    </convert>
    <touch file="${convert.dir}/done-${ext}"/>
  </target>

  <!-- Shared task conversion -->
  <!-- In task "convert-all", instead of transform "collapseMWUPart.xsl", add "collapseMWUSharedTask.xsl"-->
  <!-- Also in build.properties file, set aux.dir=/home/scratch/raja/genchal11/SR_release1.0-Aux/hlds/-->
  <target name="convert-sharedtask" depends="check-converted" unless="converted.uptodate">
    <convert target="${convert.dir}" wordsFile="${words}" stemsFile="${stems}" auxFileDirectory="${aux.dir}" bbnAuxDirectory="${aux.dir}">
      <sources>
	<fileset dir="${ccgbank.dir}">
	  <include name="${sect}/${file}.auto" />
	</fileset>
      </sources>
      <templates>
	<filelist refid="convert-all" />
      </templates>
    </convert>
    <touch file="${convert.dir}/done-${ext}"/>
  </target>

  <!-- This version is for testing ... -->
  <target name="convert-test" depends="init">
    <convert target="./tmp" wordsFile="${words}" stemsFile="${stems}" auxFileDirectory="${aux.dir}">
      <sources>
	<fileset dir="${ccgbank.dir}">
	  <include name="${sect}/${file}.auto" />
	</fileset>
      </sources>
      <templates>
	<!--
	<filelist id="convert-test" dir="${templates.dir}">
	  <file name="uncurryBareParse.xsl" />
	  <file name="find-s-back-n.xsl" />
	</filelist>
	-->
	<filelist refid="convert-initial"/>
	<filelist refid="convert-final"/>
      </templates>
    </convert>
  </target>


  <!-- =================================================================== -->
  <!-- Export                                                              -->
  <!-- =================================================================== -->

  <target name="export-to-auto" depends="init">
    <xslt style="templates/exportToAuto.xsl" basedir="${convert.dir}" destdir="${convert.dir}"
	  extension=".auto" includes="${sect}/${file}.xml">
      <factory name="org.apache.xalan.processor.TransformerFactoryImpl" />
    </xslt>
  </target>

  <target name="export-to-auto-archive" depends="init">
    <tar tarfile="openccgbank.auto.tar">
      <tarfileset dir="${convert.dir}" includes="**/*.auto" />
    </tar>
    <gzip src="openccgbank.auto.tar" zipfile="openccgbank.auto.tgz" />
    <delete file="openccgbank.auto.tar" />
  </target>


  <!-- =================================================================== -->
  <!-- Extraction                                                          -->
  <!-- =================================================================== -->

  <!-- for the section and file, extracts a grammar with no cutoffs and makes LFs -->
  <target name="extract" depends="init">
    <echo>Extracting grammar with no cutoffs and making LFs</echo>
    <echo>Section: ${sect}  File: ${file}</echo>
    <extract target="${extract.dir}" grammarName="base" ppheads="false" catFreqCutoff="1" lexFreqCutoff="1" openFreqCutoff="1" ruleFreqCutoff="1" skipUnmatched="false">
      <sources>
	<fileset dir="${convert.dir}">
	  <include name="${sect}/${file}.xml" />
	</fileset>
      </sources>
      <templates type="lexicon"> <filelist refid="extract-lexicon" /> </templates>
      <templates type="morph"> <filelist refid="extract-morph" /> </templates>
      <templates type="rules"> <filelist refid="extract-rules" /> </templates>
      <testbed debugDerivations="false" text="${info.dir}/text-${ext}" factors="${info.dir}/factors-${ext}" combos="${info.dir}/combos-${ext}" tree="${info.dir}/tree-${ext}" preds="${info.dir}/preds-${ext}"/>
    </extract>
  </target>

  <!-- definitions for extract-all -->
  <property name="all.dirs" value="00,${training.dirs},23"/>

  <macrodef name="concat-info">
    <attribute name="type"/>
    <sequential>
      <echo>Concatenating @{type}-train</echo>
      <concat destfile="${info.dir}/@{type}-train">
	<fileset dir="${info.dir}" 
		 includes="@{type}-*-all"
		 excludes="@{type}-00-all,@{type}-01-all,@{type}-22-all,@{type}-23-all,@{type}-24-all"/>
      </concat>
    </sequential>
  </macrodef>

  <!-- Checks whether factors-train (in particular) is up-to-date. -->
  <target name="check-all-extracted" depends="init">
    <uptodate property="extract.all.uptodate" 
	      srcfile="${convert.dir}/02/wsj_0200.xml" 
	      targetfile="${info.dir}/factors-train"/>
  </target>

  <!-- for all sections in use, extracts a grammar with no cutoffs and makes LFs, concatenating info files -->
  <!-- nb: using a loop with exec here to run each section in its own VM -->
  <target name="extract-all" depends="check-all-extracted" unless="extract.all.uptodate">
    <for list="${all.dirs}" param="sect">
      <sequential>
	<echo>Starting extract task for section @{sect}</echo>
	<exec executable="ccg-build" dir="." output="${log.dir}/log.extract.@{sect}">
	  <arg value="-Dsect=@{sect}"/>
	  <arg value="-Dfile=*"/>
	  <arg value="extract"/>
	</exec>
      </sequential>
    </for>
    <echo>Concatenating training section files in ${info.dir}</echo>
    <concat-info type="text"/>
    <concat-info type="textsc"/>
    <concat-info type="factors"/>
    <concat-info type="combos"/>
    <concat-info type="tree"/>
    <concat-info type="preds"/>
  </target>

  <!-- Checks whether the training lexicon (in particular) is up-to-date. -->
  <target name="check-train-extracted" depends="init">
    <uptodate property="extract.train.uptodate" 
	      srcfile="${convert.dir}/02/wsj_0200.xml" 
	      targetfile="${grams.dir}/train/lexicon.xml"/>
  </target>

  <!-- extracts a grammar from the training section with no cat cutoffs, copying it to ${grams.dir}/train -->
  <target name="extract-train" depends="check-train-extracted"
	  unless="extract.train.uptodate">
    <extract target="${extract.dir}" grammarName="train" ppheads="false" catFreqCutoff="1" lexFreqCutoff="1" openFreqCutoff="50" ruleFreqCutoff="10" skipUnmatched="true">
      <sources>
	<fileset dir="${convert.dir}">
	  <include name="*/*.xml" />
	  <exclude name="00/*" />
	  <exclude name="01/*" />
	  <exclude name="22/*" />
	  <exclude name="23/*" />
	  <exclude name="24/*" />
	</fileset>
      </sources>
      <templates type="lexicon"> <filelist refid="extract-lexicon" /> </templates>
      <templates type="morph"> <filelist refid="extract-morph" /> </templates>
      <templates type="rules"> <filelist refid="extract-rules" /> </templates>
    </extract>
    <copy todir="${grams.dir}/train">
      <fileset dir="${extract.dir}" includes="*.xml,*.html"/>
    </copy>
  </target>

  <!-- Checks whether the training lexicon with cutoffs is up-to-date. -->
  <target name="check-train-cfc10-extracted" depends="init">
    <uptodate property="extract.train.cfc10.uptodate" 
	      srcfile="${convert.dir}/02/wsj_0200.xml" 
	      targetfile="${grams.dir}/train-cfc10/lexicon.xml"/>
  </target>

  <!-- extracts a grammar from the training section with cutoffs, copying it to ${grams.dir}/train-cfc10 -->
  <target name="extract-train-cfc10" depends="check-train-cfc10-extracted"
	  unless="extract.train.cfc10.uptodate">
    <extract target="${extract.dir}" grammarName="train" ppheads="false" catFreqCutoff="10" lexFreqCutoff="3" openFreqCutoff="50" ruleFreqCutoff="10" skipUnmatched="true">
      <sources>
	<fileset dir="${convert.dir}">
	  <include name="*/*.xml" />
	  <exclude name="00/*" />
	  <exclude name="01/*" />
	  <exclude name="22/*" />
	  <exclude name="23/*" />
	  <exclude name="24/*" />
	</fileset>
      </sources>
      <templates type="lexicon"> <filelist refid="extract-lexicon" /> </templates>
      <templates type="morph"> <filelist refid="extract-morph" /> </templates>
      <templates type="rules"> <filelist refid="extract-rules" /> </templates>
    </extract>
    <copy todir="${grams.dir}/train-cfc10">
      <fileset dir="${extract.dir}" includes="*.xml,*.html"/>
    </copy>
  </target>

  <!-- Checks whether the training lexicon (in particular) is up-to-date. -->
  <target name="check-dev-extracted" depends="init">
    <uptodate property="extract.dev.uptodate" 
	      srcfile="${convert.dir}/00/wsj_0001.xml" 
	      targetfile="${grams.dir}/dev/lexicon.xml"/>
  </target>

  <!-- extracts a grammar from the dev section with no cat cutoffs, copying it to ${grams.dir}/dev -->
  <target name="extract-dev" depends="check-dev-extracted" unless="extract.dev.uptodate">
    <extract target="${extract.dir}" grammarName="dev" ppheads="false" catFreqCutoff="1" lexFreqCutoff="1" openFreqCutoff="10" ruleFreqCutoff="3" skipUnmatched="true">
      <sources>
	<fileset dir="${convert.dir}">
	  <include name="00/*.xml" />
	</fileset>
      </sources>
      <templates type="lexicon"> <filelist refid="extract-lexicon" /> </templates>
      <templates type="morph"> <filelist refid="extract-morph" /> </templates>
      <templates type="rules"> <filelist refid="extract-rules" /> </templates>
    </extract>
    <copy todir="${grams.dir}/dev">
      <fileset dir="${extract.dir}" includes="*.xml,*.html"/>
    </copy>
  </target>

  <!-- for the section and file, extracts a grammar with no cutoffs and makes LFs with debug derivs flag set -->
  <target name="extract-debug" depends="init">
    <echo>Extracting grammar with no cutoffs and making LFs with debug derivs true</echo>
    <echo>Section: ${sect}  File: ${file}</echo>
    <extract target="${extract.dir}" grammarName="base" ppheads="false" catFreqCutoff="1" lexFreqCutoff="1" openFreqCutoff="1" ruleFreqCutoff="1" skipUnmatched="false">
      <sources>
	<fileset dir="${convert.dir}">
	  <include name="${sect}/${file}.xml" />
	</fileset>
      </sources>
      <templates type="lexicon"> <filelist refid="extract-lexicon" /> </templates>
      <templates type="morph"> <filelist refid="extract-morph" /> </templates>
      <templates type="rules"> <filelist refid="extract-rules" /> </templates>
      <testbed debugDerivations="true" />
    </extract>
  </target>


  <!-- =================================================================== -->
  <!-- Top-level                                                           -->
  <!-- 1st: do bin/convert-all to convert sections in parallel             -->
  <!--      (alternatively, do convert-puncts-aux-bbn for all sections)    -->
  <!-- 2nd: do extract-various                                             -->
  <!-- 3rd: do ccg-build -f build-models.xml all                           -->
  <!-- =================================================================== -->

  <target name="extract-various" depends="extract-all,extract-train,extract-train-cfc10,extract-dev"/>

</project>

<!-- End of file -->


================================================
FILE: ccgbank/data/README
================================================

The files wsj-nns-vb and wsj-nns-vb-stems contain the plural nouns & verbs and
their stems, respectively, from the WSJ part of the Penn Treebank, as computed
by the morpha tool.

Sample commands for creating these files (with directories on the OSU
Linguistics system) are in get_wsj_nns_vb and stem_wsj_nns_vb.

There are also some made-up sentences for testing the parser and
realizer in novel/two-sents, and an example CCGbank file with Propbank
roles and corrections in the sample dir.


================================================
FILE: ccgbank/data/get_wsj_nns_vb
================================================
cat /home/corpora/EN/penn_treebank_3/ims-cwb/wsj/wsj.cqp | egrep "NNS|VB" | sort | uniq > wsj-nns-vb


================================================
FILE: ccgbank/data/novel/two-sents
================================================
Google announced today that it would offer free texting on its Google Voice app for the iPhone.
The press release was greeted rapturously.


================================================
FILE: ccgbank/data/sample/AUTO/00/wsj_0001.auto
================================================
ID=wsj_0001.1 PARSER=GOLD NUMPARSE=1
(<T S[dcl] 0 2> (<T S[dcl] 1 2> (<T NP 0 2 {join.01:ARG0}> (<T NP 0 2> (<T NP 0 2> (<T NP 0 1> (<T N 1 2> (<L N/N NNP NNP Pierre N_73/N_73>) (<L N NNP NNP Vinken N>) ) ) (<L , , , , ,>) ) (<T NP\NP 0 1> (<T S[adj]\NP 1 2> (<T NP 0 1> (<T N 1 2> (<L N/N CD CD 61 N_93/N_93>) (<L N NNS NNS years N>) ) ) (<L (S[adj]\NP)\NP JJ JJ old (S[adj]\NP_83)\NP_84>) ) ) ) (<L , , , , ,>) ) (<T S[dcl]\NP 0 2> (<L (S[dcl]\NP)/(S[b]\NP) MD MD will (S[dcl]\NP_10)/(S[b]_11\NP_10:B)_11 {join.01:ARGM-MOD}>) (<T S[b]\NP 0 2> (<T S[b]\NP 0 2> (<T S[b]\NP 0 2> (<L (S[b]\NP)/NP VB VB join (S[b]\NP)/NP {join.01:rel} [ARG0,ARG1]>) (<T NP 1 2 {join.01:ARG1}> (<L NP[nb]/N DT DT the NP[nb]_29/N_29>) (<L N NN NN board N>) ) ) (<T (S\NP)\(S\NP) 0 2 {join.01:ARGM-PRD}> (<L ((S\NP)\(S\NP))/NP IN IN as ((S_1\NP_2)_1\(S_1\NP_2)_1)/NP>) (<T NP 1 2> (<L NP[nb]/N DT DT a NP[nb]_48/N_48>) (<T N 1 2> (<L N/N JJ JJ nonexecutive N_43/N_43>) (<L N NN NN director N>) ) ) ) ) (<T (S\NP)\(S\NP) 0 2 {join.01:ARGM-TMP}> (<L ((S\NP)\(S\NP))/N[num] NNP NNP Nov. ((S_61\NP_56)_61\(S_61\NP_56)_61)/N[num]_62>) (<L N[num] CD CD 29 N[num]>) ) ) ) ) (<L . . . . .>) ) 
ID=wsj_0001.2 PARSER=GOLD NUMPARSE=1
(<T S[dcl] 0 2> (<T S[dcl] 1 2> (<T NP 0 1> (<T N 1 2> (<L N/N NNP NNP Mr. N_142/N_142>) (<L N NNP NNP Vinken N>) ) ) (<T S[dcl]\NP 0 2> (<L (S[dcl]\NP)/NP VBZ VBZ is (S[dcl]\NP_87)/NP_88>) (<T NP 0 2> (<T NP 0 1> (<L N NN NN chairman N>) ) (<T NP\NP 0 2> (<L (NP\NP)/NP IN IN of (NP_99\NP_99)/NP_100>) (<T NP 0 2> (<T NP 0 1> (<T N 1 2> (<L N/N NNP NNP Elsevier N_109/N_109>) (<L N NNP NNP N.V. N>) ) ) (<T NP[conj] 1 2> (<L , , , , ,>) (<T NP 1 2> (<L NP[nb]/N DT DT the NP[nb]_131/N_131>) (<T N 1 2> (<L N/N NNP NNP Dutch N_126/N_126>) (<T N 1 2> (<L N/N VBG VBG publishing N_119/N_119 {publish.01:rel} [ARG0]>) (<L N NN NN group N {publish.01:ARG0}>) ) ) ) ) ) ) ) ) ) (<L . . . . .>) ) 


================================================
FILE: ccgbank/data/stem_wsj_nns_vb
================================================
cat wsj-nns-vb | tr [:blank:] _ | ./morpha.ix86_linux > wsj-nns-vb-stems


================================================
FILE: ccgbank/data/wsj-nns-vb
================================================
12-inches	NNS
15	VBN
16-year-olds	NNS
1850s	NNS
1890s	NNS
18-year-olds	NNS
1900s	NNS
1920s	NNS
1930s	NNS
1940s	NNS
1950s	NNS
1960s	NNS
1970s	NNS
1980s	NNS
1990s	NNS
19-year-olds	NNS
204s	NNS
20s	NNS
20-stocks	NNS
3090s	NNS
'30s	NNS
30s	NNS
323s	NNS
'40s	NNS
'50s	NNS
'60s	NNS
'70s	NNS
747-400s	NNS
757-200s	NNS
75-cents-an-hour	NNS
'80s	NNS
80s	NNS
8300s	NNS
'90s	NNS
A330-300s	NNS
abacuses	NNS
abandoned	VBD
abandoned	VBN
abandoning	VBG
Abandoning	VBG
abandons	VBZ
abandon	VB
abandon	VBP
abated	VBD
abated	VBN
abates	VBZ
abate	VB
abating	VBG
abdicate	VBP
abetted	VBN
abetting	VBG
abide	VB
abilities	NNS
abolished	VBD
abolished	VBN
abolishing	VBG
abolish	VB
aborted	VBN
abortion-rights	NNS
Abortion-rights	NNS
abortions	NNS
abounded	VBD
abounding	VBG
abounds	VBZ
abound	VBP
abrasives	NNS
abridging	VBG
absences	NNS
absent	VB
Absent	VB
absolve	VBP
absolving	VBG
absorbed	VBD
absorbed	VBN
Absorbed	VBN
absorbers	NNS
absorbing	VBG
absorbs	VBZ
absorb	VB
absorb	VBP
abstained	VBD
abstentions	NNS
abstracts	NNS
abused	VBD
abused	VBN
abuses	NNS
abuse	VB
abusing	VBG
academics	NNS
acceded	VBD
accede	VB
accelerated	VBD
accelerated	VBN
accelerates	VBZ
accelerate	VB
accelerate	VBP
accelerating	VBG
accents	NNS
acceptances	NNS
ACCEPTANCES	NNS
accepted	VBD
accepted	VBN
accepting	VBG
accepts	VBZ
accept	VB
accept	VBP
accessories	NNS
Accessories	NNS
access	VB
accidents	NNS
acclaim	VB
accolades	NNS
accommodated	VBN
accommodate	VB
accommodate	VBP
accommodating	VBG
accommodations	NNS
accomodate	VB
accompanied	VBD
accompanied	VBN
accompanies	VBZ
accompanying	VBG
accompany	VB
accomplished	VBN
accomplishes	VBZ
Accomplishing	VBG
accomplishments	NNS
accomplish	VB
accorded	VBD
accorded	VBN
according	VBG
According	VBG
accords	NNS
accord	VB
accountants	NNS
accounted	VBD
accounted	VBN
accounting	VBG
accounts	NNS
Accounts	NNS
accounts	VBZ
account	VB
account	VBP
accreted	VBN
accruals	NNS
accrued	VBN
Accrued	VBN
accrues	VBZ
accrue	VB
accruing	VBG
accumulated	VBN
accumulate	VBP
accumulating	VBG
accusations	NNS
accused	VBD
accused	VBN
accusers	NNS
accuses	VBZ
accuse	VB
accuse	VBP
accusing	VBG
accustomed	VBN
aces	VBZ
achieved	VBD
achieved	VBN
achievements	NNS
achieves	VBZ
achieve	VB
achieve	VBP
achieving	VBG
aching	VBG
acidified	VBN
acids	NNS
acknowledged	VBD
acknowledged	VBN
acknowledges	VBZ
acknowledge	VB
acknowledge	VBP
acknowledging	VBG
acorns	NNS
acquainted	VBN
acquiesced	VBD
acquiesce	VB
acquired	VBD
acquired	VBN
Acquired	VBN
acquirers	NNS
Acquirers	NNS
acquires	VBZ
acquire	VB
acquiring	VBG
acquisitions	NNS
Acquisitions	NNS
acquitted	VBN
acquit	VB
acres	NNS
across-the-board-cuts	NNS
acted	VBD
acted	VBN
acting	VBG
Acting	VBG
actions	NNS
activated	VBN
activate	VBP
actives	NNS
activists	NNS
Activists	NNS
activities	NNS
actors	NNS
acts	NNS
acts	VBZ
actuaries	NNS
act	VB
act	VBP
adapted	VBD
adapted	VBN
Adapted	VBN
adapting	VBG
adapt	VB
adapt	VBP
added	VBD
Added	VBD
added	VBN
Added	VBN
addicted	VBN
addicts	NNS
adding	VBG
Adding	VBG
additions	NNS
additives	NNS
addressed	VBD
addressed	VBN
addresses	NNS
addresses	VBZ
addressing	VBG
Addressing	VBG
address	VB
address	VBP
adds	VBZ
Adds	VBZ
add	VB
Add	VB
add	VBP
adepts	NNS
adhered	VBD
adhere	VB
adhesives	NNS
adjourned	VBN
adjudicators	NNS
adjusted	VBD
adjusted	VBN
adjusters	NNS
Adjusters	NNS
adjusting	VBG
adjustments	NNS
adjusts	VBZ
adjust	VB
Adjust	VB
adjust	VBP
admen	NNS
administered	VBN
administers	VBZ
administer	VB
administrations	NNS
administrators	NNS
admired	VBD
admired	VBN
Admirers	NNS
admires	VBZ
admissions	NNS
admits	NNS
admits	VBZ
admitted	VBD
ADMITTED	VBD
admitted	VBN
admitting	VBG
admit	VB
admit	VBP
admonishing	VBG
adolescents	NNS
adopted	VBD
ADOPTED	VBD
adopted	VBN
adopting	VBG
Adopting	VBG
adopts	VBZ
adopt	VB
adopt	VBP
adorned	VBD
adorned	VBN
adorn	VB
ADRs	NNS
ads	NNS
Ads	NNS
ADS	NNS
adults	NNS
Adults	NNS
advanced-ceramics	NNS
advanced	VBD
advanced	VBN
advancements	NNS
advancers	NNS
Advancers	NNS
advances	NNS
Advances	NNS
advance	VB
advance	VBP
advancing	VBG
Advancing	VBG
advantages	NNS
advantage	VB
adventures	NNS
adversaries	NNS
advertised	VBD
advertised	VBN
advertisements	NNS
advertisers	NNS
Advertisers	NNS
advertises	VBZ
advertise	VB
advertise	VBP
advertising	VBG
Advertising	VBG
advertising	VBG|NN
advised	VBD
advised	VBN
advisers	NNS
advises	VBZ
Advises	VBZ
advise	VB
advise	VBP
advising	VBG
advisories	NNS
advocated	VBD
advocated	VBN
advocates	NNS
Advocates	NNS
advocates	VBZ
advocate	VB
advocate	VBP
advocating	VBG
aerobics	NNS
affairs	NNS
affected	JJ|VBN
affected	VBD
affected	VBN
affecting	VBG
affections	NNS
affects	VBZ
affect	VB
affect	VBP
affidavits	NNS
affiliated	VBN
Affiliated	VBN
affiliates	NNS
affiliating	VBG
affinities	NNS
affirmed	VBD
affirming	VBG
afflicted	VBN
afflicts	VBZ
afflict	VB
afforded	VBN
afford	VB
afford	VBP
aftereffects	NNS
Aftereffects	NNS
after-hours	NNS
afternoons	NNS
aftershocks	NNS
Aftershocks	NNS
AFTERSHOCKS	NNS
aged	VBN
agencies	NNS
agendas	NNS
agents	NNS
Agents	NNS
ages	NNS
age	VBP
aggravated	VBD
aggravated	VBN
aggravates	VBZ
aggravate	VB
aggravate	VBP
aggravating	VBG
aggregates	NNS
aging	VBG
agitated	VBN
agonize	VB
agreed	VBD
Agreed	VBD
agreed	VBN
agreeing	VBG
agreements	NNS
agrees	VBZ
AGREES	VBZ
agree	VB
agree	VBP
agriproducts	NNS
Aichi	NNS
aided	VBD
aided	VBN
Aided	VBN
aides	NNS
Aides	NNS
aiding	VBG
aids	NNS
aids	VBZ
aid	VB
ailing	VBG
ailments	NNS
ails	NNS
aimed	VBD
aimed	VBN
Aimed	VBN
aiming	VBG
aims	NNS
aims	VBZ
Aims	VBZ
aim	VB
Aim	VB
aim	VBP
aircraft	NNS
aired	VBD
aired	VBN
airfields	NNS
airing	VBG
airlifted	VBN
airlifting	VBG
airliners	NNS
airlines	NNS
Airlines	NNS
airmen	NNS
airplanes	NNS
airports	NNS
airs	NNS
airs	VBZ
air	VB
air	VBP
airwaves	NNS
aisles	NNS
ai	VBP
ai	VBZ
alarmed	VBN
Alarmed	VBN
alarming	VBG
alarms	NNS
alarms	VBZ
Albanians	NNS
albums	NNS
alchemists	NNS
alcoholics	NNS
alerted	VBD
alerting	VBG
alerts	VBZ
alert	VB
alienated	VBN
alienates	VBZ
alienate	VB
alienating	VBG
aliens	NNS
aligned	VBN
align	VBP
allayed	VBN
allay	VB
allegations	NNS
alleged	VBD
alleged	VBN
alleges	NNS
alleges	VBZ
allege	VB
allege	VBP
alleging	VBG
allergies	NNS
alleviate	VB
alleviating	VBG
alleys	NNS
alliances	NNS
allied	VBD
allies	NNS
Allies	NNS
alligators	NNS
allocated	VBD
allocated	VBN
allocate	VB
allocate	VBP
allocating	VBG
allocations	NNS
allotments	NNS
allowances	NNS
allowed	VB
allowed	VBD
allowed	VBN
allowing	VBG
Allowing	VBG
allows	VBZ
allow	VB
Allow	VB
allow	VBP
alloys	NNS
allrightniks	NNS
alluded	VBD
allusions	NNS
allying	VBG
ally	VB
altered	VBD
altered	VBN
altering	VBG
alternates	NNS
alternates	VBZ
alternating	VBG
alternatives	NNS
alter	VB
Alter	VB
alter	VBP
aluminum-makers	NNS
alumni	NNS
amahs	NNS
amalgamate	VB
amalgamations	NNS
amassed	VBD
amassed	VBN
amasses	VBZ
amass	VB
amass	VBP
amateurs	NNS
amazed	VBN
amaze	VB
ambassadors	NNS
ambiguities	NNS
ambitions	NNS
amble	VB
ambushed	VBD
amended	VBD
amended	VBN
amending	VBG
Amending	VBG
amendments	NNS
amend	VB
amenities	NNS
Amenities	NNS
A-men	NNS
Americana	NNS
Americanized	VBD
Americans	NNS
Americans	VBP
amortize	VB
amounted	VBD
amounted	VBN
amounting	VBG
amounts	NNS
amounts	VBZ
amount	VB
amount	VBP
amphobiles	NNS
amplified	VBN
amplifiers	NNS
amplifying	VBG
amplify	VB
amps	NNS
amused	VBN
amusements	NNS
amuse	VBP
am	VBP
Am	VBP
AM	VBP
anachronisms	NNS
analyses	NNS
Analyses	NNS
analysts	NNS
Analysts	NNS
analyzed	VBD
analyzed	VBN
analyze	VB
analyze	VBP
analyzing	VBG
anchored	VBN
anchors	NNS
anchor	VB
anchor	VBP
and	VBP
anemias	NNS
anemics	NNS
angels	NNS
angered	VBD
angered	VBN
angering	VBG
angles	NNS
animals	NNS
Animals	NNS
animated	VBN
animosities	NNS
ankles	NNS
Anne	VB
anniversaries	NNS
announced	VBD
ANNOUNCED	VBD
announced	VBN
announcements	NNS
announces	VBZ
announce	VB
announce	VBP
announcing	VBG
annoyed	VBD
annoyed	VBN
annualized	VBN
Annualized	VBN
annuities	NNS
Annuities	NNS
ANNUITIES	NNS
Anointing	VBG
anomalies	NNS
answered	VBD
answered	VBN
answering	VBG
answers	NNS
Answers	NNS
answers	VBZ
answer	VB
answer	VBP
antagonists	NNS
antagonize	VB
anteaters	NNS
antecedents	NNS
antelope	NNS
anthers	NNS
anti-abortionists	NNS
antibodies	NNS
anticipated	VBD
anticipated	VBN
anticipates	VBZ
anticipate	VB
anticipate	VBP
anticipating	VBG
Anticipating	VBG
antics	NNS
anti-heroes	NNS
anti-infectives	NNS
antipathies	NNS
anti-programmers	NNS
antiquities	NNS
ants	NNS
anxieties	NNS
apartments	NNS
apologies	NNS
apologists	NNS
apologized	VBD
apologizes	VBZ
apologize	VB
apologizing	VBG
appalled	VBN
apparitions	NNS
appealed	VBD
appealed	VBN
appealing	VBG
Appealing	VBG
appeals	NNS
appeal	VB
appeal	VBP
appearances	NNS
appeared	VBD
appeared	VBN
appearing	VBG
appears	NNS
appears	VBZ
APPEARS	VBZ
appear	VB
appear	VBP
appeased	VBD
appease	VB
appendages	NNS
appended	VBN
append	VB
applauded	VBD
applauding	VBG
applauds	VBZ
applaud	VB
applaud	VBP
apples	NNS
appliances	NNS
applicants	NNS
applications	NNS
Applications	NNS
applied	VBD
applied	VBN
Applied	VBN
applies	VBZ
applying	VBG
Applying	VBG
apply	VB
apply	VBP
appointed	VBD
appointed	VBN
Appointed	VBN
appointees	NNS
appointments	NNS
appoint	VB
appraisals	NNS
appraised	VBN
appraisers	NNS
appraise	VB
appreciated	VBD
appreciated	VBN
appreciates	VBZ
appreciate	VB
appreciate	VBP
appreciating	VBG
apprehensions	NNS
apprised	VBN
approached	VBD
approached	VBN
approaches	NNS
approaches	VBZ
approaching	VBG
approach	VB
approach	VBP
appropriated	VBD
appropriated	VBN
appropriations	NNS
Appropriations	NNS
appropriators	NNS
approvals	NNS
approved	VBD
APPROVED	VBD
approved	VBN
approves	VBZ
approve	VB
approve	VBP
approving	VBG
approximates	VBZ
Arabs	NNS
arbitragers	NNS
Arbitragers	NNS
arbitrageurs	NNS
arbitraging	VBG
Arbitraging	VBG
arbitrates	VBZ
arbitrating	VBG
arborists	NNS
arbs	NNS
Arbs	NNS
arcades	NNS
arched	VBD
architects	NNS
Architects	NNS
arch	VBP
areas	NNS
Areas	NNS
arenas	NNS
are	VBP
Are	VBP
ARE	VBP
argued	VBD
argued	VBN
argues	VBZ
argue	VB
argue	VBP
arguing	VBG
Arguing	VBG
arguments	NNS
arisen	VBN
arises	VBZ
arise	VB
arise	VBP
ARISE	VBP
arising	VBG
Arkansas	NNS
armadillos	NNS
armed	VBN
Armed	VBN
armies	NNS
armpits	NNS
arms	NNS
Arms	NNS
arm	VB
aromas	NNS
arose	VBD
aroused	VBD
aroused	VBN
arouses	VBZ
arouse	VB
arousing	VBG
arpeggios	NNS
Arraignments	NNS
arranged	VBD
arranged	VBN
arrangements	NNS
Arrangements	NNS
arranges	VBZ
arrange	VB
arranging	VBG
arrears	NNS
arrested	VBD
arrested	VBN
Arrested	VBN
arrests	NNS
arrest	VB
arrivals	NNS
arrived	VBD
ARRIVED	VBD
arrived	VBN
arrives	VBZ
arrive	VB
arrive	VBP
arriving	VBG
arrows	NNS
arsenals	NNS
arteries	NNS
articles	NNS
articulate	VB
artifacts	NNS
artillerists	NNS
artists	NNS
Artists	NNS
arts	NNS
Arts	NNS
artworks	NNS
Asahi	NNS
ascending	VBG
ascertain	VB
ascribed	VBN
ascribe	VBP
ashes	NNS
Ashland	VBP
ashtrays	NNS
asked	VBD
Asked	VBD
asked	VBN
Asked	VBN
asking	VBG
asks	VBZ
ask	VB
Ask	VB
ask	VBP
aspects	NNS
aspens	NNS
aspersions	NNS
aspirations	NNS
aspired	VBD
aspires	VBZ
aspire	VBP
aspiring	VBG
assailed	VBD
assailed	VBN
assassinated	VBD
assassinated	VBN
assassinate	VB
assassinating	VBG
assassinations	NNS
assaults	NNS
assault	VBP
assemblages	NNS
assembled	VBD
assembled	VBN
assemble	VB
assemble	VBP
assemblies	NNS
assembling	VBG
asserted	VBD
asserted	VBN
asserting	VBG
assertions	NNS
asserts	VBZ
assert	VB
assert	VBP
asses	NNS
assessed	VBD
assessed	VBN
assessing	VBG
assessments	NNS
assess	VB
assess	VBP
assets	NNS
Assets	NNS
ASSETS	NNS
assigned	VBN
assignments	NNS
assigns	VBZ
assign	VB
assign	VBP
assimilate	VB
assistants	NNS
assisted	VBN
assisting	VBG
assists	VBZ
assist	VB
assist	VBP
associated	VBN
associates	NNS
Associates	NNS
associate	VBP
associating	VBG
associations	NNS
assuage	VB
assumed	VBD
assumed	VBN
assumes	VBZ
assume	VB
Assume	VB
assume	VBP
assuming	VBG
Assuming	VBG
assumptions	NNS
assurances	NNS
assured	VBD
assured	VBN
assures	VBZ
assure	VB
assuring	VBG
asteroids	NNS
astounds	VBZ
astronauts	NNS
ate	VBD
Ate	VBD
athletes	NNS
athletics	NNS
Atlantis	NNS
atolls	NNS
atoms	NNS
Atone	VB
atrocities	NNS
attached	VBD
attached	VBN
attaches	VBZ
attaching	VBG
attach	VB
attach	VBP
attacked	VBD
attacked	VBN
attackers	NNS
attacking	VBG
attacks	NNS
Attacks	NNS
attacks	VBZ
attack	VB
attack	VBP
attained	VBN
attain	VB
attarcks	NNS
attempted	VBD
attempted	VBN
attempting	VBG
attempts	NNS
Attempts	NNS
attempts	VBZ
attempt	VB
attempt	VBP
attendants	NNS
Attendants	NNS
attended	VBD
attended	VBN
attendees	NNS
attending	VBG
attends	VBZ
attend	VB
attend	VBP
Attention	VB
attests	VBZ
attest	VB
attics	NNS
attitudes	NNS
Attitudes	NNS
attorneys	NNS
Attorneys	NNS
attracted	VBD
attracted	VBN
Attracted	VBN
attracting	VBG
attractions	NNS
attracts	VBZ
attract	VB
attract	VBP
attributed	VBD
attributed	VBN
attributes	NNS
attributes	VBZ
attribute	VB
attribute	VBP
attributing	VBG
auctioned	VBD
auctioned	VBN
auctions	NNS
Auctions	NNS
auction	VB
audiences	NNS
audiocassettes	NNS
audiophiles	NNS
audited	VBD
audited	VBN
auditing	VBG
audition	VB
auditors	NNS
Auditors	NNS
audits	NNS
AUDITS	NNS
audit	VB
augment	VB
auspices	NNS
authored	VBN
authorities	NNS
Authorities	NNS
authorizations	NNS
authorized	VBD
authorized	VBN
authorizes	VBZ
authorize	VB
authorizing	VBG
authors	NNS
autions	NNS
auto-emissions	NNS
autographed	VBN
autographs	NNS
autograph	VB
auto\/homeowners	NNS
automakers	NNS
automated	VBN
Automated	VBN
automates	VBZ
automating	VBG
automobiles	NNS
Automobiles	NNS
auto-sales	NNS
autos	NNS
autumns	NNS
avenge	VB
avenues	NNS
averaged	VBD
averaged	VBN
averages	NNS
averages	VBZ
average	VB
average	VBP
averaging	VBG
averred	VBD
averted	VBN
averting	VBG
averts	VBZ
avert	VB
aviators	NNS
avoided	VBD
AVOIDED	VBD
avoided	VBN
avoiding	VBG
Avoiding	VBG
avoids	VBZ
avoid	VB
avoid	VBP
awaited	VBD
awaiting	VBG
awaits	VBZ
await	VB
await	VBP
awakened	VBN
awarded	VBD
awarded	VBN
awarding	VBG
awards	NNS
awards	VBZ
award	VB
awoke	VBD
axioms	NNS
axles	NNS
B-2s	NNS
Babelists	NNS
babies	NNS
Babies	NNS
backdated	VBD
back-dating	VBG
backed	VBD
BACKED	VBD
backed	VBN
backers	NNS
backfired	VBD
backfired	VBN
backfires	VBZ
backfire	VB
backfire	VBP
backflips	VBZ
backgrounds	NNS
backing	VBG
backlogs	NNS
backlots	NNS
backpackers	NNS
backpacks	NNS
backpedaling	VBG
backslapping	VBG
backs	NNS
backs	VBZ
Backs	VBZ
back-ups	NNS
back	VB
back	VBP
bacteria	NNS
badges	NNS
bags	NNS
bailed	VBD
Bailiffs	NNS
bailing	VBG
bailouts	NNS
bail	VB
bakeries	NNS
bakers	NNS
balanced	VBN
balance-of-payments	NNS
balances	NNS
BALANCES	NNS
balances	VBZ
balance	VB
balancing	VBG
balconies	NNS
bales	NNS
balked	VBD
balking	VBG
BALKS	VBZ
balk	VB
balk	VBP
ballerinas	NNS
ballets	NNS
ballooned	VBD
ballooned	VBN
ballooning	VBG
balloonists	NNS
balloons	NNS
balloons	VBZ
balloon	VB
ballots	NNS
BALLOTS	NNS
ballparks	NNS
ballplayers	NNS
balls	NNS
ballyhooed	VBN
bamboozled	VBN
bananas	NNS
bandages	NNS
banded	VBN
bandied	VBN
bands	NNS
band	VB
bangs	VBZ
bang	VB
banished	VBN
banish	VB
bankers	NNS
Bankers	NNS
BANKERS	NNS
banking	VBG
bankrolling	VBG
bankroll	VB
bankroll	VBP
bankruptcies	NNS
bankrupt	VB
bankrupt	VBP
banks	NNS
Banks	NNS
bank	VB
Bank	VB
bank	VBP
banned	VBD
banned	VBN
banners	NNS
banning	VBG
banshees	NNS
bans	NNS
bans	VBZ
ban	VB
ban	VBP
barbed	VBN
barbers	NNS
barbs	NNS
bargained	VBD
bargained	VBN
bargain-hunters	NNS
bargain-hunt	VB
bargaining	VBG
bargains	NNS
bargain	VB
barges	NNS
barges	VBZ
baring	VBG
barking	VBG
barnacles	NNS
barns	NNS
barons	NNS
barred	VBD
barred	VBN
Barred	VBN
barreling	VBG
barrels	NNS
Barrels	NNS
barricades	NNS
barriers	NNS
barring	VBG
Barring	VBG
bars	NNS
bars	VBZ
bartenders	NNS
bartered	VBN
bar	VB
Bar	VB
baseballs	NNS
based	VBD
based	VBN
Based	VBN
basements	NNS
bases	NNS
bases	VBZ
base	VB
base	VBP
bashing	VBG
Bashing	VBG
bash	VB
basics	NNS
basing	VBG
baskets	NNS
Baskets	NNS
bastions	NNS
batches	NNS
bathed	VBN
bathrooms	NNS
baths	NNS
bats	NNS
battalions	NNS
batted	VBD
batted	VBN
battered	VBD
battered	VBN
batteries	NNS
battering	VBG
batter	VB
batting	VBG
battled	VBD
BATTLED	VBD
battled	VBN
battlegroups	NNS
battlements	NNS
battles	NNS
battles	VBZ
battle	VB
battle	VBP
battling	VBG
bays	NNS
beaches	NNS
beads	NNS
beamed	VBN
beaming	VBG
beams	VBZ
beanballs	NNS
beans	NNS
bearings	NNS
bearing	VBG
bears	NNS
Bears	NNS
bears	VBZ
bear	VB
bear	VBP
beasties	NNS
beasts	NNS
beaten	VBN
beating	VBG
beats	NNS
beats	VBZ
beat	VB
beat	VBD
beat	VBP
became	VBD
becomes	VBZ
become	VB
Become	VB
BECOME	VB
become	VBD
become	VBN
become	VBP
becoming	VBG
bedeviled	VBN
bedevil	VB
bedfellows	NNS
Bedfellows	NNS
bedpans	NNS
bedrooms	NNS
beds	NNS
beefed	VBD
beefed	VBN
beefing	VBG
beef	VB
been	VBN
Been	VBN
been	VBP
beeping	VBG
beeps	NNS
beers	NNS
bees	NNS
befallen	VBN
befall	VBP
befell	VBD
befriended	VBN
befuddled	VBD
began	VBD
beggars	NNS
begged	VBN
begging	VBG
beginnings	NNS
beginning	VBG
Beginning	VBG
begins	VBZ
Begins	VBZ
begin	VB
begin	VBP
begot	VBD
begs	VBZ
begun	VBN
beg	VB
behaved	VBD
behaved	VBN
behaves	VBZ
behave	VB
behaving	VBG
behaviors	NNS
Beheading	VBG
behemoths	NNS
beings	NNS
being	VBG
Being	VBG
BEING	VBG
being	VBG|JJ
beleaguered	VBN
belfries	NNS
belied	VBD
beliefs	NNS
belie	VB
belie	VBP
believed	VBD
believed	VBN
believes	VBZ
believe	VB
believe	VBP
believing	VBG
belittle	VB
bellies	NNS
bellow	VB
bellringers	NNS
bells	NNS
bellwethers	NNS
belly-flopped	VBD
belonged	VBD
belongings	NNS
belonging	VBG
belongs	VBZ
belong	VB
belong	VBP
belting	VBG
belts	NNS
bemoaning	VBG
benches	NNS
benchmarks	NNS
bending	VBG
bend	VB
benefactors	NNS
beneficiaries	NNS
Beneficiaries	NNS
benefited	VBD
benefited	VBN
benefiting	VBG
benefits	NNS
BENEFITS	NNS
benefits	VBZ
benefit	VB
Benefit	VB
benefit	VBP
bequeathed	VBD
bequests	NNS
berated	VBD
berries	NNS
beset	VBN
besieged	VBN
bested	VBD
bested	VBN
bestirred	VBN
bestowed	VBN
betas	NNS
betrayed	VBN
bets	NNS
Bets	NNS
betters	NNS
better	VB
betting	VBG
bet	VB
bet	VBD
bet	VBN
bet	VBP
be	VB
Be	VB
BE	VB
be	VBP
beverages	NNS
beware	VB
Beware	VB
BEWARE	VB
bewildered	VBN
bewildering	VBG
bewitched	VBN
biased	VBN
biases	NNS
bibles	NNS
bickered	VBN
bickering	VBG
bicycles	NNS
bidders	NNS
bidding	VBG
bids	NNS
Bids	NNS
bids	VBZ
bid	VB
bid	VBD
bid	VBN
bid	VBP
bifurcate	VB
bikers	NNS
Bikers	NNS
bikes	NNS
Biking	VBG
bilges	NNS
bilking	VBG
billed	VBD
billed	VBN
billings	NNS
Billings	NNS
billing	VBG
billions	NNS
Billions	NNS
billowing	VBG
bills	NNS
Bills	NNS
BILLS	NNS
bills	VBZ
bill	VB
bill	VBP
binders	NNS
binding	VBG
binges	NNS
binoculars	NNS
bins	NNS
Bioengineers	NNS
biographers	NNS
biologists	NNS
biomedical-products	NNS
biopsies	NNS
birds	NNS
BIRDS	NNS
birthdays	NNS
births	NNS
biscuits	NNS
Bishops	NNS
bites	NNS
bites	VBZ
bite	VB
biting	VBG
bits	NNS
bitten	VBN
Bitten	VBN
blabs	VBZ
blacked	VBN
blackened	VBN
blacklist	VB
blackmailed	VBN
blackmailers	NNS
blackmailing	VBG
blackmail	VB
blackouts	NNS
blacks	NNS
Blacks	NNS
Blackstone	VBP
blades	NNS
blamed	VBD
blamed	VBN
Blamed	VBN
blames	VBZ
blame	VB
blame	VBP
blaming	VBG
Blaming	VBG
Blandings	NNS
blanketed	VBD
blankets	NNS
blanket	VBP
blared	VBD
blasted	VBD
blasting	VBG
blasts	NNS
blast	VB
blaze	VBP
blazing	VBG
bleachers	NNS
bled	VBD
bleeding	VBG
bleed	VB
blemishes	NNS
blending	VBG
blends	NNS
blend	VB
blessed	VBN
blessings	NNS
bless	VB
blew	VBD
blindfolded	VBD
blinds	NNS
blini	NNS
blinked	VBD
blinkers	NNS
blinks	VBZ
blink	VB
blips	NNS
blip	VB
blip	VBP
blitzes	NNS
blocked	VBD
blocked	VBN
Blocked	VBN
blocking	VBG
blocks	NNS
blocks	VBZ
block	VB
block	VBP
Blondes	NNS
bloodied	VBN
bloodletting	VBG
bloods	NNS
blooming	VBG
blossomed	VBD
blossomed	VBN
blossoms	NNS
blotting	VBG
blowing	VBG
blown	VBN
blows	NNS
blow	VB
bludgeoned	VBN
bludgeon	VB
bluebloods	NNS
blue-chips	NNS
blues	NNS
Blues	NNS
blundered	VBD
blunders	NNS
blunder	VB
blunted	VBD
blunted	VBN
blunt	VB
blurred	VBD
blurring	VBG
blurting	VBG
blurt	VBP
blur	VB
BMWs	NNS
boarding	VBG
boardrooms	NNS
Boardrooms	NNS
boards	NNS
board	VB
boasted	VBD
boasted	VBN
boasts	VBZ
boast	VB
boast	VBP
boaters	NNS
boating	VBG
boats	NNS
bodegas	NNS
bodes	VBZ
bode	VB
bodies	NNS
bodyworkers	NNS
Boeing	VBG
bogged	VBD
bogging	VBG
bog	VB
boiled	VBD
boilers	NNS
boiling	VBG
boils	VBZ
boil	VB
bolstered	VBD
bolstered	VBN
Bolstered	VBN
bolstering	VBG
Bolstering	VBG
bolsters	VBZ
bolster	VB
bolted	VBN
bolts	NNS
bombarded	VBD
bombarded	VBN
bombarding	VBG
bombed	VBD
bombed	VBN
bombers	NNS
bombings	NNS
bomblets	NNS
bombs	NNS
bomb	VB
bonded	VBN
bond-holders	NNS
bondholders	NNS
bondholdings	NNS
bonds	NNS
Bonds	NNS
BONDS	NNS
boned	VBN
bones	NNS
bonnets	NNS
bonuses	NNS
Bonuses	NNS
booed	VBD
booked	VBD
booked	VBN
bookers	NNS
bookings	NNS
Bookings	NNS
booking	VBG
booklets	NNS
books	NNS
Books	NNS
bookstores	NNS
book	VB
boomed	VBD
boomed	VBN
boomers	NNS
booming	VBG
booms	NNS
boom	VB
boosted	VBD
boosted	VBN
boosters	NNS
boosting	VBG
boosts	NNS
BOOSTS	NNS
boosts	VBZ
boost	VB
Boost	VB
boost	VBP
booths	NNS
Booths	NNS
bootlegged	VBN
boots	NNS
boozing	VBG
bordered	VBN
bordering	VBG
borders	NNS
bored	VBN
bore	VBD
boring	VBG
borne	VBN
born	VBN
Born	VBN
borrowed	VBD
borrowed	VBN
Borrowed	VBN
borrowers	NNS
Borrowers	NNS
borrowings	NNS
borrowing	VBG
borrowing	VBG|NN
borrows	VBZ
borrow	VB
borrow	VBP
bosses	NNS
Bosses	NNS
botched	VBN
bothered	VBD
bothered	VBN
bothering	VBG
bother	VB
bother	VBP
bottled	VBN
bottlenecks	NNS
bottlers	NNS
bottles	NNS
bottle	VB
bottling	VBG
bottomed	VBD
bottomed	VBN
bottoming	VBG
bottoms	NNS
bottom	VB
bought	VBD
bought	VBN
bounced	VBD
bounces	NNS
bounces	VBZ
bounce	VB
bounce	VBP
bouncing	VBG
boundaries	NNS
bounding	VBG
bounds	NNS
bounds	VBZ
bound	VBN
bourbons	NNS
bourses	NNS
boutiques	NNS
bouts	NNS
Bouygues	NNS
bowed	VBD
bowed	VBN
Bowing	VBG
bowling	VBG
bowls	VBZ
bowl	VBP
bow	VB
bow	VBP
boxes	NNS
boycotted	VBN
boycott	VB
boyfriends	NNS
boys	NNS
Boys	NNS
braced	VBD
braced	VBN
brace	VB
bracing	VBG
brags	VBZ
brag	VB
braids	NNS
brains	NNS
brakes	NNS
Brakes	NNS
braking	VBG
branched	VBN
branches	NNS
Branches	NNS
branching	VBG
branch	VB
brandished	VBD
brandishing	VBG
brands	NNS
Brands	NNS
brands	VBZ
brassieres	NNS
brats	NNS
braved	VBD
brave	VB
braving	VBG
Brawls	NNS
brazen	VB
Brazilians	NNS
breached	VBD
breached	VBN
breaches	NNS
breach	VB
breaded	VBN
breakdowns	NNS
breakers	NNS
breaking	VBG
Breaking	VBG
breaks	NNS
breaks	VBZ
breakthroughs	NNS
break	VB
break	VBP
breasts	NNS
breathed	VBD
breathe	VB
breathing	VBG
breaths	NNS
bred	VBD
bred	VBN
breeders	NNS
Breeders	NNS
breeding	VBG
breed	VB
breed	VBP
breezes	NNS
brethren	NNS
brewed	VBN
breweries	NNS
Breweries	NNS
brewers	NNS
brewing	VBG
brew	VB
bribed	VBD
bribed	VBN
bribes	NNS
bribe	VB
bribing	VBG
bricks	NNS
bridges	NNS
bridge	VB
bridging	VBG
briefcases	NNS
briefed	VBD
briefed	VBN
briefings	NNS
briefs	NNS
BRIEFS	NNS
brief	VB
brigades	NNS
brightened	VBD
brightened	VBN
brightening	VBG
brimmed	VBD
bringing	VBG
brings	VBZ
bring	VB
bring	VBP
bristled	VBD
bristles	VBZ
bristle	VBP
British	NNS
broadcasters	NNS
Broadcasters	NNS
broadcasting	VBG
Broadcasting	VBG
broadcasts	NNS
Broadcasts	NNS
broadcasts	VBZ
broadcast	VB
broadcast	VBD
broadcast	VBN
broadened	VBD
broadened	VBN
broadening	VBG
broadens	VBZ
broaden	VB
brochures	NNS
broken	VBN
brokerages	NNS
broker-dealers	NNS
brokered	VBD
brokering	VBG
brokers	NNS
Brokers	NNS
broke	VBD
Broncos	NNS
broncs	NNS
brothers	NNS
brought	VBD
brought	VBN
browbeat	VB
browse	VB
browsing	VBG
bruised	VBN
bruises	NNS
bruising	VBG
brushbacks	NNS
brushed	VBD
brushed	VBN
brushes	NNS
brushing	VBG
brush	VB
Brussels	NNS
bubbles	NNS
bubble	VB
Buccaneers	NNS
bucked	VBD
bucked	VBN
buckets	NNS
bucking	VBG
Bucking	VBG
buckled	VBD
buckle	VB
buckling	VBG
bucks	NNS
bucks	VBZ
buck	VB
buck	VBP
buddies	NNS
budding	VBG
budged	VBD
budged	VBN
budgeted	VBN
budgeteers	NNS
budgets	NNS
budge	VB
buds	NNS
buffer	VB
buffeted	VBN
buffets	NNS
Buffets	NNS
buffet	VB
buffing	VBG
buffs	NNS
bugged	VBN
bugs	NNS
Bugs	NNS
builders	NNS
Builders	NNS
building-materials	NNS
building-products	NNS
buildings	NNS
Buildings	NNS
building	VBG
Building	VBG
builds	VBZ
build	VB
build	VBN
build	VBP
built	VBD
built	VBN
Built	VBN
bulbs	NNS
bulging	VBG
bulkheads	NNS
bulldozed	VBN
bulldozers	NNS
bulletins	NNS
bullets	NNS
bullhorns	NNS
bullied	VBD
bullies	VBZ
bulls	NNS
Bulls	NNS
bullying	VBG
bumble	VB
bumble	VBP
bumbling	VBG
bumped	VBD
bumped	VBN
bumps	NNS
bump	VB
Bums	NNS
bunches	NNS
bundled	VBN
bundles	NNS
bundling	VBG
bungled	VBN
buns	NNS
buoyed	VBD
buoyed	VBN
Buoyed	VBN
buoying	VBG
buoys	VBZ
buoy	VB
burbles	VBZ
burdened	VBD
burdened	VBN
burdens	NNS
Burdens	NNS
burdens	VBZ
bureaucracies	NNS
bureaucrats	NNS
Bureaucrats	NNS
bureaus	NNS
burgeoning	VBG
burgers	NNS
burglaries	NNS
burglarized	VBN
burgs	NNS
burials	NNS
buried	VBD
buried	VBN
Buried	VBN
burned	VBD
burned	VBN
Burned	VBN
burning	VBG
burnishing	VBG
burnouts	NNS
burns	NNS
burns	VBZ
burnt	VBN
burn	VB
burn	VBP
bursting	VBG
bursts	NNS
bursts	VBZ
burst	VBD
burst	VBP
burying	VBG
bury	VB
bury	VBP
buses	NNS
bushels	NNS
bushes	NNS
busies	NNS
business-communications	NNS
businesses	NNS
Businesses	NNS
business-machines	NNS
businessmen	NNS
Businessmen	NNS
business-partners	NNS
busloads	NNS
busted	VBD
busted	VBN
busting	VBG
busts	NNS
butlers	NNS
butterflies	NNS
buttons	NNS
buttressed	VBN
buttresses	VBZ
buttress	VB
butt	VB
buy-backs	NNS
buy-back	VB
buyers	NNS
Buyers	NNS
BUYERS	NNS
buyings	NNS
buying	VBG
Buying	VBG
buy-outs	NNS
buyouts	NNS
buys	NNS
buys	VBZ
buy	VB
Buy	VB
buy	VB|NN
buy	VBP
buzzes	VBZ
buzzing	VBG
buzz	VB
buzzwords	NNS
bylaws	NNS
bylines	NNS
bypass	VB
bystanders	NNS
cabin-crew	NNS
cabinets	NNS
cables	NNS
cabs	NNS
caches	NNS
cadets	NNS
cadge	VBP
cafes	NNS
cafeterias	NNS
caked	VBD
calamities	NNS
Calaveras	NNS
calculated	VBD
calculated	VBN
Calculated	VBN
calculates	VBZ
calculate	VB
calculate	VBP
calculating	VBG
Calculating	VBG
calculations	NNS
calculators	NNS
calibrated	VBN
Californians	NNS
called	VB
called	VBD
Called	VBD
called	VBN
Called	VBN
CALLED	VBN
callers	NNS
Callers	NNS
calling	VBG
Calling	VBG
calls	NNS
Calls	NNS
calls	VBZ
call	VB
Call	VB
CALL	VB
call	VBP
calmed	VBN
calming	VBG
calm	VB
calories	NNS
Caltrans	NNS
calves	NNS
cameras	NNS
came	VBD
camouflaged	VBN
campaigned	VBN
campaigning	VBG
campaigns	NNS
campaign	VB
camped	VBD
campers	NNS
camps	NNS
campuses	NNS
Campuses	NNS
canals	NNS
canceled	VBD
canceled	VBN
canceled	VBN|JJ
canceling	VBG
cancellations	NNS
cancels	VBZ
cancel	VB
cancers	NNS
cancer-suppressors	NNS
candidates	NNS
candies	NNS
candles	NNS
canned	VBN
canning	VBG
cans	NNS
canvases	NNS
canvassed	VBN
canyons	NNS
capabilities	NNS
capacities	NNS
capacitors	NNS
capital-assets	NNS
capital-draining	VBG
capital-gains	NNS
capitalgains	NNS
capital-goods	NNS
capitalists	NNS
capitalized	VBD
capitalized	VBN
capitalize	VB
capitalizing	VBG
Capitalizing	VBG
capitals	NNS
capital-to-assets	NNS
capita	NNS
capitulated	VBD
capped	VBD
capped	VBN
capping	VBG
caps	NNS
capsules	NNS
captain	VBP
captioned	VBD
captivating	VBG
captives	NNS
captured	VBD
captured	VBN
captured	VBN|JJ
capture	VB
capturing	VBG
cap	VB
cap	VBP
carats	NNS
carbide-products	NNS
car-dealers	NNS
cardholders	NNS
cardinals	NNS
cards	NNS
cared	VBD
cared	VBN
careened	VBD
careening	VBG
careen	VB
careers	NNS
Careers	NNS
cares	VBZ
care	VB
care	VBP
caricatures	NNS
caricature	VB
carillons	NNS
caring	VBG
carnivores	NNS
carpenters	NNS
carpetbaggers	NNS
carpeted	VBD
carpets	NNS
carp	VBP
carried	VBD
carried	VBN
Carried	VBN
carriers	NNS
Carriers	NNS
carries	VBZ
carry-forwards	NNS
carryforwards	NNS
carrying	VBG
Carrying	VBG
carry	VB
carry	VBP
cars	NNS
Cars	NNS
carted	VBD
carting	VBG
Cartons	NNS
cartoonists	NNS
cartoons	NNS
cartridges	NNS
carts	NNS
cart	VBP
carved	VBD
carved	VBN
carvers	NNS
carves	VBZ
carve	VB
carve	VBP
carving	VBG
cascaded	VBD
cascading	VBG
caseloads	NNS
cases	NNS
Cases	NNS
cases	VBZ
cashed	VBD
cashed	VBN
cashing	VBG
cash	VB
casings	NNS
casinos	NNS
Casinos	NNS
caskets	NNS
cassettes	NNS
castigated	VBN
castigate	VB
castigating	VBG
castings	NNS
casting	VBG
castling	VBG
casts	VBZ
cast	VB
cast	VBD
cast	VBN
Cast	VBN
casualties	NNS
cataclysms	NNS
cataloging	VBG
catalogs	NNS
catapult	VB
catapult	VBP
Cataracts	NNS
catastrophes	NNS
catchers	NNS
catches	VBZ
catching	VBG
Catching	VBG
catch	VB
catch	VBP
categories	NNS
categorized	VBN
catered	VBD
catering	VBG
caters	VBZ
cater	VB
cater	VBP
CATFISH	NNS
catheters	NNS
cathodes	NNS
cats	NNS
cattle	NNS
Cattle	NNS
caught	VBD
caught	VBN
caused	VBD
caused	VBN
causes	NNS
causes	VBZ
cause	VB
cause	VBP
causing	VBG
cautioned	VBD
cautioning	VBG
cautions	VBZ
caution	VB
caution	VBP
caveats	NNS
caved	VBD
caves	NNS
C.D.s	NNS
CDs	NNS
ceased	VBD
ceased	VBN
ceases	VBZ
cease	VB
cease	VBP
ceded	VBD
ceded	VBN
cede	VB
ceding	VBG
ceilings	NNS
celebrated	VBD
celebrates	VBZ
celebrate	VB
celebrate	VBP
celebrating	VBG
celebrations	NNS
celebrities	NNS
cellars	NNS
cellists	NNS
cells	NNS
celluloids	NNS
cemented	VBN
Cementing	VBG
cement-makers	NNS
cement	VB
censored	VBN
censor	VBP
censured	VBD
centenarians	NNS
centered	VBD
centered	VBN
centering	VBG
centers	NNS
centers	VBZ
Centers	VBZ
center	VBP
centimeters	NNS
centralized	VBN
centralize	VB
cents	NNS
Cents	NNS
centuries	NNS
centurions	NNS
CEOs	NNS
ceramics	NNS
cereals	NNS
ceremonies	NNS
certificates	NNS
Certificates	NNS
CERTIFICATES	NNS
certified	VBN
certify	VB
CFCs	NNS
chafed	VBN
chafe	VBP
chains	NNS
Chains	NNS
chain	VBP
chaired	VBD
chaired	VBN
chairmen	NNS
chairs	NNS
chairs	VBZ
chalked	VBN
chalking	VBG
challenged	VBD
challenged	VBN
challengers	NNS
challenges	NNS
challenges	VBZ
Challenges	VBZ
challenge	VB
challenge	VBP
challenging	VBG
chambers	NNS
Chambers	NNS
Champagnes	NNS
championed	VBD
championed	VBN
championing	VBG
championships	NNS
champions	NNS
champion	VBP
champs	NNS
chances	NNS
chance	VBP
chandeliers	NNS
changed	VBD
CHANGED	VBD
changed	VBN
CHANGED	VBN
changes	NNS
Changes	NNS
changes	VBZ
change	VB
Change	VB
change	VBP
changing	VBG
Changing	VBG
channeled	VBD
channels	NNS
channel	VB
channel	VBP
Chans	NNS
chanted	VBD
chanted	VBN
chanting	VBG
chants	NNS
chaps	NNS
chapters	NNS
characteristics	NNS
characterized	VBD
characterized	VBN
characterizes	VBZ
characterize	VB
characterize	VBP
characterizing	VBG
characters	NNS
Characters	NNS
charged	VBD
charged	VBN
charge-offs	NNS
charges	NNS
Charges	NNS
charges	VBZ
charge	VB
Charge	VB
charge	VBP
charging	VBG
charities	NNS
Charities	NNS
charlatans	NNS
Charlestonians	NNS
charred	VBN
chartered	VBD
chartered	VBN
charts	NNS
charts	VBZ
chart	VB
chart	VBP
chased	VBD
chasers	NNS
chase	VB
chasing	VBG
chassis	NNS
chastened	VBD
chastened	VBN
chastised	VBD
chastised	VBN
chastises	VBZ
chatting	VBG
chat	VB
chauffeurs	NNS
chauffeur	VB
cheapens	VBZ
cheated	VBD
cheaters	NNS
cheating	VBG
cheat	VB
cheat	VBP
checkbooks	NNS
checked	VBD
checked	VBN
checking	VBG
checkpoints	NNS
checks	NNS
checks	VBZ
check	VB
Check	VB
check	VBP
cheered	VBD
cheered	VBN
cheering	VBG
cheerleaders	NNS
cheers	NNS
cheer	VB
cheeses	NNS
chefs	NNS
chelicerates	NNS
chemicals	NNS
Chemicals	NNS
chemical-weapons	NNS
chemists	NNS
cherished	VBN
cherishes	VBZ
cherries	NNS
cherubs	NNS
chewed	VBD
chewing	VBG
chews	NNS
chew	VB
chew	VBP
chickens	NNS
Chickens	NNS
chided	VBD
chided	VBN
chides	VBZ
chiefs	NNS
children	NNS
Children	NNS
CHILDREN	NNS
chilled	VBN
chilling	VBG
chill	VB
chimes	VBZ
chimneys	NNS
chimpanzees	NNS
Chinese	NNS
chipped	VBN
chipping	VBG
chips	NNS
chisel	VB
chlorofluorocarbons	NNS
choices	NNS
Choices	NNS
choked	VBD
choked	VBN
choke	VB
choking	VBG
chooses	VBZ
choose	VB
Choose	VB
choose	VBP
choosing	VBG
chopped	VBN
chopping	VBG
chops	NNS
chopsticks	NNS
chop	VB
chords	NNS
choreographers	NNS
chores	NNS
Chores	NNS
chortled	VBD
choruses	NNS
chosen	VBN
chose	VBD
Christians	NNS
chromosomes	NNS
Chronicles	NNS
chronicles	VBZ
chucked	VBD
chuckles	NNS
chuckles	VBZ
chuckling	VBG
chug	VBP
chums	NNS
chunks	NNS
churches	NNS
church-goers	NNS
churn	VB
churn	VBP
cials	NNS
cigarettes	NNS
cigars	NNS
cinch	VB
Cincinnati	NNS
circled	VBD
circles	NNS
circles	VBZ
circuits	NNS
circulars	NNS
circulated	VBD
circulated	VBN
circulate	VB
circulate	VBP
circulating	VBG
circulations	NNS
circumstances	NNS
circumventing	VBG
circumvents	VBZ
circumvent	VB
citations	NNS
cited	VBD
cited	VBN
Cited	VBN
cites	VBZ
cite	VB
cite	VBP
Citicorp	VB
cities	NNS
Cities	NNS
citing	VBG
Citing	VBG
citizens	NNS
Citizens	NNS
CITIZENS	NNS
civics	NNS
civilians	NNS
civil-rights	NNS
clad	VBN
Clad	VBN
claimants	NNS
CLAIMANTS	NNS
claimed	VBD
claimed	VBN
claiming	VBG
Claiming	VBG
claims	NNS
Claims	NNS
claims	VBZ
CLAIMS	VBZ
claim	VB
claim	VBP
clambered	VBD
clamored	VBD
clampdowns	NNS
clamped	VBN
clamping	VBG
clamp	VB
clanging	VBG
clanking	VBG
clarifications	NNS
clarified	VBN
clarifies	VBZ
clarifying	VBG
clarify	VB
clashed	VBD
clashed	VBN
clashes	NNS
clash	VB
classed	VBN
classes	NNS
Classes	NNS
classics	NNS
Classics	NNS
classifications	NNS
classified	VBD
classified	VBN
classifies	VBZ
classify	VB
classmates	NNS
classrooms	NNS
clauses	NNS
Claws	NNS
cleaned	VBD
cleaned	VBN
cleaners	NNS
clean-fuels	NNS
cleaning	VBG
Cleaning	VBG
cleansed	VBD
cleansed	VBN
cleansers	NNS
cleanse	VB
cleansing	VBG
cleans	VBZ
clean	VB
clearances	NNS
cleared	VBD
cleared	VBN
clearing	VBG
clears	VBZ
CLEARS	VBZ
clear	VB
clear	VBP
clergy	NNS
clerics	NNS
clerks	NNS
clicked	VBD
clientele	NNS
clients	NNS
Clients	NNS
climbed	VBD
climbed	VBN
climbers	NNS
climbing	VBG
climbs	VBZ
climb	VB
clinched	VBD
clinching	VBG
cling	VB
cling	VBP
clinical-products	NNS
clinics	NNS
clinkers	NNS
clipped	VBD
clipped	VBN
clippings	NNS
clips	NNS
clip	VB
cliques	NNS
cloak	VBP
clobbered	VBD
clobbered	VBN
clobber	VB
clocked	VBN
clocks	NNS
clocks	VBZ
clogged	VBN
clogging	VBG
cloned	VBN
clones	NNS
closed	VBD
closed	VBN
Closed	VBN
closed	VBN|VBD
closes	NNS
closes	VBZ
Closes	VBZ
close	VB
Close	VB
close	VBP
closings	NNS
closing	VBG
closing	VBG|NN
closures	NNS
clothed	VBN
clothes	NNS
clothiers	NNS
clouded	VBN
clouds	NNS
clouds	VBZ
cloud	VB
cloud	VBP
clowns	NNS
clubbed	VBD
CLUBBING	VBG
clubs	NNS
Clubs	NNS
CLUBS	NNS
clues	NNS
clumps	NNS
clustered	VBN
clusters	NNS
clutching	VBG
clutch	VBP
cluttered	VBN
clutter	VB
C'mon	VB
coaches	NNS
Coach	VB
co-anchored	VBN
coasted	VBD
coasters	NNS
coasts	NNS
coated	VBN
coatings	NNS
coats	NNS
Coats	NNS
coattails	NNS
co-authored	VBN
Co-authors	NNS
coaxing	VBG
coax	VB
cobbled	VBD
cobbled	VBN
Cobbs	NNS
co-chairmen	NNS
cockatoos	NNS
cockroaches	NNS
cocktails	NNS
coconuts	NNS
coddled	VBN
coded	VBN
co-defendants	NNS
CODE-NAMED	VBN
codes	NNS
code	VB
co-developers	NNS
codified	VBN
Codifying	VBG
co-edits	VBZ
coerces	VBZ
co-exist	VB
coextrude	VBP
coffers	NNS
co-founded	VBD
co-founders	NNS
cognoscenti	NNS
cohere	VB
cohorts	NNS
co-host	VB
coincided	VBD
coincides	VBZ
coincide	VB
coined	VBN
coins	NNS
colas	NNS
cold-cuts	NNS
coli	NNS
collaborated	VBD
collaborate	VB
collaborate	VBP
collaborating	VBG
collaborators	NNS
collages	NNS
collapsed	VBD
collapsed	VBN
collapses	NNS
collapses	VBZ
collapse	VB
collapsing	VBG
collars	NNS
collateralized	VBN
colleagues	NNS
Colleagues	NNS
collected	VBD
collected	VBN
collectibles	NNS
Collectibles	NNS
collecting	VBG
collections	NNS
collectives	NNS
collectivizers	NNS
collectors	NNS
Collectors	NNS
collects	VBZ
collect	VB
collect	VBP
colleges	NNS
Colleges	NNS
college-sports	NNS
colloquies	NNS
colonialists	NNS
colonies	NNS
colonists	NNS
color-coded	VBN
color-coding	VBG
colored	VBN
colors	NNS
color	VB
columnists	NNS
columns	NNS
co-managed	VBN
co-managing	VBG
combatants	NNS
combating	VBG
Combatting	VBG
combat	VB
combed	VBN
combinations	NNS
combined	VBD
combined	VBN
Combined	VBN
combines	NNS
combines	VBZ
combine	VB
combine	VBP
combing	VBG
combining	VBG
comedies	NNS
comestibles	NNS
comes	VBZ
Comes	VBZ
comets	NNS
come	VB
Come	VB
come	VBD
come	VBN
Come	VBN
come	VBP
comforted	VBN
comforting	VBG
comforts	NNS
coming	VBG
Coming	VBG
commanded	VBN
commanders	NNS
commanding	VBG
commandos	NNS
command	VB
command	VBP
commemorated	VBD
commemorate	VB
commemorate	VBP
commenced	VBD
commencing	VBG
commends	VBZ
commend	VB
commentaries	NNS
commentators	NNS
Commentators	NNS
commented	VBD
commenting	VBG
Commenting	VBG
comments	NNS
Comments	NNS
COMMENTS	NNS
comments	VBZ
comment	VB
commercialize	VB
commercializing	VBG
commercials	NNS
Commercials	NNS
commissioned	VBD
commissioned	VBN
commissioners	NNS
commissioning	VBG
Commissioning	VBG
commissions	NNS
Commissions	NNS
commissions	VBZ
commitments	NNS
commits	VBZ
committed	VBD
committed	VBN
committees	NNS
Committees	NNS
committees	VBZ
committes	NNS
committing	VBG
commit	VB
commit	VBP
commodities	NNS
Commodities	NNS
commoditize	VB
communicated	VBD
communicated	VBN
communicate	VB
communicating	VBG
communications	NNS
communiques	NNS
communists	NNS
Communists	NNS
communities	NNS
commuters	NNS
COMMUTERS	NNS
commutes	NNS
commuting	VBG
compacted	VBN
companies	NNS
Companies	NNS
COMPANIES	NNS
companions	NNS
Compaq	VB
compared	VBD
compared	VBN
Compared	VBN
compares	VBZ
compare	VB
Compare	VB
COMPARE	VB
compare	VBP
comparing	VBG
Comparing	VBG
comparisons	NNS
compatriots	NNS
compelled	VBN
Compelled	VBN
compels	VBZ
compel	VB
compensated	VBN
compensates	VBZ
compensate	VB
compensations	NNS
competed	VBD
competed	VBN
competes	VBZ
Competes	VBZ
compete	VB
compete	VBP
competing	VBG
Competing	VBG
competing	VBG|JJ
competitions	NNS
competitors	NNS
Competitors	NNS
compiled	VBN
Compiled	VBN
compiles	VBZ
compile	VB
compiling	VBG
complained	VBD
complained	VBN
complaining	VBG
complains	VBZ
complaints	NNS
Complaints	NNS
complain	VB
complain	VBP
complements	VBZ
complement	VB
completed	VBD
completed	VBN
completes	VBZ
complete	VB
completing	VBG
completions	NNS
complexes	NNS
complexities	NNS
complicated	VBD
complicated	VBN
complicates	VBZ
complicate	VB
complications	NNS
complied	VBD
complied	VBN
compliments	NNS
compliment	VBP
complying	VBG
Complying	VBG
comply	VB
components	NNS
composed	VBN
composers	NNS
composites	NNS
compositions	NNS
compounded	VBD
compounded	VBN
compounding	VBG
Compounding	VBG
compounds	NNS
compound	VB
compressed	VBN
compressors	NNS
comprised	VBN
comprises	VBZ
comprise	VB
comprise	VBP
comprising	VBG
compromised	VBN
compromises	NNS
Compromises	NNS
compromises	VBZ
compromise	VB
compromising	VBG
compulsions	NNS
Computations	NNS
computerized	VBN
computerize	VB
computerizing	VBG
computer-products	NNS
computer-services	NNS
computers	NNS
Computers	NNS
COMPUTERS	NNS
computer-systems	NNS
computes	VBZ
compute	VB
computing	VBG
comrades	NNS
concealed	VBN
concealing	VBG
conceal	VB
conceded	VBD
conceded	VBN
concedes	VBZ
concede	VB
concede	VBP
conceding	VBG
conceived	VBD
conceived	VBN
conceive	VB
conceiving	VBG
concentrated	VBD
concentrated	VBN
concentrates	VBZ
concentrate	VB
concentrate	VBP
concentrating	VBG
concentrations	NNS
conceptions	NNS
concepts	NNS
concerned	VBD
concerned	VBN
Concerned	VBN
concerning	VBG
Concerning	VBG
concerns	NNS
Concerns	NNS
concerns	VBZ
concern	VB
concertos	NNS
concerts	NNS
concessions	NNS
concluded	VBD
concluded	VBN
concludes	VBZ
conclude	VB
conclude	VBP
concluding	VBG
conclusions	NNS
concocted	VBN
concoctions	NNS
Concocts	VBZ
concurred	VBD
concur	VB
condemned	VBD
condemned	VBN
condemning	VBG
condemns	VBZ
condemn	VB
condensers	NNS
conditioned	VBN
conditioners	NNS
conditions	NNS
condominiums	NNS
condoms	NNS
condoned	VBD
condone	VB
condos	NNS
conducted	VBD
conducted	VBN
conducting	VBG
conducts	VBZ
conduct	VB
conduct	VBP
conduits	NNS
Conduits	NNS
cones	NNS
conferees	NNS
Conferees	NNS
conferences	NNS
conferred	VBD
conferring	VBG
confers	VBZ
confer	VB
confer	VBP
confessed	VBD
confessed	VBN
confesses	VBZ
confessing	VBG
confessions	NNS
confidants	NNS
confided	VBD
confides	VBZ
Confiding	VBG
configurations	NNS
confined	VBN
confines	NNS
confirmed	VBD
confirmed	VBN
confirming	VBG
Confirming	VBG
confirms	VBZ
confirm	VB
confirm	VBP
confiscated	VBD
confiscated	VBN
confiscate	VB
confiscating	VBG
conflicted	VBN
conflicting	VBG
conflicts	NNS
conflict	VBP
conforming	VBG
conforms	VBZ
conform	VB
conform	VBP
confrontations	NNS
CONFRONTATIONS	NNS
confronted	VBN
Confronted	VBN
confronting	VBG
confronts	VBZ
confront	VB
confront	VBP
confused	VBD
confused	VBN
confuses	VBZ
confuse	VB
confusing	VBG
confusions	NNS
conglomerates	NNS
congratulated	VBD
congratulated	VBN
congratulate	VB
congressmen	NNS
Congressmen	NNS
conjures	VBZ
conjure	VBP
connected	VBN
connecting	VBG
connections	NNS
connects	VBZ
connect	VB
connect	VBP
connotations	NNS
connote	VB
conquer	VB
conscripts	NNS
consented	VBD
consented	VBN
consenting	VBG
consents	NNS
consent	VB
consequences	NNS
conservationists	NNS
Conservationists	NNS
conservatives	NNS
Conservatives	NNS
CONSERVATIVES	NNS
conserve	VB
considerations	NNS
considered	VBD
considered	VBN
Considered	VBN
considering	VBG
Considering	VBG
considers	VBZ
consider	VB
Consider	VB
consider	VBP
consigned	VBN
consigns	VBZ
consisted	VBD
consisted	VBN
consisting	VBG
Consisting	VBG
consists	VBZ
consist	VB
consist	VBP
cons	NNS
consoles	VBZ
console	VB
consolidated	VBD
consolidated	VBN
consolidates	VBZ
consolidate	VB
consolidating	VBG
consolidations	NNS
consonants	NNS
consorting	VBG
conspiracies	NNS
conspirators	NNS
conspired	VBD
conspire	VBP
conspiring	VBG
constituencies	NNS
constituents	NNS
constituted	VBD
constitutes	VBZ
constitute	VB
constitute	VBP
constrained	VBN
constrains	VBZ
constraints	NNS
constrain	VB
constricting	VBG
constrictors	NNS
constructed	VBN
constructing	VBG
constructions	NNS
construct	VB
construed	VBD
construed	VBN
construe	VB
construe	VBP
consultants	NNS
Consultants	NNS
consultations	NNS
consulted	VBN
consulting	VBG
consult	VB
consumed	VBD
consumed	VBN
consumer-electronics	NNS
consumer-goods	NNS
consumer-products	NNS
consumers	NNS
Consumers	NNS
consume	VB
consume	VBP
consummated	VBN
contacted	VBD
contacted	VBN
contacting	VBG
contacts	NNS
contact	VB
contained	VBD
contained	VBN
containers	NNS
containing	VBG
contains	VBZ
contain	VB
contain	VBP
contaminated	VBN
cont'd.	VBN
contemplated	VBD
contemplated	VBN
contemplates	VBZ
contemplate	VB
contemplate	VBP
contemplating	VBG
contemporaries	NNS
contemporize	VB
contended	VBD
contended	VBN
contenders	NNS
contending	VBG
contends	VBZ
contend	VB
contend	VBP
contentions	NNS
contents	NNS
content	VB
contestants	NNS
contested	VBD
contested	VBN
contesting	VBG
contests	NNS
contest	VB
Continentals	NNS
contingencies	NNS
continued	VBD
continued	VBN
Continued	VBN
continues	VBZ
continue	VB
continue	VBP
continuing	VBG
Continuing	VBG
contraceptives	NNS
contract-drilling	VBG
contracted	VBD
contracted	VBN
contracting	VBG
Contracting	VBG
contractions	NNS
contractors	NNS
Contractors	NNS
contracts	NNS
Contracts	NNS
contracts	VBZ
contract	VB
contract	VBP
contradicting	VBG
contradictions	NNS
contradicts	VBZ
contradict	VB
Contras	NNS
contrasted	VBD
contrasted	VBN
contrasting	VBG
Contrasts	NNS
contrasts	VBZ
contrast	VB
contrast	VBP
contravened	VBN
contribued	VBD
contributed	VBD
contributed	VBN
contributes	VBZ
contribute	VB
contribute	VBP
contributing	VBG
Contributing	VBG
contributions	NNS
contributors	NNS
controlled	VBD
controlled	VBN
controllers	NNS
controlling	VBG
controls	NNS
controls	VBZ
control	VB
control	VBP
controversies	NNS
con	VB
convenants	NNS
convened	VBD
convened	VBN
convenes	VBZ
convene	VB
convene	VBP
convening	VBG
conventional-arms	NNS
conventioners	NNS
convention-goers	NNS
conventions	NNS
converged	VBD
conversations	NNS
conversions	NNS
converted	VBD
converted	VBN
converters	NNS
convertibles	NNS
converting	VBG
converts	NNS
converts	VBZ
convert	VB
convert	VBP
conveyed	VBD
conveys	VBZ
convey	VB
convey	VBP
convicted	VBD
convicted	VBN
convictions	NNS
CONVICTS	VBZ
convict	VB
convinced	VBD
convinced	VBN
convinced	VBN|JJ
convinces	VBZ
convince	VB
convince	VBP
convincing	VBG
convoluted	VBN
convolutions	NNS
convoys	NNS
convulsions	NNS
cookbooks	NNS
cooked	VBN
cookies	NNS
cooking	VBG
cooks	NNS
cook	VB
coolants	NNS
cooled	VBD
cooled	VBN
cooling	VBG
cools	VBZ
cool	VB
Cool	VB
cool	VBP
cooperated	VBD
cooperated	VBN
cooperate	VB
cooperate	VBP
cooperating	VBG
cooperatives	NNS
coordinated	VBN
coordinates	VBZ
coordinate	VB
coordinating	VBG
Coors	NNS
co-payments	NNS
cope	VB
copied	VBD
copied	VBN
copiers	NNS
copies	NNS
co-pilot	NNS
coping	VBG
co-presidents	NNS
co-produce	VB
copycats	NNS
copying	VBG
copyrighted	VBN
copyrights	NNS
copy	VB
copy	VBP
Copy	VBP
cores	NNS
corkscrews	NNS
cornered	VBN
corners	NNS
cornerstones	NNS
corner	VB
cornices	NNS
corporate-earnings	NNS
corporates	NNS
corporations	NNS
Corporations	NNS
corral	VB
corrected	VBD
corrected	VBN
correcting	VBG
corrections	NNS
corrects	VBZ
correct	VB
correct	VBP
correlate	VBP
corresponded	VBD
correspondents	NNS
Corresponding	VBG
correspond	VB
corridors	NNS
corroborate	VBP
Corvettes	NNS
cosmetics	NNS
Cosmetics	NNS
cosmologies	NNS
co-sponsored	VBN
co-sponsors	NNS
co-sponsor	VB
Costa	NNS
costing	VBG
costs	NNS
Costs	NNS
costs	VBZ
costumed	VBN
costumes	NNS
cost	VB
cost	VBD
cost	VBN
cost	VBP
cots	NNS
cottages	NNS
couched	VBN
couching	VBG
coughed	VBD
coughed	VBN
coughing	VBG
coughs	NNS
cough	VB
councilors	NNS
councils	NNS
counseled	VBN
counseling	VBG
counselors	NNS
counsels	VBZ
counsel	VB
counted	VBD
counted	VBN
countenance	VB
counteracted	VBN
counteract	VB
counterattack	VB
counterbalanced	VBN
counterbidders	NNS
counterbids	NNS
counter-claims	NNS
counterclaims	NNS
countered	VBD
Countered	VBD
countered	VBN
countering	VBG
countermeasures	NNS
counterparts	NNS
counterprogram	VB
counters	NNS
countersued	VBD
countersued	VBN
countersuing	VBG
countervailing	VBG
counter	VB
counter	VBP
counties	NNS
counting	VBG
Counting	VBG
countries	NNS
Countries	NNS
countrymen	NNS
counts	NNS
counts	VBZ
count	VB
count	VBP
Count	VBP
coupled	VBN
Coupled	VBN
couples	NNS
couplets	NNS
coup-makers	NNS
coupons	NNS
Coupons	NNS
coups	NNS
couriers	NNS
coursed	VBN
courses	NNS
courted	VBD
courted	VBN
courtesies	NNS
courthouses	NNS
courting	VBG
courtrooms	NNS
courts	NNS
Courts	NNS
COURTS	NNS
courts	VBZ
court	VB
cousins	NNS
covenants	NNS
coverages	NNS
covered	VBD
covered	VBN
coverings	NNS
covering	VBG
covers	NNS
covers	VBZ
coverts	NNS
cover	VB
cover	VBP
coveted	VBN
covets	VBZ
cowards	NNS
cowboys	NNS
Cowboys	NNS
cower	VBP
co-workers	NNS
cows	NNS
CPAs	NNS
crabs	NNS
cracked	VBD
cracked	VBN
cracking	VBG
Cracking	VBG
crackle	VBP
cracks	NNS
crack	VB
crack	VBP
crafted	VBD
crafted	VBN
crafting	VBG
craftsmen	NNS
craft	VB
crammed	VBD
cramming	VBG
cramps	NNS
crams	VBZ
cranes	NNS
craning	VBG
cranked	VBD
cranked	VBN
cranks	NNS
crank	VB
crashed	VBD
CRASHED	VBD
crashes	NNS
crashes	VBZ
crashing	VBG
Crashing	VBG
crash	VB
cratering	VBG
crates	NNS
crave	VBP
crawled	VBD
crawling	VBG
crawls	VBZ
crawl	VB
creak	VB
creamed	VBN
creams	NNS
created	VBD
created	VBN
Created	VBN
creates	VBZ
Creates	VBZ
create	VB
Create	VB
create	VBP
creating	VBG
creations	NNS
creators	NNS
Creators	NNS
creatures	NNS
credentials	NNS
credit-data	NN|NNS
credited	VBD
credited	VBN
crediting	VBG
creditors	NNS
Creditors	NNS
credit-ratings	NNS
credits	NNS
credits	VBZ
credit	VB
credit	VBP
creeping	VBG
crematoriums	NNS
crept	VBD
crept	VBN
crest	VB
crevasses	NNS
crevices	NNS
crews	NNS
cries	VBZ
crimes	NNS
criminalize	VB
criminals	NNS
crimping	VBG
crimp	VB
cringed	VBD
crippled	VBN
cripples	NNS
crippling	VBG
crises	NNS
Crises	NNS
crisscrossing	VBG
criss-cross	VBP
criteria	NNS
criticisms	NNS
criticized	VBD
criticized	VBN
criticizes	VBZ
criticize	VB
criticize	VBP
criticizing	VBG
critics	NNS
Critics	NNS
croak	VBP
croissants	NNS
cronies	NNS
crooks	NNS
crooned	VBD
croons	VBZ
cropped	VBD
cropped	VBN
cropping	VBG
crops	NNS
crop	VB
CROSS-BRED	VBD
crossed	VBD
crossed	VBN
crosses	VBZ
crossing	VBG
cross-pollinated	VBN
crossroads	NNS
cross-shareholdings	NNS
cross	VB
cross	VBP
crouched	VBD
Crouched	VBN
crowded	VBD
crowded	VBN
crowds	NNS
crowds	VBZ
crowd	VBP
crowed	VBN
crowned	VBN
crows	VBZ
CRs	NNS
crudes	NNS
cruisers	NNS
cruise	VBP
cruising	VBG
crumbled	VBD
crumbled	VBN
crumbles	VBZ
crumble	VB
crumbling	VBG
crumpled	VBD
crumpled	VBN
crunched	VBD
Crunch	VB
crushed	VBN
crushes	VBZ
crushing	VBG
crush	VB
crying	VBG
cryptographers	NNS
crystals	NNS
cry	VB
cry	VBP
cubs	NNS
cuckoos	NNS
cues	NNS
cuff	VB
culled	VBN
culminated	VBD
culminated	VBN
culminates	VBZ
culminating	VBG
culprits	NNS
cultivated	VBN
cultivates	VBZ
cultivating	VBG
cultures	NNS
cups	NNS
curators	NNS
curbed	VBD
curbed	VBN
curbing	VBG
CURBING	VBG
curbs	NNS
curb	VB
Curb	VB
cured	VBN
cures	NNS
cure	VB
curing	VBG
curled	VBD
curl	VB
currencies	NNS
currents	NNS
curry	VB
cursed	VBD
curses	NNS
curtailed	VBD
curtailed	VBN
curtailing	VBG
curtail	VB
curtail	VBP
curtains	NNS
cushioned	VBN
cushioning	VBG
cushion	VB
customers	NNS
Customers	NNS
customized	VBN
customs	NNS
Customs	NNS
cutbacks	NNS
cutouts	NNS
cuts	NNS
cuts	VBZ
cutters	NNS
cutting-tools	NNS
cutting	VBG
Cutting	VBG
cutting	VBG|NN
cut	VB
Cut	VB
cut	VBD
cut	VBN
cut	VBP
cuvees	NNS
CVB	NNP
cycads	NNS
Cycads	NNS
cycles	NNS
cyclicals	NNS
cycling	VBG
cyclists	NNS
c-Yields	NNS
czars	NNS
dabbled	VBD
dabble	VB
dabbling	VBG
dabs	VBZ
dailies	NNS
dalliances	NNS
damaged	VBD
damaged	VBN
damages	NNS
damages	VBZ
damage	VB
damage	VBP
damaging	VBG
damped	VBN
damped	VBP
dampened	VBD
dampen	VB
damping	VBG
damp	VB
damp	VBP
dams	NNS
dancers	NNS
dances	NNS
dance	VB
dancing	VBG
dangers	NNS
Dangers	NNS
dangled	VBN
dangling	VBG
dared	VBD
dare	VB
dare	VBP
darlings	NNS
dashed	VBD
dashed	VBN
dashes	NNS
dash	VB
databases	NNS
data	NN|NNS
data	NNS
Data	NNS
data	NNS|NN
dated	VBN
dates	NNS
dates	VBZ
date	VB
date	VBP
dating	VBG
daughters	NNS
daunted	VBD
daunting	VBG
dawdling	VBG
dawning	VBG
dawns	VBZ
days.	NNS
days	NNS
Days	NNS
dazzled	VBN
deactivates	VBZ
deadbeats	NNS
deadlines	NNS
deadlocked	VBN
dead	VBN
Deafening	VBG
dealerships	NNS
dealers	NNS
Dealers	NNS
dealings	NNS
dealing	VBG
Dealing	VBG
dealmakers	NNS
deals	NNS
deals	VBZ
dealt	VBD
dealt	VBN
deal	VB
deal	VBP
deaths	NNS
debacles	NNS
debated	VBN
debates	NNS
Debates	NNS
debate	VB
debating	VBG
debentures	NNS
debtholders	NNS
debtors	NNS
debts	NNS
debunk	VB
debuted	VBD
debut	VB
decades	NNS
Decades	NNS
decapitalize	VBP
deceased	VBN
deceived	VBD
deceived	VBN
deceive	VB
decelerated	VBN
decelerating	VBG
decentralized	VBN
decentralizing	VBG
decertified	VBN
decided	VBD
decided	VBN
decides	VBZ
decide	VB
Decide	VB
decide	VBP
deciding	VBG
Deciding	VBG
decimated	VBN
decision-makers	NNS
decisions	NNS
Decisions	NNS
decked	VBN
deckhands	NNS
decking	VBG
decks	NNS
declarations	NNS
declared	VBD
declared	VBN
declares	VBZ
declare	VB
declare	VBP
declaring	VBG
Declaring	VBG
declassifying	VBG
declined	VBD
declined	VBN
decliners	NNS
Decliners	NNS
declines	NNS
Declines	NNS
declines	VBZ
decline	VB
decline	VBP
declining	VBG
Declining	VBG
decontaminated	VBN
decorated	VBN
Decorated	VBN
decorators	NNS
decoys	NNS
decreased	VBD
decreased	VBN
decreases	NNS
decreases	VBZ
decrease	VB
decrease	VBP
decreasing	VBG
decreed	VBN
decribed	VBD
decried	VBD
decries	VBZ
decrying	VBG
Dec.	VB
dedicated	VBD
dedicated	VBN
deduces	VBZ
deducted	VBN
deductibles	NNS
deducting	VBG
deductions	NNS
Deductions	NNS
deduct	VB
deeds	NNS
deemed	VBD
deemed	VBN
de-emphasized	VBN
de-emphasize	VB
deems	VBZ
deem	VBP
deepened	VBD
deepening	VBG
deer	NNS
Deer	NNS
defaulted	VBD
defaulted	VBN
defaulters	NNS
defaulting	VBG
defaults	NNS
Defaults	NNS
default	VB
defeated	VBD
defeated	VBN
defeating	VBG
defeats	NNS
defeats	VBZ
defeat	VB
defected	VBD
defecting	VBG
defections	NNS
Defections	NNS
defects	NNS
defect	VB
defendants	NNS
Defendants	NNS
defended	VBD
defended	VBN
defenders	NNS
Defenders	NNS
defending	VBG
Defending	VBG
defends	VBZ
defend	VB
defend	VBP
defense-electronics	NNS
defenses	NNS
deferred	VBN
deferring	VBG
defer	VB
deficiencies	NNS
deficits	NNS
defied	VBD
defies	VBZ
defined	VBD
defined	VBN
defines	VBZ
define	VB
defining	VBG
Defining	VBG
definitions	NNS
deflated	VBD
deflated	VBN
deflate	VB
deflators	NNS
deflected	VBD
deflecting	VBG
deflect	VB
deformed	VBN
defrauded	VBD
defrauded	VBN
defrauding	VBG
defraud	VB
defunct	VB
defuse	VB
Defuse	VB
defying	VBG
defy	VBP
degenerated	VBD
degenerated	VBN
degenerate	VB
degrees	NNS
delayed	VBD
delayed	VBN
delaying	NN|VBG
delaying	VBG
delays	NNS
delays	VBZ
DELAYS	VBZ
delay	VB
delay	VBP
delegates	NNS
Delegates	NNS
delegate	VB
delegating	VBG
deleted	VBN
delete	VB
deleting	VBG
deletions	NNS
deliberate	VB
deliberating	VBG
deliberations	NNS
delighted	VBD
delighted	VBN
delights	VBZ
delight	VB
DELIGHT	VBP
deli	NNS
delinquencies	NNS
delinquents	NNS
delisted	VBN
delivered	VBD
delivered	VBN
deliveries	NNS
Deliveries	NNS
delivering	VBG
delivers	VBZ
deliver	VB
Deliver	VB
deliver	VBP
delousing	VBG
deluged	VBD
deluged	VBN
delved	VBN
delves	VBZ
demagogues	NNS
demanded	VBD
demanded	VBN
demanding	VBG
demands	NNS
demands	VBZ
demand	VB
demand	VBP
demeaned	VBN
demeanors	NNS
demilitarize	VB
demobilize	VB
demobilizing	VBG
democracies	NNS
democratized	VBN
democratize	VB
Democrats	NNS
demographics	NNS
Demographics	NNS
demolished	VBD
demolished	VBN
demolishing	VBG
demolish	VB
demonized	VBN
demons	NNS
demonstrated	VBD
demonstrated	VBN
demonstrates	VBZ
demonstrate	VB
demonstrate	VBP
demonstrating	VBG
demonstrations	NNS
Demonstrations	NNS
demonstrators	NNS
demoted	VBN
demurs	VBZ
denationalized	VBN
denials	NNS
denied	VBD
denied	VBN
Denied	VBN
denies	VBZ
denims	NNS
Denizens	NNS
denominated	VBN
denominations	NNS
denounced	VBD
denounced	VBN
denounce	VB
denounce	VBP
denouncing	VBG
dentists	NNS
dents	NNS
denuclearized	VBN
denude	VB
denying	VBG
deny	VB
deny	VBP
departed	VBD
departing	VBG
Departing	VBG
departments	NNS
departures	NNS
depart	VB
depart	VBP
depended	VBD
depended	VBN
dependents	NNS
depending	VBG
Depending	VBG
depends	VBZ
depend	VB
depend	VBP
depicted	VBN
depicting	VBG
Depicting	VBG
depicts	VBZ
depict	VB
depict	VBP
depleted	VBD
depleted	VBN
depletes	VBZ
deplete	VB
deplores	VBZ
deploring	VBG
deployed	VBD
deployed	VBN
deported	VBD
deposed	VBN
deposited	VBD
deposited	VBN
depositing	VBG
depositions	NNS
depositors	NNS
deposits	NNS
Deposits	NNS
deposits	VBZ
deposit	VB
depots	NNS
depreciated	VBD
depredations	NNS
depressed	VBD
depressed	VBN
depresses	VBZ
depressing	VBG
depressions	NNS
depress	VB
depress	VBP
deprivations	NNS
deprived	VBD
deprived	VBN
deprived	VBN|JJ
deprives	VBZ
deprive	VB
depriving	VBG
deprogrammings	NNS
depths	NNS
deputies	NNS
Deputies	NNS
derailed	VBN
derailing	VBG
derail	VB
deregulated	VBN
deregulate	VB
derided	VBD
derided	VBN
derivatives	NNS
derived	VBD
derived	VBN
derives	VBZ
derive	VB
deriving	VBG
Descendants	NNS
descended	VBD
descending	VBG
descends	VBZ
descents	NNS
described	VBD
described	VBN
describes	VBZ
describe	VB
describe	VBP
describing	VBG
Describing	VBG
descriptions	NNS
deserted	VBN
deserts	NNS
desert	VB
deserved	VBD
deserves	VBZ
deserve	VB
deserve	VBP
designated	VBN
designates	VBZ
designate	VB
designating	VBG
designations	NNS
designed	VBD
designed	VBN
designees	NNS
designers	NNS
designing	VBG
designs	NNS
Designs	NNS
designs	VBZ
design	VB
desired	VBD
desired	VBN
desires	NNS
desire	VBP
desist	VB
desks	NNS
despairs	VBZ
despised	VBN
despise	VB
despots	NNS
destabilize	VB
destabilizing	VBG
destinations	NNS
Destinations	NNS
destined	VBN
destroyed	VBD
destroyed	VBN
destroying	VBG
destroys	VBZ
destroy	VB
destroy	VBP
detached	VBN
Detached	VBN
detailed	VBN
detailing	VBG
details	NNS
Details	NNS
detained	VBD
detained	VBN
detaining	VBG
detected	VBD
detected	VBN
detecting	VBG
detectives	NNS
detectors	NNS
detect	VB
detect	VBP
detergents	NNS
deteriorated	VBD
deteriorated	VBN
deteriorates	VBZ
deteriorate	VB
deteriorate	VBP
deteriorating	VBG
determined	VBD
determined	VBN
determines	VBZ
determine	VB
determine	VBP
determining	VBG
Determining	VBG
deterred	VBD
deterrents	NNS
deterring	VBG
deters	VBZ
deter	VB
deter	VBP
detests	VBZ
dethroned	VBN
detractors	NNS
detracts	VBZ
detract	VB
devaluations	NNS
devalued	VBD
devalued	VBN
devastated	VBD
devastated	VBN
devastating	VBG
developed	VBD
developed	VBN
Developed	VBN
developers	NNS
Developers	NNS
developing	VBG
Developing	VBG
developments	NNS
Developments	NNS
develops	VBZ
develop	VB
Develop	VB
develop	VBP
deviated	VBD
deviations	NNS
devices	NNS
devils	NNS
devised	VBD
devised	VBN
devises	VBZ
devise	VB
devise	VBP
devoted	VBD
devoted	VBN
devotees	NNS
Devotees	NNS
devotes	VBZ
devote	VB
devote	VBP
devoured	VBN
devouring	VBG
dewatering	VBG
diabetics	NNS
diagnosed	VBD
diagnosed	VBN
diagnosing	VBG
diagnostics	NNS
diagramming	VBG
dialects	NNS
dialing	VBG
DIALING	VBG
dials	NNS
dial	VB
diamonds	NNS
diapers	NNS
diaries	NNS
dibenzofurans	NNS
dice	NNS
dickered	VBD
dictated	VBD
dictated	VBN
Dictates	NNS
dictates	VBZ
dictate	VB
dictate	VBP
dictatorships	NNS
dictators	NNS
did	VBD
Did	VBD
died	VBD
Died	VBD
DIED	VBD
died	VBN
Died	VBN
die-hards	NNS
Diehards	NNS
diesels	NNS
dies	VBZ
Dies	VBZ
die	VB
Die	VB
die	VBP
Die	VBP
differed	VBD
differences	NNS
Differences	NNS
differentials	NNS
differentiate	VB
differentiating	VBG
differing	VBG
differs	VBZ
differ	VB
differ	VBP
difficulties	NNS
digested	VBN
digesting	VBG
digest	VB
digging	VBG
digits	NNS
dignify	VB
dignitaries	NNS
digs	NNS
DIGS	NNS
digs	VBZ
dig	VB
diluted	VBD
diluted	VBN
diluted	VBN|JJ
dilute	VB
diluting	VBG
dimensions	NNS
dimes	NNS
diminished	VBD
diminished	VBN
diminishes	VBZ
diminishing	VBG
diminish	VB
diminish	VBP
dimming	VBG
dined	VBD
dined	VBN
diners	NNS
dining	VBG
dinners	NNS
dinosaurs	NNS
dioxins	NNS
diplomats	NNS
dipped	VBD
dipped	VBN
dipping	VBG
dips	NNS
dip	VB
Dip	VB
directed	VBD
directed	VBN
directing	VBG
directions	NNS
directives	NNS
directories	NNS
directors	NNS
Directors	NNS
directs	VBZ
direct	VB
Dirks	NNS
disabilities	NNS
disabled	VBN
disabled-workers	NNS
disabling	VBG
disadvantages	NNS
disagreed	VBD
disagreed	VBN
disagreements	NNS
disagrees	VBZ
disagree	VB
disagree	VBP
disallowed	VBD
disappeared	VBD
disappeared	VBN
disappears	VBZ
disappear	VB
disappear	VBP
disappointed	VBD
disappointed	VBN
disappointments	NNS
Disappointments	NNS
DISAPPOINTMENTS	NNS
disappoint	VB
disapproved	VBD
disapproved	VBN
disapproves	VBZ
disapprove	VBP
disarming	VBG
disarm	VB
disassemble	VB
disassociate	VB
disasters	NNS
Disasters	NNS
disavowed	VBD
disbanded	VBN
disbanding	VBG
disband	VB
disbursed	VBN
disbursements	NNS
discarded	VBD
discarded	VBN
discard	VB
discerns	VBZ
discern	VB
discharged	VBN
discharges	NNS
discharge	VB
disciples	NNS
disciplined	VBD
disciplined	VBN
disciplining	VBG
disclaims	VBZ
disclosed	VBD
disclosed	VBN
discloses	VBZ
disclose	VB
disclosing	VBG
disclosures	NNS
Disclosures	NNS
discolored	VBN
discomfit	VB
disconnected	VBN
disconnect	VB
discontinued	VBN
discontinue	VB
discontinuing	VBG
discos	NNS
Discos	NNS
discounted	VBD
discounted	VBN
Discounted	VBN
discounting	VBG
discounts	NNS
discounts	VBZ
discount	VB
discouraged	VBD
discouraged	VBN
discourages	VBZ
discourage	VB
discourage	VBP
discouraging	VBG
discovered	VBD
discovered	VBN
discoveries	NNS
discovering	VBG
discovers	VBZ
discover	VB
discover	VBP
discredited	VBN
discredit	VB
discrepancies	NNS
Discrepancies	NNS
discrepencies	NNS
discriminating	VBG
discs	NNS
discussed	VBD
discussed	VBN
discussing	VBG
Discussing	VBG
discussions	NNS
discuss	VB
discuss	VBP
disdaining	VBG
disdain	VB
diseases	NNS
disembark	VBP
disenchanted	VBN
disengage	VB
disgorge	VB
disgruntled	VBN
disguised	VBN
disguises	NNS
disguise	VB
disgusted	VBN
Disgusted	VBN
dishes	NNS
dish	VB
dishwashers	NNS
disinclined	VBN
disinfectants	NNS
disintegrated	VBD
disintegrating	VBG
disks	NNS
dislikes	VBZ
dislike	VB
dislike	VBP
dislocations	NNS
dismantled	VBN
dismantle	VB
Dismantle	VB
dismantling	VBG
dismayed	VBN
dismember	VB
dismissed	VBD
dismissed	VBN
dismisses	VBZ
dismissing	VBG
Dismissing	VBG
dismiss	VB
dismiss	VBP
disobey	VB
disorders	NNS
disparaged	VBD
disparage	VB
disparaging	VBG
disparities	NNS
dispatched	VBD
dispatched	VBN
dispatchers	NNS
dispatches	NNS
dispatching	VBG
dispatch	VB
dispelled	VBD
dispel	VB
dispensed	VBD
dispense	VB
dispense	VBP
dispensing	VBG
dispersants	NNS
dispersed	VBD
dispersing	VBG
displaced	VBN
displace	VB
displayed	VBD
displayed	VBN
displaying	VBG
displays	NNS
displays	VBZ
display	VB
display	VBP
displeases	VBZ
disposables	NNS
disposals	NNS
disposed	VBD
disposed	VBN
disposes	VBZ
dispose	VB
disposing	VBG
dispositions	NNS
disprove	VB
disputed	VBD
disputed	VBN
disputes	NNS
disputes	VBZ
dispute	VB
dispute	VBP
disqualified	VBN
disqualify	VB
disregarded	VBD
disregard	VB
disrupted	VBD
disrupted	VBN
disrupting	VBG
disruptions	NNS
disrupt	VB
dissatisfied	VBN
dissected	VBN
dissecting	VBG
disseminated	VBN
disseminate	VB
disseminating	VBG
dissented	VBD
dissented	VBN
dissenters	NNS
dissents	NNS
dissidents	NNS
Dissidents	NNS
dissipated	VBN
dissipates	VBZ
dissipate	VB
dissociate	VB
dissociating	VBG
dissolved	VBN
dissolves	VBZ
dissolve	VB
dissolving	VBG
dissuade	VB
distances	NNS
distance	VB
distancing	VBG
distilled	VBN
distillers	NNS
distilling	VBG
distinctions	NNS
distinguished	VBD
distinguished	VBN
distinguish	VB
distorted	VBN
distortions	NNS
distorts	VBZ
distort	VB
distort	VBP
distracted	VBD
distracted	VBN
distracting	VBG
distractions	NNS
distract	VB
distributed	VBD
distributed	VBN
Distributed	VBN
distributes	VBZ
distribute	VB
distribute	VBP
distributing	VBG
Distributing	VBG
distributions	NNS
distributors	NNS
districts	NNS
districts\/states	NNS
disturbances	NNS
disturbed	VBN
disturbing	VBG
disturbs	VBZ
disturb	VB
dithering	VBG
dived	VBD
diverge	VB
diverging	VBG
diversifed	VBN
diversifications	NNS
diversified	VBN
diversifying	VBG
diversify	VB
Diversify	VB
diversions	NNS
divers	NNS
diverted	VBN
diverting	VBG
divert	VB
divert	VBP
divested	VBD
divesting	VBG
Divesting	VBG
divestitures	NNS
divest	VB
divest	VBP
dives	VBZ
dive	VB
dive	VBP
divided	VBD
divided	VBN
dividends	NNS
divides	VBZ
divide	VB
Divide	VB
divide	VBP
dividing	VBG
dividing	VBG|NN|JJ
diving	VBG
divisions	NNS
divorced	VBD
divorced	VBN
divulge	VB
divvied	VBN
divvying	VBG
dizzying	VBG
dockets	NNS
dock-siders	NNS
doctors	NNS
Doctors	NNS
DOCTORS	NNS
doctor	VB
doctrines	NNS
docudramas	NNS
documentaries	NNS
documented	VBN
documenting	VBG
documents	NNS
Documents	NNS
documents	VBZ
document	VB
dodged	VBD
dodge	VBP
does	VBZ
Does	VBZ
dogged	VBD
dogged	VBN
dogging	VBG
do-gooders	NNS
dogs	NNS
Dogs	NNS
DOGS	NNS
dogs	VBZ
doing	VBG
Doing	VBG
doldrums	NNS
doled	VBD
dole	VB
dole	VBP
doling	VBG
dollars	NNS
dolls	NNS
dolphins	NNS
domes	NNS
dominated	VBD
dominated	VBN
dominates	VBZ
dominate	VB
dominate	VBP
dominating	VBG
donated	VBD
donated	VBN
donate	VB
donate	VBP
donating	VBG
Donating	VBG
donations	NNS
Donations	NNS
done	VBN
donned	VBD
Donning	VBG
donors	NNS
dons	NNS
dons	VBZ
DON'T	VB
don	VB
doomed	VBD
doomed	VBN
dooming	VBG
doomsayers	NNS
doom	VB
doormen	NNS
doors	NNS
doses	NNS
dossiers	NNS
doted	VBN
doth	VBZ
dotting	VBG
dot	VBP
double-crossed	VBD
doubled	VBD
Doubled	VBD
doubled	VBN
doubles	VBZ
double	VB
double	VBP
doubling	VBG
doubted	VBD
doubters	NNS
doubts	NNS
Doubts	NNS
doubts	VBZ
doubt	VB
doubt	VBP
do	VB
Do	VB
do	VBP
Do	VBP
dovetails	VBZ
dove	VBD
downed	VBD
downgraded	VBD
downgraded	VBN
Downgraded	VBN
downgrades	NNS
downgrading	VBG
downpayments	NNS
downplayed	VBD
downsized	VBN
downsize	VB
downsizing	VBG
downs	NNS
downturns	NNS
down	VBP
dozens	NNS
Dozens	NNS
drafted	VBD
drafted	VBN
drafting	VBG
draftsmen	NNS
draft	VB
dragged	VBD
dragged	VBN
dragging	VBG
Dragging	VBG
drags	VBZ
drag	VB
drag	VBP
drained	VBN
draining	VBG
drains	VBZ
drain	VB
dramatizations	NNS
DRAMs	NNS
drapes	NNS
drape	VB
drawbacks	NNS
drawings	NNS
drawing	VBG
Drawing	VBG
drawn	VBN
draws	NNS
draws	VBZ
draw	VB
draw	VBP
dreaded	VBN
dreamed	VBD
dreamed	VBN
dreaming	VBG
dreams	NNS
Dreams	NNS
dreams	VBZ
dreamt	VBD
dream	VB
Dream	VB
dream	VBP
dressed	VBD
dressed	VBN
dresses	NNS
dresses	VBZ
dressing	VBG
dress	VB
dress	VBP
drew	VBD
dried	VBD
dried	VBN
drifted	VBD
drifting	VBG
drift	VB
drift	VBP
drilled	VBD
drilled	VBN
drillers	NNS
drilling	VBG
drills	NNS
drill	VB
drinking	VBG
drinks	NNS
drink	VB
drink	VBP
dripping	VBG
driven	VBN
drivers	NNS
drives	NNS
drives	VBZ
drive	VB
drive	VBP
driving	VBG
Driving	VBG
drooled	VBD
drooling	VBG
droped	VBD
droplets	NNS
dropouts	NNS
dropped	VBD
dropped	VBN
droppers	NNS
dropping	VBG
drops	NNS
drops	VBZ
drop	VB
drop	VBP
droughts	NNS
droves	NNS
drove	VBD
drowned	VBD
drowned	VBN
drown	VB
drug-sales	NNS
drugs	NNS
Drugs	NNS
drugstores	NNS
drumming	VBG
drums	NNS
drum	VB
drying	VBG
dry	VB
Ds	NNS
dubbed	VBD
dubbed	VBN
Dubbed	VBN
dubs	VBZ
ducking	VBG
ducklings	NNS
ducks	NNS
Ducks	NNS
ducks	VBZ
duck	VB
ducts	NNS
duds	NNS
dueling	VBG
duels	NNS
due	NNS
dues	NNS
duffers	NNS
dug	VBD
dulled	VBN
dummies	NNS
dumped	VBD
dumped	VBN
dumping	VBG
dumps	NNS
dumps	VBZ
dump	VB
dump	VBP
dunes	NNS
dupes	VBZ
duplicated	VBN
duplicate	VB
Duplicating	VBG
duplications	NNS
durable-goods	NNS
durables	NNS
dusted	VBD
dusting	VBG
duties	NNS
'd	VBD
dwarfed	VBN
dwarfs	VBZ
dwarf	VB
dwarf	VBP
dwellers	NNS
dwellings	NNS
dwindled	VBD
dwindling	VBG
dyed	VBN
dyes	NNS
dying	VBG
dynamics	NNS
dynamos	NNS
earmarked	VBD
earmarked	VBN
earmarking	VBG
earmark	VB
earned	VBD
earned	VBN
earners	NNS
earnigs	NNS
earnings	NNS
Earnings	NNS
EARNINGS	NNS
earning	VBG
earns	VBZ
Earns	VBZ
earn	VB
earn	VBP
earrings	NNS
ears	NNS
earthlings	NNS
earthquakes	NNS
earthworms	NNS
eased	VBD
eased	VBN
eases	VBZ
ease	VB
ease	VBP
easing	VBG
Easterners	NNS
East	NNS
EAST	NNS
eaten	VBN
eaters	NNS
eating	VBG
eats	VBZ
eat	VB
eat	VBP
eavesdrop	VB
ebbs	VBZ
ebb	VB
eccentrics	NNS
echelons	NNS
echoed	VBD
echoed	VBN
echoes	NNS
echoing	VBG
Echoing	VBG
echo	VB
echo	VBP
eclairs	NNS
eclipse	VB
eclipsing	VBG
economics	NNS
economies	NNS
economists	NNS
Economists	NNS
economize	VB
edged	VBD
edged	VBN
edges	NNS
edge	VB
edging	VBG
editions	NNS
editorials	NNS
Editorials	NNS
editors	NNS
edit	VB
educated	VBN
educate	VB
educating	VBG
educations	NNS
educators	NNS
Educators	NNS
effects	NNS
effects	VBZ
effect	VB
efficiencies	NNS
efforts	NNS
Efforts	NNS
eggs	NNS
egos	NNS
ejected	VBN
eked	VBD
eke	VB
elaborate	VB
elaborating	VBG
Elaborating	VBG
elapsed	VBN
elbows	NNS
elders	NNS
elected	VBD
elected	VBN
Elected	VBN
elections	NNS
Elections	NNS
ELECTIONS	NNS
electrical-products	NNS
electrified	VBN
electrochemicals	NNS
electrodes	NNS
electrogalvanized	VBN
electrogalvanizing	VBG
electromagnets	NNS
electronic-data	NN|NNS
electronics	NNS
electronic-systems	NNS
electro-optics	NNS
elect	VB
elect	VBP
elements	NNS
Elements	NNS
elephants	NNS
elevated	VBD
elevates	VBZ
elevations	NNS
elevators	NNS
eliminated	VBD
eliminated	VBN
eliminates	VBZ
eliminate	VB
Eliminate	VB
eliminate	VBP
eliminating	VBG
Eliminating	VBG
elite	NNS
elites	NNS
elitists	NNS
elongate	VB
eluded	VBD
eluding	VBG
emasculate	VB
embargoed	VBD
embargoes	NNS
embargos	NNS
embarked	VBD
embarked	VBN
embarking	VBG
embark	VB
embarrassed	VBD
embarrassed	VBN
embarrassing	VBG
embarrass	VB
embassies	NNS
embattled	VBN
embedded	VBN
Embedded	VBN
embellish	VB
embezzled	VBD
embezzling	VBG
emblems	NNS
embodied	VBN
embodies	VBZ
embody	VBP
emboldened	VBN
Emboldened	VBN
embraced	VBD
embraced	VBN
embraces	VBZ
embrace	VB
embracing	VBG
embroiled	VBN
emerged	VBD
emerged	VBN
emergencies	NNS
emerges	VBZ
emerge	VB
emerge	VBP
emerging	VBG
Emerging	VBG
emigrated	VBD
emigrate	VB
emigres	NNS
emissaries	NNS
emissions	NNS
emitted	VBN
emoted	VBD
emote	VB
emotions	NNS
empathize	VB
emphasized	VBD
emphasized	VBN
emphasizes	VBZ
emphasize	VB
emphasize	VBP
emphasizing	VBG
emphaticize	VB
empires	NNS
employed	VBN
employees	NNS
Employees	NNS
EMPLOYEES	NNS
employees	VBZ
employers	NNS
Employers	NNS
employing	VBG
employs	VBZ
employ	VB
employ	VBP
empowered	VBN
empowering	VBG
empowers	VBZ
empower	VBP
emptied	VBN
emptying	VBG
empty	VB
empty	VBP
emulated	VBN
emulate	VB
emulating	VBG
enabled	VBD
enabled	VBN
enables	VBZ
enable	VB
enable	VBP
enabling	VBG
enacted	VBD
enacted	VBN
enacting	VBG
enact	VB
encapsulate	VB
encasing	VBG
encircling	VBG
enclosed	VBN
enclosing	VBG
encompassed	VBD
encompasses	VBZ
encompass	VB
encountered	VBD
encountered	VBN
encounters	NNS
encounters	VBZ
encounter	VB
encouraged	VBD
encouraged	VBN
Encouraged	VBN
encourages	VBZ
encourage	VB
Encourage	VB
encourage	VBP
encouraging	VBG
Encouraging	VBG
encroaching	VBG
encrusted	VBN
encrypting	VBG
encumbered	VBN
endangered-species	NNS
endangered	VBN
endanger	VB
endeavoring	VBG
endeavors	NNS
endeavor	VB
ended	VBD
ENDED	VBD
ended	VBN
endings	NNS
ending	VBG
Ending	VBG
endorsed	VBD
endorsed	VBN
endorsements	NNS
endorsers	NNS
endorses	VBZ
endorse	VB
endorse	VBP
endorsing	VBG
endowed	VBD
endowed	VBN
endow	VB
ends	NNS
Ends	NNS
ends	VBZ
Ends	VBZ
end-tailed	VBN
endured	VBD
endured	VBN
endure	VB
endure	VBP
Endure	VBP
enduring	VBG
end	VB
End	VB
end	VBP
enemies	NNS
energies	NNS
energized	VBN
energy-services	NNS
enforced	VBN
enforcers	NNS
Enforcers	NNS
enforces	VBZ
enforce	VB
enforce	VBP
enforcing	VBG
engaged	VBD
engaged	VBN
engagements	NNS
engages	VBZ
engage	VB
engage	VBP
engaging	VBG
engineered	VBN
engineering	VBG
engineers	NNS
Engineers	NNS
engineer	VB
engines	NNS
English	NNS
engraved	VBN
engulfed	VBD
engulfed	VBN
enhanced	VBD
enhanced	VBN
enhancements	NNS
enhances	VBZ
enhance	VB
enhancing	VBG
enjoined	VBD
enjoined	VBN
enjoin	VB
enjoyed	VBD
enjoyed	VBN
enjoying	VBG
Enjoying	VBG
enjoys	VBZ
enjoy	VB
enjoy	VBP
enlarged	VBN
enlargers	NNS
enlarge	VB
enlarging	VBG
enlightened	VBN
enlightening	VBG
enlighten	VB
enlisted	VBD
enlisting	VBG
enlist	VB
enlivening	VBG
ennumerated	VBD
enraged	VBD
enriching	VBG
enrich	VBP
enrolled	VBD
enrolled	VBN
enrollees	NNS
enrollments	NNS
enroll	VB
enroll	VBP
ensconced	VBN
ensembles	NNS
ensnarled	VBN
ensued	VBD
ensue	VB
ensuing	VBG
ensures	VBZ
ensure	VB
ensure	VBP
ensuring	VBG
entailed	VBN
entails	VBZ
entail	VB
entangled	VBN
entered	VBD
entered	VBN
entering	VBG
enterprises	NNS
enters	VBZ
entertained	VBD
entertained	VBN
entertainers	NNS
entertaining	VBG
entertain	VB
enter	VB
Enter	VB
enter	VBP
enthusiasms	NNS
enthusiasts	NNS
Enthusiasts	NNS
enticed	VBD
entice	VB
entice	VBP
enticing	VBG
entities	NNS
entitled	VBD
entitled	VBN
entitlements	NNS
entitles	VBZ
entitle	VB
entitle	VBP
entitling	VBG
entombed	VBN
entranced	VBN
entrants	NNS
entrenched	VBN
entrench	VB
entrepreneurs	NNS
Entrepreneurs	NNS
entries	NNS
entrusted	VBN
entrust	VB
entrust	VBP
entwined	VBN
envelopes	NNS
environmentalists	NNS
Environmentalists	NNS
environments	NNS
envisaged	VBD
envisaged	VBN
envisioned	VBN
envisions	VBZ
envision	VB
envision	VBP
envy	VBP
eons	NNS
epileptics	NNS
episodes	NNS
epitomize	VBP
equaled	VBD
equaled	VBN
equaling	VBG
equals	VBZ
equal	VB
equal	VBP
equated	VBN
equates	VBZ
equate	VB
equestrians	NNS
equipped	VBD
equipped	VBN
Equipped	VBN
equipping	VBG
equips	VBZ
equip	VB
equities	NNS
Equities	NNS
equivalents	NNS
Equivalents	NNS
eradicate	VB
erased	VBD
erased	VBN
erases	VBZ
erase	VB
erasing	VBG
Erasing	VBG
erasures	NNS
erected	VBD
erected	VBN
erect	VB
eroded	VBD
eroded	VBN
erodes	VBZ
Erodes	VBZ
erode	VB
erode	VBP
eroding	VBG
errata	NNS
erred	VBD
erred	VBN
errors	NNS
errs	VBZ
err	VB
Err	VB
err	VBP
erupted	VBD
erupted	VBN
erupts	VBZ
erupt	VB
escalated	VBD
escalated	VBN
escalate	VB
escalating	VBG
escalators	NNS
escaped	VBD
escaped	VBN
escape	VB
escaping	VBG
eschewed	VBN
Escorts	NNS
escorts	VBZ
escrowed	VBN
espouse	VBP
ESPs	NNS
essays	NNS
essentials	NNS
established	VBD
established	VBN
Established	VBN
establishes	VBZ
establishing	VBG
Establishing	VBG
establishments	NNS
establish	VB
Establish	VB
establshed	VBN
estimated	VBD
estimated	VBN
Estimated	VBN
estimates	NNS
Estimates	NNS
estimates	VBZ
estimate	VB
estimate	VBP
estimating	VBG
Estimating	VBG
estimators	NNS
estranged	VBN
ethics	NNS
euphemisms	NNS
Eurobonds	NNS
Eurodebentures	NNS
EURODOLLARS	NNPS|NNS
EURODOLLARS	NNS
Euroissues	NNS
Euronotes	NNS
Europeans	NNS
evacuated	VBN
evacuate	VB
evaded	VBN
evaders	NNS
evades	VBZ
evade	VB
evaluated	VBD
evaluated	VBN
evaluates	VBZ
evaluate	VB
evaluate	VBP
evaluating	VBG
Evaluating	VBG
evaluations	NNS
Evaluations	NNS
evangelists	NNS
evaporated	VBD
evaporated	VBN
evaporate	VB
evened	VBN
evenings	NNS
evens	VBZ
events	NNS
Events	NNS
even	VB
Everglades	NNS
evidenced	VBN
evil-doers	NNS
evinced	VBD
evinced	VBN
eviscerating	VBG
evokes	VBZ
evoke	VBP
evoking	VBG
evolved	VBD
evolved	VBN
evolve	VB
evolving	VBG
exacerbated	VBD
exacerbated	VBN
exacerbates	VBZ
exacerbate	VB
exacerbating	VBG
exaggerated	VBN
exaggerate	VB
examinations	NNS
examined	VBD
examined	VBN
examiners	NNS
Examiners	NNS
examines	VBZ
examine	VB
EXAMINE	VB
examine	VBP
examining	VBG
examples	NNS
Examples	NNS
exams	NNS
excavated	VBN
excavating	VBG
excavators	NNS
exceeded	VBD
exceeded	VBN
exceeding	VBG
exceeds	VBZ
exceed	VB
exceed	VBP
excel	VB
excel	VBP
exceptions	NNS
except	VB
excerpts	NNS
Excerpts	NNS
excesses	NNS
exchanged	VBD
exchanged	VBN
exchanges	NNS
exchange	VB
exchange	VBP
exchanging	VBG
excised	VBD
excised	VBN
excise	VB
excited	VBN
excite	VB
exclaims	VBZ
excluded	VBD
excluded	VBN
Excluded	VBN
Excludes	NNS
excludes	VBZ
exclude	VB
exclude	VBP
excluding	VBG
Excluding	VBG
exclusions	NNS
excorciate	VB
excoriated	VBN
excursions	NNS
excused	VBN
excuses	NNS
excuse	VB
excutives	NNS
execs	NNS
executed	VBD
Executed	VBD
executed	VBN
executes	VBZ
execute	VB
execute	VBP
executing	VBG
executions	NNS
Executions	NNS
executives	NNS
Executives	NNS
EXECUTIVES	NNS
executors	NNS
exemplified	VBN
exemplifies	VBZ
ex-employees	NNS
exempted	VBN
exempting	VBG
exemptions	NNS
exempt	VB
exercised	VBD
exercised	VBN
exercises	NNS
exercises	VBZ
exercise	VB
exercise	VBP
exercising	VBG
exerpts	NNS
exerted	VBN
exerting	VBG
exert	VB
exhaled	VBD
exhausted	VBD
exhausted	VBN
exhausting	VBG
exhaust	VB
exhaust	VBP
exhibited	VBN
exhibiting	VBG
exhibitions	NNS
exhibitors	NNS
exhibits	NNS
exhibits	VBZ
exhibit	VB
exhort	VB
exiled	VBD
exiled	VBN
existed	VBD
existed	VBN
existing	VBG
Existing	VBG
exists	VBZ
exist	VB
exist	VBP
exited	VBD
exits	NNS
exits	VBZ
exit	VB
exonerated	VBD
exonerated	VBN
exonerating	VBG
exorcise	VB
exorcisms	NNS
expanded	VBD
expanded	VBN
expanding	VBG
expands	VBZ
EXPANDS	VBZ
expand	VB
expand	VBP
expansionists	NNS
expansions	NNS
expectations	NNS
Expectations	NNS
expected	VB
expected	VBD
expected	VBN
expecting	VBG
Expects	NNS
expects	VBZ
expect	VB
Expect	VB
expect	VBP
EXPECT	VBP
expedients	NNS
expedited	VBN
expedite	VB
expediting	VBG
expelled	VBD
expelled	VBN
expel	VB
expended	VBN
expenditures	NNS
expenditures	VBZ
expenses	NNS
Expenses	NNS
experienced	VBD
experienced	VBN
Experienced	VBN
experiences	NNS
experiences	VBZ
experience	VB
experience	VBP
experiencing	VBG
experimented	VBD
experimented	VBN
experimenting	VBG
experiments	NNS
Experiments	NNS
experts	NNS
Experts	NNS
expirations	NNS
expired	VBD
expired	VBN
expires	VBZ
expire	VB
expire	VBP
expiring	VBG
explained	VBD
explained	VBN
explaining	VBG
Explaining	VBG
explains	VBZ
Explains	VBZ
explain	VB
explain	VBP
explanations	NNS
exploded	VBD
exploded	VBN
explodes	VBZ
explode	VB
exploding	VBG
exploited	VBN
exploiters	NNS
exploiting	VBG
exploits	NNS
exploits	VBZ
exploit	VB
exploit	VBP
explores	VBZ
explore	VB
explore	VBP
exploring	VBG
explosions	NNS
Explosions	NNS
explosives	NNS
exported	VBD
exported	VBN
exporters	NNS
exporting	VBG
exports	NNS
Exports	NNS
exports	VBZ
export	VB
export	VBP
exposed	VBD
exposed	VBN
expose	VB
expose	VBP
exposing	VBG
exposures	NNS
expounding	VBG
expressed	VBD
expressed	VBN
expresses	VBZ
expressing	VBG
expressions	NNS
express	VB
express	VBP
expunged	VBN
expunge	VB
extended	VBD
extended	VBN
extending	VBG
extends	VBZ
extend	VB
extend	VBP
extensions	NNS
Extensions	NNS
Exteriors	NNS
extinguish	VB
extorted	VBD
extorting	VBG
extort	VB
extracted	VBD
extracted	VBN
extracting	VBG
extracts	NNS
extract	VB
extradited	VBN
extraditions	NNS
extrapolated	VBN
extras	NNS
extremes	NNS
extremists	NNS
extricate	VB
extrusions	NNS
exuded	VBD
exude	VBP
eyeballing	VBG
eyeballs	NNS
eyebrows	NNS
eyed	VBD
eyeglasses	NNS
eyeing	VBG
eyes	NNS
Eyes	NNS
eyewitnesses	NNS
eying	VBG
F16s	NNS
F-18s	NNS
F18s	NNS
fabricated	VBN
fabricate	VB
fabrications	NNS
fabricators	NNS
fabrics	NNS
facades	NNS
faced	VBD
faced	VBN
Faced	VBN
facelifts	NNS
faces	NNS
faces	VBZ
face	VB
face	VBP
facilitate	VB
facilitate	VBP
facilitating	VBG
facilities	NNS
facings	NNS
facing	VBG
FACING	VBG
facsimiles	NNS
factions	NNS
factories	NNS
Factories	NNS
factoring	VBG
factors	NNS
factors	VBZ
factor	VB
factory-jobs	NNS
facts	NNS
faded	VBD
faded	VBN
fades	NNS
fade	VB
fading	VBG
fads	NNS
failed	VBD
FAILED	VBD
failed	VBN
failings	NNS
failing	VBG
fails	VBZ
Fails	VBZ
failures	NNS
Failures	NNS
fail	VB
fail	VBP
fainting	VBG
faint	VB
fairs	NNS
fajitas	NNS
faked	VBD
faked	VBN
faking	VBG
fallen	VBN
falling	VBG
falls	NNS
falls	VBZ
fall	VB
fall	VBP
falsified	VBN
falsifying	VBG
falsify	VB
faltered	VBD
faltered	VBN
faltering	VBG
falters	VBZ
falter	VBP
famed	VBN
familiarize	VB
families	NNS
Families	NNS
famines	NNS
fanatics	NNS
fancies	VBZ
fangs	NNS
fanned	VBD
fans	NNS
Fans	NNS
fans	VBZ
fantasies	NNS
fantasize	VB
fantasize	VBP
fan	VB
fared	VBD
fared	VBN
fares	NNS
Fares	NNS
fares	VBZ
fare	VB
fare	VBP
Fare	VBP
farmers	NNS
Farmers	NNS
FARMERS	NNS
farming	VBG
farms	NNS
farmsteads	NNS
farms	VBZ
farm	VB
farmwives	NNS
fascinated	VBN
fascists	NNS
fashioned	VBN
fashions	NNS
fashion	VB
fastballs	NNS
fastened	VBN
fasteners	NNS
fatalities	NNS
Fatalities	NNS
fathers	NNS
Fathers	NNS
fats	NNS
fattened	VBD
fattened	VBN
fatten	VBP
faulted	VBN
faultlines	NNS
faults	NNS
fault	VBP
fauna	NNS
favored	VBD
favored	VBN
favoring	VBG
favorites	NNS
favors	NNS
favors	VBZ
favor	VB
favor	VBP
fawning	VBG
faxed	VBD
faxes	NNS
feared	VBD
feared	VBN
fearing	VBG
fears	NNS
Fears	NNS
fears	VBZ
fear	VB
fear	VBP
feasted	VBN
feasts	NNS
feathers	NNS
feats	NNS
featured	VBD
featured	VBN
features	NNS
features	VBZ
feature	VB
feature	VBP
featuring	VBG
fed	VBD
fed	VBN
feeding	VBG
feedlots	NNS
Feedlots	NNS
feeds	VBZ
feed	VB
feed	VBP
feelers	NNS
feelings	NNS
Feelings	NNS
feeling	VBG
Feeling	VBG
feels	VBZ
Feels	VBZ
feel	VB
feel	VBP
fees	NNS
Fees	NNS
feet	NNS
fellas	NNS
FELLED	VBD
felled	VBN
fellows	NNS
fell	VBD
fell	VBN
felonies	NNS
felons	NNS
felt	VBD
felt	VBN
females	NNS
feminists	NNS
fences	NNS
fended	VBD
fending	VBG
Fending	VBG
fend	VB
ferreting	VBG
ferret	VB
ferries	NNS
ferrying	VBG
ferry	VB
fertilized	VBN
fertilizers	NNS
fertilizing	VBG
fester	VB
festivals	NNS
festivities	NNS
festooned	VBN
festooning	VBG
fetched	VBD
fetches	VBZ
fetching	VBG
fetch	VB
fetch	VBP
fetuses	NNS
feuded	VBD
feuding	VBG
fiberglass	NNS
fibers	NNS
ficials	NNS
fidgeting	VBG
fiefdoms	NNS
fielded	VBD
fielded	VBN
fielding	VBG
fields	NNS
fields	VBZ
field	VB
fighter-bombers	NNS
fighters	NNS
fighting	VBG
fights	NNS
fights	VBZ
fight	VB
Fight	VB
fight	VBP
figured	VBD
figured	VBN
figures	NNS
Figures	NNS
figures	VBZ
figure	VB
figure	VBP
figuring	VBG
Figuring	VBG
filberts	NNS
filched	VBN
filed	VBD
filed	VBN
filers	NNS
files	NNS
files	VBZ
file	VB
file	VBP
filings	NNS
filing	VBG
Filipinos	NNS
filled	VBD
filled	VBN
filling	VBG
Filling	VBG
fills	VBZ
fill	VB
fill	VBP
filmed	VBD
filmed	VBN
Filmed	VBN
filming	VBG
film-makers	NNS
films	NNS
filtered	VBN
Filtered	VBN
filtering	VBG
filters	NNS
filters	VBZ
finagled	VBN
finalists	NNS
finalized	VBD
finalized	VBN
finalizing	VBG
finals	NNS
financed	VBD
financed	VBN
finances	NNS
FINANCES	NNS
finances	VBZ
finance	VB
financial-crimes	NNS
financial-services	NNS
financiers	NNS
financings	NNS
financing	VBG
findings	NNS
finding	VBG
Finding	VBG
finds	NNS
finds	VBZ
find	VB
find	VBP
Find	VBP
fine-arts	NNS
fined	VBD
fined	VBN
fines	NNS
finessed	VBN
fine-tuning	VB
fine	VB
fingered	VBN
fingering	VBG
fingerlings	NNS
fingerprints	NNS
fingers	NNS
finger	VB
fining	VBG
finished	VB
finished	VBD
finished	VBN
finishes	NNS
finishes	VBZ
finishing	VBG
finish	VB
finish	VBP
fireballs	NNS
fired	VBD
fired	VBN
firefighters	NNS
firehoops	NNS
firemen	NNS
fireplaces	NNS
fireproofing	VBG
fires	NNS
fires	VBZ
Fires	VBZ
fire	VB
fireworks	NNS
firings	NNS
firing	VBG
firmed	VBD
firmed	VBN
firming	VBG
firms	NNS
Firms	NNS
FIRMS	NNS
firm	VB
fisheries	NNS
fishermen	NNS
fishing	VBG
fissures	NNS
fists	NNS
fits	NNS
fits	VBZ
fit	VB
fit	VBN
fit	VBP
fixed	VBD
fixed	VBN
fixes	NNS
fixing	VBG
fixtures	NNS
fix	VB
fizzes	VBZ
fizzled	VBD
fizzled	VBN
flabbergasted	VBN
flags	NNS
Flags	NNS
flamed	VBD
flames	NNS
Flanked	VBN
flapping	VBG
flaps	NNS
flared	VBN
flare	VBP
flaring	VBG
flashbacks	NNS
flashed	VBD
flashed	VBN
flashes	NNS
flashes	VBZ
flashing	VBG
flashlights	NNS
flash	VB
flash	VBP
flats	NNS
flattened	VBD
flattened	VBN
flattening	VBG
flatten	VB
flaunts	VBZ
flaunt	VB
flavors	NNS
flawed	VBN
flaws	NNS
Flaws	NNS
flay	VB
fleas	NNS
fledging	VBG
fled	VBD
fled	VBN
fleeced	VBN
fleeing	VBG
fleets	NNS
fleets	VBZ
flee	VB
fleshpots	NNS
flew	VBD
flexing	VBG
flickered	VBD
flicking	VBG
flied	VBD
fliers	NNS
flies	NNS
flies	VBZ
flight-attendants	NNS
flights	NNS
Flights	NNS
flinch	VB
flinging	VBG
flings	NNS
flipped	VBD
flipping	VBG
flips	VBZ
flip	VB
flirted	VBD
flirted	VBN
flirting	VBG
floated	VBD
floated	VBN
floating	VBG
Floating	VBG
floats	VBZ
float	VB
float	VBP
flocked	VBD
flocked	VBN
flocking	VBG
flog	VB
flooded	VBD
flooded	VBN
flooding	VBG
flood	VB
floors	NNS
flopped	VBD
flopped	VBN
floppies	NNS
flora	NNS
flotations	NNS
floundered	VBN
floundering	VBG
flounder	VB
flourished	VBD
flourished	VBN
flourishing	VBG
flourish	VB
flouting	VBG
flowed	VBD
flowers	NNS
Flowers	NNS
flowing	VBG
flown	VBN
flows	NNS
flows	VBZ
flow	VB
flow	VBP
fluctuated	VBD
fluctuated	VBN
fluctuates	VBZ
fluctuate	VB
fluctuate	VBP
fluctuating	VBG
fluctuations	NNS
fluids	NNS
flunking	VBG
flunk	VBP
fluoropolymers	NNS
flush	VB
flush	VBP
flying	VBG
fly	VB
Fly	VB
fly	VBP
foaming	VBG
focused	VBD
focused	VBN
focuses	VBZ
focusing	VBG
Focusing	VBG
focus	VB
focus	VBP
foes	NNS
FOES	NNS
fog	VB
foiled	VBD
foiled	VBN
Foiled	VBN
foiling	VBG
foil	VB
folded	VBD
folded	VBN
folders	NNS
folding	VBG
fold	VB
fold	VBP
folks	NNS
Folks	NNS
follies	NNS
followed	VBD
followed	VBN
followers	NNS
following	VBG
Following	VBG
follows	VBZ
follow	VB
Follow	VB
follow	VBP
fomenting	VBG
food-fish	NNS
food-services	NNS
foods	NNS
foodstuffs	NNS
fooled	VBN
fooling	VBG
fools	NNS
fool	VB
foothills	NNS
Foothills	NNS
footing	VBG
footnoted	VBN
footnotes	NNS
footsteps	NNS
foot	VB
foot	VBP
forays	NNS
forbade	VBD
forbidden	VBN
forbidding	VBG
forbids	VBZ
forced	VBD
forced	VBN
forces	NNS
Forces	NNS
forces	VBZ
force	VB
force	VBP
FORCE	VBP
forcing	VBG
forecasters	NNS
forecasting	VBG
forecasts	NNS
Forecasts	NNS
forecasts	VBZ
forecast	VB
forecast	VBD
forecast	VBN
forecast	VBP
foreclosed	VBD
foreclosed	VBN
Foreclosed	VBN
foreclosed	VBN|JJ
foreclosures	NNS
Foreclosures	NNS
forefathers	NNS
foreigners	NNS
Foreigners	NNS
forensics	NNS
forerunners	NNS
foresaw	VBD
foreseen	VBN
foresees	VBZ
foresee	VB
foresee	VBP
foreshadowed	VBN
forest-products	NNS
Forest-products	NNS
forests	NNS
forfeitures	NNS
forfeit	VB
forged	VBN
forgeries	NNS
forgets	VBZ
forgetting	VBG
forget	VB
Forget	VB
forget	VBP
forge	VB
forgings	NNS
forging	VBG
forgiven	VBN
forgive	VB
forgiving	VBG
forgotten	VBN
forgot	VBD
forgot	VBN
forgo	VB
forked	VBD
forked	VBN
forklifts	NNS
fork	VB
formalities	NNS
formalizes	VBZ
formats	NNS
formed	VBD
formed	VBN
Formed	VBN
forming	VBG
forms	NNS
forms	VBZ
formulas	NNS
formulated	VBN
formulates	VBZ
formulate	VB
formulating	VBG
formulations	NNS
form	VB
form	VBP
forsaken	VBN
fortified	VBN
fortunes	NNS
forums	NNS
forward	VB
fossils	NNS
fostered	VBD
fostered	VBN
fostering	VBG
foster	VB
fought	VBD
fought	VBN
fouled	VBN
foundations	NNS
founded	VBD
founded	VBN
Founded	VBN
foundered	VBD
foundering	VBG
founders	NNS
Founders	NNS
founding	VBG
Founding	VBG
found	VBD
found	VBN
fountains	NNS
Four-fifths	NNS
foxes	NNS
fractioning	VBG
fractions	NNS
fractured	VBD
fractured	VBN
fragmented	VBN
fragments	NNS
fragments	VBZ
frailties	NNS
framed	VBN
framers	NNS
frames	NNS
frame	VB
framing	VBG
franchised	VBN
franchisees	NNS
Franchisees	NNS
franchisers	NNS
franchises	NNS
franchises	VBZ
franchise	VB
franchising	VBG
Franciscans	NNS
francs	NNS
fraternities	NNS
frauds	NNS
frayed	VBN
fray	VB
freaked	VBN
freaks	NNS
freedoms	NNS
freed	VBD
FREED	VBD
freed	VBN
Freed	VBN
freeholders	NNS
freeing	VBG
frees	VBZ
free	VB
free	VBP
freeways	NNS
freezers	NNS
freezes	NNS
freezes	VBZ
freeze	VB
freighters	NNS
freight	VB
French	NNS
frequencies	NNS
frequents	VBZ
freshmen	NNS
frets	VBZ
fretted	VBD
fretting	VBG
fret	VB
fret	VBP
frictions	NNS
Fridays	NNS
fried	VBN
friendships	NNS
friends	NNS
Friends	NNS
friers	NNS
friezes	NNS
frigates	NNS
frightened	VBD
frightened	VBN
frighten	VB
fringes	NNS
fripperies	NNS
frittered	VBN
frittering	VBG
frocks	NNS
frogmen	NNS
frogs	NNS
frolicked	VBN
frolic	VB
fronds	NNS
fronts	NNS
froth	VB
frozen	VBN
froze	VBD
fruits	NNS
frustrated	VBD
frustrated	VBN
frustrate	VB
frustrating	VBG
frustrations	NNS
frying	VBG
fudge	VB
fudge	VBP
fueled	VBD
fueled	VBN
fueling	VBG
Fueling	VBG
fuel-services	NNS
fuels	NNS
fuel	VB
fugitives	NNS
Fuji	NNS
fulfilled	VBD
fulfilled	VBN
fulfilling	VBG
fulfills	VBZ
fulfill	VB
fulfill	VBP
fulminations	NNS
fumes	NNS
fumes	VBZ
fuming	VBG
fumpered	VBD
functionaries	NNS
functioned	VBD
functioning	VBG
functions	NNS
function	VB
function	VBP
fundamentalists	NNS
fundamentals	NNS
funded	VBD
funded	VBN
Funded	VBN
funding	VBG
fund-raisers	NNS
fundraisers	NNS
Fund-Raisers	NNS
fundraising	VBG
funds	NNS
Funds	NNS
FUNDS	NNS
funds	VBZ
fund	VB
fund	VBP
fungi	NNS
funneled	VBD
funneled	VBN
funneling	VBG
funnel	VB
furloughed	VBN
furloughs	NNS
furnaces	NNS
furnished	VBN
furnishings	NNS
furnishing	VBG
furnish	VB
furriers	NNS
furrows	VBZ
furs	NNS
furthering	VBG
furthers	VBZ
further	VB
fusses	VBZ
futures	NNS
Futures	NNS
FUTURES	NNS
gadgets	NNS
gagged	VBN
gained	VB
gained	VBD
gained	VBN
gainers	NNS
Gainers	NNS
gaining	VBG
gains	NNS
Gains	NNS
gains	VBZ
gain	VB
gain	VBP
galaxies	NNS
galleries	NNS
gallons	NNS
galloping	VBG
gallstones	NNS
galvanized	VBD
galvanize	VB
galvanizing	VBG
gamblers	NNS
gamble	VB
gambling	VBG
games	NNS
gangbusters	NNS
gangs	NNS
gangsters	NNS
gaped	VBN
garages	NNS
gardeners	NNS
gardenettes	NNS
gardening	VBG
gardens	NNS
garden	VB
garments	NNS
garnered	VBD
garnered	VBN
garner	VB
garner	VBP
gases	NNS
Gases	NNS
gas-gathering	VBG
gasolines	NNS
gasped	VBD
gasp	VB
gates	NNS
gathered	VBD
gathered	VBN
Gathered	VBN
gatherings	NNS
gathering	VBG
gathers	VBZ
gather	VB
gather	VBP
gauges	VBZ
gauge	VB
gauging	VBG
gave	VBD
Gave	VBD
gaze	VBP
geared	VBN
gearing	VBG
gears	VBZ
gear	VB
gear	VBP
geeks	NNS
Geeks	NNS
gemsbok	NNS
gems	NNS
gender	VB
generalists	NNS
generalizations	NNS
Generalizations	NNS
generalize	VB
generated	VBD
generated	VBN
generates	VBZ
generate	VB
generate	VBP
generating	VBG
generations	NNS
generators	NNS
genes	NNS
genres	NNS
gentleladies	NNS
gentlemen	NNS
geosciences	NNS
Germans	NNS
GERMANS	NNS
germs	NNS
gestured	VBD
gestures	NNS
gets	VBZ
Gets	VBZ
getting	VBG
Getting	VBG
get-togethers	NNS
get	VB
Get	VB
GET	VB
get	VBP
Get	VBP
geysers	NNS
ghettos	NNS
ghostbusters	NNS
Ghostbusters	NNS
ghosts	NNS
giants	NNS
Giants	NNS
gifts	NNS
gilts	NNS
Gilts	NNS
gimmicks	NNS
girded	VBD
girding	VBG
girls	NNS
giveaways	NNS
Giveaways	NNS
givebacks	NNS
given	VBN
Given	VBN
gives	VBZ
Gives	VBZ
giveth	VBZ
give	VB
Give	VB
give	VBP
GIVE	VBP
giving	VBG
Giving	VBG
gizmos	NNS
glamorized	VBN
glamorize	VB
glanced	VBD
glares	VBZ
glasses	NNS
glaze	VB
glaze	VBP
gleaming	VBG
gleaned	VBN
glean	VB
glide	VB
gliding	VBG
glimpses	NNS
glitches	NNS
glitterati	NNS
gloated	VBD
gloaters	NNS
gloating	VBG
gloats	VBZ
gloat	VB
globalists	NNS
gloss	VB
gloss	VBP
gloves	NNS
glowed	VBD
glowing	VBG
glued	VBN
glues	NNS
gluts	NNS
glutted	VBN
glut	VB
glycols	NNS
gnaw	VB
goals	NNS
goats	NNS
gobbled	VBN
gobbling	VBG
goblins	NNS
Gods	NNS
goes	VBZ
Goes	VBZ
goings-on	NNS
going	VBG
Going	VBG
goldbanded	VBN
golds	NNS
golfers	NNS
golfs	NNS
Goliaths	NNS
gone	VBN
Gone	VBN
gone	VBN|JJ
gon	VB
gon	VBG
goodies	NNS
goods	NNS
Goodyear	VBP
gored	VBN
gore	VB
gorillas	NNS
gossiping	VBG
gotten	VBN
got	VB
got	VBD
Got	VBD
got	VBN
got	VBP
go	VB
Go	VB
go	VBP
governed	VBD
governed	VBN
governing	VBG
governmental-affairs	NNS
government-relations	NNS
government-securities	NNS
government-set	VBN
governmentset	VBN
governments	NNS
Governments	NNS
governors	NNS
Governors	NNS
govern	VB
Govern	VB
govern	VBP
grabbed	VBD
grabbed	VBN
grabbing	VBG
grabs	NNS
grab	VB
grab	VBP
grace	VB
graders	NNS
grades	NNS
Grads	NNS
graduated	VBD
graduated	VBN
graduates	NNS
Graduates	NNS
graduates	VBZ
grafted	VBN
grains	NNS
Grains	NNS
GRAINS	NNS
Grammys	NNS
grams	NNS
grandchildren	NNS
grandees	NNS
grandkids	NNS
grandmasters	NNS
grandmothers	NNS
grandparents	NNS
Granges	NNS
granted	VBD
granted	VBN
granting	VBG
grants	NNS
grants	VBZ
grant	VB
grant	VBP
grapes	NNS
Grapes	NNS
graphics	NNS
Graphics	NNS
graphs	NNS
grappled	VBD
grapples	VBZ
grapple	VB
grasping	VBG
grasp	VB
grasp	VBP
grassroots	NNS
gratuities	NNS
graying	VBG
grazed	VBD
grazers	NNS
graze	VBP
great-grandchildren	NNS
greats	NNS
greenhouses	NNS
greens	NNS
Greens	NNS
greeted	VBD
greeted	VBN
Greetings	NNS
greeting	VBG
greets	VBZ
greet	VB
grenades	NNS
grew	VBD
GREW	VBD
grew	VBN
gridlocked	VBN
grievances	NNS
grill	VBP
grimaced	VBD
grimaces	NNS
grimace	VB
grinders	NNS
grinding	VBG
grinds	VBZ
grind	VB
gringos	NNS
Grinned	VBD
grinning	VBG
grins	NNS
gripes	NNS
gripes	VBZ
gripped	VBD
gripping	VBG
grips	NNS
groans	VBZ
groceries	NNS
groped	VBD
grossing	VBG
grottoes	NNS
groundbreakers	NNS
grounded	VBN
ground-handling	NNS
grounding	VBG
grounds	NNS
ground	VB
ground	VBD
ground	VBN
grouped	VBN
groups	NNS
Groups	NNS
group	VB
groused	VBD
Groused	VBD
grouses	VBZ
grovels	VBZ
growers	NNS
growing	VBG
Growing	VBG
GROWING	VBG
growls	VBZ
grown	VBN
grows	VBZ
Grows	VBZ
growths	NNS
growth	VB
grow	VB
grow	VBP
grueling	VBG
grumbled	VBD
grumble	VBP
guaranteed	VBD
guaranteed	VBN
Guaranteed	VBN
guaranteeing	VBG
guarantees	NNS
guarantees	VBZ
guarantee	VB
guarantee	VBP
guarded	VBD
guarded	VBN
guarding	VBG
guards	NNS
guards	VBZ
guard	VB
guard	VBP
Guber-Peters	NNS
guerrillas	NNS
guessed	VBD
guessing	VBG
guess	VB
guess	VBP
guests	NNS
Guests	NNS
guided	VBD
guided	VBN
guidelines	NNS
Guidelines	NNS
guideposts	NNS
guides	NNS
guide	VB
guiding	VBG
guilders	NNS
gunboats	NNS
gunmen	NNS
Gunmen	NNS
gunned	VBN
gunners	NNS
gunslinging	VBG
guns	NNS
Guns	NNS
gurus	NNS
Gurus	NNS
gushes	VBZ
gush	VBP
guts	NNS
gut	VB
guys	NNS
Guys	NNS
guzzle	VB
gymnastics	NNS
gyrated	VBD
gyrate	VB
gyrating	VBG
gyrations	NNS
habeas	NNS
habitats	NNS
habits	NNS
hackers	NNS
hackles	NNS
hacks	NNS
hack	VB
had	VBD
Had	VBD
had	VBN
haggle	VB
hagglings	NNS
haggling	VBG
hailed	VBD
hailed	VBN
hailing	VBG
hails	VBZ
half-states	NNS
halls	NNS
hallways	NNS
halogenated	VBD
halted	VBD
halted	VBN
halting	VBG
halts	NNS
halts	VBZ
halt	VB
halt	VBP
halved	VBD
halved	VBN
halves	NNS
halves	VBZ
halve	VB
hamburgers	NNS
hammered	VBN
hammering	VBG
hammer	VB
hamming	VBG
hampered	VBD
hampered	VBN
hampering	VBG
hampers	VBZ
hamper	VB
hamstring	VB
hamstrung	VBN
hamstrung	VBP
handbills	NNS
handbooks	NNS
hand-carried	VBN
handcuffed	VBN
handcuffs	NNS
handed	VBD
handed	VBN
handicapped	NNS
handicapped	VBN
handicap	VB
handled	VBD
handled	VBN
handlers	NNS
handles	VBZ
handle	VB
handle	VBP
handling	VBG
handpicked	VBN
hands	NNS
handstands	NNS
hands	VBZ
hand	VB
hanged	VBN
hanging	VBG
hangs	VBZ
hang	VB
hang	VBP
happened	VBD
Happened	VBD
happened	VBN
Happened	VBN
happenings	NNS
happening	VBG
happens	VBZ
happen	VB
happen	VBP
harangues	NNS
harangues	VBZ
harassed	VBD
harassing	VBG
harass	VB
harboring	VBG
harbors	NNS
harbors	VBZ
harbor	VBP
hardened	VBN
hardships	NNS
harmed	VBD
harmed	VBN
harms	NNS
harms	VBZ
harm	VB
harm	VBP
harnessing	VBG
harped	VBD
harping	VBG
harp	VB
harried	VBN
harvested	VBN
harvests	NNS
harvest	VBP
hashing	VBG
hassles	NNS
hastened	VBN
hasten	VB
has	VBN
has	VBP
has	VBZ
Has	VBZ
HAS	VBZ
hatched	VBN
hatch	VB
hated	VBN
hates	VBZ
hate	VB
hate	VBP
hats	NNS
hauled	VBD
haulers	NNS
hauling	VBG
haul	VB
haunted	VBN
haunting	VBG
haunts	NNS
haunts	VBZ
haunt	VB
haunt	VBP
havens	NNS
have	VB
Have	VB
have	VBD
have	VBN
have	VBP
Have	VBP
having	VBG
Having	VBG
Hawaii	NNS
hawkers	NNS
hawking	VBG
hawks	NNS
hawk	VBP
hazards	NNS
HCFCs	NNS
HDTVs	NNS
headaches	NNS
headed	VBD
headed	VBN
Headed	VBN
heading	VBG
Heading	VBG
headlights	NNS
headlined	VBD
headlined	VBN
headlines	NNS
headphones	NNS
headquarters	NNS
headrests	NNS
headsets	NNS
heads	NNS
heads	VBZ
head	VB
head	VBP
healed	VBN
healing	VBG
health-products	NNS
heal	VB
heaped	VBD
heaped	VBN
heaping	VBG
heard	VBD
heard	VBN
Heard	VBN
hearings	NNS
Hearings	NNS
hearing	VBG
Hearing	VBG
hears	VBZ
HEARS	VBZ
heartened	VBN
hearts	NNS
hear	VB
hear	VBP
heated	VBN
heaters	NNS
heating	VBG
Heating	VBG
heats	VBZ
heat	VB
heaved	VBD
heaved	VBN
heavens	NNS
heaves	VBD
heavyweights	NNS
heckled	VBN
hedgers	NNS
hedges	NNS
hedge	VB
hedge	VBP
hedging	VBG
hedging	VBG|JJ
heebie-jeebies	NNS
heeded	VBD
heeded	VBN
heed	VB
heels	NNS
heighborhoods	NNS
heightened	VBD
heightened	VBN
heighten	VB
heights	NNS
heirs	NNS
held	VBD
held	VBN
helicopters	NNS
helped	VBD
helped	VBN
Helped	VBN
helped	VBP
helping	VBG
Helping	VBG
helps	VBZ
Helps	VBZ
help	VB
Help	VB
help	VBP
hemorrhaged	VBN
hemorrhaging	VBG
hemorrhoids	NNS
hens	NNS
Hens	NNS
heralded	VBN
herald	VB
herald	VBP
herbicides	NNS
Hercules	NNS
herding	VBG
herds	NNS
herniated	VBN
heroes	NNS
herons	NNS
hesitate	VB
hesitate	VBP
hesitating	VBG
hewed	VBD
hewn	VBN
hews	VBZ
hidden	VBN
hideouts	NNS
hiders	NNS
hides	NNS
hide	VB
hiding	VBG
hid	VBD
highlands	NNS
highlighted	VBD
highlighted	VBN
highlighting	VBG
highlights	NNS
Highlights	NNS
highlights	VBZ
highlight	VB
high-rises	NNS
highs	NNS
hightailing	VBG
hightops	NNS
highways	NNS
Highways	NNS
hiked	VBN
hikers	NNS
hikes	NNS
hills	NNS
hindered	VBD
hindered	VBN
hindering	VBG
hinders	VBZ
hinder	VB
hinge	VB
hinted	VBD
hinted	VBN
hinterlands	NNS
hinting	VBG
hints	NNS
hints	VBZ
hint	VB
hint	VBP
hips	NNS
hired	VBD
hired	VBN
Hired	VBN
hires	NNS
hires	VBZ
hire	VB
hire	VBP
hiring	VBG
Hispanics	NNS
hissed	VBD
historians	NNS
historical-claims	NNS
historicized	VBN
hitched	VBN
hitches	NNS
hits	NNS
hits	VBZ
hitters	NNS
hitting	VBG
hit	VB
hit	VBD
hit	VBN
Hit	VBN
hit	VBP
Hit	VBP
hoarding	VBG
hoards	NNS
hoard	VBP
hobbies	NNS
hobbled	VBN
hobbles	VBZ
hobbling	VBG
hobbyists	NNS
hobos	NNS
Hoe	VB
hog	NNS
hogs	NNS
Hogs	NNS
hoisted	VBN
holders	NNS
Holders	NNS
holdings	NNS
Holdings	NNS
holding	VBG
Holding	VBG
holdouts	NNS
holdovers	NNS
holds	VBZ
holdups	NNS
hold	VB
Hold	VB
HOLD	VB
hold	VB|NN
hold	VBP
Hold	VBP
holed	VBN
holes	NNS
hole	VBP
holidays	NNS
holler	VB
HomeFed	VBN
homeowners	NNS
homered	VBD
homers	NNS
homer	VB
homes	NNS
homicides	NNS
homosexuals	NNS
Homosexuals	NNS
Hondurans	NNS
Honduras	NNS
honed	VBN
hone	VB
honorariums	NNS
honored	VBN
honoring	VBG
honors	NNS
honor	VB
honor	VBP
hoods	NNS
hoodwinked	VBN
hooked	VBD
hooked	VBN
hooking	VBG
hooks	VBZ
hookups	NNS
hook	VB
hooves	NNS
hoped	VBD
hoped	VBN
hopes	NNS
Hopes	NNS
HOPES	NNS
hopes	VBZ
hope	VB
hope	VBP
hoping	VBG
Hoping	VBG
hopping	VBG
hopscotched	VBD
hops	VBZ
horizons	NNS
hormones	NNS
horns	NNS
horoscopes	NNS
horribles	NNS
horrors	NNS
horses	NNS
Horses	NNS
horticultural-products	NNS
hosannas	NNS
hoses	NNS
Hoses	NNS
hoses	VBZ
hospitalizations	NNS
hospitalized	VBN
hospitals	NNS
Hospitals	NNS
hostages	NNS
hosted	VBD
hostilities	NNS
hosting	VBG
hosts	NNS
hosts	VBZ
host	VB
hot-cereals	NNS
hotel-casinos	NNS
hoteliers	NNS
hotels	NNS
hotlines	NNS
hounded	VBD
hounding	VBG
hours	NNS
Hours	NNS
housed	VBN
households	NNS
houses	NNS
houses	VBZ
house	VB
house	VBP
housewares	NNS
housewives	NNS
Housings	NNS
hovered	VBD
hovered	VBN
hovering	VBG
howling	VBG
huckstering	VBG
huddled	VBD
hugged	VBD
hugging	VBG
hugs	NNS
hulking	VBG
humanities	NNS
humanizing	VBG
human-resources	NNS
human-rights	NNS
humans	NNS
humbled	VBN
hum	VB
hunched	VBN
hundreds	NNS
Hundreds	NNS
hung	VBD
hung	VBN
hunker	VB
hunted	VBN
hunter-gatherers	NNS
hunters	NNS
hunting	VBG
hunts	VBZ
hunt	VB
hunt	VBP
hurdles	NNS
hurled	VBN
hurling	VBG
hurl	VBP
hurricanes	NNS
hurried	VBN
hurries	VBZ
hurry	VB
hurting	VBG
hurtling	VBG
hurts	VBZ
Hurts	VBZ
hurt	VB
hurt	VBD
hurt	VBN
hurt	VBP
husbands	NNS
HUSBANDS	NNS
hustlers	NNS
hustles	VBZ
hybrids	NNS
hyenas	NNS
hyped	VBD
hypermarkets	NNS
hyping	VBG
hypnotized	VBN
hypocrites	NNS
hypothesized	VBN
ice-baggers	NNS
ideals	NNS
ideas	NNS
Ideas	NNS
identified	VBD
identified	VBN
identifies	VBZ
identifying	VBG
identify	VB
identify	VBP
identities	NNS
ideologies	NNS
ideologues	NNS
Ideologues	NNS
idiots	NNS
idled	VBD
idled	VBN
idle	VB
idling	VBG
ignited	VBD
ignited	VBN
ignite	VB
ignored	VBD
ignored	VBN
ignores	VBZ
ignore	VB
Ignore	VB
ignore	VBP
ignoring	VBG
Ignoring	VBG
illegalities	NNS
illnesses	NNS
ills	NNS
illuminates	VBZ
illuminate	VB
illusions	NNS
illustrated	VBD
illustrated	VBN
illustrates	VBZ
illustrate	VB
illustrate	VBP
illustrations	NNS
images	NNS
imagined	VBD
imagined	VBN
imagines	VBZ
imagine	VB
Imagine	VB
imagine	VBP
imagining	VBG
imbalances	NNS
imitated	VBN
imitate	VBP
imitating	VBG
immersed	VBN
immigrants	NNS
immigrated	VBD
immunities	NNS
impacted	VBN
impacts	NNS
impact	VB
impaired	VBN
impair	VB
impart	VB
impeached	VBN
impeded	VBN
impedes	VBZ
impede	VB
impediments	NNS
impeding	VBG
impelled	VBN
impending	VBG
imperatives	NNS
imperfections	NNS
imperialists	NNS
imperiled	VBN
impersonations	NNS
implanted	VBD
implanted	VBN
implanting	VBG
implant	VB
implemented	VBD
implemented	VBN
implementing	VBG
implements	VBZ
implement	VB
implicated	VBN
implicate	VB
implications	NNS
implied	VBD
implied	VBN
implies	VBZ
implores	VBZ
imploring	VBG
implying	VBG
imply	VB
imply	VBP
imported	VBD
imported	VBN
imported	VBN|JJ
importers	NNS
importing	VBG
imports	NNS
Imports	NNS
imports	VBZ
import	VB
import	VBP
imposed	VBD
imposed	VBN
imposes	VBZ
impose	VB
Impose	VB
imposing	VBG
impounded	VBN
impound	VB
impoverished	VBN
impressed	VBD
impressed	VBN
impresses	VBZ
impressionists	NNS
impress	VB
imprisoned	VBN
Imprisoned	VBN
imprisoning	VBG
imprison	VB
improprieties	NNS
improved	VBD
improved	VBN
improvements	NNS
improves	VBZ
improve	VB
improve	VBP
improving	VBG
Improving	VBG
improvised	VBD
impugn	VB
impulses	NNS
inaugurated	VBN
incarcerate	VB
incensed	VBN
incentives	NNS
inched	VBD
inched	VBN
inches	NNS
inching	VBG
inch	VB
incidents	NNS
incisions	NNS
inciting	VBG
inclined	VBN
included	VBD
included	VBN
Included	VBN
includes	VBZ
Includes	VBZ
include	VB
include	VBP
including	VBG
Including	VBG
incomes	NNS
incongruities	NNS
inconsistencies	NNS
incorporated	VBD
incorporated	VBN
incorporates	VBZ
incorporate	VB
incorporating	VBG
increased	VB
increased	VBD
increased	VBN
Increased	VBN
increased	VBN|JJ
increases	NNS
Increases	NNS
increases	VBZ
increase	VB
Increase	VB
increase	VBP
increasing	VBG
Increasing	VBG
increments	NNS
incriminating	VBG
incumbents	NNS
incurred	VBD
incurred	VBN
incurring	VBG
incur	VB
incur	VBP
indemnify	VB
independents	NNS
indexed	VBN
indexers	NNS
indexes	NNS
Indexes	NNS
index-futures	NNS
indexing	VBG
index-options	NNS
indicated	VBD
indicated	VBN
indicates	VBZ
indicate	VB
indicate	VBP
indicating	VBG
indications	NNS
indicators	NNS
indices	NNS
indicted	VBD
indicted	VBN
indictments	NNS
indict	VB
individuals	NNS
Individuals	NNS
indoctrinated	VBN
induced	VBD
induced	VBN
inducements	NNS
induces	VBZ
induce	VB
inducing	VBG
indulgences	NNS
indulges	VBZ
indulge	VB
indulging	VBG
industrialists	NNS
industrialized	VBN
industrialize	VB
industrials	NNS
industrials	VBZ
industries	NNS
Industries	NNS
inefficiencies	NNS
inequalities	NNS
inequities	NNS
infants	NNS
Infants	NNS
infected	VBD
infected	VBN
infecting	VBG
infections	NNS
inferences	NNS
inferred	VBN
infiltrated	VBN
infiltrate	VB
infiltrating	VBG
inflame	VB
inflated	VBD
inflated	VBN
inflates	VBZ
inflate	VB
inflating	VBG
Inflation-adjusted	VBN
inflicted	VBD
inflicted	VBN
inflict	VB
inflows	NNS
influenced	VBD
influenced	VBN
influences	NNS
influences	VBZ
influence	VB
influence	VBP
influencing	VBG
information-services	NNS
information-systems	NNS
informed	VBD
informed	VBN
informing	VBG
informs	VBZ
inform	VB
infractions	NNS
infringed	VBD
infringed	VBN
infringes	VBZ
infringe	VB
infringing	VBG
infuriated	VBD
infuriate	VB
infused	VBN
infuse	VB
ingest	VB
ingots	NNS
ingrates	NNS
ingratiate	VB
ingredients	NNS
inhabited	VBN
inhabits	VBZ
inhabit	VBP
inherited	VBD
inherited	VBN
inherits	VBZ
inherit	VBP
inhibited	VBD
inhibit	VB
inhibit	VBP
initialed	VBD
initialing	VBG
initials	NNS
initiated	VBD
initiated	VBN
initiate	VB
initiate	VBP
initiating	VBG
initiatiors	NNS
initiatives	NNS
initiatives	VBZ
injected	VBD
injected	VBN
injecting	VBG
injections	NNS
injects	VBZ
inject	VB
Inject	VB
injunctions	NNS
injured	VBD
injured	VBN
injure	VB
injuries	NNS
injuring	VBG
injustices	NNS
inks	NNS
inmates	NNS
innings	NNS
innocents	NNS
innoculating	VBG
innovated	VBD
innovate	VB
innovations	NNS
innovators	NNS
i	NNS
inns	NNS
innuendoes	NNS
inputs	NNS
inquired	VBD
inquiries	NNS
inquiring	VBG
inroads	NNS
insects	NNS
inserted	VBD
inserted	VBN
inserting	VBG
inserts	NNS
insert	VB
insiders	NNS
Insiders	NNS
insights	NNS
insinuating	VBG
insisted	VBD
insisted	VBN
insisting	VBG
Insisting	VBG
insists	VBZ
insist	VB
insist	VBP
inspected	VBD
inspected	VBN
inspecting	VBG
inspections	NNS
inspectors	NNS
inspectors	VBZ
Inspects	VBZ
inspect	VB
inspect	VBP
inspirations	NNS
inspired	VBD
inspired	VBN
Inspired	VBN
inspire	VB
inspire	VBP
installations	NNS
installed	VBD
installed	VBN
installing	VBG
installments	NNS
install	VB
install	VBP
instances	NNS
instigated	VBD
instill	VB
instincts	NNS
instituted	VBD
instituted	VBN
institute	VB
instituting	VBG
institutions	NNS
Institutions	NNS
instructed	VBD
instructed	VBN
instructing	VBG
instructions	NNS
instructors	NNS
instructs	VBZ
instruct	VB
instrumentalists	NNS
instruments	NNS
Instruments	NNS
insulated	VBN
insulate	VB
insulate	VBP
insulating	VBG
insulins	NNS
insulting	VBG
insult	VB
insurance-claims	NNS
insured	VBD
insured	VBN
Insureres	NNS
insurers	NNS
Insurers	NNS
INSURERS	NNS
insures	VBZ
insure	VB
insure	VBP
insurgents	NNS
insuring	VBG
integrated-technologies	NNS
integrated	VBN
integrate	VB
integrating	VBG
intellectuals	NNS
intended	VBD
intended	VBN
intends	VBZ
intend	VB
intend	VBP
intensified	VBD
intensified	VBN
intensifying	VBG
intensify	VB
intentions	NNS
intents	NNS
interactions	NNS
interceded	VBD
intercepted	VBN
Intercepting	VBG
interconnected	VBN
interconnect	VB
interested	VBN
interests	NNS
interests	VBZ
interest	VB
interfered	VBD
interferes	VBZ
interfere	VB
interfere	VBP
interfering	VBG
interior-furnishings	NNS
interiors	NNS
interjects	VBZ
interloping	VBG
intermediaries	NNS
intermixed	VBD
internationalists	NNS
international-operations	NNS
interpretations	NNS
interpreted	VBD
interpreted	VBN
interpreting	VBG
interprets	VBZ
interpret	VB
interpret	VBP
interrogated	VBN
interrogators	NNS
interrupted	VBN
interrupting	VBG
interruptions	NNS
interrupt	VB
intersections	NNS
interspersed	VBN
intersperses	VBZ
interstates	NNS
intertitles	NNS
intertwined	VBN
intertwining	VBG
intervals	NNS
intervened	VBD
intervened	VBN
intervene	VB
intervening	VBG
interventionists	NNS
interventions	NNS
interviewed	VBD
interviewed	VBN
interviewing	VBG
interviews	NNS
Interviews	NNS
interview	VB
intimate	VB
intimidated	VBN
intimidate	VB
intimidating	VBG
intimidations	NNS
intones	VBZ
intrigued	VBN
intrigues	NNS
introduced	VBD
introduced	VBN
Introduced	VBN
introduces	VBZ
introduce	VB
introducing	VBG
Introducing	VBG
introductions	NNS
intrude	VBP
intrusions	NNS
inundated	VBN
invaded	VBD
invaders	NNS
invades	VBZ
invade	VB
invade	VBP
invading	VBG
invalidated	VBD
invented	VBD
invented	VBN
inventing	VBG
inventions	NNS
inventories	NNS
Inventories	NNS
inventors	NNS
invent	VB
invent	VBP
inverted	VBN
invested	VBD
invested	VBN
investigated	VBD
investigated	VBN
investigates	VBZ
investigate	VB
investigating	VBG
Investigating	VBG
investigations	NNS
investigators	NNS
Investigators	NNS
investing	VBG
Investing	VBG
investing	VBG|NN
investments	NNS
investor-relations	NNS
investors	NNS
Investors	NNS
invests	VBZ
invest	VB
invest	VBP
invitations	NNS
invited	VBD
invited	VBN
invites	VBZ
invite	VB
inviting	VBG
invoices	NNS
invoked	VBD
invoked	VBN
invokes	VBZ
invoke	VB
invoking	VBG
involved	VB
involved	VBD
involved	VBN
Involved	VBN
involves	VBZ
involve	VB
involve	VBP
involving	VBG
IOUs	NNS
IPOs	NNS
IRAs	NNS
Irises	NNS
irked	VBD
irked	VBN
irks	VBZ
irk	VB
ironies	NNS
irons	NNS
iron	VB
irradiated	VBN
irregularities	NNS
irritated	VBN
irritates	VBZ
islands	NNS
islands	VBZ
is	NNS
isolated	VBD
isolated	VBN
isolates	VBZ
isolate	VB
isolate	VBP
issued	VBD
issued	VBN
issuers	NNS
issues	NNS
Issues	NNS
ISSUES	NNS
issues	VBZ
issue	VB
issue	VBP
issuing	VBG
is	VBZ
Is	VBZ
IS	VBZ
itemize	VB
items	NNS
Items	NNS
jabs	NNS
Jackals	NNS
jacked	VBD
jacked	VBN
jackets	NNS
Jackets	NNS
jackhammers	NNS
jacking	VBG
jack	VB
jailed	VBD
jailed	VBN
JAILED	VBN
jails	NNS
jammed	VBD
jammed	VBN
jams	NNS
jam	VB
Jan.	VB
Japanese-Americans	NNS
Japanese	NNS
Japanese	VBP
jarring	VBG
jars	NNS
jaunts	NNS
JAUNTS	NNS
jeans	NNS
Jeeps	NNS
jelled	VBD
jeopardized	VBN
jeopardizes	VBZ
jeopardize	VB
jeopardizing	VBG
jerked	VBN
jetliners	NNS
jets	NNS
Jets	NNS
jettisoning	VBG
jet	VBP
jewelers	NNS
jewels	NNS
Jews	NNS
jiggling	VBG
jillions	NNS
jingling	VBG
jinks	NNS
jinxed	VBN
jitters	NNS
jobs	NNS
Jobs	NNS
jockeys	NNS
jocks	NNS
jogs	VBZ
joined	VBD
joined	VBN
joining	VBG
Joining	VBG
joins	VBZ
JOINS	VBZ
joint-implants	NNS
joints	NNS
join	VB
JOIN	VB
join	VBP
joked	VBD
jokes	NNS
jokes	VBZ
joke	VB
jolted	VBD
jolted	VBN
jolts	NNS
jolt	VB
Jolt	VB
jostle	VBP
journalists	NNS
Journalists	NNS
journals	NNS
jousting	VBG
joys	NNS
judged	VBN
judgeships	NNS
judges	NNS
Judges	NNS
judge	VB
Judge	VB
judge	VBP
judging	VBG
Judging	VBG
judgments	NNS
jugglers	NNS
juggle	VB
juggling	VBG
jugs	NNS
juices	NNS
jumbos	NNS
jumped	VBD
jumped	VBN
jumping	VBG
Jumping	VBG
jumps	NNS
jumps	VBZ
jump	VB
jump	VBP
junctures	NNS
juniors	NNS
junk-bond	NNS
junkets	NNS
junk-holders	NNS
junkholders	NNS
Junk-holders	NNS
junkies	NNS
junk	VB
juries	NNS
jurisdictions	NNS
jurists	NNS
jurors	NNS
jury-rigged	VBD
justices	NNS
justified	VBN
justifies	VBZ
justifying	VBG
justify	VB
jutting	VBG
Jutting	VBG
juxtapose	VBP
kayoed	VBN
KC-135s	NNS
keen	VB
Keepers	NNS
keeping	VBG
Keeping	VBG
keeps	VBZ
keep	VB
Keep	VB
keep	VBP
kept	VBD
kept	VBN
ketchup	VB|IN
keyboards	NNS
keyed	VBN
keys	NNS
key	VB
kickbacks	NNS
kicked	VBD
kicked	VBN
kickers	NNS
kicking	VBG
kicks	NNS
kicks	VBZ
kick	VB
kick	VBP
kiddies	NNS
kidding	VBG
kidnapped	VBD
kidnapped	VBN
kidnappers	NNS
kidnap	VB
kids	NNS
Kids	NNS
killed	VBD
killed	VBN
killers	NNS
killings	NNS
killing	VBG
kills	VBZ
kill	VB
Kill	VB
kill	VBP
kilobytes	NNS
kilograms	NNS
kilometers	NNS
kindled	VBN
kinds	NNS
kinfolk	NNS
kingpins	NNS
kings	NNS
Kissing	VBG
Kiss	VB
kits	NNS
kneaded	VBN
kneading	VBG
knees	NNS
knew	VBD
knights	NNS
knitted	VBN
knitting	VBG
knit	VBN
knocked	VBD
knocked	VBN
knocking	VBG
knocks	VBZ
knock	VB
knots	NNS
knowing	VBG
Knowing	VBG
knowns	NNS
known	VBN
Known	VBN
knows	VBZ
know	VB
know	VBP
Know	VBP
knuckles	NNS
kowtow	VB
kronor	NNS
kudos	NNS
labeled	VBD
labeled	VBN
labeling	VBG
Labeling	VBG
labels	NNS
labels	VBZ
label	VB
label	VBP
laboratories	NNS
laborers	NNS
laboring	VBG
Laboring	VBG
labors	NNS
labs	NNS
laced	VBN
lacked	VBD
lacked	VBN
lackeys	NNS
lacking	VBG
lacks	VBZ
lack	VBP
ladies	NNS
laggards	NNS
lagged	VBD
lagged	VBN
lagging	VBG
lagoons	NNS
lags	NNS
lags	VBZ
Lags	VBZ
lag	VB
lag	VBP
laid	VBD
laid	VBN
lakes	NNS
lambasted	VBD
lambastes	VBZ
lamented	VBD
laments	VBZ
laminated	VBN
lampposts	NNS
lamps	NNS
landed	VBD
landed	VBN
landfills	NNS
landholdings	NNS
landings	NNS
landing	VBG
landlords	NNS
landowners	NNS
Landowners	NNS
landscapers	NNS
landscapes	NNS
landslides	NNS
lands	NNS
land	VB
Land	VBP
lanes	NNS
languages	NNS
languished	VBD
languished	VBN
languishes	VBZ
languishing	VBG
languish	VB
lapsed	VBN
lapses	NNS
lapses	VBZ
laps	NNS
laptops	NNS
Laptops	NNS
lap	VBP
lasers	NNS
lashed	VBD
lashing	VBG
lash	VB
lash	VBP
lasted	VBD
lasted	VBN
lasting	VBG
lasts	VBZ
last	VB
last	VBP
latched	VBN
latches	VBZ
latching	VBG
latch	VBP
lathes	NNS
lauded	VBD
lauded	VBN
laughed	VBD
laughed	VBN
laughing	VBG
laughs	NNS
laughs	VBZ
laugh	VB
launched	VBD
launched	VBN
launches	NNS
launches	VBZ
launching	VBG
launch	VB
laundered	VBD
laundered	VBN
Laundered	VBN
launderers	NNS
laundering	VBG
launder	VB
laurels	NNS
lavished	VBN
lavishing	VBG
lawbreakers	NNS
lawmakers	NNS
Lawmakers	NNS
LAWMAKERS	NNS
law-making	NNS
lawns	NNS
laws	NNS
lawsuits	NNS
Lawsuits	NNS
lawyers	NNS
Lawyers	NNS
LAWYERS	NNS
laxatives	NNS
layers	NNS
laying	VBG
layoffs	NNS
LAYOFFS	NNS
lays	VBZ
lay	VB
lay	VBD
lay	VBP
LBOs	NNS
leaders	NNS
LEADERS	NNS
leading	VBG
Leading	VBG
leads	NNS
leads	VBZ
Leads	VBZ
lead	VB
lead	VBN
lead	VBP
leafing	VBG
leaflets	NNS
leaguers	NNS
leagues	NNS
leaked	VBD
leaked	VBN
leakers	NNS
leaking	VBG
leaks	NNS
leaned	VBD
leaned	VBN
leaning	VBG
leans	VBZ
lean	VB
Lean	VB
lean	VBP
leaped	VBD
leaped	VBN
leapfrog	VB
leaping	VBG
Leaping	VBG
leaps	NNS
leapt	VBD
leap	VB
leap	VBP
learned	VBD
learned	VBN
learning	VBG
Learning	VBG
learns	VBZ
learn	VB
learn	VBP
leased	VBD
leased	VBN
leases	NNS
leases	VBZ
lease	VB
lease	VBP
leasing	VBG
leasing	VBG|NN
leathers	NNS
leaves	NNS
leaves	VBZ
leave	VB
Leave	VB
leave	VBP
leaving	VBG
Leaving	VBG
lectured	VBD
lectures	VBZ
lecture	VB
lecture	VBP
ledgers	NNS
led	VBD
led	VBN
Led	VBN
leeches	NNS
leftists	NNS
leftovers	NNS
left	VBD
Left	VBD
left	VBN
Left	VBN
legalizing	VBG
legal-services	NNS
legions	NNS
legislate	VB
Legislating	VBG
legislators	NNS
Legislators	NNS
legislatures	NNS
legitimized	VBN
legitimize	VB
legs	NNS
lemmings	NNS
lemons	NNS
lenders	NNS
Lenders	NNS
lending	VBG
lends	VBZ
lend	VB
Lend	VB
lend	VBP
lengthened	VBD
lengthened	VBN
lengthens	VBZ
lengthen	VB
lengthen	VBP
lengths	NNS
lenses	NNS
LENSES	NNS
lent	VBD
lent	VBN
leotards	NNS
lesbians	NNS
lesions	NNS
lessening	VBG
lessen	VB
lessers	NNS
lessons	NNS
lets	VBZ
letters	NNS
Letters	NNS
letting	VBG
Letting	VBG
let	VB
Let	VB
let	VBD
Let	VBD
let	VBN
let	VBP
leveled	VBD
leveled	VBN
leveling	VBG
levels	NNS
level	VB
level	VBP
leveraged	VBN
Leveraged	VBN
LEVERAGED	VBN
leverage	VB
leveraging	VBG
levied	VBD
levy	VB
liabilities	NNS
liaisons	NNS
Liaisons	NNS
liars	NNS
libeled	VBN
liberalizations	NNS
liberalized	VBD
liberalized	VBN
liberalize	VB
liberalize	VBP
liberalizing	VBG
liberals	NNS
Liberals	NNS
liberated	VBD
libertarians	NNS
liberties	NNS
librarians	NNS
libraries	NNS
lice	NNS
licensed	VBD
licensed	VBN
licenses	NNS
licenses	VBZ
license	VB
license	VBP
licensing	VBG
licking	VBG
Lids	NNS
lied	VBD
lies	NNS
lies	VBZ
LIES	VBZ
lieutenants	NNS
lie	VB
lie	VBP
lifeguards	NNS
lifes	NNS
lifted	VBD
lifted	VBN
lifting	VBG
lifts	NNS
lifts	VBZ
lift	VB
Lift	VB
lift	VBP
lighted	VBN
lightened	VBD
lightening	VBG
lighten	VB
lighting	VBG
lights	NNS
Lights	NNS
light	VB
liked	VBD
liked	VBN
likened	VBD
likened	VBN
likening	VBG
likes	NNS
likes	VBZ
like	VB
like	VBP
limbs	NNS
limitations	NNS
limited	VBD
limited	VBN
limiting	VBG
Limiting	VBG
limits	NNS
limits	VBZ
limit	VB
limit	VBP
limousines	NNS
limping	VBG
linebackers	NNS
lined	VBD
lined	VBN
liners	NNS
lines	NNS
Lines	NNS
lineups	NNS
line	VB
line	VBP
lingering	VBG
lingers	VBZ
linger	VB
Linger	VB
lining	VBG
linkages	NNS
linked	VBD
linked	VBN
linking	VBG
Linking	VBG
links	NNS
links	VBZ
link	VB
link	VBP
Link	VBP
lions	NNS
lipoproteins	NNS
lips	NNS
lipsticks	NNS
liquefied	VBN
liquefies	VBZ
liquefy	VB
liquefy	VBP
liquidated	VBD
liquidated	VBN
liquidate	VB
liquidating	VBG
Liquidating	VBG
liquids	NNS
lire	NNS
listed	VBD
listed	VBN
listened	VBD
listened	VBN
listeners	NNS
Listeners	NNS
listening	VBG
listens	VBZ
listen	VB
Listen	VB
listen	VBP
listings	NNS
listing	VBG
lists	NNS
lists	VBZ
list	VB
list	VBP
lithographs	NNS
litigants	NNS
litigators	NNS
littered	VBN
litter	VBP
lit	VBD
lit	VBN
lived	VBD
lived	VBN
live-hauled	VBD
live-haulers	NNS
lives	NNS
Lives	NNS
lives	VBZ
Lives	VBZ
live	VB
Live	VB
live	VBP
Live	VBP
living	VBG
Living	VBG
loaded	VBD
loaded	VBN
loadings	NNS
loading	VBG
loads	NNS
load	VB
loafers	NNS
loaned	VBD
loaned	VBN
loans	NNS
Loans	NNS
loans	VBZ
loan	VB
loathed	VBD
loathed	VBN
loathes	VBZ
loaves	NNS
lobbied	VBD
lobbied	VBN
lobbies	NNS
lobbying	VBG
lobbyists	NNS
lobby	VB
locales	NNS
localities	NNS
localized	VBN
locals	NNS
located	VBN
Located	VBN
locate	VB
locate	VBP
locating	VBG
locations	NNS
locked	VBD
locked	VBN
locking	VBG
locks	NNS
locks	VBZ
lock	VB
lock	VBP
locutions	NNS
lodged	VBD
lodged	VBN
lodge	VB
lodgings	NNS
logged	VBD
logged	VBN
loggers	NNS
logging	VBG
logistics	NNS
logos	NNS
log-rolled	VBD
logs	NNS
logs	VBZ
log	VB
log	VBP
long-term	NNS
long	VBP
looked	VBD
looked	VBN
lookee-loos	NNS
looking	VBG
Looking	VBG
looks	NNS
looks	VBZ
look	VB
Look	VB
look	VBP
looming	VBG
looms	NNS
looms	VBZ
loom	VB
loom	VBP
LOOM	VBZ
loonies	NNS
loopholes	NNS
loops	NNS
loosened	VBN
loosening	VBG
loosen	VB
loose	VB
looting	VBG
loot	VB
lopped	VBD
lorded	VBD
lords	NNS
losers	NNS
loses	NNS
loses	VBZ
lose	VB
lose	VBP
losing	VBG
losses	NNS
Losses	NNS
LOSSES	NNS
lost	VBD
Lost	VBD
lost	VBN
lotions	NNS
lots	NNS
Lots	NNS
lotteries	NNS
loudspeakers	NNS
louis	NNS
lounges	NNS
lovebirds	NNS
loved	VBD
loved	VBN
lovers	NNS
loves	VBZ
Loves	VBZ
love	VB
love	VBP
lowered	VBD
lowered	VBN
lowering	VBG
lowers	VBZ
lower	VB
lower	VBP
low-lifes	NNS
lows	NNS
loyalties	NNS
lubricants	NNS
lucked	VBD
lugged	VBD
lugging	VBG
lugs	NNS
lulled	VBN
lumber	VBP
luminaries	NNS
lumped	VBN
lumping	VBG
lumps	NNS
lumps	VBZ
lunch	VB
lunged	VBD
lunging	VBG
lungs	NNS
lurched	VBD
lurching	VBG
lurch	VBP
lured	VBD
lured	VBN
lures	NNS
lures	VBZ
lure	VB
Lure	VBP
luring	VBG
lurking	VBG
luxuries	NNS
lying	VBG
lyrics	NNS
Lyrics	NNS
machetes	NNS
Machiguengas	NNS
machines	NNS
Machines	NNS
machinists	NNS
Machinists	NNS
Machinists	NNS|NNPS
made	VBD
made	VBN
Made	VBN
mafias	NNS
mafiosi	NNS
magazines	NNS
Magazines	NNS
maggots	NNS
magicians	NNS
magistrates	NNS
magnetized	VBN
magnets	NNS
magnified	VBD
magnified	VBN
magnify	VB
Magnolias	NNS
maharajahs	NNS
mailed	VBD
mailed	VBN
mailers	NNS
mailings	NNS
mailing	VBG
mailmen	NNS
mail-sorting	VBG
mail	VB
mail	VBP
mainframes	NNS
mains	NNS
maintained	VBD
maintained	VBN
maintaining	VBG
maintains	VBZ
maintain	VB
maintain	VBP
Maintain	VBP
majoring	VBG
majors	NNS
makers	NNS
Makers	NNS
makes	NNS
makes	VBZ
make	VB
Make	VB
MAKE	VB
make	VBP
Make	VBP
making	VBG
Making	VBG
MAKING	VBG
Makin	VBG
malefactors	NNS
males	NNS
malfunctions	NNS
maligned	VBN
malls	NNS
mammoths	NNS
manacles	NNS
managed	VBD
managed	VBN
Managed	VBN
managements	NNS
managers	NNS
Managers	NNS
manages	VBZ
manage	VB
manage	VBP
managing	VBG
Managing	VBG
mandated	VBD
mandated	VBN
mandates	NNS
mandates	VBZ
mandate	VB
mandating	VBG
maneuvered	VBD
maneuvered	VBN
maneuverings	NNS
maneuvering	VBG
maneuvers	NNS
MANEUVERS	NNS
maneuvers	VBZ
maneuver	VB
manhandled	VBN
manifestations	NNS
manifestos	NNS
manifest	VBP
maninstays	NNS
manipulated	VBN
manipulates	VBZ
manipulate	VB
manipulate	VBP
manipulating	VBG
manipulations	NNS
manipulators	NNS
manned	VBD
mannerisms	NNS
manners	NNS
manning	VBG
mansions	NNS
manuals	NNS
MANUALS	NNS
manuevering	VBG
manufactured	VBD
manufactured	VBN
manufacturers	NNS
Manufacturers	NNS
manufactures	VBZ
manufacture	VB
manufacture	VBP
manufacturing	VBG
man	VB
many	NNS
many	VB
mapped	VBN
mapping	VBG
maps	NNS
map	VB
map	VBP
marathons	NNS
marbles	NNS
marched	VBD
marched	VBN
marchers	NNS
marches	NNS
marching	VBG
march	VB
march	VBP
Margeotes	NNS
marginalia	NNS
marginalizing	VBG
margin-calls	NNS
margined	VBN
margining	VBG
margins	NNS
Margins	NNS
markdowns	NNS
marked	VBD
marked	VBN
marketed	VBD
marketed	VBN
marketeers	NNS
marketers	NNS
Marketers	NNS
marketing-communications	NNS
marketing	VBG
market-makers	NNS
marketplaces	NNS
markets	NNS
Markets	NNS
markets	VBZ
market	VB
market	VBP
marking	VBG
markka	NNS
marks	NNS
Marks	NNS
marks	VBZ
mark	VB
mark	VBP
marquees	NNS
marred	VBN
marriages	NNS
married	VBD
married	VBN
marrying	VBG
marry	VB
marshes	NNS
marveled	VBD
marvels	NNS
marvel	VB
masked	VBD
masked	VBN
masks	NNS
Masks	VBZ
masons	NNS
masquerading	VBG
massacres	NNS
massages	NNS
massage	VB
massaging	VBG
massed	VBD
masses	NNS
masseurs	NNS
masseuses	NNS
mass-media	NNS
mass-producing	VBG
mastered	VBN
masterpieces	NNS
masters	NNS
master	VB
matched	VBD
matched	VBN
matches	NNS
matches	VBZ
matching	VBG
match	VB
match	VBP
mated	VBN
materialized	VBD
materialized	VBN
materializes	VBZ
materialize	VB
materialize	VBP
materials	NNS
Materials	NNS
mates	NNS
mathematics	NNS
mating	VBG
mattered	VBN
matters	NNS
Matters	NNS|VBZ
matters	VBZ
Matters	VBZ
matter	VB
matter	VBP
matured	VBN
matures	VBZ
mature	VB
mature	VBP
maturing	VBG
maturities	NNS
Maturities	NNS
maul	VB
mavens	NNS
maximize	VB
maximizing	VBG
maxims	NNS
mayors	NNS
mazes	NNS
McDonald	VB
meadows	NNS
meals	NNS
meandered	VBD
meanders	VBZ
meanings	NNS
meaning	VBG
means	NNS
Means	NNS
means	VBZ
Means	VBZ
meant	VBD
meant	VBN
mean	VB
Mean	VB
mean	VBP
measured	VBD
measured	VBN
Measured	VBN
measurements	NNS
measures	NNS
Measures	NNS
measures	VBZ
measure	VB
measuring	VBG
Meats	NNS
MEATS	NNS
mechanics	NNS
mechanisms	NNS
medallions	NNS
meddle	VB
meddling	VBG
media	NNS
mediate	VB
mediators	NNS
medical-products	NNS
medicines	NNS
meetings	NNS
Meetings	NNS
meeting	VBG
Meeting	VBG
meets	NNS
meets	VBZ
meet	VB
Meet	VB
meet	VBP
megabytes	NNS
mega-crashes	NNS
Mega-hits	NNS
mega-issues	NNS
mega-mergers	NNS
mega-problems	NNS
mega-projects	NNS
megaquestions	NNS
mega-resorts	NNS
megawatts	NNS
melding	VBG
melds	VBZ
meld	VB
mellowed	VBN
melodies	NNS
melting	VBG
melts	VBZ
melt	VB
memberships	NNS
members	NNS
Members	NNS
mementos	NNS
memoirs	NNS
memorabilia	NNS
memoranda	NNS
memorandums	NNS
memorialized	VBN
memories	NNS
memorize	VBP
memos	NNS
MEMOS	NNS
mend	VB
men	NNS
Men	NNS
mentioned	VBD
mentioned	VBN
mentioning	VBG
mentions	VBZ
mention	VB
mention	VBP
mentors	NNS
menus	NNS
Mercantilists	NNS
Mercedes-Benzes	NNS
Mercedes	NNS
merchandised	VBN
merchandisers	NNS
merchandising	VBG
merchants	NNS
Merchants	NNS
merged	VBD
merged	VBN
mergers	NNS
merge	VB
merge	VBP
merging	VBG
meringues	NNS
merits	NNS
merit	VB
merit	VBP
mesh	VB
messages	NNS
messengers	NNS
messing	VBG
Messrs.	NNS
mess	VB
metabolized	VBN
metals	NNS
Metals	NNS
METALS	NNS
metal-workers	NNS
metalworkers	NNS
metaphors	NNS
meted	VBN
meters	NNS
methodologies	NNS
methods	NNS
meting	VBG
metrics	NNS
met	VBD
met	VBN
mice	NNS
Mice	NNS
micoprocessors	NNS
microbes	NNS
microchips	NNS
microcomputers	NNS
microeconomics	NNS
microelectronics	NNS
microphones	NNS
microprocessors	NNS
microwaves	NNS
mid-1940s	NNS
mid-1960s	NNS
mid-1970s	NNS
mid-1980s	NNS
mid-1990s	NNS
middlemen	NNS
midsized	VBN
miffed	VBD
miffed	VBN
MiG-29s	NNS
mighta	MD|VB
migrate	VB
migrations	NNS
miles	NNS
milestones	NNS
military-electronics	NNS
militate	VB
militias	NNS
milked	VBN
milks	NNS
milk	VB
milling	VBG
millionaires	NNS
million-plus	NNS
millions	NNS
Millions	NNS
mills	NNS
mimics	NNS
mimics	VBZ
mimic	VB
mimic	VBP
mince	VB
minded	VBD
minds	NNS
mind	VB
Mind	VB
minefields	NNS
minerals	NNS
miners	NNS
mines	NNS
mine	VBP
mingle	VBP
miniaturized	VBN
minicars	NNS
minicomputers	NNS
minimills	NNS
minimized	VBN
minimize	VB
minimizing	VBG
minimums	NNS
mining	VBG
miniseries	NNS
ministers	NNS
ministries	NNS
minisupercomputers	NNS
minivans	NNS
Minneapolis	NNS
minorities	NNS
minors	NNS
minted	VBN
minting	VBG
mints	NNS
minuses	NNS
Minuses	NNS
minutes	NNS
minutiae	NNS
MIPs	NNS
MIPS	NNS
mired	VBN
mirrored	VBD
mirrors	VBZ
mirror	VB
mirror	VBP
misadventures	NNS
miscalculated	VBD
miscalculated	VBN
miscarriages	NNS
misclassified	VBN
miscreants	NNS
misdeeds	NNS
misdemeanors	NNS
misfortunes	NNS
misguided	VBN
mishandled	VBD
mishandling	VBG
misinterpreted	VBN
misinterpret	VB
misjudged	VBD
misjudgments	NNS
mislaid	VBN
misleading	VBG
misled	VBD
misled	VBN
mismeasurements	NNS
misperceptions	NNS
misplaced	VBN
misquoting	VBG
misrepresentations	NNS
misrepresented	VBD
misrepresenting	VBG
misrepresents	VBZ
misrepresent	VB
misrouted	VBN
missed	VBD
missed	VBN
misses	VBZ
missiles	NNS
missing	VBG
missionaries	NNS
missions	NNS
misspent	VBN
misstated	VBD
misstated	VBN
misstatements	NNS
misstates	VBZ
miss	VB
miss	VBP
mistaken	VBN
mistakes	NNS
mistake	VB
mistreat	VB
mistresses	NNS
mistrials	NNS
mists	NNS
misunderstandings	NNS
Misunderstanding	VBG
misunderstood	VBN
misused	VBD
mites	NNS
mitigate	VB
mitigating	VBG
Mitsubishi	NNS
Mitsui	NNS
mixed	VBD
mixed	VBN
Mixed	VBN
mixers	NNS
mixes	VBZ
mixing	VBG
mixtures	NNS
mix	VB
moaning	VBG
moans	VBZ
moan	VB
mobilized	VBD
mobilized	VBN
mobilize	VB
mobilizing	VBG
mocked	VBN
mocking	VBG
modeled	VBD
modeled	VBN
modeling	VBG
models	NNS
model	VB
modems	NNS
moderated	VBN
moderates	NNS
moderate	VB
moderate	VBP
moderating	VBG
modernized	VBD
modernized	VBN
modernize	VB
modernizing	VBG
modes	NNS
modifications	NNS
Modifications	NNS
modified	VBN
modifies	VBZ
modify	VB
modulate	VBP
moisturizers	NNS
molded	VBN
molds	NNS
molecules	NNS
mollified	VBN
mollify	VB
moments	NNS
Mondays	NNS
monetarists	NNS
moneymakers	NNS
monitored	VBD
MONITORED	VBD
monitored	VBN
monitoring	VBG
monitors	NNS
monitors	VBZ
monitor	VB
monitor	VBP
monkeys	NNS
monoliths	NNS
monologues	NNS
monopolies	NNS
monopolized	VBD
monopolized	VBN
monopolize	VB
monopolizing	VBG
months	NNS
Months	NNS
Moonies	NNS
moonlighting	VBG
moons	NNS
mopping	VBG
mop	VB
morals	NNS
mores	NNS
mornings	NNS
morsels	NNS
mortgaged	VBN
mortgages	NNS
mortgage	VB
Moslems	NNS
motels	NNS
mothers	NNS
Mothers	NNS
motifs	NNS
motions	NNS
motions	VBZ
motivated	VBN
motivate	VB
motivate	VBP
motivating	VBG
motives	NNS
motorcycles	NNS
motorists	NNS
motorized	VBN
motors	NNS
mounds	NNS
mountains	NNS
mounted	VBD
mounted	VBN
mounting	VBG
mounts	VBZ
mount	VB
mount	VBP
mourning	VBG
Mourning	VBG
mousetraps	NNS
mouthed	VBD
mouths	NNS
moved	VBD
MOVED	VBD
moved	VBN
movements	NNS
moves	NNS
Moves	NNS
moves	VBZ
MOVES	VBZ
move	VB
Move	VB
move	VBP
Move	VBP
movies	NNS
moving	VBG
Moving	VBG
mow	VB
mucked	VBN
muddied	VBN
muddled	VBN
muffled	VBN
muffs	NNS
mulling	VBG
mulls	VBZ
mull	VB
multimedia	NNS
multinationals	NNS
multipled	VBD
multiples	NNS
multiplied	VBN
multiplying	VBG
multiply	VB
multiply	VBP
mumbled	VBN
mummies	NNS
Munching	VBG
municipalities	NNS
municipals	NNS
Municipals	NNS
MUNICIPALS	NNS
muni	NNS
munis	NNS
murals	NNS
murdered	VBN
murderers	NNS
murdering	VBG
murders	NNS
murmuring	VBG
muscled	VBD
muscles	NNS
muscling	VBG
Muscovites	NNS
muses	NNS
muses	VBZ
museums	NNS
Museums	NNS
muse	VB
mushroomed	VBD
mushroomed	VBN
mushrooms	NNS
musicians	NNS
muster	VB
mutated	VBN
mutate	VB
mutations	NNS
muted	VBN
mute	VB
mutilated	VBN
Mutinies	NNS
mutters	NNS
mutts	NNS
muzzles	VBZ
'm	VBP
mysteries	NNS
myths	NNS
nabbing	VBG
naggings	NNS
nagging	VBG
nags	NNS
nailed	VBN
nails	NNS
nail	VB
name-droppers	NNS
name-drops	VBZ
named	VBD
named	VBN
Named	VBN
nameplates	NNS
names	NNS
Names	NNS
names	VBZ
name	VB
name	VBP
naming	VBG
narcotics	NNS
narratives	NNS
narrowed	VBD
narrowed	VBN
narrowing	VBG
Narrowing	VBG
narrows	VBZ
narrow	VB
nationalists	NNS
nationalized	VBD
nationalized	VBN
nationals	NNS
nations	NNS
natives	NNS
natural-foods	NNS
natural-resources	NNS
navies	NNS
navigate	VB
naysayers	NNS
naysay	VB
Nazis	NNS
Neanderthals	NNS
neared	VBD
nearing	VBG
near-monopolies	NNS
nears	VBZ
necessitated	VBD
necessitated	VBN
necessities	NNS
necks	NNS
neckties	NNS
needed	VBD
needed	VBN
needed	VBN|JJ
needing	VBG
needs	NNS
Needs	NNS
needs	VBZ
need	VB
need	VBP
negated	VBN
negatives	NNS
neglected	VBD
neglected	VBN
neglecting	VBG
negotiated	VBD
negotiated	VBN
negotiates	VBZ
negotiate	VB
negotiate	VBP
negotiating	VBG
negotiations	NNS
Negotiations	NNS
negotiators	NNS
Negotiators	NNS
neighbhorhoods	NNS
neighborhoods	NNS
neighboring	VBG
neighbors	NNS
neighbours	NNS
neophytes	NNS
nerds	NNS
Nerds	NNS
nerves	NNS
Nestled	VBN
nests	NNS
nets	NNS
nets	VBZ
netted	VBD
netted	VBN
netting	VBG
net	VB
networking	VBG
networks	NNS
Networks	NNS
network	VB
neurologists	NNS
neutralized	VBN
neutralizes	VBZ
neutrons	NNS
newborns	NNS
newcasts	NNS
newcomers	NNS
newscasts	NNS
newsies	NNS
newsletters	NNS
News	NNS
newspapers	NNS
Newspapers	NNS
newsprints	NNS
newsstands	NNS
Newsstands	NNS
news-weeklies	NNS
nibbling	VBG
niches	NNS
Nicholas	NNS
nicked	VBN
nicknamed	VBN
nicknames	NNS
nightclubs	NNS
nightmares	NNS
nights	NNS
nine-months	NNS
nine-tenths	NNS
nixed	VBD
noblemen	NNS
nods	VBZ
no-loads	NNS
nominated	VBD
nominated	VBN
nominate	VB
nominations	NNS
nominees	NNS
non-clients	NNS
non-communists	NNS
nonconformists	NNS
non-economists	NNS
non-lawyers	NNS
Non-lawyers	NNS
nonoperating	VBG
Nonperformers	NNS
nonperforming	VBG
Nonperforming	VBG
nonrecurring	VBG
non-seamen	NNS
nonstops	NNS
noodles	NNS
normalize	VB
norms	NNS
Norms	NNS
Northrop	VB
nose-dived	VBD
nosedived	VBD
nose-dived	VBN
nosediving	VBG
noses	NNS
Nos.	NNS
notched	VBD
notch	VB
notebooks	NNS
noted	VBD
noted	VBN
noteholders	NNS
notes	NNS
Notes	NNS
NOTES	NNS
notes	VBZ
note	VB
Note	VB
NOTE	VB
note	VBP
noticed	VBD
noticed	VBN
notices	NNS
notice	VB
notice	VBP
noticing	VBG
notifications	NNS
notified	VBD
notified	VBN
notifies	VBZ
notifying	VBG
notify	VB
notify	VBP
noting	VBG
Noting	VBG
notions	NNS
No.	VB
novels	NNS
novelties	NNS
novitiates	NNS
Nov.	VB
nozzles	NNS
nuances	NNS
nuclear-arms	NNS
nudge	VB
nullified	VBN
nullify	VB
nullify	VBP
number-crunchers	NNS
numbered	VBD
numbered	VBN
numbering	VBG
numbers	NNS
nursed	VBD
nurseries	NNS
nurses	NNS
nursing	VBG
nurtured	VBD
nurtured	VBN
nurture	VB
nurturing	VBG
nuts	NNS
oaks	NNS
Oases	NNS
oats	NNS
obey	VBP
obfuscate	VB
objected	VBD
objected	VBN
objecting	VBG
objections	NNS
Objections	NNS
objectives	NNS
objects	NNS
object	VB
object	VBP
obligated	VBD
obligated	VBN
obligations	NNS
Obligations	NNS
obliged	VBN
obliged	VBN|JJ
obliges	VBZ
obliterated	VBN
obscured	VBD
obscures	VBZ
obscure	VB
observations	NNS
observed	VBD
observed	VBN
observers	NNS
Observers	NNS
observes	VBZ
observe	VB
observe	VBP
observing	VBG
Observing	VBG
obsessed	VBN
obsoleted	VBN
obsoleting	VBG
obstacles	NNS
obstructed	VBN
obstructing	VBG
obstruct	VBP
obtained	VBD
obtained	VBN
obtaining	VBG
obtain	VB
obtain	VBP
obviate	VB
occasions	NNS
occasion	VB
occupations	NNS
occupied	VBD
occupied	VBN
occupies	VBZ
occupying	VBG
occupy	VB
occurred	VBD
occurred	VBN
occurrences	NNS
occurring	VBG
occurs	VBZ
occur	VB
occur	VBP
oceans	NNS
octaves	NNS
octogenarians	NNS
oddballs	NNS
oddities	NNS
ODDITIES	NNS
odds	NNS
Odds	NNS
offenders	NNS
offending	VBG
offends	VBZ
offend	VB
offensives	NNS
offered	VBD
offered	VBN
Offered	VBN
OFFERED	VBN
offerings	NNS
offering	VBG
Offering	VBG
offers	NNS
offers	VBZ
offer	VB
Offer	VB
offer	VBP
off-hours	NNS
officals	NNS
officers	NNS
Officers	NNS
offices	NNS
Offices	NNS
office-supplies	NNS
officials	NNS
Officials	NNS
OFFICIALS	NNS
offi	NNS
offsets	NNS
offsetting	VBG
Offsetting	VBG
offset	VB
offset	VBD
offset	VBN
offset	VBP
offshoots	NNS
offspring	NNS
ogles	VBZ
ogling	VBG
oils	NNS
Oils	NNS
olds	NNS
old-timers	NNS
olefins	NNS
Olympics	NNS
omens	NNS
omissions	NNS
omits	VBZ
omitted	VBD
omitted	VBN
omit	VB
omit	VBP
oncogenes	NNS
Oncogenes	NNS
ones	NNS
onlookers	NNS
Onlookers	NNS
on-ramps	NNS
ooze	VB
oozing	VBG
opened	VBD
opened	VBN
openended	VBN
openers	NNS
openings	NNS
opening	VBG
opens	VBZ
open	VB
Open	VB
open	VBP
operas	NNS
operated	VBD
operated	VBD|VBN
operated	VBN
operates	VBZ
operate	VB
operate	VBP
operating	VBG
Operating	VBG
operations	NNS
operatives	NNS
operators	NNS
opining	VBG
opinion-makers	NNS
opinions	NNS
Opinions	NNS
opponents	NNS
Opponents	NNS
opportunists	NNS
opportunities	NNS
opposed	VBD
opposed	VBN
Opposed	VBN
opposes	VBZ
oppose	VB
oppose	VBP
opposing	VBG
opted	VBD
opted	VBN
optical-products	NNS
optimists	NNS
opting	VBG
options	NNS
Options	NNS
OPTIONS	NNS
option	VBP
opt	VB
opt	VBP
oranges	NNS
orchardists	NNS
orchards	NNS
orchestras	NNS
orchestrated	VBD
orchestrated	VBN
orchestrating	VBG
orchids	NNS
ordained	VBN
ordered	VBD
ordered	VBN
ORDERED	VBN
ordering	VBG
orders	NNS
Orders	NNS
orders	VBZ
order	VB
ordinances	NNS
organisms	NNS
organizations	NNS
Organizations	NNS
organized	VBD
organized	VBN
ORGANIZED	VBN
organizers	NNS
organizes	VBZ
organize	VB
organizing	VBG
organs	NNS
oriented	VBN
originated	VBN
originated	VBP
originates	VBZ
originate	VB
originating	VBG
originations	NNS
originators	NNS
origins	NNS
Orkem	VB
ornaments	NNS
orphaned	VBN
orphans	NNS
others	NNS
Others	NNS
ounces	NNS
ousted	VBD
ousted	VBN
OUSTED	VBN
ousting	VBG
oust	VB
outages	NNS
outbidding	VBG
outbid	VB
outbid	VBP
outbreaks	NNS
outcomes	NNS
outdated	VBN
outdid	VBD
outdistanced	VBN
outdone	VBN
outfielders	NNS
outfits	NNS
outfit	VB
outflank	VB
outflows	NNS
Outflows	NNS
outfly	VB
outgained	VBD
outgrew	VBD
outgrown	VBN
outings	NNS
outlanders	NNS
outlasted	VBD
outlast	VB
outlawed	VBD
outlawed	VBN
outlawing	VBG
outlays	NNS
Outlays	NNS
outleaped	VBD
outlets	NNS
outlined	VBD
outlined	VBN
outlines	VBZ
outline	VB
outlining	VBG
outlooks	NNS
outmoded	VBN
outnumbered	VBD
out-of-staters	NNS
outpaced	VBD
outpaced	VBN
outpaced	VBP
outpace	VB
outpace	VBP
outpacing	VBG
outperformed	VBD
outperformed	VBN
outperforming	VBG
outperforms	VBZ
outperform	VB
outperform	VBP
outposts	NNS
outraged	VBN
outranks	VBZ
outselling	VBG
outsells	VBZ
outsell	VB
outshines	VBZ
outshine	VB
outsiders	NNS
outskirts	NNS
out-smart	VB
outsold	VBD
outstripped	VBD
outstripped	VBN
outstripping	VBG
outstrips	VBZ
outstrip	VB
out-trade	VB
outweighed	VBD
outweighed	VBN
outweigh	VB
outweigh	VBP
ovens	NNS
over-allotments	NNS
overalls	NNS
overarching	VBG
overbid	VB
overbid	VBD
overbought	VBN
overburden	VB
overcame	VBD
overcharges	NNS
overcollateralized	VBN
overcomes	VBZ
overcome	VB
overcome	VBN
overcome	VBP
overcommitted	VBN
overdoing	VBG
overdone	VBN
overdosed	VBN
overdosing	VBG
overemphasize	VB
overflowing	VBG
overhanging	VBG
overhauled	VBN
overhauling	VBG
overhaul	VB
overheated	VBN
overheating	VBG
overlaid	VBN
overlapping	VBG
overlap	VB
overlap	VBP
overlays	VBZ
overlooked	VBD
overlooked	VBN
overlooking	VBG
overlooks	VBZ
overlook	VB
overlook	VBP
over-magazined	VBN
overpaid	VBD
overpaid	VBN
overpaying	VBG
overpay	VB
overplanted	VBN
overpower	VB
overpriced	VBN
overpurchase	VB
overreacted	VBN
overreacting	VBG
Overreacting	VBG
overreact	VB
overreact	VBP
override	VB
overriding	VBG
overrode	VBD
overruled	VBD
overruled	VBN
overrule	VB
overruling	VBG
overruns	NNS
oversaw	VB
oversaw	VBD
overseeing	VBG
overseen	VBN
overseers	NNS
oversees	VBZ
oversee	VB
overshadowed	VBD
overshadowed	VBN
overshadowing	VBG
oversimplified	VBN
oversold	VB
oversold	VBN
overstated	VBD
overstated	VBN
overstate	VB
overstating	VBG
overstrained	VBN
oversubscribed	VBN
overtaken	VBN
overtaxed	VBN
overthrowing	VBG
overthrown	VBN
overthrow	VB
overtures	NNS
overturned	VBD
overturned	VBN
overturning	VBG
overturn	VB
overused	VBN
overvalued	VBD
overvalued	VBN
overweighted	VBN
overwhelmed	VBD
overwhelmed	VBN
overwhelming	VBG
overwhelm	VB
overwhelm	VBP
overworking	VBG
owed	VBD
owed	VBN
owes	VBZ
owe	VB
owe	VBP
owing	VBG
owned	VBD
owned	VBN
owners	NNS
Owners	NNS
owning	VBG
Owning	VBG
owns	VBZ
own	VB
own	VBN
own	VBP
paced	VBN
pacemakers	NNS
pace	VB
pacified	VBD
packaged-goods	NNS
Packaged-goods	NNS
packaged	VBN
packages	NNS
Packages	NNS
packages	VBZ
package	VB
packaging	VBG
packed	VBD
packed	VBN
packets	NNS
packing	VBG
packs	NNS
packs	VBZ
pack	VB
pack	VBP
PACs	NNS
PACS	NNS
pacts	NNS
paddles	NNS
paeans	NNS
pages	NNS
paid	VBD
paid	VBN
Paid	VBN
paid	VBN|JJ
PaineWebber	VB
pains	NNS
painted	VBD
painted	VBN
painters	NNS
paintings	NNS
Paintings	NNS
painting	VBG
paints	NNS
paint	VB
paint	VBP
paired	VBN
pairs	NNS
pair	VB
palazzi	NNS
paled	VB
paled	VBD
pales	VBZ
pale	VBP
palms	NNS
palmtops	NNS
Palmtops	NNS
palm	VB
pals	NNS
pampers	VBZ
pamphlets	NNS
pancakes	NNS
pandering	VBG
panelists	NNS
panels	NNS
pangs	NNS
panicked	VBD
panicking	VBG
panics	NNS
panic	VB
panjandrums	NNS
panned	VBD
panned	VBN
panning	VBG
Pantages	NNS
panties	NNS
pants	NNS
pan	VB
paper-goods	NNS
PAPER	NNS
paper-products	NNS
papers	NNS
PAPERS	NNS
parachute	VB
parachuting	VBG
parades	NNS
parakeets	NNS
parallels	NNS
parallels	VBZ
parallel	VB
paralyzed	VBN
paralyzing	VBG
Paramedics	NNS
parameters	NNS
paraphernalia	NNS
paraphrase	VBP
parasites	NNS
parastatals	NNS
parcels	NNS
parcel	VB
parcel	VBP
parched	VBN
pardoned	VBD
pared	VBD
pared	VBN
parents	NNS
Parents	NNS
pare	VB
Paribas	NNS
parimutuels	NNS
paring	VBG
parishes	NNS
parishioners	NNS
parities	NNS
parked	VBD
parked	VBN
parking	VBG
parks	NNS
park	VB
Park	VB
parlors	NNS
parried	VBD
parry	VB
partake	VB
parted	VBD
participants	NNS
Participants	NNS
participated	VBD
participated	VBN
participates	VBZ
participate	VB
participate	VBP
participating	VBG
participations	NNS
particulars	NNS
parties	NNS
Parties	NNS
parties	VBZ
parting	VBG
partisans	NNS
Partisans	NNS
partnerships	NNS
Partnerships	NNS
partners	NNS
Partners	NNS
PARTNERS	NNS
parts	NNS
Parts	NNS
part	VB
pashas	NNS
passages	NNS
passed	VBD
passed	VBN
Passed	VBN
passenger-kilometers	NNS
passengers	NNS
passers-by	NNS
passes	NNS
passes	VBZ
passing	VBG
passions	NNS
passports	NNS
pass	VB
pass	VBP
passwords	NNS
pasted	VBN
pastels	NNS
pasteurized	VBN
pastimes	NNS
pastors	NNS
patched	VBN
patch	VB
patented	VBD
patented	VBN
patents	NNS
paths	NNS
patients	NNS
Patients	NNS
patrolled	VBN
patrols	NNS
patronized	VBN
patronize	VB
patronizing	VBG
patrons	NNS
patterned	VBN
patterns	NNS
Patterns	NNS
paused	VBD
pauses	NNS
pauses	VBZ
pause	VB
pause	VBP
pausing	VBG
paved	VBD
paved	VBN
paves	VBZ
pave	VB
pawing	VBG
pawning	VBG
pawns	NNS
payables	NNS
paychecks	NNS
payers	NNS
Payers	NNS
paying	VBG
Paying	VBG
payments	NNS
Payments	NNS
PAYMENTS	NNS
payoffs	NNS
payouts	NNS
Payouts	NNS
payrolls	NNS
pays	VBZ
PAYS	VBZ
pay	VB
Pay	VB
PAY	VB
pay	VBP
PCBs	NNS
PCs	NNS
peacemakers	NNS
peaches	NNS
peaked	VBD
peaked	VBN
peaking	VBG
peaks	NNS
peak	VB
pealing	VBG
peals	NNS
peanuts	NNS
pearls	NNS
pears	NNS
peasants	NNS
Peasants	NNS
peas	NNS
peccadilloes	NNS
pecks	NNS
peck	VBP
peculiarities	NNS
pedaled	VBN
pedaling	VBG
pedal	VB
peddled	VBN
peddles	VBZ
peddle	VB
peddle	VBP
peddling	VBG
pedestrians	NNS
Pedigrees	NNS
Peeking	VBG
peeled	VBN
peering	VBG
peers	NNS
peers	VBZ
peer	VB
peer	VBP
pegged	VBD
pegged	VBN
pegging	VBG
pegs	VBZ
peg	VB
peg	VBP
pellets	NNS
penalized	VBN
penalizes	VBZ
penalize	VB
penalties	NNS
pence	NNS
pencils	NNS
Pencils	NNS
PENCILS	NNS
Pencil	VB
pending	VBG
Pending	VBG
pending	VBG|JJ
penetrated	VBN
penetrate	VB
penetrating	VBG
penises	NNS
penned	VBN
pennies	NNS
pensions	NNS
pens	NNS
peopled	VBN
people	NNS
People	NNS
peoples	NNS
peppered	VBD
peppering	VBG
peppers	NNS
Pepsi	NNS
perceived	VBD
perceived	VBN
perceives	VBZ
perceive	VBP
percentages	NNS
perceptions	NNS
perched	VBN
perfected	VBN
performances	NNS
performed	VBD
performed	VBN
performers	NNS
performing-arts	NNS
performing	VBG
Performing	VBG
performs	VBZ
perform	VB
perform	VBP
perils	NNS
periodicals	NNS
periods	NNS
Periods	NNS
peripherals	NNS
perishables	NNS
perished	VBN
perked	VBD
perked	VBN
perks	NNS
permeated	VBD
permeating	VBG
permits	NNS
permits	VBZ
permitted	VBD
permitted	VBN
permitting	VBG
permit	VB
permit	VBP
perpetrated	VBN
perpetuates	VBZ
perpetuate	VB
perpetuate	VBP
perpetuating	VBG
persecuted	VBN
persecuting	VBG
persisted	VBD
persisting	VBG
persists	VBZ
persist	VB
persist	VBP
personalities	NNS
personalized	VBN
personalize	VB
personnel	NNS
Personnel	NNS
persons	NNS
persuaded	VBD
persuaded	VBN
persuades	VBZ
persuade	VB
persuading	VBG
Persuading	VBG
pertains	VBZ
perturbed	VBD
peruse	VB
peruse	VBP
pervaded	VBD
pervade	VBP
perversities	NNS
pesatas	NNS
pesetas	NNS
pesos	NNS
pessimists	NNS
Pestered	VBN
pesticides	NNS
petitioned	VBD
petitions	NNS
petition	VB
petrochemicals	NNS
pets	NNS
PETS	NNS
pharaohs	NNS
pharmaceuticals	NNS
Pharmaceuticals	NNS
pharmacies	NNS
pharmacists	NNS
phased	VBD
phased	VBN
phases	NNS
phase	VB
phasing	VBG
phenomena	NNS
Phillips	NNS
philosophers	NNS
philosophies	NNS
phobias	NNS
phoned	VBD
phoned	VBN
phones	NNS
phones	VBZ
phone	VBP
phoning	VBG
photocopiers	NNS
photocopying	VBG
photocopy	VB
photofinishers	NNS
photographed	VBN
photographers	NNS
photographing	VBG
photographs	NNS
photographs	VBZ
photos	NNS
phrases	NNS
physicians	NNS
physics	NNS
pianos	NNS
piasters	NNS
picked	VBD
picked	VBN
pickers	NNS
picking	VBG
Pickin	VBG
pickles	NNS
picks	NNS
picks	VBZ
pickups	NNS
pick	VB
Pick	VB
pick	VBP
pictured	VBN
pictures	NNS
Pictures	NNS
pictures	VBZ
picture	VBP
picturing	VBG
pieced	VBN
pieces	NNS
Pieces	NNS
piece	VB
Pierce	VB
piers	NNS
pies	NNS
piggybacking	VBG
Piggybacking	VBG
piglets	NNS
pigments	NNS
pigs	NNS
piled	VBD
piled	VBN
piles	NNS
pile	VB
pile	VBP
pilings	NNS
piling	VBG
PILING	VBG
pillars	NNS
pilloried	VBN
pillorying	VBG
pillowcases	NNS
pillows	NNS
pills	NNS
pilots	NNS
Pilots	NNS
pimps	NNS
pinched	VBD
pinched	VBN
pinching	VBG
pinch	VB
pine	VBP
pinging	VBG
ping	VB
pinned	VBN
pinning	VBG
pin-pointed	VBN
pinpointed	VBN
pinpoint	VB
pins	NNS
pins	VBZ
pints	NNS
pin	VB
pioneered	VBD
pioneers	NNS
pioneer	VB
piped	VBD
piped	VBN
pipelines	NNS
pipes	NNS
pirated	VBN
pirates	NNS
piroghi	NNS
pistils	NNS
pistols	NNS
pistons	NNS
pitched	VBD
pitched	VBN
pitchers	NNS
pitches	NNS
pitches	VBZ
pitching	VBG
pitchmen	NNS
pitch	VB
pitch	VBP
pitfalls	NNS
Pitfalls	NNS
pits	NNS
pits	VBZ
pitted	VBD
pitted	VBN
pitting	VBG
pit	VB
pivot	VB
pizzas-with-everything	NNS
pizzerias	NNS
placated	VBN
placate	VB
placed	VBD
placed	VBN
placements	NNS
places	NNS
places	VBZ
place	VB
Place	VB
place	VBP
placing	VBG
plagued	VBD
plagued	VBN
plague	VB
plaguing	VBG
plainclothes	NNS
plains	NNS
Plains	NNS
plaintiffs	NNS
Plaintiffs	NNS
planes	NNS
planets	NNS
planks	NNS
planned	VBD
planned	VBN
planners	NNS
Planners	NNS
planning	VBG
plans	NNS
Plans	NNS
plans	VBP
plans	VBZ
Plans	VBZ
PLANS	VBZ
plantations	NNS
planted	VBD
planted	VBN
planting	VBG
plants	NNS
PLANTS	NNS
plant	VB
plan	VB
plan	VBP
plastics	NNS
Plastics	NNS
plates	NNS
platforms	NNS
platitudes	NNS
plaudits	NNS
played	VBD
played	VBN
players	NNS
Players	NNS
playgrounds	NNS
playing	VBG
Playing	VBG
playoffs	NNS
plays	NNS
plays	VBZ
Plays	VBZ
play	VB
play	VBP
pleaded	VBD
pleaded	VBN
pleadings	NNS
pleading	VBG
plead	VB
pleasantries	NNS
pleased	VBD
pleased	VBN
pleases	VBZ
please	VB
Please	VB
please	VBP
pleasing	VBG
pleas	NNS
pleasures	NNS
plea	VB
pledged	VBD
pledged	VBN
pledges	NNS
pledges	VBZ
pledging	VBG
pliers	NNS
plies	VBZ
plights	NNS
plods	VBZ
plots	NNS
plotted	VBD
plotters	NNS
plotting	VBG
plot	VB
plowed	VBD
plowed	VBN
plows	VBZ
plow	VB
ploys	NNS
Ploys	NNS
plucked	VBN
pluck	VB
plugged	VBD
plugging	VBG
Plugging	VBG
plug	VB
plug	VBP
plummeted	VBD
plummeted	VBN
plummeting	VBG
plummet	VB
plummet	VBP
plunged	VBD
plunged	VBN
plunges	NNS
plunges	VBZ
plunge	VB
plunge	VBP
plunging	VBG
plunking	VBG
pluses	NNS
Pluses	NNS
plying	VBG
Poachers	NNS
poaching	VBG
pocketing	VBG
pockets	NNS
Pockets	NNS
pockets	VBZ
pocket	VB
pockmarked	VBN
pointed	VBD
pointed	VBN
pointers	NNS
pointing	VBG
points	NNS
points	VBZ
point	VB
point	VBP
poised	VBN
poisoned	VBN
poisons	NNS
poked	VBD
pokes	VBZ
poking	VBG
polarized	VBN
poles	NNS
Poles	NNS
police	NNS
Police	NNS
polices	NNS
police	VB
policies	NNS
Policies	NNS
policing	VBG
policyholders	NNS
policy-makers	NNS
policy-making	VBG
polished	VBD
polished	VBN
polishing	VBG|NN
polish	VB
politicians	NNS
Politicians	NNS
politicized	VBN
politico-plaintiffs	NNS
politics	NNS
Politics	NNS
POLITICS	NNS
polled	VBD
polled	VBN
pollen-producing	VBG
pollinated	VBN
pollinate	VB
pollinate	VBP
pollinating	VBG
polls	NNS
Polls	NNS
pollsters	NNS
polls	VBZ
pollutants	NNS
polluters	NNS
pollute	VB
polluting	VBG
poll	VB
pols	NNS
poltergeists	NNS
polymers	NNS
polyols	NNS
polyps	NNS
polyrhythms	NNS
pondering	VBG
ponder	VB
ponder	VBP
ponds	NNS
ponied	VBD
ponies	NNS
pontificate	VBP
ponying	VBG
pooled	VBN
pooling	VBG
pools	NNS
pool	VBP
popping	VBG
pops	VBZ
popularized	VBD
popularized	VBN
popularize	VB
populated	VBN
populate	VB
populating	VBG
populations	NNS
pop	VB
pop	VBP
porcelains	NNS
porches	NNS
pored	VBD
pored	VBN
pores	VBZ
pork-barrelers	NNS
portables	NNS
portends	VBZ
portend	VB
portfolios	NNS
Portfolios	NNS
PORTING	VBG
portions	NNS
portraits	NNS
portrayals	NNS
portrayed	VBD
portrayed	VBN
portraying	VBG
portrays	VBZ
portray	VB
portray	VBP
ports	NNS
Ports	NNS
posed	VBD
posed	VBN
poses	VBZ
pose	VB
pose	VBP
posing	VBG
positioned	VBD
positioned	VBN
positions	NNS
positions	VBZ
position	VB
possessed	VBD
possessed	VBN
possesses	VBZ
possessing	VBG
possessions	NNS
possess	VB
possess	VBP
possibilities	NNS
postcards	NNS
posted	VBD
Posted	VBD
posted	VBN
Posted	VBN
posters	NNS
postings	NNS
posting	VBG
postmarked	VBN
postmarks	NNS
postponed	VBD
postponed	VBN
postpone	VB
postpone	VBP
postponing	VBG
posts	NNS
posts	VBZ
Posts	VBZ
posturing	VBG
post	VB
POTABLES	NNS
potatoes	NNS
potentates	NNS
potentialities	NNS
potholes	NNS
pots	NNS
pot	VB
pouches	NNS
pounce	VB
pounded	VBN
pounding	VBG
pounds	NNS
pound	VB
poured	VBD
poured	VBN
pouring	VBG
pours	VBZ
pour	VB
pour	VBP
powders	NNS
powered	VBN
powerhouses	NNS
powers	NNS
power	VB
practiced	VBD
practiced	VBN
practices	NNS
practice	VB
practicing	VBG
practitioners	NNS
pragmatists	NNS
prairies	NNS
praised	VBD
praised	VBN
praises	NNS
praises	VBZ
praise	VB
praise	VBP
praising	VBG
prancing	VBG
prayers	NNS
praying	VBG
preaching	VBG
preach	VB
preach	VBP
pre-approved	VBN
preapproved	VBN
prearranged	VBN
precautions	NNS
preceded	VBN
precedents	NNS
precedes	VBZ
precede	VB
preceding	VBG
precincts	NNS
precious-metals	NNS
Precious-metals	NNS
precipices	NNS
precipitated	VBD
precipitating	VBG
precluded	VBN
precludes	VBZ
preclude	VB
predates	VBZ
predators	NNS
predecessors	NNS
predetermined	VBN
predicated	VBN
predict\/advocate	VBP
predicted	VBD
predicted	VBN
predicting	VBG
Predicting	VBG
predictions	NNS
Predictions	NNS
predicts	VBZ
predict	VB
predict	VBP
predispose	VB
pre-empted	VBD
pre-empt	VB
preferences	NNS
preferred	VBD
preferred	VBG
preferred	VBN
preferring	VBG
prefers	VBZ
prefer	VB
prefer	VBP
prejudiced	VBN
prejudices	NNS
premiered	VBD
premieres	NNS
premiere	VB
premiering	VBG
premises	NNS
premiums	NNS
preoccupied	VBN
prepaid	VB
prepaid	VBN
preparations	NNS
preparatives	NNS
prepared	VBD
prepared	VBN
preparers	NNS
prepares	VBZ
prepare	VB
prepare	VBP
preparing	VBG
prepaying	VBG
prepayments	NNS
Prepayments	NNS
prepay	VB
prepping	VBG
pre-registered	VBN
pre-register	VB
prerogatives	NNS
presages	VBZ
presage	VB
preschoolers	NNS
prescribed	VBN
prescribes	VBZ
prescribe	VB
prescribe	VBP
prescriptions	NNS
presentations	NNS
presented	VBD
presented	VBN
presenters	NNS
presenting	VBG
presents	NNS
presents	VBZ
present	VB
Present	VB
present	VBP
preserved	VBD
preserved	VBN
preserves	VBZ
preserve	VB
preserving	VBG
presided	VBD
presided	VBN
presidents	NNS
Presidents	NNS
presides	VBZ
presiding	VBG
pre-signed	VBN
pressed	VBD
pressed	VBN
Pressed	VBN
presses	NNS
pressing	VBG
pressured	VBD
pressured	VBN
pressures	NNS
Pressures	NNS
pressure	VB
pressure	VBP
pressuring	VBG
press	VB
Press	VB
press	VBP
presumed	VBN
presumes	VBZ
presuming	VBG
pretending	VBG
pretend	VB
Pretend	VB
pretensions	NNS
pre-tested	VBN
pre-try	VB
prevailed	VBD
prevailed	VBN
prevailing	VBG
prevails	VBZ
prevail	VB
prevail	VBP
prevented	VBD
prevented	VBN
Prevented	VBN
preventing	VBG
prevents	VBZ
prevent	VB
Prevent	VB
prevent	VBP
previewing	VBG
previews	NNS
prey	VBP
priced	VBD
priced	VBN
price-earnings	NNS
price\/earnings	NNS
prices	NNS
Prices	NNS
PRICES	NNS
prices	VBZ
price	VB
price	VBP
pricings	NNS
pricing	VBG
pricked	VBN
priests	NNS
primed	VBN
primitives	NNS
princes	NNS
principals	NNS
principles	NNS
printed	VBD
printed	VBN
printers	NNS
printing	VBG
printing	VBG|NN
printouts	NNS
prints	NNS
prints	VBZ
print	VB
print	VBP
priorities	NNS
prisoners	NNS
prisons	NNS
privatized	VBN
privatize	VB
privatizing	VBG
privileges	NNS
prized	VBN
prizes	NNS
probabilities	NNS
probes	NNS
probe	VB
probe	VBP
probing	VBG
Probing	VBG
problematics	NNS
problems	NNS
procedures	NNS
proceeded	VBD
proceeded	VBN
proceedings	NNS
PROCEEDINGS	NNS
proceeding	VBG
proceeds	NNS
Proceeds	NNS
proceeds	VBZ
proceed	VB
proceed	VBP
processed	VBD
processed	VBN
processes	NNS
processes	VBZ
processing	VBG
Processing	VBG
processors	NNS
process	VB
process	VBP
proclaimed	VBD
proclaiming	VBG
proclaims	VBZ
proclaim	VB
proclaim	VBP
proclamations	NNS
procure	VB
prodded	VBN
prodding	VBG
prods	VBZ
produced	VBD
produced	VBN
producers	NNS
Producers	NNS
produces	VBZ
produce	VB
Produce	VB
produce	VBP
producing	VBG
productions	NNS
products	NNS
PRODUCTS	NNS
prod	VB
professed	VBD
professed	VBN
professes	VBZ
professionals	NNS
Professionals	NNS
professions	NNS
professors	NNS
profess	VBP
proffered	VBD
proffered	VBN
profferred	VBN
profiled	VBN
profiles	NNS
profile	VB
profited	VBD
profited	VBN
profiteering	VBG
profiteers	NNS
profiting	VBG
profit-sharing	NNS
profits	NNS
Profits	NNS
PROFITS	NNS
profits	VBZ
profit-taking	NNS
profitting	VBG
profit	VB
profit	VBP
progenitors	NNS
prognosticators	NNS
programmed	VBN
programmers	NNS
programming	VBG
programs	NNS
Programs	NNS
program	VB
program	VBP
progressed	VBD
progressed	VBN
progresses	VBZ
progressing	VBG
progressions	NNS
progressives	NNS
progress	VB
prohibited	VBD
prohibited	VBN
prohibiting	VBG
prohibitions	NNS
prohibits	VBZ
prohibit	VB
prohibit	VBP
projected	VBD
projected	VBN
Projected	VBN
projecting	VBG
Projecting	VBG
projections	NNS
projectors	NNS
projects	NNS
Projects	NNS
projects	VBZ
project	VB
project	VBP
proliferated	VBN
proliferate	VBP
proliferating	VBG
prolonged	VBN
prolong	VB
promised	VBD
promised	VBN
promises	NNS
promises	VBZ
Promises	VBZ
promise	VB
promise	VBP
promising	VBG
promoted	VBD
promoted	VBN
promoters	NNS
promotes	VBZ
promote	VB
promote	VBP
promoting	VBG
promotions	NNS
prompted	VBD
prompted	VBN
Prompted	VBN
prompting	VBG
prompts	VBZ
prompt	VB
promulgated	VBD
prongs	NNS
pronounced	VBD
pronounced	VBN
pronouncements	NNS
pronounces	VBZ
proof-of-purchases	NNS
proofreading	VBG
propagandists	NNS
propagandizes	VBZ
propagandize	VB
propelled	VBD
propelled	VBN
propelling	VBG
propel	VB
properties	NNS
proponents	NNS
Proponents	NNS
proportions	NNS
proposals	NNS
Proposals	NNS
PROPOSALS	NNS
proposed	VBD
proposed	VBN
proposes	VBZ
propose	VB
propose	VBP
proposing	VBG
propositions	NNS
propped	VBD
propped	VBN
propping	VBG
proprietorships	NNS
proprietors	NNS
propsed	VBN
props	NNS
prop	VB
proscribed	VBN
proscribes	VBZ
prosecuted	VBD
prosecuted	VBN
prosecute	VB
prosecuting	VBG
prosecutions	NNS
prosecutors	NNS
Prosecutors	NNS
PROSECUTORS	NNS
pros	NNS
Pros	NNS
prospects	NNS
Prospects	NNS
PROSPECTS	NNS
prospectuses	NNS
prospered	VBN
prosper	VB
prostitutes	NNS
protected	VBD
protected	VBN
protecting	VBG
protections	NNS
protectors	NNS
protects	VBZ
protect	VB
protect	VBP
proteges	NNS
proteins	NNS
proteins	VBZ
protested	VBD
protested	VBN
protesters	NNS
protesting	VBG
protestors	NNS
protests	NNS
protests	VBZ
protest	VB
protocols	NNS
prototypes	NNS
proved	VBD
proved	VBN
proven	VBN
Proverbs	NNS
proves	VBZ
Proves	VBZ
prove	VB
prove	VBP
provided	VBD
provided	VBN
Provided	VBN
providers	NNS
provides	VBZ
provide	VB
Provide	VB
provide	VBP
Provide	VBP
providing	VBG
provinces	NNS
proving	VBG
provisioning	VBG
provisions	NNS
provoked	VBD
provoked	VBN
provoke	VB
provoking	VBG
proxies	NNS
pruned	VBN
prune	VB
pseudo-lobbyists	NNS
psychics	NNS
psychologists	NNS
Psychologists	NNS
publications	NNS
publicized	VBN
publicize	VB
public-relations	NNS
public-works	NNS
Public-works	NNS
published	VBD
published	VBN
Published	VBN
publishers	NNS
Publishers	NNS
publishes	VBZ
publishing	VBG
publish	VB
pubs	NNS
puffers	NNS
pull-backs	NNS
pullbacks	NNS
pulled	VBD
pulled	VBN
pulling	VBG
pullouts	NNS
pulls	NNS
pulls	VBZ
pull	VB
Pull	VB
pull	VBP
pulverizing	VBG
pummeled	VBD
pummeled	VBN
pummel	VB
pumped	VBD
pumped	VBN
pumping	VBG
pumps	NNS
pump	VB
pump	VBP
punched	VBD
punched	VBN
punchers	NNS
punching	VBG
Punching	VBG
punch	VB
punch	VBP
pundits	NNS
punished	VBN
punishing	VBG
punish	VB
puns	NNS
punts	NNS
pupils	NNS
puppets	NNS
puppies	NNS
purchased	VBD
purchased	VBN
purchasers	NNS
purchases	NNS
purchases	VBZ
purchase	VB
purchase	VBP
purchasing	VBG
purchasing	VBG|NN
purged	VBD
purged	VBN
purges	VBZ
purge	VB
purging	VBG
purists	NNS
pur-poises	NNS
purports	VBZ
purport	VBP
purposes	NNS
purrs	VBZ
purse-snatchings	NNS
purses	NNS
pursued	VBD
pursued	VBN
pursuers	NNS
pursues	VBZ
pursue	VB
pursue	VBP
pursuing	VBG
pursuits	NNS
pushed	VBD
pushed	VBN
pushers	NNS
pushes	VBZ
pushing	VBG
Pushing	VBG
push	VB
push	VBP
Push	VBP
puts	NNS
puts	VBZ
Puts	VBZ
putting	VBG
Putting	VBG
put	VB
Put	VB
put	VBD
Put	VBD
put	VBN
Put	VBN
put	VBP
put	VBP|VB
puzzled	VBD
puzzled	VBN
puzzles	NNS
puzzle	VB
pyramiding	VBG
pyramids	NNS
quacks	NNS
quacks	VBZ
quadrupeds	NNS
quadrupled	VBD
quadrupled	VBN
quadruples	VBZ
quadrupling	VBG
quakes	NNS
qualifications	NNS
qualified	VBD
qualified	VBN
qualifies	VBZ
qualifying	VBG
qualify	VB
qualify	VBP
qualities	NNS
qualms	NNS
quantified	VBN
quantify	VB
quantities	NNS
quarreling	VBG
quarrel	VB
quarterbacks	NNS
quarters	NNS
quartets	NNS
quashed	VBD
quashed	VBN
quashing	VBG
queers	NNS
quell	VB
queried	VBN
queries	NNS
queries	VBZ
questioned	VBD
questioned	VBN
Questioned	VBN
questioning	VBG
questions	NNS
Questions	NNS
questions	VBZ
question	VB
question	VBP
queues	NNS
queuing	VBG
quibbling	VBG
quicken	VB
quieted	VBD
quieted	VBN
quieting	VBG
quiet	VB
quipped	VBD
quips	NNS
quips	VBZ
Quips	VBZ
quirks	NNS
quits	VBZ
quitting	VBG
quit	VB
quit	VBD
quit	VBN
quit	VBP
quivers	NNS
quiz	VB
quota-cheaters	NNS
quotas	NNS
quotations	NNS
quoted	VBD
quoted	VBN
quotes	NNS
quotes	VBZ
quote	VB
quote	VBP
quoting	VBG
Quoting	VBG
raced	VBD
racehorses	NNS
races	NNS
racetracks	NNS
racing	VBG
Racing	VBG
racked	VBD
racked	VBN
racketeering	VBG
rackets	NNS
racking	VBG
racks	NNS
radar-eluding	VBG
radicals	NNS
radioing	VBG
radios	NNS
rafters	NNS
raged	VBD
raged	VBN
rages	NNS
rage	VB
raging	VBG
raided	VBD
raided	VBN
raiders	NNS
raiding	VBG
raids	NNS
raid	VB
railbikes	NNS
railcars	NNS
railings	NNS
railroads	NNS
rails	NNS
rails	VBZ
railways	NNS
rained	VBD
rains	NNS
rain	VB
raised	VBD
raised	VBN
raisers	NNS
raises	NNS
raises	VBZ
raise	VB
Raise	VB
raise	VBP
raising	VBG
Raising	VBG
raked	VBD
raking	VBG
rallied	VBD
RALLIED	VBD
rallied	VBN
rallies	NNS
rallies	VBZ
rallying	VBG
rally	VB
Rally	VB
rally	VBP
rambled	VBD
ramifications	NNS
rammed	VBD
ramparts	NNS
ramps	NNS
ramp	VB
ranchers	NNS
ranches	NNS
rand	NNS
ranged	VBD
ranged	VBN
rangers	NNS
ranges	NNS
ranges	VBZ
range	VB
range	VBP
ranging	VBG
rang	VBD
ranked	VBD
ranked	VBN
rankings	NNS
ranking	VBG
rankled	VBN
ranks	NNS
ranks	VBZ
rank	VB
rank	VBP
ran	VBD
raped	VBD
raped	VBN
rapeseeds	NNS
raping	VBG
rapists	NNS
raptors	NNS
rarefied	VBN
ratcheting	VBG
rated	VBD
rated	VBN
Rated	VBN
ratepayers	NNS
rates	NNS
Rates	NNS
RATES	NNS
rates	VBZ
rate	VB
rate	VBP
ratified	VBD
ratified	VBN
ratifying	VBG
ratify	VB
ratings	NNS
Ratings	NNS
rating	VBG
rationalizations	NNS
rationalize	VB
rationalizing	VBG
rationed	VBN
ratios	NNS
RATIOS	NNS
rats	NNS
rattled	VBD
RATTLED	VBD
rattled	VBN
rattle	VB
rattling	VBG
rat	VB
ravaged	VBN
ravages	NNS
RAVAGES	NNS
raves	VBZ
rave	VB
ravines	NNS
raw-materials	NNS
rays	NNS
razed	VBN
razing	VBG
reached	VBD
reached	VBN
Reached	VBN
reaches	NNS
reaches	VBZ
reaching	VBG
Reaching	VBG
reach	VB
reach	VBP
reacted	VBD
reacted	VBN
reacting	VBG
reactions	NNS
reactivated	VBD
reactivated	VBN
reactors	NNS
reacts	VBZ
react	VB
react	VBP
readers	NNS
Readers	NNS
readied	VBD
readings	NNS
reading	VBG
Reading	VBG
readmit	VB
reads	VBZ
read	VB
Read	VB
read	VBD
read	VBD|VBP
read	VBN
read	VBP
read	VBP|VBD
reaffirmed	VBD
reaffirming	VBG
reaffirms	VBZ
reaffirm	VB
Reaganauts	NNS
realestate	VB
realigned	VBD
realigning	VBG
realignments	NNS
realign	VB
realists	NNS
realities	NNS
realized	VBD
realized	VBN
realizes	VBZ
realize	VB
realize	VBP
realizing	VBG
reallocated	VBN
reallocate	VB
realms	NNS
reams	NNS
reaped	VBD
reaped	VBN
reaping	VBG
reappointed	VBN
reapportion	VBP
reappraised	VBD
reappraised	VBN
reappraise	VB
reap	VB
REAP	VBP
Rearding	VBG
reared	VBN
rearing	VBG
rearm	VB
rearranges	VBZ
rearrange	VB
reasoned	VBD
reasoned	VBN
reasons	NNS
Reasons	NNS
reasons	VBZ
reason	VB
reason	VBP
reasserting	VBG
reasserts	VBZ
reassert	VB
reassessing	VBG
reassess	VB
reassigned	VBD
reassigned	VBN
reassignments	NNS
reassume	VB
reassurances	NNS
reassured	VBD
reassured	VBN
reassure	VB
reassuring	VBG
reauthorize	VB
reawakening	VBG
rebates	NNS
rebelled	VBD
rebels	NNS
rebounded	VB
rebounded	VBD
rebounded	VBN
rebounding	VBG
Rebounding	VBG
rebounds	NNS
rebounds	VBZ
rebound	VB
rebuffed	VBD
rebuffed	VBN
rebuilding	VBG
Rebuilding	VBG
rebuild	VB
rebuilt	VBN
rebuked	VBD
rebuts	VBZ
rebutted	VBN
rebut	VB
recalculated	VBD
recalculating	VBG
recalculations	NNS
recalled	VBD
recalled	VBN
recalling	VBG
recalls	NNS
recalls	VBZ
Recalls	VBZ
recall	VB
Recall	VB
recall	VBP
recanted	VBD
recanted	VBN
recapitalizations	NNS
recapitalized	VBN
recapture	VB
recede	VBP
receding	VBG
receipts	NNS
receivables	NNS
received	VBD
received	VBN
receivers	NNS
receives	VBZ
receive	VB
receive	VBP
receiving	VBG
recentralized	VBN
receptionists	NNS
receptors	NNS
recessed	VBN
recessions	NNS
recharging	VBG
recipes	NNS
recipients	NNS
recites	VBZ
reciting	VBG
reckoned	VBN
reckoning	VBG
reckons	VBZ
reckon	VB
reckon	VBP
reclaimed	VBN
reclaiming	VBG
reclaims	VBZ
reclaim	VB
reclaim	VBP
reclassified	VBD
reclining	VBG
recognized	VBD
recognized	VBN
recognizes	VBZ
recognize	VB
recognize	VBP
recognizing	VBG
recommendations	NNS
recommendatons	NNS
recommended	VBD
recommended	VBN
recommending	VBG
recommends	VBZ
recommend	VB
recommend	VBP
reconciles	VBZ
reconcile	VB
reconciling	VBG
reconnect	VB
reconsidered	VBN
reconsider	VB
reconstructed	VBD
reconstructed	VBN
reconstructing	VBG
reconstruct	VB
recorded	VBD
recorded	VBN
recorders	NNS
recordings	NNS
recording	VBG
records	NNS
RECORDS	NNS
records	VBZ
record	VB
Record	VB
recounted	VBD
recounted	VBN
recounting	VBG
recounts	VBZ
recouped	VBD
recouped	VBN
recoup	VB
recovered	VBD
recovered	VBN
recoveries	NNS
recovering	VBG
Recovering	VBG
recovers	VBZ
recover	VB
recover	VBP
recraft	VB
re-creactions	NNS
recreate	VB
Re-creating	VBG
re-creations	NNS
recruited	VBD
recruited	VBN
Recruited	VBN
recruiting	VBG
recruits	NNS
recruits	VBZ
recruit	VB
rectangles	NNS
rectified	VBN
rectifying	VBG
recuperate	VB
recurring	VBG
recused	VBN
recycled	VBN
recycles	VBZ
recycle	VB
recycling	VBG
reddened	VB
redeemed	VBN
redeeming	VBG
redeem	VB
redefined	VBD
redefine	VB
redefining	VBG
redemptions	NNS
redeploy	VB
redesigned	VBD
redesigned	VBN
redesigning	VBG
redesign	VB
redevelop	VB
red-flag	VB
redial	VB
redirected	VBN
rediscover	VB
redistribute	VB
redistributing	VBG
redlining	VBG
redoing	VBG
redoubling	VBG
redound	VB
redo	VB
redraw	VB
redress	VB
reds	NNS
Reds	NNS
reduced	VBD
reduced	VBN
reduces	VBZ
reduce	VB
reduce	VBP
reducing	VBG
Reducing	VBG
reductions	NNS
reefs	NNS
re-elected	VBD
re-elected	VBN
reeled	VBD
reeled	VBN
reeling	VBG
re-emerge	VB
re-emphasize	VBP
re-enacting	VBG
re-enactments	NNS
Re-enactments	NNS
re-entered	VBD
re-entering	VBG
re-enter	VB
re-establishing	VBG
re-establish	VB
reestablish	VB
re-evaluate	VB
re-evaluate	VBP
re-evaluating	VBG
re-examine	VB
reexamining	VBG
re-exports	NNS
refashioning	VBG
referees	NNS
references	NNS
referrals	NNS
referred	VBD
referred	VBN
referring	VBG
Referring	VBG
refers	VBZ
refer	VB
refer	VBP
refile	VB
refinanced	VBD
refinanced	VBN
refinance	VB
refinancing	VBG
refined	VBN
refineries	NNS
refiners	NNS
Refiners	NNS
refine	VB
refining	VBG
refitting	VBG
reflected	VBD
reflected	VBN
reflecting	VBG
Reflecting	VBG
reflects	VBZ
reflect	VB
reflect	VBP
refocused	VBD
refocused	VBN
refocuses	VB
refocusing	VBG
refocus	VB
reformed	VBN
reformers	NNS
reforming	VBG
reforms	NNS
reformulated	VBN
reform	VB
refrained	VBN
refrain	VB
refreshing	VBG
refrigerators	NNS
refueling	VBG
refugees	NNS
refunded	VBN
refunding	VBG
refunding	VBG|NN
refunds	NNS
refund	VB
refurbished	VBN
refurbishing	VBG
refurbish	VB
refused	VBD
refused	VBN
refusers	NNS
refuses	VBZ
refuse	VB
refuse	VBP
refusing	VBG
refuted	VBD
refute	VB
regained	VBD
regained	VBN
regaining	VBG
regains	VBZ
Regains	VBZ
regain	VB
regain	VBP
regarded	VBD
regarded	VBN
Regarded	VBN
regarding	VBG
Regarding	VBG
regards	VBZ
regard	VB
regard	VBP
regenerate	VB
regions	NNS
registered	VBD
registered	VBN
registering	VBG
registers	NNS
register	VB
register	VBP
registrants	NNS
registrations	NNS
regrets	NNS
regrets	VBZ
regretted	VBD
regretted	VBN
regret	VB
regret	VBP
regroup	VB
regroup	VBP
regulated	VBN
regulates	VBZ
regulate	VB
regulating	VBG
regulations	NNS
REGULATIONS	NNS
regulators	NNS
Regulators	NNS
regulators	VBZ
regummed	VBD
rehabilitated	VBN
rehabilitate	VB
rehashing	VBG
reigned	VBD
reigning	VBG
reignited	VBD
reignited	VBN
reignite	VB
reigniting	VBG
reimbursed	VBD
reimbursed	VBN
reimbursements	NNS
reimburses	VBZ
reimburse	VB
reimburse	VBP
reimpose	VB
reincorporated	VBN
reincorporating	VBG
reindicting	VBG
reinforced	VBD
reinforced	VBN
reinforcements	NNS
reinforces	VBZ
reinforce	VB
reinforce	VBP
reinforcing	VBG
Reinforcing	VBG
reining	VBG
reins	NNS
reinstalled	VBN
reinstated	VBD
reinstated	VBN
reinstate	VB
reinstating	VBG
reinstituting	VBG
reinsurers	NNS
reintegrated	VBN
reintroduced	VBN
rein	VB
reinvented	VBD
reinvent	VB
reinvested	VBD
reinvested	VBN
reinvesting	VBG
reinvest	VB
reinvest	VBP
reinvigorated	VBN
reinvigorate	VB
reinvigorating	VBG
reiterated	VBD
reiterates	VBZ
reiterating	VBG
REITs	NNS
rejected	VBD
rejected	VBN
rejecting	VBG
rejections	NNS
rejects	VBZ
reject	VB
reject	VBP
rejoice	VBP
rejoined	VBD
rejoining	VBG
Rejoins	VBZ
rejoin	VB
rejuvenate	VB
rekindled	VBN
Rekindled	VBN
rekindle	VB
rekindling	VBG
relabeling	VBG
related	VBD
related	VBN
Related	VBN
relates	VBZ
relate	VB
relate	VBP
relating	VBG
relationships	NNS
relations	NNS
Relations	NNS
relatives	NNS
relaunched	VBN
relaunch	VB
relaxed	VBD
relaxed	VBN
relaxing	VBG
relax	VB
relax	VBP
relayed	VBD
released	VBD
released	VBN
releases	NNS
releases	VBZ
release	VB
Release	VB
release	VBP
releasing	VBG
relegated	VBN
relented	VBD
relenting	VBG
relent	VBP
relics	NNS
relied	VB
relied	VBD
relied	VBN
relies	VBZ
relieved	VBD
relieved	VBN
relieve	VB
religions	NNS
relinquished	VBD
relinquished	VBN
relinquishing	VBG
relinquish	VB
relished	VBD
relishes	VBZ
relish	VB
relive	VBP
relocated	VBD
relocated	VBN
relocate	VB
relocating	VBG
relocations	NNS
relying	VBG
Relying	VBG
rely	VB
rely	VBP
remade	VB
remained	VBD
remained	VBN
remaining	VBG
Remaining	VBG
remains	NNS
Remains	NNS
remains	VBZ
remain	VB
remain	VBP
remake	VB
remanded	VBD
remarked	VBD
remarked	VBN
Remarketers	NNS
remarketings	NNS
remarks	NNS
remarks	VBZ
remark	VB
remedied	VBN
remedies	NNS
remedy	VB
remembered	VBD
remembered	VBN
remembering	VBG
remembers	VBZ
remember	VB
Remember	VB
remember	VBP
Remics	NNS
REMICs	NNS
reminded	VBD
reminded	VBN
reminders	NNS
reminding	VBG
reminds	VBZ
remind	VB
remind	VBP
remittances	NNS
remnants	NNS
remodeled	VBN
remodeling	VBG
remora	NNS
removed	VBD
removed	VBN
Removed	VBN
removes	VBZ
remove	VB
removing	VBG
remunerated	VBN
renamed	VBD
renamed	VBN
rename	VB
rendered	VBD
rendered	VBN
renderings	NNS
rendering	VBG
render	VB
rendezvoused	VBD
renege	VB
reneging	VBG
renegotiated	VBN
renegotiate	VB
renegotiating	VBG
renewals	NNS
renewed	VBD
renewed	VBN
Renewed	VBN
renewing	VBG
renews	VBZ
renew	VB
renounced	VBD
renounce	VB
renouncing	VBG
renovated	VBN
renovate	VB
renovating	VBG
renowned	VBN
rentals	NNS
rented	VBN
renters	NNS
renting	VBG
rents	NNS
Rents	NNS
rents	VBZ
rent	VB
reoffered	VBN
reopened	VBD
reopened	VBN
reopening	VBG
reopens	VBZ
reopen	VB
reorganized	VBN
reorganizes	VBZ
reorganize	VB
reoriented	VBN
repackaged	VBN
repackage	VB
repackaging	VBG
repaid	VBD
repaid	VBN
repainted	VBN
repaired	VBD
repaired	VBN
repairing	VBG
repairs	NNS
repairs	VBZ
repair	VB
repair	VBP
reparations	NNS
repassed	VBN
repatriate	VB
repaying	VBG
repayments	NNS
repay	VB
repealed	VBN
repeals	VBZ
repeal	VB
repeated	VBD
repeated	VBN
repeaters	NNS
repeating	VBG
repeats	NNS
repeats	VBZ
repeat	VB
repel	VB
repel	VBP
repercussions	NNS
replaced	VBD
replaced	VBN
replacements	NNS
replaces	VBZ
replace	VB
replace	VBP
replacing	VBG
Replacing	VBG
replaster	VB
replays	NNS
replenished	VBN
replenish	VB
replicated	VBN
replicate	VB
replicating	VBG
replied	VBD
Replied	VBD
replied	VBN
replies	NNS
replies	VBZ
reply	VB
repond	VB
reported	VBD
reported	VBN
reporters	NNS
reporting	VBG
reports	NNS
Reports	NNS
REPORTS	NNS
reports	VBZ
Reports	VBZ
report	VB
Report	VB
report	VBP
reposed	VBN
reposition	VB
repositories	NNS
repossess	VB
representations	NNS
representatives	NNS
Representatives	NNS
represented	VBD
represented	VBN
representing	VBG
representives	NNS
represents	VBZ
represent	VB
represent	VBP
repressed	VBN
repressing	VBG
repriced	VBN
reprinted	VBN
Reprinted	VBN
reprints	VBZ
reprint	VB
reprisals	NNS
reproduced	VBD
Reproduced	VBN
reproduce	VB
reprove	VB
reps	NNS
Republicans	NNS
republics	NNS
repudiate	VB
repurchased	VBD
repurchased	VBN
repurchases	NNS
repurchase	VB
repurchase	VBD
repurchase	VBN
repurchasing	VBG
reputations	NNS
reputed	VBN
requested	VBD
requested	VBN
requesting	VBG
requests	NNS
request	VB
request	VBP
required	VBD
required	VBN
requirements	NNS
requires	VBZ
require	VB
Require	VB
require	VBP
requiring	VBG
requisitioned	VBD
rerouted	VBN
rerouting	VBG
reruns	NNS
resales	NNS
rescheduled	VBD
rescheduled	VBN
reschedule	VB
rescinded	VBD
rescinding	VBG
rescind	VB
rescissions	NNS
rescued	VBD
rescuers	NNS
rescues	VBZ
rescue	VB
researched	VBN
researchers	NNS
Researchers	NNS
RESEARCHERS	NNS
researches	VBZ
researching	VBG
research	VB
resellers	NNS
reselling	VBG
resells	VBZ
resell	VB
resell	VBP
resemblances	NNS
resembles	VBZ
resemble	VB
resemble	VBP
resembling	VBG
resented	VBD
resent	VB
resent	VBP
reservations	NNS
reserved	VBD
reserved	VBN
Reserved	VBN
reserves	NNS
Reserves	NNS
reserves	VBZ
reserve	VB
reserve	VBP
reserving	VBG
reservoirs	NNS
reset	VB
reshaped	VBD
reshaped	VBN
reshape	VB
reshaping	VBG
reshuffled	VBD
reshuffle	VB
reshufflings	NNS
reshuffling	VBG
resided	VBN
residences	NNS
residents	NNS
Residents	NNS
resides	VBZ
reside	VB
residing	VBG
residues	NNS
resignations	NNS
RESIGNATIONS	NNS
resigned	VBD
RESIGNED	VBD
resigned	VBN
resigning	VBG
resign	VB
resins	NNS
resisted	VBD
resisted	VBN
resisting	VBG
resists	VBZ
resist	VB
Resist	VB
resist	VBP
resold	VB
resold	VBN
resold	VBP
resolutions	NNS
resolved	VBD
resolved	VBN
resolve	VB
resolving	VBG
resonated	VBD
resonates	VBZ
resonate	VB
resorts	NNS
resorts	VBZ
resort	VB
resort	VBP
resources	NNS
respected	VBD
respected	VBN
respects	NNS
respects	VBZ
respect	VB
responded	VBD
responded	VBN
respondents	NNS
responding	VBG
Responding	VBG
responds	VBZ
respond	VB
respond	VBP
responses	NNS
Responses	NNS
responsibilities	NNS
restarted	VBD
restarted	VBN
restarters	NNS
restarting	VBG
restart	VB
restated	VBD
restated	VBN
restate	VB
restating	VBG
restaurants	NNS
Restaurants	NNS
rested	VBD
restored	VBD
restored	VBN
restore	VB
restoring	VBG
restrained	VBD
restrained	VBN
restraining	VBG
restraints	NNS
restrain	VB
restricted	VBD
restricted	VBN
restricting	VBG
restrictions	NNS
restricts	VBZ
restrict	VB
Restrict	VB
restrict	VBP
restructured	VBD
restructured	VBN
restructures	VBZ
restructure	VB
restructure	VBP
restructurings	NNS
restructuring	VBG
rests	VBZ
rest	VB
Rest	VB
rest	VB|NN
rest	VBP
restyled	VBN
resubmit	VB
resulted	VBD
resulted	VBN
resulting	VBG
resulting	VBG|JJ
results	NNS
Results	NNS
results	VBZ
result	VB
result	VBP
resumed	VBD
resumed	VBN
resumes	NNS
resumes	VBZ
resume	VB
resume	VBP
resuming	VBG
re-supplied	VBN
resurfaced	VBD
resurfaced	VBN
resurging	VBG
resurrected	VBD
resurrected	VBN
resurrects	VBZ
resurrect	VB
resurrect	VBP
resuscitate	VB
resuscitating	VBG
retailers	NNS
Retailers	NNS
retailing	VBG
retail-sales	NNS
retails	VBZ
retail	VB
retail	VBP
retained	VBD
retained	VBN
retaining	VBG
retains	VBZ
retain	VB
retain	VBP
retaking	VBG
retaliating	VBG
retardants	NNS
retard	VB
rethinking	VBG
rethink	VB
retired	VBD
retired	VBN
Retired	VBN
retirees	NNS
retirements	NNS
retires	VBZ
retire	VB
retire	VBP
retiring	VBG
retooling	VBG
retools	VBZ
retorts	NNS
retorts	VBZ
retraced	VBD
retracted	VBD
retraining	VBG
retreated	VBD
retreated	VBN
retreating	VBG
retreats	NNS
retreat	VB
retrench	VBP
retrieved	VBD
retrieved	VBN
retrieve	VB
retrieve	VBP
retrofit	VB
retry	VB
returned	VBD
returned	VBN
returning	VBG
returns	NNS
Returns	NNS
returns	VBZ
return	VB
return	VBP
reunions	NNS
reunited	VBN
reunite	VB
reused	VBN
revalued	VBN
revamped	VBD
revamped	VBN
revamping	VBG
revamp	VB
're	VBP
revealed	VBD
revealed	VBN
revealing	VBG
reveals	VBZ
Reveals	VBZ
reveal	VB
reveal	VBP
revelations	NNS
revelers	NNS
reveling	VBG
revels	NNS
revel	VBP
revenues	NNS
Revenues	NNS
reverberated	VBN
reverberate	VB
reverberating	VBG
reverberations	NNS
reversals	NNS
reversed	VBD
reversed	VBN
reverses	VBZ
reverse	VB
Reverse	VBP
reversing	VBG
Reversing	VBG
reverted	VBN
reverts	VBZ
reviewed	VBD
reviewed	VBN
reviewing	VBG
Reviewing	VBG
reviews	NNS
reviews	VBZ
review	VB
review	VBP
revised	VBD
revised	VBN
Revised	VBN
REVISED	VBN
revise	VB
revising	VBG
Revising	VBG
revisionists	NNS
revisions	NNS
revisited	VBN
revisits	VBZ
revisit	VB
Revitalized	VBN
revitalizing	VBG
revivals	NNS
Revivals	NNS
revived	VBD
revived	VBN
revive	VB
revive	VBP
reviving	VBG
revoked	VBN
revoke	VB
revoking	VBG
revolutionaries	NNS
revolutionized	VBD
revolutionize	VB
revolves	VBZ
revolve	VB
revolving	VBG
revved	VBN
rewarded	VBN
rewarding	VBG
rewards	NNS
Rewards	NNS
rewards	VBZ
reward	VB
Reward	VB
reworked	VBN
rewrite	VB
rewriting	VBG
rewritten	VBN
rhymed	VBD
rhymes	VBZ
rhyming	VBG
ribbies	NNS
ribbons	NNS
ribs	NNS
Ricans	NNS
riches	NNS
riders	NNS
rides	NNS
ride	VB
ride	VBP
ridges	NNS
ridiculed	VBN
ridicules	VBZ
riding	VBG
rid	VB
RID	VB
rid	VBD
rid	VBN
rid	VBN|JJ
riffing	VBG
rifles	NNS
rigged	VBD
rigged	VBN
righted	VBN
rights	NNS
Rights	NNS
RIGHTS	NNS
right-to-lifers	NNS
right-wingers	NNS
rigors	NNS
rigs	NNS
riles	VBZ
rile	VBP
rim	VBP
ringers	NNS
Ringers	NNS
ringing	VBG
rings	NNS
rings	VBZ
ring	VB
ring	VBP
riots	NNS
ripens	VBZ
ripen	VBP
ripoffs	NNS
ripped	VBD
ripped	VBN
Ripples	NNS
ripple	VBP
rippling	VBG
risen	VBN
rises	NNS
rises	VBZ
rise	VB
rise	VBP
rising	VBG
Rising	VBG
risked	VBD
risking	VBG
risks	NNS
Risks	NNS
risks	VBZ
risk	VB
risk	VBP
rites	NNS
rituals	NNS
rivaling	VBG
rivalries	NNS
rivals	NNS
Rivals	NNS
rivals	VBZ
rival	VB
rivers	NNS
riveted	VBD
riveted	VBN
rivets	NNS
rivets	VBZ
roadblocks	NNS
roads	NNS
Roads	NNS
roadways	NNS
roamed	VBD
roam	VBP
roaring	VBG
roars	VBZ
robbed	VBN
robberies	NNS
robbers	NNS
Robbers	NNS
robbing	VBG
robes	NNS
robots	NNS
rocked	VBD
rocked	VBN
rockers	NNS
rocketed	VBD
rocketing	VBG
rockets	NNS
rocking	VBG
rocks	NNS
rock	VB
rodents	NNS
rode	VBD
RODE	VBD
rods	NNS
rogues	NNS
roiling	VBG
roil	VB
roles	NNS
rollbacks	NNS
rolled	VBD
rolled	VBN
Rolled	VBN
rollers	NNS
rolling	VBG
rollovers	NNS
rolls	NNS
rolls	VBZ
roll	VB
roll	VBP
romancing	VBG
romanticized	VBN
romps	NNS
romp	VBP
roofers	NNS
roofs	NNS
rooftops	NNS
Roommates	NNS
rooms	NNS
roost	VB
rooted	VBN
rooters	NNS
rooting	VBG
roots	NNS
root	VB
root	VBP
ropes	NNS
rosarians	NNS
roses	NNS
rose	VBD
rose	VBP
rotated	VBD
rotate	VB
rotating	VBG
rotted	VBN
rotting	VBG
roughed	VBD
roughnecks	NNS
rounded	VBD
rounded	VBN
rounds	NNS
round	VB
round	VBP
roustabouts	NNS
routed	VBN
routes	NNS
routes	VBZ
routines	NNS
routing	VBG
rowed	VBD
rows	NNS
row	VB
royalties	NNS
rubbed	VBD
rubber-necking	VBG
rubber-stamp	VB
rubdowns	NNS
rubfests	NNS
Rubins	NNS
rubles	NNS
rubs	NNS
rubs	VBZ
rub	VB
rub	VBP
ruffled	VBN
Ruffled	VBN
rugs	NNS
ruined	VBN
Ruined	VBN
ruining	VBG
ruins	NNS
ruin	VB
ruin	VBP
ruled	VBD
ruled	VBN
rulers	NNS
rules	NNS
Rules	NNS
RULES	NNS
rules	VBZ
rule	VB
rule	VBP
rulings	NNS
ruling	VBG
rumbled	VBD
rumbles	VBZ
rumble	VBP
rumblings	NNS
rumbling	VBG
ruminated	VBD
ruminated	VBN
ruminations	NNS
rumored	VBD
rumored	VBN
rumors	NNS
Rumors	NNS
rumors	VBZ
rung	VBN
run-ins	NNS
runners	NNS
runners-up	NNS
running	VBG
Running	VBG
runs	NNS
runs	VBZ
runups	NNS
run	VB
run	VBD
run	VBN
run	VBP
Runways	NNS
ruptured	VBD
ruptured	VBN
rupturing	VBG
rushed	VBD
rushed	VBN
rushes	VBZ
rushing	VBG
rush	VB
rush	VBP
rusted	VBN
rusticated	VBN
rustlers	NNS
rustlings	NNS
RVs	NNS
Saatchi	NNS
sabers	NNS
sabotage	VB
sacked	VBD
sackings	NNS
sacking	VBG
sacks	NNS
sacrifices	NNS
sacrifices	VBZ
sacrifice	VB
sacrificing	VBG
saddled	VBD
saddled	VBN
safeguarded	VBN
safeguarding	VBG
safeguards	NNS
safeguard	VB
safety	VB
sages	NNS
sagged	VBD
sagged	VBN
sagging	VBG
sagging	VBG|JJ
Sagos	NNS
said	VBD
Said	VBD
SAID	VBD
said	VBN
Said	VBN
sailed	VBD
sailing	VBG
sailors	NNS
sails	NNS
saints	NNS
salaries	NNS
SALARIES	NNS
salarymen	NNS
salesmen	NNS
sales	NNS
Sales	NNS
SALES	NNS
salespeople	NNS
Salespeople	NNS
salicylates	NNS
salted	VBD
saluted	VBD
saluting	VBG
salvaged	VBN
salvage	VB
salve	VB
Samaritans	NNS
samovars	NNS
sampled	VBN
samples	NNS
sanctioned	VBN
sanctioning	VBG
sanctions	NNS
sanctions	VBZ
Sandinistas	NNS
sands	NNS
sandwiched	VBD
sandwiched	VBN
Sandwiched	VBN
sandwiches	NNS
sang	VBD
sanitationists	NNS
sanitized	VBN
sanitize	VBP
sank	VBD
San	NNS
sapped	VBN
sapping	VBG
sap	VB
satellites	NNS
satisfied	VBD
satisfied	VBN
satisfied	VBN|JJ
satisfies	NNS
satisfies	VBZ
satisfying	VBG
Satisfying	VBG
satisfy	VB
saturated	VBD
saturated	VBN
saturate	VB
sat	VBD
sat	VBN
saucers	NNS
sauces	NNS
saunas	NNS
saved	VBD
saved	VBN
savers\/investors	NNS
savers	NNS
saves	VBZ
save	VB
Save	VB
save	VBP
savings	NNS
Savings	NNS
saving	VBG
savored	VBD
savoring	VBG
savors	NNS
savor	VB
saw	VBD
saying	VBG
Saying	VBG
says	VBZ
Says	VBZ
say	VB
Say	VB
say	VBP
Say	VBP
scabs	NNS
scalawags	NNS
scaled	VBD
scaled	VBN
scales	NNS
scale	VB
scaling	VBG
scalps	NNS
scammed	VBD
scammers	NNS
scamper	VBP
scams	NNS
scandalized	VBD
scandals	NNS
scanners	NNS
scanning	VBG
scans	NNS
scans	VBZ
scan	VB
scape	VB
scared	VBD
scared	VBN
scares	NNS
scares	VBZ
scare	VB
scare	VBP
scarfing	VBG
scaring	VBG
Scaring	VBG
scarred	VBN
scars	NNS
scattered	VBN
scavengers	NNS
scenarios	NNS
Scenarios	NNS
scenes	NNS
scents	NNS
scheduled	VBD
scheduled	VBN
schedules	NNS
schedule	VB
scheduling	VBG
schemers	NNS
schemes	NNS
scheming	VBG
schmumpered	VBD
scholarships	NNS
scholars	NNS
schoolboys	NNS
schoolchildren	NNS
schoolmates	NNS
schools	NNS
Schools	NNS
schoolteachers	NNS
school	VB
sciences	NNS
scientists	NNS
Scientists	NNS
SciMed	VBD
SciMed	VBN
scoffed	VBD
scoffs	VBZ
scoff	VBP
scolded	VBN
scold	VB
scooped	VBD
scooping	VBG
scoops	NNS
scoops	VBZ
scoop	VB
scooted	VBD
scored	VBD
scored	VBN
scores	NNS
Scores	NNS
score	VBP
scoring	VBG
scorn	VB
scorn	VBP
scotched	VBD
scotches	NNS
scourges	NNS
scouring	VBG
scour	VB
scouting	VBG
scout	VB
scowls	VBZ
scowl	VBP
scrambled	VBD
scrambled	VBN
scrambles	NNS
scramble	VBP
scrambling	VBG
scrape	VB
scrapped	VBD
scrapped	VBN
scrapping	VBG
scraps	NNS
Scraps	NNS
scraps	VBZ
scrap	VB
SCRAP	VBP
scratched	VBN
scratching	VBG
scratch	VB
scratch	VBP
screamed	VBD
screaming	VBG
screams	VBZ
scream	VB
scream	VBP
screeched	VBD
screeching	VBG
screened	VBD
screenings	NNS
screening	VBG
screens	NNS
screens	VBZ
screen	VB
screenwriters	NNS
screwed	VBD
screwed	VBN
screws	NNS
scribbled	VBD
scribblers	NNS
scribbling	VBG
scribes	NNS
scrimped	VBD
scrimping	VBG
scripts	NNS
scriptwriters	NNS
scrounged	VBD
scrounge	VBP
scrubbers	NNS
scrutinized	VBD
scrutinized	VBN
scrutinize	VB
scrutinizing	VBG
sculptors	NNS
sculptures	NNS
scurries	NNS
scurrying	VBG
scurry	VB
scuttled	VBD
scuttled	VBN
scuttle	VB
sealants	NNS
sealed	VBD
sealed	VBN
sealing	VBG
seals	NNS
seal	VB
seamen	NNS
searched	VBD
searches	NNS
searches	VBZ
searching	VBG
search	VB
search	VBP
searing	VBG
Sears	NNS
seas	NNS
seasonings	NNS
seasons	NNS
seated	VBN
seating	VBG
seats	NNS
Seats	NNS
seats	VBZ
secede	VB
second-guessed	VBN
second-guess	VB
seconds	NNS
Seconds	NNS
secretaries	NNS
secrets	NNS
sections	NNS
sectors	NNS
secured	VBD
secured	VBN
secure	VB
secure	VBP
securing	VBG
securites	NNS
securities	NNS
Securities	NNS
sedans	NNS
seduce	VB
seducing	VBG
seeded	VBN
seeds	NNS
seeing	VBG
Seeing	VBG
seekers	NNS
seeking	VBG
Seeking	VBG
SEEKING	VBG
seeks	VBZ
seek	VB
seek	VBP
Seek	VBP
seemed	VBD
seemed	VBN
seems	VBZ
Seems	VBZ
seem	VB
seem	VBP
seen	VBN
Seen	VBN
seeped	VBD
seesawing	VBG
sees	VBZ
Sees	VBZ
seething	VBG
see	VB
See	VB
see	VBP
SEE	VBP
segmenting	VBG
segments	NNS
segregated	VBD
segregate	VB
seized	VBD
seized	VBN
Seizes	VBZ
seize	VB
seize	VBP
seizing	VBG
seizures	NNS
selected	VBD
selected	VBN
selecting	VBG
selections	NNS
Selections	NNS
selects	VBZ
select	VB
select	VBP
self-destructed	VBD
self-insure	VBP
self-reinsure	VB
self-starters	NNS
sellers	NNS
selling	VBG
Selling	VBG
sell-off	NNS
sell-offs	NNS
selloffs	NNS
sells	VBZ
sell	VB
Sell	VB
SELL	VB
sell	VBP
semantics	NNS
semesters	NNS
semi-celebrities	NNS
semiconductors	NNS
semifinished	VBN
Semifinished	VBN
seminars	NNS
senators	NNS
Senators	NNS
senders	NNS
sending	VBG
sends	VBZ
send	VB
Send	VB
send	VBP
seniors	NNS
Seniors	NNS
sensed	VBD
senses	NNS
sense	VB
sense	VBP
sensibilities	NNS
sensing	VBG
sensitives	NNS
sensitivities	NNS
sensitize	VB
Sens.	NNS
sensors	NNS
sentenced	VBD
sentenced	VBN
sentences	NNS
Sentences	NNS
sentencings	NNS
sentencing	VBG
Sentencing	VBG
sentiments	NNS
sent	VBD
sent	VBN
separated	VBN
SEPARATED	VBN
separate	VB
separate	VBP
separating	VBG
sequels	NNS
sequestered	VBN
sequester	VB
sequester	VBP
sequins	NNS
sergeants	NNS
serials	NNS
series	NNS
Series	NNS
servants	NNS
served	VBD
served	VBN
Served	VBN
servers	NNS
serves	VBZ
serve	VB
serve	VBP
serviced	VBN
services	NNS
SERVICES	NNS
services	VBZ
service	VB
servicing	VBG
serving	VBG
sessions	NNS
setbacks	NNS
sets	NNS
sets	VBZ
setters	NNS
settings	NNS
setting	VBG
Setting	VBG
settled	VBD
settled	VBN
settlements	NNS
Settlements	NNS
settlers	NNS
settles	VBZ
settle	VB
Settle	VB
settle	VBP
settling	VBG
set	VB
set	VBD
set	VBN
set	VBP
severed	VBD
severed	VBN
severing	VBG
sever	VB
sevices	NNS
sewers	NNS
sew	VB
sexes	NNS
shacks	NNS
shades	NNS
shadowing	VBG
shadows	NNS
shadow	VB
shags	VBZ
shaken	VBN
Shaken	VBN
shakes	VBZ
shake	VB
SHAKE	VB
shake	VBP
shaking	VBG
shaped	VBN
shapes	NNS
shapes	VBZ
shape	VB
shape	VBP
shaping	VBG
shards	NNS
sharecroppers	NNS
shared	VBD
shared	VBN
shareholders	NNS
Shareholders	NNS
shareholdings	NNS
shares	NNS
Shares	NNS
shares	VBZ
share	VB
share	VBP
sharing	VBG
Sharing	VBG
sharks	NNS
sharpening	VBG
sharpens	VBZ
sharpen	VB
shattered	VBD
shattered	VBN
shattering	VBG
shatters	NNS
shaved	VBD
shaved	VBN
shaves	VBZ
shave	VB
Shaving	VBG
sheared	VBN
sheaths	NNS
shedding	VBG
SHEDDING	VBG
shed	VB
shed	VBD
shed	VBN
shed	VBP
sheets	NNS
sheiks	NNS
shelled	VBD
shelling	VBG
shells	NNS
shell	VB
sheltered	VBN
sheltering	VBG
shelters	NNS
SHELTERS	NNS
shelved	VBD
shelves	NNS
shepherded	VBD
sheriffs	NNS
shied	VBD
shied	VBN
shielded	VBD
shielded	VBN
shielding	VBG
shields	NNS
shield	VB
shifted	VBD
shifted	VBN
shifting	VBG
shifts	NNS
shifts	VBZ
shift	VB
shift	VBP
shillings	NNS
shills	NNS
shimmered	VBD
shine	VB
shine	VBP
shining	VBG
Shining	VBG
shins	NNS
shipbuilders	NNS
shipments	NNS
Shipments	NNS
shipped	VBD
shipped	VBN
shippers	NNS
Shippers	NNS
shipping	VBG
shipsets	NNS
ships	NNS
ship	VB
ship	VBP
shipyards	NNS
shirking	VBG
shirk	VB
shirts	NNS
shivering	VBG
shivers	NNS
shocked	VBD
shocked	VBN
Shocked	VBN
shocks	NNS
shock	VB
shoehorned	VBN
shoe-horn	VB
shoelaces	NNS
shoemaking	VBG
shoes	NNS
shook	VBD
Shook	VBD
shootings	NNS
shooting	VBG
shoots	NNS
shoots	VBZ
shoot	VB
shoot	VBP
shopkeepers	NNS
shopped	VBD
shopped	VBN
shoppers	NNS
Shoppers	NNS
SHOPPERS	NNS
shopping	VBG
shops	NNS
Shops	NNS
SHOPS	NNS
shop	VB
shores	NNS
shore	VB
shoring	VBG
shorn	VB
Shorn	VBN
shortages	NNS
shortchanged	VBN
short-circuited	VBN
shortcomings	NNS
shorted	VBN
shortened	VBN
shortening	VBG
shorten	VB
shorting	VBG
Shorting	VBG
short-sellers	NNS
shorts	NNS
short	VB
shots	NNS
shot	VBD
shot	VBN
shouldering	VBG
shoulders	NNS
shoulder	VB
shoulder	VBP
shouted	VBD
shouting	VBG
shouts	VBZ
shout	VB
shout	VBP
shoved	VBD
shovels	NNS
shoves	VBZ
shove	VB
shoving	VBG
showcases	NNS
showed	VBD
showed	VBN
showers	NNS
shower	VB
showgirls	NNS
showings	NNS
showing	VBG
Showing	VBG
shown	VBN
showrooms	NNS
Showrooms	NNS
shows	NNS
show-stoppers	NNS
shows	VBZ
Shows	VBZ
show	VB
Show	VB
show	VBP
shrank	VBD
shredded	VBD
shrieked	VBD
shrines	NNS
shrinking	VBG
Shrinking	VBG
shrinks	VBZ
shrink	VB
shriveled	VBD
shrouded	VBD
shrubs	NNS
Shrubs	NNS
shrugged	VBD
shrugs	NNS
shrugs	VBZ
shrug	VB
shrunk	VBN
shudders	NNS
shuffled	VBD
shuffling	VBG
shunned	VBD
shunning	VBG
shun	VB
shun	VBP
SHUN	VBP
shutdowns	NNS
shuts	NNS
shuts	VBZ
shuttered	VBD
shuttering	VBG
shutting	VBG
shuttled	VBD
shuttled	VBN
shuttles	NNS
shuttling	VBG
shut	VB
shut	VBD
shut	VBN
shying	VBG
shy	VB
shy	VBP
siblings	NNS
sided	VBD
sided	VBN
sidelined	VBN
sidelines	NNS
sidelining	VBG
sides	NNS
SIDES	NNS
sidestepped	VBD
sidestepping	VBG
sidesteps	VBZ
sidestep	VB
sidestep	VBP
sidetrack	VB
side	VB
side	VBP
sidewalks	NNS
sifted	VBN
sift	VB
sift	VBP
sighed	VBD
sighing	VBG
sighs	NNS
sighs	VBZ
sightings	NNS
sights	NNS
signaled	VBD
signaled	VBN
SIGNALED	VBN
signaling	VBG
signalling	VBG
signals	NNS
signals	VBZ
signal	VB
SIGNAL	VB
signal	VBP
signatories	NNS
signatures	NNS
signboards	NNS
signed	VBD
signed	VBN
Signed	VBN
signified	VBD
signifying	VBG
signify	VB
signing	VBG
signs	NNS
Signs	NNS
signs	VBZ
sign	VB
silenced	VBN
silences	NNS
Silences	NNS
silence	VB
silted	VBN
similarities	NNS
simmering	VBG
simmer	VB
simplicities	NNS
simplified	VBN
simplifying	VBG
SIMPLIFYING	VBG
simplify	VB
simplify	VBP
simulates	VBZ
simulate	VBP
simulations	NNS
simulators	NNS
singers	NNS
singing	VBG
Singin	VBG
singled	VBD
singled	VBN
singles	NNS
single	VB
single	VBP
singling	VBG
sings	VBZ
sing	VB
sing	VBP
sinking	VBG
sink	VB
sink	VBP
sins	NNS
siphoned	VBD
siphoned	VBN
siphoning	VBG
siphon	VB
sipped	VBD
sipping	VBG
sirens	NNS
sisters	NNS
sitcoms	NNS
sites	NNS
sits	VBZ
sitting	VBG
Sitting	VBG
sitting	VBG|JJ
situated	VBN
situations	NNS
sit	VB
Sit	VB
sit	VBP
six-packs	NNS
sixties	NNS
Sixties	NNS
sized	VBD
sizes	NNS
size	VBP
sizzle	VB
sizzling	VBG
skateboards	NNS
skeptics	NNS
Skeptics	NNS
sketches	NNS
sketches	VBZ
sketching	VBG
skewed	VBN
skidded	VBD
SKIDDED	VBD
skidded	VBN
skidding	VBG
skids	NNS
skid	VB
skid	VBD
skiers	NNS
skies	NNS
skiing	VBG
skills	NNS
Skills	NNS
skimmers	NNS
skimp	VB
skim	VB
skins	NNS
skipped	VBD
skipper	VB
skipping	VBG
Skipping	VBG
skip	VB
skip	VBP
skirmished	VBN
skirmishes	NNS
skirted	VBN
skirting	VBG
skirts	VBZ
skis	NNS
ski	VB
SKr1.5	NNS
SKr205	NNS
SKr20	NNS
SKr225	NNS
SKr29	NNS
Skulls	NNS
skyrocketed	VBD
skyrocketed	VBN
skyrocketing	VBG
slabs	NNS
slackened	VBD
slackened	VBN
slackening	VBG
slacks	NNS
slack	VB
slain	VBN
slam-dunk	VB
slammed	VBD
slam	VBP
slapped	VBD
slapped	VBN
slaps	NNS
slaps	VBZ
slap	VB
slashed	VBD
slashed	VBN
slashes	NNS
slashing	VBG
slash	VB
slash	VBP
slated	VBD
slated	VBN
Slated	VBN
slats	NNS
slaughtered	VBN
slayings	NNS
Slay	VBP
sleeping	VBG
Sleeping	VBG
sleeps	VBZ
sleep	VB
sleep	VBP
Sleep	VBP
sleeves	NNS
slept	VBD
slice	VB
slice	VBP
slicing	VBG
slide-packs	NNS
slides	NNS
Slides	NNS
slides	VBZ
slide	VB
sliding	VBG
slid	VBD
slid	VBN
slimmed	VBN
slimming	VBG
slingers	NNS
slings	NNS
slipped	VBD
slipped	VBN
slipping	VBG
slips	VBZ
slip	VB
slip	VBP
slithered	VBD
slithering	VBG
slits	NNS
slivered	VBN
slogans	NNS
slogs	VBZ
slog	VB
slopes	NNS
slopes	VBZ
sloshing	VBG
slots	NNS
slough	VB
slowdowns	NNS
slowed	VBD
slowed	VBN
slowing	VBG
Slowing	VBG
slows	VBZ
slow	VB
S&Ls	NNS
slumped	VBD
slumped	VBN
slumping	VBG
slumps	NNS
slump	VB
slump	VBP
slums	NNS
slurs	NNS
smacks	VBZ
smack	VBP
smarting	VBG
smashed	VBD
smashed	VBN
smashing	VBG
smash	VB
smelled	VBD
smelling	VBG
smells	VBZ
smell	VBP
smelt	VBN
smidgins	NNS
smiled	VBD
smiles	NNS
smiles	VBZ
smile	VBP
smiling	VBG
Smiling	VBG
smoked	VBD
smokers	NNS
Smokers	NNS
smokescreens	NNS
smokes	VBZ
smoke	VB
smoke	VBP
smoking	VBG
smoldering	VBG
smolder	VBP
smoothed	VBN
smooth	VB
smothered	VBN
smothering	VBG
smother	VB
smuggle	VB
snafus	NNS
snagged	VBN
snags	NNS
snakes	NNS
snakes	VBZ
snaking	VBG
snapped	VBD
snapped	VBN
snapping	VBG
snapshots	NNS
snaps	VBZ
snap	VBP
snare	VB
snarls	NNS
snatched	VBD
snatched	VBN
snatch	VB
sneaked	VBD
sneakers	NNS
sneaking	VBG
sneak	VBP
sniffed	VBD
sniffing	VBG
sniffs	VBZ
sniff	VB
sniped	VBD
snippets	NNS
sniveling	VBG
's	NNS
snooping	VBG
Snoozing	VBG
snoring	VBG
snorts	VBZ
snowballed	VBD
snowball	VB
snowbirds	NNS
snubbed	VBD
snubbing	VBG
soaking	VBG
soak	VB
soaps	NNS
soapsuds	NNS
soared	VBD
soared	VBN
soaring	VBG
Soaring	VBG
soars	NNS
soar	VB
soar	VBP
sobered	VBD
sob	VB
socalled	VBN
social-affairs	NNS
socialists	NNS
Socialists	NNS
socialize	VB
socializing	VBG
societies	NNS
sociologists	NNS
socks	NNS
sock	VB
Sock	VB
sodas	NNS
sofas	NNS
soft-drinks	NNS
softened	VBD
softened	VBN
softening	VBG
softens	VBZ
soften	VB
softies	NNS
soiled	VBD
soil-nutrients	NNS
soils	NNS
soirees	NNS
soldiers	NNS
Soldiers	NNS
sold	VBD
sold	VBN
solicitations	NNS
solicited	VBD
solicited	VBN
soliciting	VBG
solicitors	NNS
solicits	VBZ
solicit	VB
solidified	VBD
solidify	VB
solidify	VBP
solutions	NNS
solved	VBD
Solved	VBD
solved	VBN
solvents	NNS
solves	VBZ
solve	VB
solving	VBG
Solving	VBG
songs	NNS
SONGsters	NNS
songwriters	NNS
sons	NNS
soothe	VB
soothing	VBG
sophisticates	NNS
sops	NNS
soreheads	NNS
sorted	VBN
sorting	VBG
Sorting	VBG
sorts	NNS
sort	VB
sought	VBD
sought	VBN
soulmates	NNS
souls	NNS
sounded	VBD
sounded	VBN
soundings	NNS
sounding	VBG
sounds	NNS
sounds	VBZ
Sounds	VBZ
sound	VB
Sound	VB
sound	VBP
soups	NNS
sources	NNS
Sources	NNS
sourcing	VBG
soured	VBD
soured	VBN
sour	VB
soviets	NNS
Soviets	NNS
sowed	VBD
Sows	NNS
sows	VBZ
sow	VB
sow	VBP
soybeans	NNS
Soybeans	NNS
SOYBEANS	NNS
spaceships	NNS
spaces	NNS
spackle	VB
spaghetti	NNS
spanned	VBD
spanning	VBG
spans	NNS
span	VBP
spared	VBD
spared	VBN
spares	NNS
spares	VBZ
spare	VB
spare	VBP
sparing	VBG
sparked	VBD
sparked	VBN
sparking	VBG
sparkplugs	NNS
sparks	NNS
sparks	VBZ
Sparks	VBZ
spark	VB
sparred	VBD
sparring	VBG
spasms	NNS
spas	NNS
spawned	VBD
spawned	VBN
spawns	VBZ
spawn	VB
speakers	NNS
Speakers	NNS
speaking	VBG
Speaking	VBG
speaks	VBZ
speak	VB
speak	VBP
spearheaded	VBD
spearheaded	VBN
spearheading	VBG
specialists	NNS
Specialists	NNS
specialized	VBN
specializes	VBZ
specialize	VB
specialize	VBP
specializing	VBG
specials	NNS
specialties	NNS
specialty-chemicals	NNS
specialty-metals	NNS
species	NNS
specifications	NNS
Specifications	NNS
specifics	NNS
specified	VBD
specified	VBN
specifies	VBZ
specifying	VBG
specify	VB
specimens	NNS
specs	NNS
spectators	NNS
speculated	VBD
speculated	VBN
speculate	VB
speculate	VBP
speculating	VBG
speculations	NNS
speculators	NNS
Speculators	NNS
sped	VBD
sped	VBN
speeches	NNS
speeded	VBD
speeding	VBG
speeds	NNS
speeds	VBZ
speed	VB
Speed	VB
spelled	VBN
spelling	VBG
spells	NNS
spells	VBZ
spell	VB
spenders	NNS
spending	VBG
Spending	VBG
spending	VBG|NN
spends	VBZ
spendthrifts	NNS
spend	VB
Spend	VB
spend	VBP
spent	VBD
spent	VBN
spewed	VBD
spewing	VBG
spices	NNS
spiders	NNS
spied	VBD
spies	NNS
spies	VBZ
spigots	NNS
spiked	VBN
spilled	VBD
spilled	VBN
spills	NNS
spills	VBZ
spill	VB
spinning	VBG
spinoffs	NNS
spins	VBZ
spin	VB
spiraled	VBD
spiraling	VBG
spiralled	VBD
spirited	VBN
spirits	NNS
Spirits	NNS
splashed	VBD
splints	NNS
splits	NNS
Splits	NNS
splits	VBZ
split	VB
split	VBD
split	VBN
spoiled	VBD
spoil	VBP
spoken	VBN
spokesmen	NNS
Spokesmen	NNS
spokes	NNS
Spokespersons	NNS
spoke	VBD
sponsored	VBD
sponsored	VBN
sponsoring	VBG
sponsors	NNS
Sponsors	NNS
sponsors	VBZ
sponsor	VB
sponsor	VBP
spooked	VBD
spooked	VBN
Spooked	VBN
spooks	NNS
spook	VBP
spoonbills	NNS
spoonfuls	NNS
spores	NNS
sported	VBD
sporting-goods	NNS
sporting	VBG
sportsmen	NNS
sports	NNS
Sports	NNS
sports	VBZ
spotlight	VB
spots	NNS
Spots	NNS
spots	VBZ
spotted	VBD
spotted	VBN
Spotted	VBN
spotting	VBG
spotting	VBG|NN
spot	VB
spouses	NNS
spout	VBP
sprang	VBD
sprawling	VBG
spraying	VBG
sprays	NNS
spreading	VBG
spreadsheets	NNS
spreads	NNS
Spreads	NNS
spreads	VBZ
spread	VB
spread	VBD
spread	VBN
spread	VBP
springing	VBG
springs	VBZ
spring	VB
sprinkled	VBD
sprinklers	NNS
sprinkles	VBZ
sprinkle	VBP
spritzers	NNS
sprouting	VBG
sprout	VB
sprout	VBP
spruce	VB
SPRUCING	VBG
sprung	VBN
spuds	NNS
spun	VBD
spun	VBN
spurned	VBD
spurned	VBN
spurning	VBG
spurns	VBZ
spurn	VB
spurn	VBP
spurred	VBD
spurred	VBN
Spurred	VBN
spurring	VBG
spurs	VBZ
spurted	VBD
spurted	VBN
spurts	NNS
spurts	VBZ
spurt	VBP
spur	VB
sputtered	VBD
sputter	VBP
spying	VBG
spy	VB
squabbles	NNS
squads	NNS
squalls	NNS
squandered	VBN
squandering	VBG
squared	VBD
squared	VBN
squares	NNS
square	VB
squaring	VBG
squatted	VBN
squeaking	VBG
squeegee	VBP
squeezed	VBD
squeezed	VBN
squeezes	VBZ
squeeze	VB
squeeze	VBP
squeezing	VBG
squelched	VBN
squelch	VBP
squinted	VBD
squinting	VBG
squirming	VBG
stabbed	VBD
stabbed	VBN
stabbing	VBG
stabilized	VBD
stabilized	VBN
stabilizes	VBZ
stabilize	VB
stabilize	VBP
stabilizing	VBG
Stabilizing	VBG
stacked	VBN
stacking	VBG
stacks	NNS
stack	VB
stadiums	NNS
Stadiums	NNS
staffed	VBN
staffers	NNS
Staffers	NNS
staffing	VBG
staffs	NNS
staff	VB
staged	VBD
STAGED	VBD
staged	VBN
stages	NNS
stages	VBZ
stage	VB
stage	VBP
stagewhispers	VBZ
staggered	VBD
staggering	VBG
staging	VBG
stagnated	VBD
stagnating	VBG
staid	VBN
stains	NNS
stain	VB
staircases	NNS
stairs	NNS
staked	VBN
stakes	NNS
stake	VB
stalked	VBN
stalking	VBG
stalled	VBD
stalled	VBN
Stalled	VBN
stalling	VBG
stalls	NNS
stalls	VBZ
stall	VB
stalwarts	NNS
stampeded	VBN
stampede	VB
stampings	NNS
stamping	VBG
stamps	NNS
stamp	VB
stanch	VB
standardize	VB
standards	NNS
standbys	NNS
standing	VBG
Standing	VBG
stands	NNS
stands	VBZ
stand	VB
Stand	VB
stand	VBP
Stand	VBP
stapling	VBG
stared	VBD
stares	NNS
stare	VBP
staring	VBG
starring	VBG
stars	NNS
stars	VBZ
started	VBD
started	VBN
Started	VBN
starters	NNS
starting	VBG
Starting	VBG
startled	VBD
starts	NNS
starts	VBP
starts	VBZ
start-up	NNS
start-ups	NNS
start	VB
start	VBP
star	VB
starved	VBN
starve	VB
Starve	VB
starving	VBG
stashed	VBD
stash	VB
stated	VBD
stated	VBN
statements	NNS
Statements	NNS
statesmen	NNS
states	NNS
States	NNS
STATES	NNS
states	VBZ
state	VB
state	VBP
stating	VBG
stationed	VBN
stations	NNS
statisticians	NNS
statistics	NNS
Statistics	NNS
statues	NNS
statutes	NNS
staunch	VB
stave	VB
stayed	VBD
stayed	VBN
staying	VBG
stays	NNS
stays	VBZ
stay	VB
stay	VBP
steadied	VBD
steadied	VBN
steaks	NNS
stealing	VBG
steals	VBZ
steal	VB
steal	VBP
steamed	VBD
steamed	VBN
steaming	VBG
steelmakers	NNS
Steelmakers	NNS
steels	NNS
steelworkers	NNS
steered	VBD
steered	VBN
steering	VBG
steers	VBZ
steer	VB
stemmed	VBD
stemmed	VBN
stemming	VBG
stems	VBZ
stem	VB
stem	VBP
stepped	VBD
stepped	VBN
stepping	VBG
steps	NNS
Steps	NNS
steps	VBZ
Steps	VBZ
step	VB
Step	VB
step	VBP
stereos	NNS
stereotypes	NNS
steriles	NNS
sterilized	VBN
sterilize	VB
sterilizing	VBG
steroids	NNS
stewards	NNS
stewed	VBD
stickers	NNS
sticking	VBG
sticks	NNS
sticks	VBZ
stick	VB
Stick	VB
stick	VBP
stifles	VBZ
stifle	VB
stifling	VBG
still-raging	VBG
stilts	NNS
stimulated	VBN
stimulate	VB
stimulating	VBG
stimulators	NNS
stimuli	NNS
stinging	VBG
stingrays	NNS
stink	VBP
stints	NNS
stipends	NNS
stipulated	VBD
stipulates	VBZ
stipulate	VB
stirred	VBD
stirrings	NNS
stirring	VBG
stirrups	NNS
stirs	VBZ
Stirs	VBZ
stir	VB
stir	VBP
stitched	VBN
stitches	NNS
stockbrokers	NNS
Stockbrokers	NNS
stockbuilding	VBG
stocked	VBN
stockholders	NNS
Stockholders	NNS
stockholdings	NNS
stock-index-futures	NNS
stock-index	NNS
stocking	VBG
stock-options	NNS
stockpiles	NNS
stockpile	VB
stocks	NNS
Stocks	NNS
STOCKS	NNS
stocks	VBZ
stock	VB
stockyards	NNS
stoked	VBN
stoke	VB
stoking	VBG
stolen	VBN
stole	VBD
stomachs	NNS
stomach	VB
stomped	VBD
stomping	VBG
stoned	VBN
stones	NNS
stonewalled	VBD
stood	VBD
stood	VBN
stooges	NNS
stools	NNS
stoppages	NNS
stopped	VBD
stopped	VBN
stopping	VBG
stops	NNS
stops	VBZ
stop	VB
Stop	VB
stop	VBP
stored	VBD
stored	VBN
storefronts	NNS
stores	NNS
Stores	NNS
stores	VBZ
store	VB
store	VBP
stories	NNS
storing	VBG
stormed	VBD
storming	VBG
storms	NNS
storytellers	NNS
stowed	VBD
straddling	VBG
strafe	VB
straightening	VBG
straighten	VB
strained	VBN
strainers	NNS
straining	VBG
strains	NNS
strain	VB
strain	VBP
straits	NNS
stranded	VBN
stranding	VBG
strands	NNS
strangled	VBN
strangles	VBZ
strapped	VBD
strapped	VBN
stratagems	NNS
strategies	NNS
Strategies	NNS
strategists	NNS
Strategists	NNS
strawberries	NNS
straying	VBG
stray	VB
stray	VBP
streaked	VBD
streamed	VBD
streaming	VBG
streamlined	VBD
streamline	VB
streamlining	VBG
streams	NNS
streets	NNS
Streetspeak	VB
strengthened	VBD
strengthened	VBN
strengthening	VBG
strengthens	VBZ
strengthen	VB
strengthen	VBP
strengths	NNS
stressed	VBD
stressed	VBN
stresses	NNS
stresses	VBZ
stressing	VBG
stressors	NNS
stress	VB
stress	VBP
stretched	VBD
stretched	VBN
stretches	NNS
stretches	VBZ
stretching	VBG
Stretching	VBG
stretch	VB
stretch	VBP
strewn	VBN
stricken	VBN
strides	NNS
strikers	NNS
strikes	NNS
Strikes	NNS
strikes	VBZ
strike	VB
strike	VBP
striking	VBG
Striking	VBG
strings	NNS
string	VB
stripes	NNS
stripped	VBD
stripped	VBN
stripping	VBG
strips	NNS
Strips	NNS
strips	VBZ
strip	VB
striven	VBN
strives	VBZ
strive	VBP
striving	VBG
strode	VBD
strokes	NNS
Strokes	NNS
strokes	VBZ
Stroking	VBG
strolling	VBG
stroll	VB
stroll	VBP
strongholds	NNS
strove	VBD
struck	VBD
STRUCK	VBD
struck	VBN
structured	VBD
structured	VBN
structures	NNS
structure	VB
structuring	VBG
struggled	VBD
STRUGGLED	VBD
struggled	VBN
struggles	NNS
struggles	VBZ
struggle	VB
struggling	VBG
STUBBED	VBN
stuck	VBD
stuck	VBN
studded	VBN
student-athletes	NNS
studentled	VBN
students	NNS
Students	NNS
STUDENTS	NNS
studied	VBD
studied	VBN
studies	NNS
Studies	NNS
studies	VBZ
studios	NNS
Studios	NNS
studying	VBG
study	VB
study	VBP
stuffed	VBD
stuffed	VBN
Stuffing	VBG
stuff	VBP
stumbled	VBD
stumbled	VBN
stumble	VB
stumble	VBP
stumbling	VBG
stung	VBN
Stung	VBN
stunned	VBD
stunned	VBN
Stunned	VBN
stunted	VBN
styled	VBN
styles	NNS
styling	VBG
stymied	VBN
subcommittees	NNS
subcompacts	NNS
subconferences	NNS
subcontractors	NNS
Subcontractors	NNS
subcontract	VB
subdued	VBN
subgroups	NNS
subjected	VBN
subjecting	VBG
subjects	NNS
subjects	VBZ
subject	VB
sublet	VB
submarines	NNS
sub-markets	NNS
submits	VBZ
submitted	VBD
submitted	VBN
submitting	VBG
submit	VB
submit	VBP
subordinated	VBD
subordinated	VBN
subordinates	NNS
subordinates	VBZ
subordinate	VB
subpoenaed	VBN
subpoenas	NNS
subpoena	VB
subscribed	VBN
subscribers	NNS
Subscribers	NNS
subscribes	VBZ
subscribe	VB
subscribe	VBP
subscribing	VBG
Subscribing	VBG
subscriptions	NNS
sub-segments	NNS
subsided	VBD
subsided	VBN
subsides	NNS
subsidiaries	NNS
subsidies	NNS
Subsidies	NNS
subsidized	VBN
subsidizes	VBZ
subsidize	VB
subsidizing	VBG
Subsidizing	VBG
subskills	NNS
substances	NNS
substantiate	VB
substations	NNS
substituted	VBD
substituted	VBN
substitutes	NNS
substitute	VB
substituting	VBG
Substituting	VBG
substracting	VBG
subsumed	VBN
subtilis	NNS
subtitled	VBN
subtracted	VBD
subtracted	VBN
subtracting	VBG
subtract	VB
sub-underwriters	NNS
sub-underwriting	VBG
suburbs	NNS
subversives	NNS
subverted	VBN
subverts	VBZ
subvert	VB
subways	NNS
succeeded	VBD
succeeded	VBN
succeeding	VBG
Succeeding	VBG
succeeds	VBZ
succeed	VB
succeed	VBP
successes	NNS
successors	NNS
succumbed	VBD
succumbed	VBN
succumbing	VBG
suckers	NNS
sucks	VBZ
sued	VBD
sued	VBN
SUES	VBZ
sue	VB
suffered	VBD
suffered	VBN
suffering	VBG
Suffering	VBG
suffers	VBZ
suffer	VB
suffer	VBP
sufficed	VBD
suffice	VB
Suffice	VB
suggested	VBD
suggested	VBN
suggesting	VBG
suggestions	NNS
suggests	VBZ
suggest	VB
suggest	VBP
suing	VBG
suited	VBN
suites	NNS
suitors	NNS
Suitors	NNS
suits	NNS
Suits	NNS
suits	VBZ
suit	VB
summaries	NNS
summarized	VBD
summarize	VB
summarizing	VBG
Summarizing	VBG
summed	VBD
summers	NNS
summoned	VBD
summoned	VBN
summoning	VBG
summon	VB
sums	NNS
sums	VBZ
sum	VB
Sundays	NNS
sunflowers	NNS
sunglasses	NNS
sung	VBN
sunk	VBD
sunk	VBN
sunsets	NNS
superceded	VBD
supercede	VBP
supercomputers	NNS
superconcentrates	NNS
Superconcentrates	NNS
superconductors	NNS
Superconductors	NNS
superimposed	VBN
superintendents	NNS
superiors	NNS
supermarkets	NNS
Supermarkets	NNS
superpowers	NNS
superpremiums	NNS
superseded	VBD
superseded	VBN
supersede	VB
superstars	NNS
supervised	VBD
supervised	VBN
supervises	VBZ
supervise	VB
supervise	VBP
supervising	VBG
supervisors	NNS
supplements	NNS
supplement	VB
supplied	VBD
supplied	VBN
suppliers	NNS
Suppliers	NNS
supplies	NNS
supplies	VBZ
supplying	VBG
supply	VB
supply	VBP
supported	VBD
supported	VBN
supporters	NNS
Supporters	NNS
supporting	VBG
Supporting	VBG
supports	NNS
supports	VBZ
support	VB
support	VBP
supposed	VBD
supposed	VBN
suppose	VB
Suppose	VB
suppose	VBP
suppressants	NNS
suppressed	VBD
suppressed	VBN
suppress	VB
surfaced	VBD
surfaced	VBN
surfaces	VBZ
surface	VB
surface	VBP
surfacing	VBG
surfers	NNS
surged	VBD
SURGED	VBD
surged	VBN
surges	NNS
surges	VBZ
surge	VB
surging	VBG
surmounting	VBG
surpassed	VBD
surpassed	VBN
surpassing	VBG
surpass	VB
surpass	VBP
surpluses	NNS
surprised	VBD
surprised	VBN
surprises	NNS
Surprises	NNS
surprise	VB
surprising	VBG
surrendered	VBD
surrendered	VBN
surrendering	VBG
surrender	VB
Surrender	VB
surrounded	VBN
Surrounded	VBN
surrounded	VBN|JJ
surrounding	VBG
surround	VBP
surtaxes	NNS
surveyed	VBD
surveyed	VBN
Surveying	VBG
surveys	NNS
Surveys	NNS
surveys	VBZ
survey	VB
survey	VBP
survived	VBD
Survived	VBD
survived	VBN
survives	VBZ
survive	VB
Survive	VB
survive	VBP
surviving	VBG
Surviving	VBG
survivors	NNS
suspected	VBD
suspected	VBN
suspecting	VBG
suspects	NNS
suspects	VBZ
suspect	VB
suspect	VBP
suspended	VBD
suspended	VBN
suspending	VBG
suspend	VB
suspensions	NNS
suspicions	NNS
sustained	VBD
sustained	VBN
sustaining	VBG
sustains	VBZ
sustain	VB
sutures	NNS
suvivors	NNS
's	VBZ
s	VBZ
'S	VBZ
swallowed	VBN
swallowing	VBG
swallow	VB
swamped	VBD
swamped	VBN
swamp	VB
swans	NNS
swapped	VBN
swapping	VBG
swaps	NNS
swap	VB
swap	VBP
swarms	NNS
swathed	VBN
swayed	VBN
swaying	VBG
sway	VB
sway	VBP
swears	VBZ
swear	VB
swear	VBP
sweated	VBN
sweaters	NNS
Sweating	VBG
sweatshirts	NNS
sweat	VB
sweat	VBD
sweat	VBP
Swedes	NNS
sweepers	NNS
sweeping	VBG
sweeps	NNS
sweepstakes	NNS
sweeps	VBZ
sweep	VB
sweetened	VBD
sweetened	VBN
sweeteners	NNS
sweeten	VB
sweets	NNS
swelled	VBD
swelled	VBN
swelling	VBG
swells	NNS
swells	VBZ
swell	VB
swell	VBP
swept	VBD
swept	VBN
swerve	VBP
swimming	VBG
swim	VBP
swindled	VBN
swine	NNS
swinging	VBG
swings	NNS
swings	VBZ
swing	VB
swing	VBP
switched	VBD
switched	VBN
switchers	NNS
switches	NNS
switches	VBZ
switching	VBG
SWITCHING	VBG
switch	VB
switch	VBP
swiveling	VBG
Swiveling	VBG
swore	VBD
sworn	VBN
swung	VBD
SWUNG	VBD
swung	VBN
sycophants	NNS
symbolized	VBN
symbolizes	VBZ
symbols	NNS
sympathies	NNS
sympathizers	NNS
sympathize	VBP
symposiums	NNS
symptoms	NNS
Syms	NNS
synchronized	VBN
Synchronized	VBN
synchronize	VBP
syndciated	VBN
syndicated	VBN
syndicates	NNS
Syndicates	NNS
syndicate	VB
syndicating	VBG
syndications	NNS
synergies	NNS
syngeries	NNS
synonyms	NNS
synthesizers	NNS
synthesize	VB
synthetics	NNS
systems	NNS
Systems	NNS
tabacs	NNS
tables	NNS
tablespoons	NNS
tablets	NNS
tabloids	NNS
taboo	VB
tabs	NNS
tacked	VBD
tacking	VBG
tackled	VBN
tackles	VBZ
tackle	VB
tackle	VBP
tackling	VBG
tacos	NNS
tactics	NNS
tagged	VBN
tags	NNS
tag	VB
tailing	VBG
tailored	VBN
tailoring	VBG
tails	NNS
tainted	VBN
taken	VBN
Taken	VBN
takeovers	NNS
takers	NNS
takes	VBZ
Takes	VBZ
taketh	VB
take	VB
Take	VB
take	VBP
Take	VBP
takings	NNS
taking	VBG
Taking	VBG
talents	NNS
tales	NNS
Tales	NNS
talked	VBD
talked	VBN
talking	VBG
Talking	VBG
talks	NNS
Talks	NNS
talks	VBZ
TALKS	VBZ
talk	VB
talk	VBP
tallied	VBD
tallies	NNS
tallying	VBG
taming	VBG
Taming	VBG
tampering	VBG
tampers	NNS
tamper	VB
tampons	NNS
Tandy	VB
tangled	VBN
tangle	VBP
tangoed	VBD
tanked	VBN
tankers	NNS
Tankers	NNS
tanks	NNS
Tanks	NNS
tank	VB
tanned	VBN
tans	NNS
tantalizing	VBG
taped	VBD
taped	VBN
Taped	VBN
tapering	VBG
tapers	NNS
tapers	VBZ
taper	VB
tapes	NNS
tapestries	NNS
tape	VB
tape	VBP
tapings	NNS
taping	VBG
tapped	VBD
tapped	VBN
tapping	VBG
taps	NNS
Taps	VBZ
tap	VB
Tap	VB
targeted	VBD
targeted	VBN
targeting	VBG
targeting	VBG|NN
targets	NNS
targets	VBZ
target	VB
target	VBP
tariffs	NNS
tarnished	VBD
tarnished	VBN
tarnish	VB
tarred	VBD
tartans	NNS
tasks	NNS
tassels	NNS
tastes	NNS
Tastes	NNS
tastes	VBZ
taste	VB
taste	VBP
taught	VBD
taught	VBN
taunted	VBD
tax-deductions	NNS
taxed	VBD
taxed	VBN
taxes	NNS
Taxes	NNS
taxes	VBZ
tax-exempts	NNS
Tax-exempts	NNS
taxpayers	NNS
Taxpayers	NNS
TAXPAYERS	NNS
tax-reducing	VBG
tax	VB
tax-writers	NNS
T-bills	NNS
teachers	NNS
teaches	VBZ
teaching	VBG
teach	VB
TEACH	VB
teach	VBP
teamed	VBD
teaming	VBG
teammates	NNS
teams	NNS
Teams	NNS
team	VB
tearing	VBG
tears	NNS
tear	VB
teased	VBN
teaspoons	NNS
technical-services	NNS
technicians	NNS
techniques	NNS
technocrats	NNS
technologies	NNS
teemed	VBD
teeming	VBG
teen-agers	NNS
teenagers	NNS
teens	NNS
Teens	NNS
teetering	VBG
teeth	NNS
telecines	NNS
telecommunications	NNS
telecommunications	NNS|NN
Telecussed	VBD
telegraphed	VBD
telegraph	VBP
telemarketers	NNS
telephoned	VBD
Telephone-operations	NNS
telephones	NNS
telephone	VB
telephoning	VBG
telesystems	NNS
Telesystems	NNS
televised	VBN
televisions	NNS
telexes	NNS
tellers	NNS
telling	VBG
tells	VBZ
tell	VB
Tell	VB
tell	VBP
temblors	NNS
temperatures	NNS
tempered	VBN
temps	NNS
tempted	VBD
tempted	VBN
tempts	VBZ
tempt	VB
tempt	VBP
tenants	NNS
tended	VBD
tended	VBN
tendencies	NNS
tendered	VBD
tendered	VBN
tendering	VBG
tenders	NNS
Tenders	NNS
tender	VB
tender	VBP
tending	VBG
tends	VBZ
tend	VB
tend	VBP
tenets	NNS
tensions	NNS
tens	NNS
tenths	NNS
termed	VBD
termed	VBN
terminals	NNS
Terminals	NNS
terminated	VBD
terminated	VBN
terminate	VB
terminating	VBG
terminations	NNS
terms	NNS
Terms	NNS
term	VB
terrified	VBN
terrify	VB
territories	NNS
terrorists	NNS
testaments	NNS
test-drive	VB
test-drive	VBP
tested	VBD
tested	VBN
testers	NNS
test-fired	VBN
testified	VBD
testifies	VBZ
testifying	VBG
Testifying	VBG
testify	VB
testify	VBP
testing	VBG
testing	VBG|NN
tests	NNS
TESTS	NNS
tests	VBZ
test	VB
test	VBP
tethered	VBN
textbooks	NNS
textiles	NNS
texts	NNS
thanked	VBD
thanking	VBG
thanks	NNS
Thanks	NNS
THANKS	NNS
thank	VB
Thank	VB
thank	VBP
that	VBP
theaters	NNS
thefts	NNS
Thefts	NNS
themed	VBN
themes	NNS
theologians	NNS
theories	NNS
theorists	NNS
Theorists	NNS
theorized	VBD
theory-teaching	VBG
therapies	NNS
therapists	NNS
thermometers	NNS
The	VB
the	VBP
thieves	NNS
Thieves	NNS
things	NNS
Things	NNS
thinking	VBG
thinks	VBZ
think	VB
Think	VB
think	VBP
Think	VBP
thinned	VBN
thinning	VBG
thirds	NNS
thirties	NNS
Thirties	NNS
thistles	NNS
thoroughbreds	NNS
thoughts	NNS
thought	VBD
thought	VBN
thousands	NNS
Thousands	NNS
thrashed	VBD
thrashing	VBG
thrash	VB
threads	NNS
threatened	VBD
threatened	VBN
threatening	VBG
threatens	VBZ
threaten	VB
threaten	VBP
threats	NNS
three-fourths	NNS
three-quarters	NNS
three-sevenths	NNS
threw	VBD
thrifts	NNS
Thrifts	NNS
thrilled	VBN
thrills	VBZ
thrill	VB
thrived	VBD
thrives	VBZ
thrive	VB
thrive	VBP
Thrive	VBP
thriving	VBG
throats	NNS
throwers	NNS
throwing	VBG
Throwing	VBG
thrown	VBN
throws	VBZ
throw	VB
Throw	VB
throw	VBP
thrusting	VBG
thrusts	NNS
thrust	VBD
thrust	VBN
thugs	NNS
thumbing	VBG
thumbs	NNS
thumbs	VBZ
thumb	VB
thundered	VBD
thwarted	VBD
thwarted	VBN
thwarting	VBG
thwart	VB
ticked	VBN
ticketed	VBN
ticketing	VBG
tickets	NNS
ticking	VBG
ticks	VBZ
tick	VB
tidbits	NNS
tides	NNS
tied	VBD
tied	VBN
tie-ins	NNS
ties	NNS
ties	VBZ
tie-ups	NNS
tie	VB
tigers	NNS
tightened	VBD
tightened	VBN
tightening	VBG
tighten	VB
tighten	VBP
tiles	NNS
tilted	VBN
tilts	VBZ
tilt	VB
timberlands	NNS
timbers	NNS
timed	VBD
timed	VBN
time-hotels	NNS
time-shares	NNS
times	NNS
Times	NNS
time	VB
timing	VBG
timpani	NNS
tinged	VBN
tinges	NNS
tinkered	VBN
tinkering	VBG
tinker	VB
tins	NNS
tipped	VBD
tips	NNS
tipsters	NNS
tiptoed	VBD
tiptoed	VBN
tiptoe	VB
tip	VB
tired	VBN
tire-kickers	NNS
tires	NNS
tires	VBZ
tissues	NNS
titans	NNS
titled	VBD
titled	VBN
Titled	VBN
titles	NNS
toasted	VBD
toddlers	NNS
toeholds	NNS
toes	NNS
toiled	VBD
toiletries	NNS
toiling	VBG
toil	VB
toil	VBP
told	VBD
told	VBN
tolerate	VB
tolls	NNS
Tolls	NNS
tomatoes	NNS
toned	VBN
tones	NNS
tongues	NNS
tonnages	NNS
tons	NNS
Tons	NNS
took	VBD
tools	NNS
tooted	VBD
topics	NNS
topped	VBD
topped	VBN
topping	VBG
Topping	VBG
toppled	VBD
toppled	VBN
topple	VB
tops	NNS
tops	VBZ
top	VB
top	VBP
torched	VBD
torched	VBN
tore	VBD
Tories	NNS
tormentors	NNS
torments	VBZ
torment	VB
tornadoes	NNS
torn	VBN
torpedoed	VBN
torpedo	VB
torts	NNS
tortured	VBN
torture	VB
torture	VBP
tossed	VBD
tossed	VBN
tossers	NNS
tossing	VBG
toss	VB
totaled	VBD
totaled	VBN
totaling	VBG
totalling	VBG
totals	NNS
Totals	NNS
totals	VBZ
total	VB
total	VBP
toted	VBN
tote	VB
toting	VBG
tottering	VBG
totter	VB
touched	VBD
touched	VBN
touches	NNS
Touches	VBZ
touching	VBG
touch	VB
touch	VBP
toughened	VBD
toughen	VB
tough	VB
toured	VBD
touring	VBG
tourists	NNS
tournaments	NNS
tours	NNS
tours	VBZ
tour	VB
touted	VBD
touted	VBN
touting	VBG
touts	VBZ
tout	VB
towels	NNS
Towering	VBG
towers	NNS
tower	VB
townhouses	NNS
townships	NNS
towns	NNS
tows	NNS
toying	VBG
toys	NNS
traced	VBD
traced	VBN
traces	NNS
traces	VBZ
trace	VB
tracing	VBG
tracked	VBD
tracked	VBN
tracking	VBG
tracks	NNS
tracks	VBZ
track	VB
track	VBP
tractors	NNS
tracts	NNS
traded	VBD
traded	VBN
traded	VBN|VBD
trademarks	NNS
trade-offs	NNS
tradeoffs	NNS
traders	NNS
Traders	NNS
trades	NNS
trades	VBZ
trade	VB
trade	VBP
trading	VBG
Trading	VBG
trading	VBG|NN
traditionalists	NNS
traditions	NNS
traduced	VBN
traduce	VB
traffickers	NNS
tragedies	NNS
trailed	VBD
trailed	VBN
trailers	NNS
trailing	VBG
trails	NNS
trails	VBZ
trail	VB
trail	VBP
trained	VBN
Trained	VBN
trainers	NNS
training	VBG
trains	NNS
Trains	NNS
trains	VBZ
train	VB
train	VBP
traipse	VB
traits	NNS
tramping	VBG
trampled	VBN
trampling	VBG
transacted	VBN
transacting	VBG
transactions	NNS
Transactions	NNS
transact	VB
transcribe	VBP
transcripts	NNS
transferred	VBD
transferred	VBN
transferring	VBG
transfers	NNS
transfers	VBZ
transfer	VB
transformed	VBD
transformed	VBN
transforming	VBG
transforms	VBZ
transform	VB
transfusions	NNS
transistors	NNS
translated	VBN
Translated	VBN
translate	VB
translate	VBP
translating	VBG
translations	NNS
transmissions	NNS
transmitted	VBD
transmitted	VBN
transmitting	VBG
transmit	VB
transmogrified	VBD
transmogrified	VBN
transplanted	VBN
transplanting	VBG
transplants	NNS
transplant	VB
transported	VBD
transported	VBN
transporting	VBG
transports	NNS
Transports	NNS
transports	VBZ
transport	VB
Transport	VB
transvestites	NNS
trapped	VBN
trappings	NNS
trapping	VBG
traps	NNS
trashing	VBG
trash	VB
traumas	NNS
traumatized	VBD
traumatized	VBN
travails	NNS
traveled	VBD
traveled	VBN
travelers	NNS
Travelers	NNS
traveling	VBG
Traveling	VBG
travelogues	NNS
travels	NNS
travels	VBZ
TRAVELS	VBZ
travel	VB
travel	VBP
trays	NNS
treadmills	NNS
treads	VBZ
tread	VB
treasurers	NNS
treasures	NNS
Treasures	NNS
treasuries	NNS
Treasurys	NNS
treated	VBD
treated	VBN
treating	VBG
TREATING	VBG
treatises	NNS
treatments	NNS
treats	NNS
treats	VBZ
treat	VB
treat	VBP
trebled	VBD
trees	NNS
trekked	VBD
trembling	VBG
tremors	NNS
trenches	NNS
trending	VBG
trend-setters	NNS
trends	NNS
trend	VB
trespasses	NNS
trespass	VBP
trials	NNS
triangles	NNS
tribes	NNS
tributes	NNS
trickle	VB
trickle	VBP
trickling	VBG
tricks	NNS
trick	VB
tried	VBD
tried	VBN
tries	NNS
tries	VBZ
triggered	VBD
triggered	VBN
triggering	VBG
Triggering	VBG
triggers	VBZ
trigger	VB
trigger	VBP
trillions	NNS
trills	NNS
trimesters	NNS
trimmed	VBD
trimmed	VBN
trimming	VBG
TRIMMING	VBG
trim	VB
Trim	VBP
tripled	VBD
tripled	VBN
triples	NNS
triple	VB
tripling	VBG
tripped	VBN
trips	NNS
triumphed	VBD
trivialize	VB
trivia	NNS
troops	NNS
Troops	NNS
TROs	NNS
trotted	VBD
trotted	VBN
Trotting	VBG
troubled	VBD
troubled	VBN
Troubled	VBN
troublemakers	NNS
troubles	NNS
TROUBLES	NNS
troubles	VBZ
troubling	VBG
troughed	VBD
troughs	NNS
troupes	NNS
trousers	NNS
trout	NNS
Truckers	NNS
truck-parts	NNS
trucks	NNS
trucks	VBZ
truck	VBP
trudging	VBG
Trumped	VBN
trumpeting	VBG
trumpets	VBZ
trumpet	VBP
trundles	VBZ
trunks	NNS
trusted	VBD
trusted	VBN
trustees	NNS
Trustees	NNS
trusting	VBG
trusts	NNS
TRUSTS	NNS
trusts	VBZ
trust	VB
trust	VBP
truths	NNS
trying	VBG
Trying	VBG
tryouts	NNS
try	VB
Try	VB
try	VBP
Try	VBP
T-shirt	NNS
T-shirts	NNS
tubes	NNS
tubs	NNS
tucked	VBD
tucked	VBN
tucking	VBG
tuck	VB
tugged	VBD
tugging	VBG
tuitions	NNS
Tuitions	NNS
tumbled	VBD
tumbled	VBN
tumbles	NNS
tumbles	VBZ
tumble	VB
tumbling	VBG
tumors	NNS
tumor-suppressors	NNS
tuned	VBN
tunes	NNS
tune	VB
tune	VBP
tuning	VBG
tunnels	NNS
turbans	NNS
turbines	NNS
turboprops	NNS
turmoils	NNS
turnarounds	NNS
turned	VBD
turned	VBN
Turned	VBN
turning	VBG
turn-ons	NNS
turns	NNS
turns	VBZ
Turns	VBZ
TURNS	VBZ
turn	VB
turn	VBP
turtles	NNS
tusks	NNS
tutored	VBN
tutorials	NNS
tutoring	VBG
tuxedos	NNS
TVs	NNS
tweezers	NNS
twenties	NNS
twiddling	VBG
twinned	VBN
twisted	VBN
twisting	VBG
twists	NNS
twists	VBZ
twist	VBP
twitch	VB
two-hundredths	NNS
two-sevenths	NNS
two-thirds	NNS
twothirds	NNS
Two-thirds	NNS
tycoons	NNS
tying	VBG
typed	VBN
typefaces	NNS
types	NNS
typewriters	NNS
typhoons	NNS
typified	VBD
typifies	VBZ
UFOs	NNS
ulcers	NNS
ultimatums	NNS
umbrellas	NNS
un-advertisers	NNS
unbanning	VBG
unblock	VB
uncertainties	NNS
unchlorinated	VBN
uncles	NNS
unconsolidated	VBD
unconsolidated	VBN
uncovered	VBD
uncovered	VBN
uncovering	VBG
uncover	VB
Underclass	NNS
undercutting	VBG
undercut	VB
undercut	VBD
undercut	VBN
undercut	VBP
underestimated	VBD
underestimated	VBN
underfunded	VBN
undergirded	VBD
undergoing	VBG
undergone	VBN
undergo	VB
undergo	VBP
underlie	VB
underlined	VBD
underline	VB
underlying	VBG
Underlying	VBG
undermined	VBD
undermined	VBN
undermine	VB
undermine	VBP
undermining	VBG
underperformed	VBN
underperformers	NNS
underperforming	VBG
underperforms	VBZ
underperform	VB
underpinned	VBN
underpinning	VBG
underpin	VB
underpriced	VBN
underreacting	VBG
underscored	VBD
underscored	VBN
underscores	VBZ
underscore	VB
underscore	VBP
underscoring	VBG
Underscoring	VBG
underselling	VBG
understaffs	VBZ
understand\/adopt	VB
understanding	VBG
understands	VBZ
understand	VB
understand	VBP
understated	VBD
understated	VBN
understate	VBP
understating	VBG
understood	VBD
understood	VBN
undertaken	VBN
undertake	VB
undertakings	NNS
undertaking	VBG
undertones	NNS
undertook	VBD
underutilized	VBN
undervalued	VBD
undervalued	VBN
underweighted	VBN
underwent	VBD
underwhelmed	VBN
underwiters	NNS
underwriters	NNS
Underwriters	NNS
underwrites	VBZ
underwrite	VB
underwrite	VBP
underwritings	NNS
underwriting	VBG
Underwriting	VBG
underwritten	VBN
underwrote	VBD
undid	VBD
undone	VBN
undo	VB
undulate	VB
undulate	VBP
unearthed	VBD
unexecuted	VBN
unfazed	VBN
unfocussed	VBN
unfolded	VBD
unfolding	VBG
unfolds	VBZ
unfold	VB
unhinged	VBN
unhocked	VBN
unhusked	VBN
unified	VBN
uniforms	NNS
unifying	VBG
unify	VB
Unify	VB
unionists	NNS
unionized	VBD
unions	NNS
Unions	NNS
united	VBN
United	VBN
unites	VBZ
unite	VB
unitholders	NNS
Unitholders	NNS
units	NNS
Units	NNS
universities	NNS
Universities	NNS
unknowns	NNS
unleashed	VBD
unleashed	VBN
unleashes	VBZ
unleashing	VBG
unleash	VB
unleash	VBP
unloaded	VBN
unloading	VBG
Unloading	VBG
unload	VB
unload	VBP
unlocked	VBD
unlocks	VBZ
unlock	VBP
unmasks	VBZ
unmask	VB
unmaterialized	VBN
unnerved	VBD
unnerving	VBG
unplug	VB
unpolarizing	VBG
unraveled	VBD
unraveled	VBN
unraveling	VBG
unravel	VB
unrolls	VBZ
unroll	VBP
unseated	VBD
unseating	VBG
unsettled	VBD
unsettled	VBN
unveiled	VBD
unveiled	VBN
Unveiled	VBN
unveiling	VBG
unveils	VBZ
unveil	VB
unwavering	VBG
unwinding	VBG
unwind	VB
updated	VBN
updates	NNS
update	VB
updating	VBG
upgraded	VBD
upgraded	VBN
upgrades	NNS
Upgrades	NNS
upgrade	VB
upgrading	VBG
upheavals	NNS
upheld	VBD
upheld	VBN
UPHELD	VBN
upholding	VBG
upholds	VBZ
uphold	VB
upped	VBD
Upping	VBG
uprooted	VBD
ups-and-downs	NNS
upsets	NNS
upsetting	VBG
upset	VB
upset	VBD
upset	VBN
Upset	VBN
ups	NNS
uptick	VB
Urals	NNS
urged	VBD
urged	VBN
URGED	VBN
urges	VBZ
urge	VB
urge	VBP
urgings	NNS
urging	VBG
used	VBD
used	VBN
Used	VBN
users	NNS
Users	NNS
uses	NNS
uses	VBZ
use	VB
Use	VB
use	VBP
ushered	VBD
ushered	VBN
ushering	VBG
ushers	NNS
ushers	VBZ
using	VBG
Using	VBG
usurp	VB
U.S.	VBP
utilities	NNS
Utilities	NNS
utilize	VB
utmosts	NNS
utopians	NNS
utterances	NNS
uttered	VBD
uttering	VBG
UVB	NN
vacancies	NNS
Vacancies	NNS
vacated	VBD
vacated	VBN
vacate	VB
vacating	VBG
vacationers	NNS
vacationing	VBG
vacations	NNS
vaccines	NNS
vacillate	VB
vacuum	VB
vagabonds	NNS
vagaries	NNS
validating	VBG
valuations	NNS
valued	VBD
valued	VBN
Valued	VBN
values	NNS
values	VBZ
value	VB
value	VBP
valuing	VBG
valves	NNS
vandalized	VBD
vanished	VBD
vanished	VBN
vanishes	VBZ
vanishing	VBG
vanish	VB
vanish	VBP
Vanities	NNS
vans	NNS
vapors	NNS
variables	NNS
variations	NNS
varied	VBD
varied	VBN
varies	VBZ
varieties	NNS
varying	VBG
vary	VB
vary	VBP
Vary	VBP
vases	NNS
vassals	NNS
vaults	NNS
vault	VB
VCRs	NNS
veering	VBG
veer	VB
vegetables	NNS
Vegetables	NNS
vegetarians	NNS
vehicles	NNS
veiled	VBN
Veiling	VBG
vending	VBG
vendors	NNS
vented	VBD
ventilated	VBD
ventilated	VBN
ventures	NNS
venture	VB
venturing	VBG
vent	VB
venues	NNS
verdicts	NNS
verged	VBD
verified	VBN
verify	VB
versions	NNS
vessels	NNS
vested	VBN
vestments	NNS
vests	NNS
veterans	NNS
veterinarians	NNS
vetoed	VBD
vetoed	VBN
vetoes	NNS
vetoing	VBG
veto	VB
've	VB
've	VBP
vexed	VBN
viaducts	NNS
vibrating	VBG
vicars	NNS
vices	NNS
vicissitudes	NNS
vicitims	NNS
victimized	VBN
victims	NNS
VICTIMS	NNS
victories	NNS
VICTORIES	NNS
videocassettes	NNS
videodisks	NNS
videos	NNS
videotapes	NNS
videotape	VB
Vietnamese	NNS
viewed	VBD
viewed	VBN
viewers	NNS
Viewers	NNS
viewings	NNS
viewing	VBG
viewpoints	NNS
views	NNS
Views	NNS
views	VBZ
view	VB
view	VBP
vignettes	NNS
villagers	NNS
villages	NNS
Villages	NNS
villains	NNS
vindicated	VBN
vineyards	NNS
vintages	NNS
vinyl-products	NNS
violated	VBD
violated	VBN
violates	VBZ
violate	VB
violate	VBP
violating	VBG
violations	NNS
virgins	NNS
virtues	NNS
virtuosos	NNS
visages	NNS
visionaries	NNS
visions	NNS
visited	VBD
visited	VBN
visiting	VBG
Visiting	VBG
visitors	NNS
Visitors	NNS
visits	NNS
visits	VBZ
visit	VB
visit	VBP
visualize	VB
VISUALIZING	VBG
visuals	NNS
vitiate	VB
voiced	VBD
voiced	VBN
voices	NNS
Voices	NNS
voices	VBZ
voice	VB
voice	VBP
voicing	VBG
voided	VBN
void	VB
volumes	NNS
volunteered	VBD
volunteered	VBN
volunteers	NNS
volunteer	VB
vomiting	VBG
voted	VBD
voted	VBN
vote-getters	NNS
voters	NNS
Voters	NNS
votes	NNS
votes	VBZ
vote	VB
vote	VBP
voting	VBG
vouchers	NNS
vowed	VBD
vowed	VBN
vowels	NNS
Vowels	NNS
vowing	VBG
Vowing	VBG
vows	VBZ
vying	VBG
waddles	VBZ
wade	VB
wad	VB
wafers	NNS
waffled	VBD
waffled	VBN
wafting	VBG
waged	VBD
wages	NNS
wage	VB
waging	VBG
wagons	NNS
wags	NNS
wailing	VBG
wail	VB
waited	VBD
waited	VBN
waiters	NNS
waiting	VBG
waits	VBZ
wait	VB
Wait	VB
wait	VBP
waived	VBD
waived	VBN
waivered	VBN
waivers	NNS
waives	VBZ
waive	VB
waiving	VBG
wake	VBP
waking	VBG
walked	VBD
walkie-talkies	NNS
walking	VBG
Walking	VBG
walking	VBG|NN
walkouts	NNS
walks	NNS
walks	VBZ
walk	VB
Walk	VB
walk	VBP
Walk	VBP
wallcoverings	NNS
wallets	NNS
wallops	VBZ
wallowing	VBG
walls	NNS
wall	VB
wandering	VBG
wanders	VBZ
wander	VB
wander	VBP
waned	VBD
waned	VBN
wanes	VBZ
WANES	VBZ
wane	VB
wane	VBP
waning	VBG
wanted	VBD
wanted	VBN
Wanted	VBN
wanting	VBG
wants	VBZ
want	VB
want	VBP
warded	VBN
wardens	NNS
ward	VB
warehouses	NNS
wares	NNS
warheads	NNS
warmed	VBD
warmed	VBN
warming	VBG
warming	VBG|NN
warm	VB
warned	VBD
Warned	VBD
WARNED	VBD
warned	VBN
Warners	NNS
warnings	NNS
warning	VBG
warns	VBZ
warn	VB
warn	VBP
warranted	VBN
warranties	NNS
warrants	NNS
warrants	VBZ
warrant	VB
warrant	VBP
Warrens	NNS
warring	VBG
warriors	NNS
wars	NNS
Wars	NNS
WARS	NNS
warts	NNS
war	VB
washed	VBD
washed	VBN
washing	VBG
wash	VB
wash	VBP
wasted	VBD
wasted	VBN
wastes	NNS
wastes	VBZ
waste	VB
wasting	VBG
was	VBD
Was	VBD
WAS	VBD
watchdogs	NNS
watched	VBD
watched	VBN
watchers	NNS
watches	NNS
watches	VBZ
watching	VBG
Watching	VBG
watch	VB
WATCH	VB
watch	VBP
watered	VBD
waterfalls	NNS
watering	VBG
waters	NNS
water	VB
waterworks	NN|NNS
watts	NNS
waved	VBD
wavelengths	NNS
wavered	VBD
wavering	VBG
waves	NNS
waving	VBG
waxed	VBD
waxed	VBN
ways	NNS
Ways	NNS
weakened	VBD
weakened	VBN
weakening	VBG
Weakening	VBG
weakens	VBZ
Weakens	VBZ
weaken	VB
weaken	VBP
weaknesses	NNS
wean	VB
weapons	NNS
wearing	VBG
Wearing	VBG
wears	VBZ
wear	VB
Wear	VB
wear	VBP
weasling	VBG
weather	VB
weather	VBP
weaves	VBZ
weaving	VBG
webs	NNS
wedded	VBN
weddings	NNS
wedged	VBD
wedged	VBN
wedge	VB
Wednesdays	NNS
weds	VBZ
wed	VBN
Weeds	NNS
weekdays	NNS
weekends	NNS
weeklies	NNS
weeknights	NNS
weeks	NNS
weepers	NNS
weeping	VBG
weighed	VBD
weighed	VBN
weighing	VBG
Weighing	VBG
weighs	VBZ
weighted	VBN
weightings	NNS
weights	NNS
weight	VB
weigh	VB
weigh	VBP
welcomed	VBD
welcomed	VBN
welcomes	VBZ
welcome	VB
Welcome	VB
welcome	VBP
welcoming	VBG
welded	VBN
wells	NNS
well-stated	VBN
well-wishers	NNS
went	VBD
WENT	VBD
wept	VBD
were	VB
Were	VB
were	VBD
Were	VBD
we	VBP
whacked	VBD
whacked	VBN
whack	VB
whales	NNS
wheelbases	NNS
wheeled	VBN
wheels	NNS
wheezing	VBG
when-issued	VBN
while	VB
whimpers	NNS
whims	NNS
whipped	VBN
whippings	NNS
whipping	VBG
whipsawed	VBN
whipsaw	VB
whips	VBZ
whip	VB
whirlwinds	NNS
whirring	VBG
whisked	VBN
whispered	VBN
whispering	VBG
whispers	NNS
whistled	VBN
whistles	NNS
whistle	VBP
whistling	VBG
whites	NNS
whitewashed	VBN
whittled	VBN
whizzes	NNS
wholesalers	NNS
Wholesalers	NNS
wholesaling	VBG
whooping	VBG
whoosh	VBP
widened	VBD
Widened	VBD
widened	VBN
widening	VBG
widens	VBZ
widen	VB
widen	VBP
widgets	NNS
widowed	VBN
widows	NNS
wielded	VBN
wielding	VBG
wields	VBZ
wield	VB
wiggled	VBD
wiggle	VBP
wiggling	VBG
wigs	NNS
Wilfred	VBD
willies	NNS
willing	VBG
wills	NNS
will	VB
wimping	VBG
wimp	VB
windfalls	NNS
winding	VBG
windows	NNS
windshields	NNS
winds	NNS
wind	VB
wind	VBP
wineries	NNS
wines	NNS
wings	NNS
winking	VBG
winners	NNS
Winners	NNS
winning	VBG
Winning	VBG
wins	NNS
wins	VBZ
winters	NNS
win	VB
win	VBP
wiped	VBD
wiped	VBN
wipe	VB
wipe	VBP
wiping	VBG
wired	VBN
wires	NNS
wiretaps	NNS
wire	VB
wisecracks	NNS
wished	VBD
wished	VBN
wishes	NNS
Wishes	NNS
wishes	VBZ
wishing	VBG
wish-lists	NNS
wish	VB
wish	VBP
witches	NNS
withdrawals	NNS
withdrawing	VBG
withdrawn	VBN
withdraw	VB
withdrew	VBD
withering	VBG
wither	VBP
withheld	VBD
withheld	VBN
withholdings	NNS
withholding	VBG
withhold	VB
Withhold	VB
withhold	VBP
withstanding	VBG
withstand	VB
withstood	VBD
withstood	VBN
witnessed	VBN
witnesses	NNS
Witnesses	NNS
witnessing	VBG
Witness	VB
wives	NNS
Wives	NNS
wizards	NNS
woes	NNS
woken	VBN
woke	VBD
wolves	NNS
womanizing	VBG
women	NNS
Women	NNS
wonderbars	NNS
wondered	VBD
wondering	VBG
wonders	NNS
wonders	VBZ
wonder	VB
wonder	VBP
won	NNS
won	VBD
won	VBN
WON	VBP
woodchucks	NNS
wood-products	NNS
woods	NNS
wooed	VBN
wooing	VBG
woo	VB
worded	VBN
word-processing	NNS
words	NNS
wore	VBD
workbooks	NNS
workdays	NNS
worked	VBD
worked	VBN
workers	NNS
Workers	NNS
WORKERS	NNS
workings	NNS
working	VBG
Working	VBG
working	VBG|NN
workmen	NNS
worksheets	NNS
Worksheets	NNS
works	NNS
workstations	NNS
works	VBZ
work	VB
Work	VB
work	VBP
WORK	VBP
world-affairs	NNS
worlds	NNS
worms	NNS
worn	VBN
Worn	VBN
worried	VBD
worried	VBN
Worried	VBN
worriers	NNS
worries	NNS
Worries	NNS
worries	VBZ
worrying	VBG
worry	VB
worry	VBP
worsened	VBD
worsened	VBN
worsening	VBG
worsen	VB
wounded	VBN
wounds	NNS
wound	VB
wound	VBD
wound	VBN
woven	VBN
wows	VBZ
wracked	VBD
wracked	VBN
wrack	VBP
wrangling	VBG
wrapped	VBD
wrapped	VBN
wrappers	NNS
wrapping	VBG
wraps	VBZ
wrap	VB
wreaked	VBD
wreaking	VBG
wreak	VB
wrecked	VBD
wrecking	VBG
wreck	VB
wrenched	VBN
wrenching	VBG
wrested	VBN
wrestlers	NNS
wrestles	VBZ
wrestle	VB
wrestling	VBG
wrest	VB
wriggling	VBG
wring	VB
wrists	NNS
write-downs	NNS
writedowns	NNS
write-offs	NNS
writeoffs	NNS
writer\/producers	NNS
writers	NNS
writes	VBZ
Writes	VBZ
write	VB
write	VBP
writhing	VBG
writings	NNS
writing	VBG
Writing	VBG
written	VBN
Written	VBN
wronged	VBN
wrote	VBD
Wrote	VBD
wrought	VBD
wrung	VB
X-rays	NNS
yachts	NNS
yanked	VBD
yanked	VBN
yanking	VBG
yank	VB
yards	NNS
yearbooks	NNS
yearlings	NNS
years	NNS
Years	NNS
YEARS	NNS
yelled	VBD
yelling	VBG
yellows	NNS
yells	VBZ
yell	VB
yelped	VBD
yen	NNS
yielded	VBD
yielded	VBN
yielding	VBG
yields	NNS
Yields	NNS
yields	VBZ
yield	VB
yield	VBP
youngsters	NNS
Younkers	NNS
youths	NNS
yuppies	NNS
zappers	NNS
zapping	VBG
zeroing	VBG
zeros	NNS
zero	VB
zero	VBP
zigzags	NNS
zig-zag	VBP
zip	VB
zip	VBP
zlotys	NNS
zombies	NNS
zones	NNS
Zones	NNS
zoning	VBG
zoomed	VBD
zoomed	VBN
zoom	VB


================================================
FILE: ccgbank/data/wsj-nns-vb-stems
================================================
12-inch
15
16-year-old
1850
1890
18-year-old
1900
1920
1930
1940
1950
1960
1970
1980
1990
19-year-old
204
20
20-stock
3090
'30
30
323
'40
'50
'60
'70
747-400
757-200
75-cents-an-hour
'80
80
8300
'90
a330-300
abacus
abandon
abandon
abandon
abandon
abandon
abandon
abandon
abate
abate
abate
abate
abate
abdicate
abet
abet
abide
ability
abolish
abolish
abolish
abolish
abort
abortion-rights
abortion-rights
abortion
abound
abound
abound
abound
abrasive
abridge
absence
absent
absent
absolve
absolve
absorb
absorb
absorb
absorber
absorb
absorb
absorb
absorb
abstain
abstention
abstract
abuse
abuse
abuse
abuse
abuse
academic
accede
accede
accelerate
accelerate
accelerate
accelerate
accelerate
accelerate
accent
acceptance
acceptance
accept
accept
accept
accept
accept
accept
accessory
accessory
access
accident
acclaim
accolade
accommodate
accommodate
accommodate
accommodate
accommodation
accomodate
accompany
accompany
accompany
accompany
accompany
accomplish
accomplish
accomplish
accomplishment
accomplish
accord
accord
accord
accord
accord
accord
accountant
account
account
account
account
account
account
account
account
accrete
accrual
accrue
accrue
accrue
accrue
accrue
accumulate
accumulate
accumulate
accusation
accuse
accuse
accuser
accuse
accuse
accuse
accuse
accustom
ace
achieve
achieve
achievement
achieve
achieve
achieve
achieve
ache
acidify
acid
acknowledge
acknowledge
acknowledge
acknowledge
acknowledge
acknowledge
acorn
acquaint
acquiesce
acquiesce
acquire
acquire
acquire
acquirer
acquirer
acquire
acquire
acquire
acquisition
acquisition
acquit
acquit
acre
across-the-board-cut
act
act
act
act
action
activate
activate
active
activist
activist
activity
actor
act
act
actuary
act
act
adapt
adapt
adapt
adapt
adapt
adapt
add
add
add
add
addict
addict
add
add
addition
additive
address
address
address
address
address
address
address
address
add
add
add
add
add
adept
adhere
adhere
adhesive
adjourn
adjudicator
adjust
adjust
adjuster
adjuster
adjust
adjustment
adjust
adjust
adjust
adjust
adman
administer
administer
administer
administration
administrator
admire
admire
admirer
admire
admission
admit
admit
admit
admit
admit
admit
admit
admit
admonish
adolescent
adopt
adopt
adopt
adopt
adopt
adopt
adopt
adopt
adorn
adorn
adorn
adr
ad
ad
ad
adult
adult
advanced-ceramic
advance
advance
advancement
advancer
advancer
advance
advance
advance
advance
advance
advance
advantage
advantage
adventure
adversary
advertise
advertise
advertisement
advertiser
advertiser
advertise
advertise
advertise
advertise
advertise
advertise
advise
advise
adviser
advise
advise
advise
advise
advise
advisory
advocate
advocate
advocate
advocate
advocate
advocate
advocate
advocate
aerobic
affair
affected
affect
affect
affect
affection
affect
affect
affect
affidavit
affiliate
affiliate
affiliate
affiliate
affinity
affirm
affirm
afflict
afflict
afflict
afford
afford
afford
aftereffect
aftereffect
after-hour
afternoon
aftershock
aftershock
aftershock
age
agency
agenda
agent
agent
age
age
aggravate
aggravate
aggravate
aggravate
aggravate
aggravate
aggregate
age
agitate
agonize
agree
agree
agree
agree
agreement
agree
agree
agree
agree
agriproduct
aichus
aid
aid
aid
aide
aide
aid
aid
aid
aid
ail
ailment
ail
aim
aim
aim
aim
aim
aim
aim
aim
aim
aim
aircraft
air
air
airfield
air
airlift
airlift
airliner
airline
airline
airman
airplane
airport
air
air
air
air
airwave
aisle
be
be
alarm
alarm
alarm
alarm
alarm
albanian
album
alchemist
alcoholic
alert
alert
alert
alert
alienate
alienate
alienate
alienate
alien
align
align
allay
allay
allegation
allege
allege
allege
allege
allege
allege
allege
allergy
alleviate
alleviate
alley
alliance
ally
ally
ally
alligator
allocate
allocate
allocate
allocate
allocate
allocation
allotment
allowance
allow
allow
allow
allow
allow
allow
allow
allow
allow
alloy
allrightnik
allude
allusion
ally
ally
alter
alter
alter
alternate
alternate
alternate
alternative
alter
alter
alter
aluminum-maker
alumnus
amah
amalgamate
amalgamation
amass
amass
amass
amass
amass
amateur
amaze
amaze
ambassador
ambiguity
ambition
amble
ambush
amend
amend
amend
amend
amendment
amend
amenity
amenity
a-man
americana
americanize
american
american
amortize
amount
amount
amount
amount
amount
amount
amount
amphobile
amplify
amplifier
amplify
amplify
amp
amuse
amusement
amuse
be
be
be
anachronism
analysis
analysis
analyst
analyst
analyze
analyze
analyze
analyze
analyze
anchor
anchor
anchor
anchor
and
anemia
anemic
angel
anger
anger
anger
angle
animal
animal
animate
animosity
ankle
anne
anniversary
announce
announce
announce
announcement
announce
announce
announce
announce
annoy
annoy
annualize
annualize
annuity
annuity
annuity
anoint
anomaly
answer
answer
answer
answer
answer
answer
answer
answer
antagonist
antagonize
anteater
antecedent
antelope
anther
anti-abortionist
antibody
anticipate
anticipate
anticipate
anticipate
anticipate
anticipate
anticipate
antic
anti-hero
anti-infective
antipathy
anti-programmer
antiquity
ant
anxiety
apartment
apology
apologist
apologize
apologize
apologize
apologize
appal
apparition
appeal
appeal
appeal
appeal
appeal
appeal
appeal
appearance
appear
appear
appear
appear
appear
appear
appear
appear
appease
appease
appendage
append
append
applaud
applaud
applaud
applaud
applaud
apple
appliance
applicant
application
application
apply
apply
apply
apply
apply
apply
apply
apply
appoint
appoint
appoint
appointee
appointment
appoint
appraisal
appraise
appraiser
appraise
appreciate
appreciate
appreciate
appreciate
appreciate
appreciate
apprehension
apprise
approach
approach
approach
approach
approach
approach
approach
appropriate
appropriate
appropriation
appropriation
appropriator
approval
approve
approve
approve
approve
approve
approve
approve
approximate
arab
arbitrager
arbitrager
arbitrageur
arbitrage
arbitrage
arbitrate
arbitrate
arborist
arb
arb
arcade
arch
architect
architect
arch
area
area
arena
be
be
be
argue
argue
argue
argue
argue
argue
argue
argument
arise
arise
arise
arise
arise
arise
arkansa
armadillo
arm
arm
army
armpit
arm
arm
arm
aroma
arise
arouse
arouse
arouse
arouse
arouse
arpeggio
arraignment
arrange
arrange
arrangement
arrangement
arrange
arrange
arrange
arrears
arrest
arrest
arrest
arrest
arrest
arrival
arrive
arrive
arrive
arrive
arrive
arrive
arrive
arrow
arsenal
artery
article
articulate
artifact
artillerist
artist
artist
art
art
artwork
asahus
ascend
ascertain
ascribe
ascribe
ash
ashland
ashtray
ask
ask
ask
ask
ask
ask
ask
ask
ask
aspect
aspen
aspersion
aspiration
aspire
aspire
aspire
aspire
assail
assail
assassinate
assassinate
assassinate
assassinate
assassination
assault
assault
assemblage
assemble
assemble
assemble
assemble
assembly
assemble
assert
assert
assert
assertion
assert
assert
assert
ass
assess
assess
assess
assessment
assess
assess
asset
asset
asset
assign
assignment
assign
assign
assign
assimilate
assistant
assist
assist
assist
assist
assist
associate
associate
associate
associate
associate
association
assuage
assume
assume
assume
assume
assume
assume
assume
assume
assumption
assurance
assure
assure
assure
assure
assure
asteroid
astound
astronaut
eat
eat
athlete
athletics
atlanti
atoll
atom
atone
atrocity
attach
attach
attach
attach
attach
attach
attack
attack
attacker
attack
attack
attack
attack
attack
attack
attain
attain
attarck
attempt
attempt
attempt
attempt
attempt
attempt
attempt
attempt
attendant
attendant
attend
attend
attendee
attend
attend
attend
attend
attention
attest
attest
attic
attitude
attitude
attorney
attorney
attract
attract
attract
attract
attraction
attract
attract
attract
attribute
attribute
attribute
attribute
attribute
attribute
attribute
auction
auction
auction
auction
auction
audience
audiocassette
audiophile
audit
audit
audit
audition
auditor
auditor
audit
audit
audit
augment
auspices
author
authority
authority
authorization
authorize
authorize
authorize
authorize
authorize
author
aution
auto-emission
autograph
autograph
autograph
auto\/homeowners
automaker
automate
automate
automate
automate
automobile
automobile
auto-sale
auto
autumn
avenge
avenue
average
average
average
average
average
average
average
aver
avert
avert
avert
avert
aviator
avoid
avoid
avoid
avoid
avoid
avoid
avoid
avoid
await
await
await
await
await
awaken
award
award
award
award
award
award
awake
axiom
axle
b-2
babelist
baby
baby
backdate
back-date
back
back
back
backer
backfire
backfire
backfire
backfire
backfire
backflip
background
back
backlog
backlot
backpacker
backpack
backpedal
backslap
back
back
back
back-up
back
back
bacterium
badge
bag
bail
bailiff
bail
bailout
bail
bakery
baker
balance
balance-of-payment
balance
balance
balance
balance
balance
balcony
bale
balk
balk
balk
balk
balk
ballerina
ballet
balloon
balloon
balloon
balloonist
balloon
balloon
balloon
ballot
ballot
ballpark
ballplayer
ball
ballyhoo
bamboozle
banana
bandage
band
bandy
band
band
bang
bang
banish
banish
banker
banker
banker
bank
bankroll
bankroll
bankroll
bankruptcy
bankrupt
bankrupt
bank
bank
bank
bank
bank
ban
ban
banner
ban
banshee
ban
ban
ban
ban
barb
barber
barb
bargain
bargain
bargain-hunter
bargain-hunt
bargain
bargain
bargain
barge
barge
bare
bark
barnacle
barn
baron
bar
bar
bar
barrel
barrel
barrel
barricade
barrier
bar
bar
bar
bar
bartender
barter
bar
bar
baseball
base
base
base
basement
basis
base
base
base
bash
bash
bash
basics
base
basket
basket
bastion
batch
bath
bathroom
bath
bat
battalion
bat
bat
batter
batter
battery
batter
batter
bat
battle
battle
battle
battlegroup
battlements
battle
battle
battle
battle
battle
bay
beach
bead
beam
beam
beam
beanball
bean
bearing
bear
bear
bear
bear
bear
bear
beastie
beast
beat
beat
beat
beat
beat
beat
beat
become
become
become
become
become
become
become
become
become
bedevil
bedevil
bedfellow
bedfellow
bedpan
bedroom
bed
beef
beef
beef
beef
be
be
be
beep
beep
beer
bee
befall
befall
befall
befriend
befuddle
begin
beggar
beg
beg
beginning
begin
begin
begin
begin
begin
begin
beget
beg
begin
beg
behave
behave
behave
behave
behave
behavior
behead
behemoth
being
be
be
be
be
beleaguer
belfry
belie
belief
belie
belie
believe
believe
believe
believe
believe
believe
belittle
belly
bellow
bellringer
bell
bellwether
belly-flop
belong
belongings
belong
belong
belong
belong
belt
belt
bemoan
bench
benchmark
bend
bend
benefactor
beneficiary
beneficiary
benefit
benefit
benefit
benefit
benefit
benefit
benefit
benefit
benefit
bequeath
bequest
berate
berry
beset
besiege
best
best
bestir
bestow
beta
betray
bet
bet
betters
better
bet
bet
bet
bet
bet
be
be
be
be
beverage
beware
beware
beware
bewilder
bewilder
bewitch
bias
bias
bible
bicker
bicker
bicycle
bidder
bid
bid
bid
bid
bid
bid
bid
bid
bifurcate
biker
biker
bike
bike
bilge
bilk
bill
bill
billing
billing
bill
billion
billion
billow
bill
bill
bill
bill
bill
bill
binder
bind
binge
binoculars
bin
bioengineer
biographer
biologist
biomedical-product
biopsy
bird
bird
birthday
birth
biscuit
bishop
bite
bite
bite
bite
bit
bite
bite
blab
black
blacken
blacklist
blackmail
blackmailer
blackmail
blackmail
blackout
black
black
blackstone
blade
blame
blame
blame
blame
blame
blame
blame
blame
blanding
blanket
blanket
blanket
blare
blast
blast
blast
blast
blaze
blaze
bleacher
bleed
bleed
bleed
blemish
blend
blend
blend
bless
blessing
bless
blow
blindfold
blind
blini
blink
blinkers
blink
blink
blip
blip
blip
blitz
block
block
block
block
block
block
block
block
blonde
bloody
bloodlet
blood
bloom
blossom
blossom
blossom
blot
blow
blow
blow
blow
bludgeon
bludgeon
blueblood
blue-chip
blues
blues
blunder
blunder
blunder
blunt
blunt
blunt
blur
blur
blurt
blurt
blur
bmw
board
boardroom
boardroom
board
board
boast
boast
boast
boast
boast
boater
boat
boat
bodega
bode
bode
body
bodyworker
boe
bog
bog
bog
boil
boiler
boil
boil
boil
bolster
bolster
bolster
bolster
bolster
bolster
bolster
bolt
bolt
bombard
bombard
bombard
bomb
bomb
bomber
bombing
bomblet
bomb
bomb
bond
bond-holder
bondholder
bondholding
bond
bond
bond
bone
bone
bonnet
bonus
bonus
boo
book
book
booker
booking
booking
book
booklet
book
book
bookstore
book
boom
boom
boomer
boom
boom
boom
boost
boost
booster
boost
boost
boost
boost
boost
boost
boost
booth
booth
bootleg
boot
booze
border
border
border
bore
bear
bore
bear
bear
bear
borrow
borrow
borrow
borrower
borrower
borrowing
borrow
borrow
borrow
borrow
borrow
boss
boss
botch
bother
bother
bother
bother
bother
bottle
bottleneck
bottler
bottle
bottle
bottle
bottom
bottom
bottom
bottom
bottom
buy
buy
bounce
bounce
bounce
bounce
bounce
bounce
boundary
bound
bound
bound
bind
bourbon
bourse
boutique
bout
bouygue
bow
bow
bow
bowl
bowl
bowl
bow
bow
box
boycott
boycott
boyfriend
boy
boy
brace
brace
brace
brace
brag
brag
braid
brain
brake
brake
brake
branch
branch
branch
branch
branch
brandish
brandish
brand
brand
brand
brassiere
brat
brave
brave
brave
brawl
brazen
brazilian
breach
breach
breach
breach
bread
breakdown
breaker
break
break
break
break
breakthrough
break
break
breast
breathe
breathe
breathe
breath
breed
breed
breeder
breeder
breed
breed
breed
breeze
brethren
brew
brewery
brewery
brewer
brew
brew
bribe
bribe
bribe
bribe
bribe
brick
bridge
bridge
bridge
briefcase
brief
brief
briefing
briefs
briefs
brief
brigade
brighten
brighten
brighten
brim
bring
bring
bring
bring
bristle
bristle
bristle
british
broadcaster
broadcaster
broadcast
broadcast
broadcast
broadcast
broadcast
broadcast
broadcast
broadcast
broaden
broaden
broaden
broaden
broaden
brochure
break
brokerage
broker-dealer
broker
broker
broker
broker
break
bronco
bronc
brother
bring
bring
browbeat
browse
browse
bruise
bruise
bruise
brushback
brush
brush
brush
brush
brush
brussels
bubble
bubble
buccaneer
buck
buck
bucket
buck
buck
buckle
buckle
buckle
buck
buck
buck
buck
buddy
bud
budge
budge
budget
budgeteer
budget
budge
bud
buffer
buffet
buffet
buffet
buffet
buff
buff
bug
bug
bug
builder
builder
building-material
building-product
building
building
build
build
build
build
build
build
build
build
build
bulb
bulge
bulkhead
bulldoze
bulldozer
bulletin
bullet
bullhorn
bully
bully
bull
bull
bully
bumble
bumble
bumble
bump
bump
bump
bump
bum
bunch
bundle
bundle
bundle
bungle
bun
buoy
buoy
buoy
buoy
buoy
buoy
burble
burden
burden
burden
burden
burden
bureaucracy
bureaucrat
bureaucrat
bureau
burgeon
burger
burglary
burglarize
burg
burial
bury
bury
bury
burn
burn
burn
burn
burnish
burnout
burn
burn
burn
burn
burn
burst
burst
burst
burst
burst
bury
bury
bury
bus
bushel
bush
busy
business-communication
business
business
business-machine
businessman
businessman
business-partner
busload
bust
bust
bust
bust
butler
butterfly
button
buttress
buttress
buttress
butt
buy-back
buy-back
buyer
buyer
buyer
buying
buy
buy
buy-out
buyout
buy
buy
buy
buy
buy
buy
buzz
buzz
buzz
buzzword
bylaw
byline
bypass
bystander
cabin-crew
cabinet
cable
cab
cache
cadet
cadge
cafe
cafeteria
cake
calamity
calavera
calculate
calculate
calculate
calculate
calculate
calculate
calculate
calculate
calculation
calculator
calibrate
californian
call
call
call
call
call
call
caller
caller
call
call
call
call
call
call
call
call
call
calm
calm
calm
calorie
caltran
calf
camera
come
camouflage
campaign
campaign
campaign
campaign
camp
camper
camp
campus
campus
canal
cancel
cancel
cancel
cancel
cancellation
cancel
cancel
cancer
cancer-suppressor
candidate
candy
candle
can
can
can
canvas
canvass
canyon
capability
capacity
capacitor
capital-asset
capital-drain
capital-gain
capitalgain
capital-goods
capitalist
capitalize
capitalize
capitalize
capitalize
capitalize
capital
capital-to-asset
capita
capitulate
cap
cap
cap
cap
capsule
captain
caption
captivate
captive
capture
capture
capture
capture
capture
cap
cap
carat
carbide-product
car-dealer
cardholder
cardinal
card
care
care
careen
careen
careen
career
career
care
care
care
caricature
caricature
carillon
care
carnivore
carpenter
carpetbagger
carpet
carpet
carp
carry
carry
carry
carrier
carrier
carry
carry-forward
carryforward
carry
carry
carry
carry
car
car
cart
cart
carton
cartoonist
cartoon
cartridge
cart
cart
carve
carve
carver
carve
carve
carve
carve
cascade
cascade
caseload
case
case
case
cash
cash
cash
cash
casing
casino
casino
casket
cassette
castigate
castigate
castigate
casting
cast
castle
cast
cast
cast
cast
cast
casualty
cataclysm
catalog
catalog
catapult
catapult
cataract
catastrophe
catcher
catch
catch
catch
catch
catch
category
categorize
cater
cater
cater
cater
cater
catfish
catheter
cathode
cat
cattle
cattle
catch
catch
cause
cause
cause
cause
cause
cause
cause
caution
caution
caution
caution
caution
caveat
cave
cave
c.d.s
cd
cease
cease
cease
cease
cease
cede
cede
cede
cede
ceiling
celebrate
celebrate
celebrate
celebrate
celebrate
celebration
celebrity
cellar
cellist
cell
celluloid
cement
cement
cement-maker
cement
censor
censor
censure
centenarian
center
center
center
center
center
center
center
centimeter
centralize
centralize
cent
cent
century
centurion
ceo
ceramic
cereal
ceremony
certificate
certificate
certificate
certify
certify
cfc
chafe
chafe
chain
chain
chain
chair
chair
chairman
chair
chair
chalk
chalk
challenge
challenge
challenger
challenge
challenge
challenge
challenge
challenge
challenge
chamber
chamber
champagne
champion
champion
champion
championship
champion
champion
champ
chance
chance
chandelier
change
change
change
change
change
change
change
change
change
change
change
change
channel
channel
channel
channel
chan
chant
chant
chant
chant
chap
chapter
characteristic
characterize
characterize
characterize
characterize
characterize
characterize
character
character
charge
charge
charge-off
charge
charge
charge
charge
charge
charge
charge
charity
charity
charlatan
charlestonian
char
charter
charter
chart
chart
chart
chart
chase
chaser
chase
chase
chassis
chasten
chasten
chastise
chastise
chastise
chat
chat
chauffeur
chauffeur
cheapen
cheat
cheater
cheat
cheat
cheat
checkbook
check
check
check
checkpoint
check
check
check
check
check
cheer
cheer
cheer
cheerleader
cheer
cheer
cheese
chef
chelicerate
chemical
chemical
chemical-weapon
chemist
cherish
cherish
cherry
cherub
chew
chew
chew
chew
chew
chicken
chicken
chide
chide
chide
chief
child
child
child
chill
chill
chill
chime
chimney
chimpanzee
chinese
chip
chip
chip
chisel
chlorofluorocarbon
choice
choice
choke
choke
choke
choke
choose
choose
choose
choose
choose
chop
chop
chop
chopstick
chop
chord
choreographer
chore
chore
chortle
chorus
choose
choose
christian
chromosome
chronicle
chronicle
chuck
chuckle
chuckle
chuckle
chug
chum
chunk
church
church-goer
churn
churn
cial
cigarette
cigar
cinch
cincinnatus
circle
circle
circle
circuit
circular
circulate
circulate
circulate
circulate
circulate
circulation
circumstance
circumvent
circumvent
circumvent
citation
cite
cite
Cite
cite
cite
cite
citicorp
city
city
cite
Cite
citizen
citizen
citizen
civic
civilian
civil-rights
clothe
clothe
claimant
claimant
claim
claim
claim
claim
claim
claim
claim
claim
claim
claim
clamber
clamor
clampdown
clamp
clamp
clamp
clang
clank
clarification
clarify
clarify
clarify
clarify
clash
clash
clash
clash
class
class
class
classic
classic
classification
classify
classify
classify
classify
classmate
classroom
clause
claw
clean
clean
cleaner
clean-fuel
clean
clean
cleanse
cleanse
cleanser
cleanse
cleanse
clean
clean
clearance
clear
clear
clear
clear
clear
clear
clear
clergy
cleric
clerk
click
clientele
client
client
climb
climb
climber
climb
climb
climb
clinch
clinch
cling
cling
clinical-product
clinic
clinker
clip
clip
clipping
clip
clip
clique
cloak
clobber
clobber
clobber
clock
clock
clock
clog
clog
clone
clone
close
close
close
close
close
close
close
close
close
close
closing
close
close
closure
clothe
clothes
clothier
cloud
cloud
cloud
cloud
cloud
clown
club
club
club
club
club
clue
clump
cluster
cluster
clutch
clutch
clutter
clutter
c'mon
coach
coach
co-anchor
coast
coaster
coast
coat
coating
coat
coat
coattail
co-author
co-author
coax
coax
cobble
cobble
cobb
co-chairman
cockatoo
cockroach
cocktail
coconut
coddle
code
co-defendant
code-name
code
code
co-developer
codify
codify
co-edit
coerce
co-exist
coextrude
coffer
co-found
co-founder
cognoscenti
cohere
cohort
co-host
coincide
coincide
coincide
coin
coin
cola
cold-cut
coli
collaborate
collaborate
collaborate
collaborate
collaborator
collage
collapse
collapse
collapse
collapse
collapse
collapse
collar
collateralize
colleague
colleague
collect
collect
collectible
collectible
collect
collection
collective
collectivizer
collector
collector
collect
collect
collect
college
college
college-sport
colloquy
colonialist
colony
colonist
color-code
color-code
color
color
color
columnist
column
co-manage
co-manage
combatant
combate
combat
combat
comb
combination
combine
combine
combine
combine
combine
combine
combine
comb
combine
comedy
comestible
come
come
comet
come
come
come
come
come
come
comfort
comfort
comfort
come
come
command
commander
command
commando
command
command
commemorate
commemorate
commemorate
commence
commence
commend
commend
commentary
commentator
commentator
comment
comment
comment
comment
comment
comment
comment
comment
commercialize
commercialize
commercial
commercial
commission
commission
commissioner
commission
commission
commission
commission
commission
commitment
commit
commit
commit
committee
committee
committee
committe
commit
commit
commit
commodity
commodity
commoditize
communicate
communicate
communicate
communicate
communication
communique
communist
communist
community
commuter
commuter
commute
commute
compact
company
company
company
companion
compaq
compare
compare
compare
compare
compare
compare
compare
compare
compare
compare
comparison
compatriot
compel
compel
compel
compel
compensate
compensate
compensate
compensation
compete
compete
compete
Compete
compete
compete
compete
Compete
compete
competition
competitor
competitor
compile
compile
compile
compile
compile
complain
complain
complain
complain
complaint
complaint
complain
complain
complement
complement
complete
complete
complete
complete
complete
completion
complex
complexity
complicate
complicate
complicate
complicate
complication
comply
comply
compliment
compliment
comply
comply
comply
component
compose
composer
composite
composition
compound
compound
compound
compound
compound
compound
compress
compressor
comprise
comprise
comprise
comprise
comprise
compromise
compromise
compromise
compromise
compromise
compromise
compulsion
computation
computerize
computerize
computerize
computer-product
computer-service
computer
computer
computer
computer-system
compute
compute
compute
comrade
conceal
conceal
conceal
concede
concede
concede
concede
concede
concede
conceive
conceive
conceive
conceive
concentrate
concentrate
concentrate
concentrate
concentrate
concentrate
concentration
conception
concept
concern
concern
concern
concern
concern
concern
concern
concern
concern
concerto
concert
concession
conclude
conclude
conclude
conclude
conclude
conclude
conclusion
concoct
concoction
concoct
concur
concur
condemn
condemn
condemn
condemn
condemn
condenser
condition
conditioner
condition
condominium
condom
condone
condone
condo
conduct
conduct
conduct
conduct
conduct
conduct
conduit
conduit
cone
conferee
conferee
conference
confer
confer
confer
confer
confer
confess
confess
confess
confess
confession
confidant
confide
confide
confide
configuration
confine
confines
confirm
confirm
confirm
confirm
confirm
confirm
confirm
confiscate
confiscate
confiscate
confiscate
conflict
conflict
conflict
conflict
conform
conform
conform
conform
confrontation
confrontation
confront
confront
confront
confront
confront
confront
confuse
confuse
confuse
confuse
confuse
confusion
conglomerate
congratulate
congratulate
congratulate
congressman
congressman
conjure
conjure
connect
connect
connection
connect
connect
connect
connotation
connote
conquer
conscript
consent
consent
consent
consent
consent
consequence
conservationist
conservationist
conservative
conservative
conservative
conserve
consideration
consider
consider
consider
consider
consider
consider
consider
consider
consider
consign
consign
consist
consist
consist
consist
consist
consist
consist
con
console
console
consolidate
consolidate
consolidate
consolidate
consolidate
consolidation
consonant
consort
conspiracy
conspirator
conspire
conspire
conspire
constituency
constituent
constitute
constitute
constitute
constitute
constrain
constrain
constraint
constrain
constrict
constrictor
construct
construct
construction
construct
construe
construe
construe
construe
consultant
consultant
consultation
consult
consult
consult
consume
consume
consumer-electronics
consumer-goods
consumer-product
consumer
consumer
consume
consume
consummate
contact
contact
contact
contact
contact
contain
contain
container
contain
contain
contain
contain
contaminate
cont'd.
contemplate
contemplate
contemplate
contemplate
contemplate
contemplate
contemporary
contemporize
contend
contend
contender
contend
contend
contend
contend
contention
contents
content
contestant
contest
contest
contest
contest
contest
continental
contingency
continue
continue
continue
continue
continue
continue
continue
continue
contraceptive
contract-drill
contract
contract
contract
contract
contraction
contractor
contractor
contract
contract
contract
contract
contract
contradict
contradiction
contradict
contradict
contra
contrast
contrast
contrast
contrast
contrast
contrast
contrast
contravene
contribue
contribute
contribute
contribute
contribute
contribute
contribute
contribute
contribution
contributor
control
control
controller
control
control
control
control
control
controversy
con
convenant
convene
convene
convene
convene
convene
convene
conventional-arm
conventioner
convention-goer
convention
converge
conversation
conversion
convert
convert
converter
convertible
convert
convert
convert
convert
convert
convey
convey
convey
convey
convict
convict
conviction
convict
convict
convince
convince
convince
convince
convince
convince
convince
convolute
convolution
convoy
convulsion
cookbook
cook
cookie
cook
cook
cook
coolant
cool
cool
cool
cool
cool
cool
cool
cooperate
cooperate
cooperate
cooperate
cooperate
cooperative
coordinate
coordinate
coordinate
coordinate
coor
co-payment
cope
copy
copy
copier
copy
co-pilot
cope
co-president
co-produce
copycat
copy
copyright
copyright
copy
copy
copy
core
corkscrew
corner
corner
cornerstone
corner
cornice
corporate-earnings
corporate
corporation
corporation
corral
correct
correct
correct
correction
correct
correct
correct
correlate
correspond
correspondent
correspond
correspond
corridor
corroborate
corvette
cosmetic
cosmetic
cosmology
co-sponsor
co-sponsor
co-sponsor
costa
cost
cost
cost
cost
costume
costume
cost
cost
cost
cost
cot
cottage
couch
couch
cough
cough
cough
cough
cough
councilor
council
counsel
counsel
counselor
counsel
counsel
count
count
countenance
counteract
counteract
counterattack
counterbalance
counterbidder
counterbid
counter-claim
counterclaim
counter
counter
counter
counter
countermeasure
counterpart
counterprogram
counter
countersue
countersue
countersue
countervail
counter
counter
county
count
count
country
country
countryman
count
count
count
count
count
couple
couple
couple
couplet
coup-maker
coupon
coupon
coup
courier
course
course
court
court
courtesy
courthouse
court
courtroom
court
court
court
court
court
cousin
covenant
coverage
cover
cover
covering
cover
cover
cover
covert
cover
cover
covet
covet
coward
cowboy
cowboy
cower
co-worker
cow
cpa
crab
crack
crack
crack
crack
crackle
crack
crack
crack
craft
craft
craft
craftsman
craft
cram
cram
cramp
cram
crane
crane
crank
crank
crank
crank
crash
crash
crash
crash
crash
crash
crash
crater
crate
crave
crawl
crawl
crawl
crawl
creak
cream
cream
create
create
Create
create
create
create
create
create
create
creation
creator
creator
creature
credentials
credit-datum
credit
credit
credit
creditor
creditor
credit-rating
credit
credit
credit
credit
creep
crematorium
creep
creep
crest
crevasse
crevice
crew
cry
crime
criminalize
criminal
crimp
crimp
cringe
cripple
cripple
cripple
crisis
crisis
crisscross
criss-cross
criterion
criticism
criticize
criticize
criticize
criticize
criticize
criticize
critic
critic
croak
croissant
crony
crook
croon
croon
crop
crop
crop
crop
crop
cross-breed
cross
cross
cross
cross
cross-pollinate
crossroads
cross-shareholding
cross
cross
crouch
crouch
crowd
crowd
crowd
crowd
crowd
crow
crown
crow
cr
crude
cruiser
cruise
cruise
crumble
crumble
crumble
crumble
crumble
crumple
crumple
crunch
crunch
crush
crush
crush
crush
cry
cryptographer
crystal
cry
cry
cub
cuckoo
cue
cuff
cull
culminate
culminate
culminate
culminate
culprit
cultivate
cultivate
cultivate
culture
cup
curator
curb
curb
curb
curb
curb
curb
curb
cure
cure
cure
cure
curl
curl
currency
current
curry
curse
curse
curtail
curtail
curtail
curtail
curtail
curtain
cushion
cushion
cushion
customer
customer
customize
custom
custom
cutback
cutout
cut
cut
cutter
cutting-tool
cut
cut
cut
cut
cut
cut
cut
cut
cuvee
cvb
cycad
cycad
cycle
cyclical
cycle
cyclist
c-yield
czar
dabble
dabble
dabble
dab
daily
dalliance
damage
damage
damages
damage
damage
damage
damage
damp
damp
dampen
dampen
damp
damp
damp
dam
dancer
dance
dance
dance
danger
danger
dangle
dangle
dare
dare
dare
darling
dash
dash
dash
dash
database
datum
datum
datum
datum
date
date
date
date
date
date
daughter
daunt
daunt
dawdle
dawn
dawn
day.
day
day
dazzle
deactivate
deadbeat
deadline
deadlock
dead
deafen
dealership
dealer
dealer
dealings
deal
deal
dealmaker
deal
deal
deal
deal
deal
deal
death
debacle
debate
debate
debate
debate
debate
debenture
debtholder
debtor
debt
debunk
debut
debut
decade
decade
decapitalize
decease
deceive
deceive
deceive
decelerate
decelerate
decentralize
decentralize
decertify
decide
decide
decide
decide
decide
decide
decide
decide
decimate
decision-maker
decision
decision
deck
deckhand
deck
deck
declaration
declare
declare
declare
declare
declare
declare
declare
declassify
decline
decline
decliner
decliner
decline
decline
decline
decline
decline
decline
decline
decontaminate
decorate
decorate
decorator
decoy
decrease
decrease
decrease
decrease
decrease
decrease
decrease
decree
decribe
decry
decry
decry
dec.
dedicate
dedicate
deduce
deduct
deductible
deduct
deduction
deduction
deduct
deed
deem
deem
de-emphasize
de-emphasize
deem
deem
deepen
deepen
deer
deer
default
default
defaulter
default
default
default
default
defeat
defeat
defeat
defeat
defeat
defeat
defect
defect
defection
defection
defect
defect
defendant
defendant
defend
defend
defender
defender
defend
defend
defend
defend
defend
defense-electronics
defens
defer
defer
defer
deficiency
deficit
defy
defy
define
define
define
define
define
define
definition
deflate
deflate
deflate
deflator
deflect
deflect
deflect
deform
defraud
defraud
defraud
defraud
defunct
defuse
defuse
defy
defy
degenerate
degenerate
degenerate
degree
delay
delay
delaying
delay
delay
delay
delay
delay
delay
delegate
delegate
delegate
delegate
delete
delete
delete
deletion
deliberate
deliberate
deliberation
delight
delight
delight
delight
delight
deli
delinquency
delinquent
delist
deliver
deliver
delivery
delivery
deliver
deliver
deliver
deliver
deliver
delouse
deluge
deluge
delve
delve
demagogue
demand
demand
demand
demand
demand
demand
demand
demean
demeanor
demilitarize
demobilize
demobilize
democracy
democratize
democratize
democrat
demographic
demographic
demolish
demolish
demolish
demolish
demonize
demon
demonstrate
demonstrate
demonstrate
demonstrate
demonstrate
demonstrate
demonstration
demonstration
demonstrator
demote
demur
denationalize
denial
deny
deny
deny
deny
denims
denizen
denominate
denomination
denounce
denounce
denounce
denounce
denounce
dentist
dent
denuclearize
denude
deny
deny
deny
depart
depart
depart
department
departure
depart
depart
depend
depend
dependent
depend
depend
depend
depend
depend
depict
depict
depict
depict
depict
depict
deplete
deplete
deplete
deplete
deplore
deplore
deploy
deploy
deport
depose
deposit
deposit
deposit
deposition
depositor
deposit
deposit
deposit
deposit
depot
depreciate
depredation
depress
depress
depress
depress
depression
depress
depress
deprivation
deprive
deprive
deprive
deprive
deprive
deprive
deprogramming
depths
deputy
deputy
derail
derail
derail
deregulate
deregulate
deride
deride
derivative
derive
derive
derive
derive
derive
descendant
descend
descend
descend
descent
describe
describe
describe
describe
describe
describe
describe
description
desert
desert
desert
deserve
deserve
deserve
deserve
designate
designate
designate
designate
designation
design
design
designee
designer
design
design
design
design
design
desire
desire
desire
desire
desist
desk
despair
despise
despise
despot
destabilize
destabilize
destination
destination
destine
destroy
destroy
destroy
destroy
destroy
destroy
detach
detach
detail
detail
detail
detail
detain
detain
detain
detect
detect
detect
detective
detector
detect
detect
detergent
deteriorate
deteriorate
deteriorate
deteriorate
deteriorate
deteriorate
determine
determine
determine
determine
determine
determine
determine
deter
deterrent
deter
deter
deter
deter
detest
dethrone
detractor
detract
detract
devaluation
devalue
devalue
devastate
devastate
devastate
develop
develop
develop
developer
developer
develop
develop
development
development
develop
develop
develop
develop
deviate
deviation
device
devil
devise
devise
devise
devise
devise
devote
devote
devotee
devotee
devote
devote
devote
devour
devour
dewater
diabetic
diagnose
diagnose
diagnose
diagnostic
diagram
dialect
dial
dial
dial
dial
diamond
diaper
diary
dibenzofuran
dice
dicker
dictate
dictate
dictate
dictate
dictate
dictate
dictatorship
dictator
do
do
die
die
die
die
die
die-hard
diehard
diesel
die
die
die
die
die
die
differ
difference
difference
differential
differentiate
differentiate
differ
differ
differ
differ
difficulty
digest
digest
digest
dig
digit
dignify
dignitary
dig
dig
dig
dig
dilute
dilute
dilute
dilute
dilute
dimension
dime
diminish
diminish
diminish
diminish
diminish
diminish
dim
dine
dine
diner
dine
dinner
dinosaur
dioxin
diplomat
dip
dip
dip
dip
dip
dip
direct
direct
direct
direction
directive
directory
director
director
direct
direct
dirk
disability
disable
disabled-worker
disable
disadvantage
disagree
disagree
disagreement
disagree
disagree
disagree
disallow
disappear
disappear
disappear
disappear
disappear
disappoint
disappoint
disappointment
disappointment
disappointment
disappoint
disapprove
disapprove
disapprove
disapprove
disarm
disarm
disassemble
disassociate
disaster
disaster
disavow
disband
disband
disband
disburse
disbursement
discard
discard
discard
discern
discern
discharge
discharge
discharge
disciple
discipline
discipline
discipline
disclaim
disclose
disclose
disclose
disclose
disclose
disclosure
disclosure
discolor
discomfit
disconnect
disconnect
discontinue
discontinue
discontinue
disco
disco
discount
discount
discount
discount
discount
discount
discount
discourage
discourage
discourage
discourage
discourage
discourage
discover
discover
discovery
discover
discover
discover
discover
discredit
discredit
discrepancy
discrepancy
discrepency
discriminate
disc
discuss
discuss
discuss
discuss
discussion
discuss
discuss
disdain
disdain
disease
disembark
disenchant
disengage
disgorge
disgruntle
disguise
disguise
disguise
disgust
disgust
dish
dish
dishwasher
disincline
disinfectant
disintegrate
disintegrate
disk
dislike
dislike
dislike
dislocation
dismantle
dismantle
dismantle
dismantle
dismay
dismember
dismiss
dismiss
dismiss
dismiss
dismiss
dismiss
dismiss
disobey
disorder
disparage
disparage
disparage
disparity
dispatch
dispatch
dispatcher
dispatch
dispatch
dispatch
dispel
dispel
dispense
dispense
dispense
dispense
dispersant
disperse
disperse
displace
displace
display
display
display
display
display
display
display
displease
disposable
disposal
dispose
dispose
dispose
dispose
dispose
disposition
disprove
dispute
dispute
dispute
dispute
dispute
dispute
disqualify
disqualify
disregard
disregard
disrupt
disrupt
disrupt
disruption
disrupt
dissatisfy
dissect
dissect
disseminate
disseminate
disseminate
dissent
dissent
dissenter
dissent
dissident
dissident
dissipate
dissipate
dissipate
dissociate
dissociate
dissolve
dissolve
dissolve
dissolve
dissuade
distance
distance
distance
distil
distiller
distil
distinction
distinguish
distinguish
distinguish
distort
distortion
distort
distort
distort
distract
distract
distract
distraction
distract
distribute
distribute
distribute
distribute
distribute
distribute
distribute
distribute
distribution
distributor
district
districts\/states
disturbance
disturb
disturb
disturb
disturb
dither
dive
diverge
diverge
diversife
diversification
diversify
diversify
diversify
diversify
diversion
diver
divert
divert
divert
divert
divest
divest
divest
divestiture
divest
divest
dive
dive
dive
divide
divide
dividend
divide
divide
divide
divide
divide
divide
dive
division
divorce
divorce
divulge
divvy
divvy
dizzy
docket
dock-sider
doctor
doctor
doctor
doctor
doctrine
docudrama
documentary
document
document
document
document
document
document
dodge
dodge
do
do
dog
dog
dog
do-gooder
dog
dog
dog
dog
do
do
doldrums
dole
dole
dole
dole
dollar
doll
dolphin
dome
dominate
dominate
dominate
dominate
dominate
dominate
donate
donate
donate
donate
donate
donate
donation
donation
do
don
don
donor
don
don
don't
don
doom
doom
doom
doomsayer
doom
doorman
door
dose
dossier
dote
doth
dot
dot
double-cross
double
double
double
double
double
double
double
doubt
doubter
doubt
doubt
doubt
doubt
doubt
do
do
do
do
dovetail
dive
down
downgrade
downgrade
downgrade
downgrade
downgrade
downpayment
downplay
downsize
downsize
downsize
downs
downturn
down
dozen
dozen
draft
draft
draft
draftsman
draft
drag
drag
drag
drag
drag
drag
drag
drain
drain
drain
drain
dramatization
dram
drape
drape
drawback
drawing
draw
draw
draw
draw
draw
draw
draw
dread
dream
dream
dream
dream
dream
dream
dream
dream
dream
dream
dress
dress
dress
dress
dress
dress
dress
draw
dry
dry
drift
drift
drift
drift
drill
drill
driller
drill
drill
drill
drink
drink
drink
drink
drip
drive
driver
drive
drive
drive
drive
drive
drive
drool
drool
drop
droplet
dropout
drop
drop
dropper
drop
drop
drop
drop
drop
drought
drove
drive
drown
drown
drown
drug-sale
drug
drug
drugstore
drum
drum
drum
dry
dry
d
dub
dub
dub
dub
duck
duckling
duck
duck
duck
duck
duct
dud
duel
duel
due
due
duffer
dig
dull
dummy
dump
dump
dump
dump
dump
dump
dump
dune
dupe
duplicate
duplicate
duplicate
duplication
durable-goods
durable
dust
dust
duty
'd
dwarf
dwarf
dwarf
dwarf
dweller
dwelling
dwindle
dwindle
dye
dye
die
dynamics
dynamo
earmark
earmark
earmark
earmark
earn
earn
earner
earnig
earnings
earnings
earnings
earn
earn
earn
earn
earn
earring
ear
earthling
earthquake
earthworm
ease
ease
ease
ease
ease
ease
easterner
east
east
eat
eater
eat
eat
eat
eat
eavesdrop
ebb
ebb
eccentric
echelon
echo
echo
echo
echo
echo
echo
echo
eclair
eclipse
eclipse
economics
economy
economist
economist
economize
edge
edge
edge
edge
edge
edition
editorial
editorial
editor
edit
educate
educate
educate
education
educator
educator
effect
effect
effect
efficiency
effort
effort
egg
ego
eject
eke
eke
elaborate
elaborate
elaborate
elapse
elbow
elder
elect
elect
elect
election
election
election
electrical-product
electrify
electrochemical
electrode
electrogalvanize
electrogalvanize
electromagnet
electronic-datum
electronics
electronic-system
electro-optics
elect
elect
element
element
elephant
elevate
elevate
elevation
elevator
eliminate
eliminate
eliminate
eliminate
eliminate
eliminate
eliminate
eliminate
elite
elite
elitist
elongate
elude
elude
emasculate
embargo
embargo
embargo
embark
embark
embark
embark
embarrass
embarrass
embarrass
embarrass
embassy
embattle
embed
embed
embellish
embezzle
embezzle
emblem
embody
embody
embody
embolden
embolden
embrace
embrace
embrace
embrace
embrace
embroil
emerge
emerge
emergency
emerge
emerge
emerge
emerge
emerge
emigrate
emigrate
emigre
emissary
emission
emit
emote
emote
emotion
empathize
emphasize
emphasize
emphasize
emphasize
emphasize
emphasize
emphaticize
empire
employ
employee
employee
employee
employee
employer
employer
employ
employ
employ
employ
empower
empower
empower
empower
empty
empty
empty
empty
emulate
emulate
emulate
enable
enable
enable
enable
enable
enable
enact
enact
enact
enact
encapsulate
encase
encircle
enclose
enclose
encompass
encompass
encompass
encounter
encounter
encounter
encounter
encounter
encourage
encourage
encourage
encourage
encourage
encourage
encourage
encourage
encourage
encroach
encrust
encrypt
encumber
endangered-species
endanger
endanger
endeavor
endeavor
endeavor
end
end
end
ending
end
end
endorse
endorse
endorsement
endorser
endorse
endorse
endorse
endorse
endow
endow
endow
end
end
end
end
end-tail
endure
endure
endure
endure
endure
endure
end
end
end
enemy
energy
energize
energy-service
enforce
enforcer
enforcer
enforce
enforce
enforce
enforce
engage
engage
engagement
engage
engage
engage
engage
engineer
engineer
engineer
engineer
engineer
engine
english
engrave
engulf
engulf
enhance
enhance
enhancement
enhance
enhance
enhance
enjoin
enjoin
enjoin
enjoy
enjoy
enjoy
enjoy
enjoy
enjoy
enjoy
enlarge
enlarger
enlarge
enlarge
enlighten
enlighten
enlighten
enlist
enlist
enlist
enliven
ennumerate
enrage
enrich
enrich
enrol
enrol
enrollee
enrollment
enroll
enroll
ensconce
ensemble
ensnarl
ensue
ensue
ensue
ensure
ensure
ensure
ensure
entail
entail
entail
entangle
enter
enter
enter
enterprise
enter
entertain
entertain
entertainer
entertain
entertain
enter
enter
enter
enthusiasm
enthusiast
enthusiast
entice
entice
entice
entice
entity
entitle
entitle
entitlement
entitle
entitle
entitle
entitle
entomb
entrance
entrant
entrench
entrench
entrepreneur
entrepreneur
entry
entrust
entrust
entrust
entwine
envelope
environmentalist
environmentalist
environment
envisage
envisage
envision
envision
envision
envision
envy
eon
epileptic
episode
epitomize
equal
equal
equal
equal
equal
equal
equate
equate
equate
equestrian
equip
equip
Equip
equip
equip
equip
equity
equity
equivalent
equivalent
eradicate
erase
erase
erase
erase
erase
erase
erasure
erect
erect
erect
erode
erode
erode
erode
erode
erode
erode
erratum
err
err
error
err
err
err
err
erupt
erupt
erupt
erupt
escalate
escalate
escalate
escalate
escalator
escape
escape
escape
escape
eschew
escort
escort
escrow
espouse
esp
essay
essential
establish
establish
establish
establish
establish
establish
establishment
establish
establish
establsh
estimate
estimate
estimate
estimate
estimate
estimate
estimate
estimate
estimate
estimate
estimator
estrange
ethic
euphemism
eurobond
eurodebenture
eurodollar
eurodollar
euroissue
euronote
european
evacuate
evacuate
evade
evader
evade
evade
evaluate
evaluate
evaluate
evaluate
evaluate
evaluate
evaluate
evaluation
evaluation
evangelist
evaporate
evaporate
evaporate
even
evening
even
event
event
even
everglade
evidence
evil-doer
evince
evince
eviscerate
evoke
evoke
evoke
evolve
evolve
evolve
evolve
exacerbate
exacerbate
exacerbate
exacerbate
exacerbate
exaggerate
exaggerate
examination
examine
examine
examiner
examiner
examine
examine
examine
examine
examine
example
example
exam
excavate
excavate
excavator
exceed
exceed
exceed
exceed
exceed
exceed
excel
excel
exception
except
excerpt
excerpt
excess
exchange
exchange
exchange
exchange
exchange
exchange
excise
excise
excise
excite
excite
exclaim
exclude
exclude
exclude
exclude
exclude
exclude
exclude
exclude
exclude
exclusion
excorciate
excoriate
excursion
excuse
excuse
excuse
excutive
exec
execute
execute
execute
execute
execute
execute
execute
execution
execution
executive
executive
executive
executor
exemplify
exemplify
ex-employee
exempt
exempt
exemption
exempt
exercise
exercise
exercise
exercise
exercise
exercise
exercise
exerpt
exert
exert
exert
exhale
exhaust
exhaust
exhaust
exhaust
exhaust
exhibit
exhibit
exhibition
exhibitor
exhibit
exhibit
exhibit
exhort
exile
exile
exist
exist
exist
exist
exist
exist
exist
exit
exit
exit
exit
exonerate
exonerate
exonerate
exorcise
exorcism
expand
expand
expand
expand
expand
expand
expand
expansionist
expansion
expectation
expectation
expect
expect
expect
expect
expect
expect
expect
expect
expect
expect
expedient
expedite
expedite
expedite
expel
expel
expel
expend
expenditure
expenditure
expense
expense
experience
experience
experience
experience
experience
experience
experience
experience
experiment
experiment
experiment
experiment
experiment
expert
expert
expiration
expire
expire
expire
expire
expire
expire
explain
explain
explain
explain
explain
explain
explain
explain
explanation
explode
explode
explode
explode
explode
exploit
exploiter
exploit
exploit
exploit
exploit
exploit
explore
explore
explore
explore
explosion
explosion
explosive
export
export
exporter
export
export
export
export
export
export
expose
expose
expose
expose
expose
exposure
expound
express
express
express
express
expression
express
express
expunge
expunge
extend
extend
extend
extend
extend
extend
extension
extension
exterior
extinguish
extort
extort
extort
extract
extract
extract
extract
extract
extradite
extradition
extrapolate
extra
extreme
extremist
extricate
extrusion
exude
exude
eyeball
eyeball
eyebrow
eye
eyeglass
eye
eye
eye
eyewitness
eye
f16
f-18
f18
fabricate
fabricate
fabrication
fabricator
fabric
facade
face
face
face
facelift
face
face
face
face
facilitate
facilitate
facilitate
facility
facing
face
face
facsimile
faction
factory
factory
factor
factor
factor
factor
factory-job
fact
fade
fade
fade
fade
fade
fad
fail
fail
fail
failing
fail
fail
fail
failure
failure
fail
fail
faint
faint
fair
fajita
fake
fake
fake
fall
fall
fall
fall
fall
fall
falsify
falsify
falsify
falter
falter
falter
falter
falter
fame
familiarize
family
family
famine
fanatic
fancy
fang
fan
fan
fan
fan
fantasy
fantasize
fantasize
fan
fare
fare
fare
fare
fare
fare
fare
fare
farmer
farmer
farmer
farm
farm
farmstead
farm
farm
farmwife
fascinate
fascist
fashion
fashion
fashion
fastball
fasten
fastener
fatality
fatality
father
father
fat
fatten
fatten
fatten
fault
faultline
fault
fault
fauna
favor
favor
favor
favorite
favor
favor
favor
favor
fawn
fax
fax
fear
fear
fear
fear
fear
fear
fear
fear
feast
feast
feather
feat
feature
feature
feature
feature
feature
feature
feature
feed
feed
feed
feedlot
feedlot
feed
feed
feed
feeler
feeling
feeling
feel
feel
feel
feel
feel
feel
fee
fee
foot
fella
fell
fell
fellow
fall
fall
felony
felon
feel
feel
female
feminist
fence
fend
fend
fend
fend
ferret
ferret
ferry
ferry
ferry
fertilize
fertilizer
fertilize
fester
festival
festivity
festoon
festoon
fetch
fetch
fetch
fetch
fetch
fetus
feud
feud
fiberglass
fiber
ficial
fidget
fiefdom
field
field
field
field
field
field
fighter-bomber
fighter
fight
fight
fight
fight
fight
fight
figure
figure
figure
figure
figure
figure
figure
figure
figure
filbert
filch
file
file
filer
file
file
file
file
filings
file
filipino
fill
fill
fill
fill
fill
fill
fill
film
film
film
film
film-maker
film
filter
filter
filter
filter
filter
finagle
finalist
finalize
finalize
finalize
final
finance
finance
finances
finances
finance
finance
financial-crime
financial-service
financier
financing
finance
finding
find
find
find
find
find
find
find
fine-art
fine
fine
fine
finesse
fine-tune
fine
finger
finger
fingerling
fingerprint
finger
finger
fine
finish
finish
finish
finish
finish
finish
finish
finish
fireball
fire
fire
firefighter
firehoop
fireman
fireplace
fireproof
fire
fire
fire
fire
firework
firing
fire
firm
firm
firm
firm
firm
firm
firm
fishery
fisherman
fish
fissure
fist
fit
fit
fit
fit
fit
fix
fix
fix
fix
fixture
fix
fizz
fizzle
fizzle
flabbergast
flag
flag
flame
flame
flank
flap
flap
flare
flare
flare
flashback
flash
flash
flash
flash
flash
flashlight
flash
flash
flat
flatten
flatten
flatten
flatten
flaunt
flaunt
flavor
flaw
flaw
flaw
flay
flea
fledge
flee
flee
fleece
flee
fleet
fleet
flee
fleshpot
fly
flex
flicker
flick
fly
flier
fly
fly
flight-attendant
flight
flight
flinch
fling
fling
flip
flip
flip
flip
flirt
flirt
flirt
float
float
float
float
float
float
float
flock
flock
flock
flog
flood
flood
flood
flood
floor
flop
flop
floppy
flora
flotation
flounder
flounder
flounder
flourish
flourish
flourish
flourish
flout
flow
flower
flower
flow
fly
flow
flow
flow
flow
fluctuate
fluctuate
fluctuate
fluctuate
fluctuate
fluctuate
fluctuation
fluid
flunk
flunk
fluoropolymer
flush
flush
fly
fly
fly
fly
foam
focus
focus
focus
focus
focus
focus
focus
foe
foe
fog
foil
foil
foil
foil
foil
fold
fold
folder
fold
fold
fold
folk
folk
folly
follow
follow
follower
follow
follow
follow
follow
follow
follow
foment
food-fish
food-service
food
foodstuff
fool
fool
fool
fool
foothill
foothill
foot
footnote
footnote
footstep
foot
foot
foray
forbid
forbid
forbid
forbid
force
force
force
force
force
force
force
force
force
forecaster
forecast
forecast
forecast
forecast
forecast
forecast
forecast
forecast
foreclose
foreclose
foreclose
foreclose
foreclosure
foreclosure
forefather
foreigner
foreigner
forensic
forerunner
foresee
foresee
foresee
foresee
foresee
foreshadow
forest-product
forest-product
forest
forfeiture
forfeit
forge
forgery
forget
forget
forget
forget
forget
forge
forging
forge
forgive
forgive
forgive
forget
forget
forget
forgo
fork
fork
forklift
fork
formality
formalize
format
form
form
form
form
form
form
formula
formulate
formulate
formulate
formulate
formulation
form
form
forsake
fortify
fortune
forum
forward
fossil
foster
foster
foster
foster
fight
fight
foul
foundation
found
found
found
founder
founder
founder
founder
found
found
find
find
fountain
four-fifth
fox
fraction
fraction
fracture
fracture
fragment
fragment
fragment
frailty
frame
framer
frame
frame
frame
franchise
franchisee
franchisee
franchiser
franchise
franchise
franchise
franchise
franciscan
franc
fraternity
fraud
fray
fray
freak
freak
freedom
free
free
free
free
freeholder
free
free
free
free
freeway
freezer
freeze
freeze
freeze
freighter
freight
french
frequency
frequent
freshman
fret
fret
fret
fret
fret
friction
friday
fry
friendship
friend
friend
frier
frieze
frigate
frighten
frighten
frighten
fringe
frippery
fritter
fritter
frock
frogman
frog
frolic
frolic
frond
front
froth
freeze
freeze
fruit
frustrate
frustrate
frustrate
frustrate
frustration
fry
fudge
fudge
fuel
fuel
fuel
fuel
fuel-service
fuel
fuel
fugitive
fujus
fulfil
fulfil
fulfil
fulfil
fulfill
fulfill
fulmination
fume
fume
fume
fumper
functionary
function
function
function
function
function
fundamentalist
fundamental
fund
fund
fund
fund
fund-raiser
fundraiser
fund-raiser
fundraise
fund
fund
fund
fund
fund
fund
fungus
funnel
funnel
funnel
funnel
furlough
furlough
furnace
furnish
furnishings
furnish
furnish
furrier
furrow
fur
further
further
further
fuss
future
future
future
gadget
gag
gain
gain
gain
gainer
gainer
gain
gain
gain
gain
gain
gain
galaxy
gallery
gallon
gallop
gallstone
galvanize
galvanize
galvanize
gambler
gamble
gamble
game
gangbuster
gang
gangster
gape
garage
gardener
gardenette
garden
garden
garden
garment
garner
garner
garner
garner
gas
gas
gas-gather
gasoline
gasp
gasp
gate
gather
gather
gather
gathering
gather
gather
gather
gather
gauge
gauge
gauge
give
give
gaze
gear
gear
gear
gear
gear
geek
geek
gemsbok
gem
gender
generalist
generalization
generalization
generalize
generate
generate
generate
generate
generate
generate
generation
generator
gene
genre
gentlelady
gentleman
geoscience
german
german
germ
gesture
gesture
get
get
get
get
get-together
get
get
get
get
get
geyser
ghetto
ghostbuster
ghostbuster
ghost
giant
giant
gift
gilt
gilt
gimmick
gird
gird
girl
giveaway
giveaway
giveback
give
give
give
give
giveth
give
give
give
give
give
give
gizmo
glamorize
glamorize
glance
glare
glass
glaze
glaze
gleam
glean
glean
glide
glide
glimpse
glitch
glitterati
gloat
gloater
gloat
gloat
gloat
globalist
gloss
gloss
glove
glow
glow
glue
glue
glut
glut
glut
glycol
gnaw
goal
goat
gobble
gobble
goblin
god
go
go
goings-on
go
go
goldband
gold
golfer
golf
goliath
go
go
go
gon
gon
goody
goods
goodyear
gore
gore
gorilla
gossip
get
get
get
get
get
get
go
go
go
govern
govern
govern
governmental-affair
government-relation
government-security
government-set
governmentset
government
government
governor
governor
govern
govern
govern
grab
grab
grab
grab
grab
grab
grace
grader
grade
grad
graduate
graduate
graduate
graduate
graduate
graft
grain
grain
grain
grammy
gram
grandchild
grandee
grandkid
grandmaster
grandmother
grandparent
grange
grant
grant
grant
grant
grant
grant
grant
grape
grape
graphic
graphic
graph
grapple
grapple
grapple
grasp
grasp
grasp
grassroot
gratuity
gray
graze
grazer
graze
great-grandchild
great
greenhouse
green
green
greet
greet
greeting
greet
greet
greet
grenade
grow
grow
grow
gridlock
grievance
grill
grimace
grimace
grimace
grinder
grind
grind
grind
gringo
grin
grin
grin
gripe
gripe
grip
grip
grip
groan
grocery
grope
gross
grotto
groundbreaker
ground
ground-handling
ground
grounds
grind
grind
grind
group
group
group
group
grouse
Grouse
grouse
grovel
grower
grow
grow
grow
growl
grow
grow
grow
growth
growth
grow
grow
gruel
grumble
grumble
guarantee
guarantee
guarantee
guarantee
guarantee
guarantee
guarantee
guarantee
guard
guard
guard
guard
guard
guard
guard
guber-peter
guerrilla
guess
guess
guess
guess
guest
guest
guide
guide
guideline
guideline
guidepost
guide
guide
guide
guilder
gunboat
gunman
gunman
gun
gunner
gunsling
gun
gun
guru
guru
gush
gush
gut
gut
guy
guy
guzzle
gymnastics
gyrate
gyrate
gyrate
gyration
habeas
habitat
habit
hacker
hackles
hack
hack
have
have
have
haggle
haggling
haggle
hail
hail
hail
hail
half-state
hall
hallway
halogenate
halt
halt
halt
halt
halt
halt
halt
halve
halve
half
halve
halve
hamburger
hammer
hammer
hammer
ham
hamper
hamper
hamper
hamper
hamper
hamstring
hamstring
hamstring
handbill
handbook
hand-carry
handcuff
handcuffs
hand
hand
handicapped
handicap
handicap
handle
handle
handler
handle
handle
handle
handle
handpick
hand
handstand
hand
hand
hang
hang
hang
hang
hang
happen
happen
happen
happen
happening
happen
happen
happen
happen
harangue
harangue
harass
harass
harass
harbor
harbor
harbor
harbor
harden
hardship
harm
harm
harm
harm
harm
harm
harness
harp
harp
harp
harry
harvest
harvest
harvest
hash
hassle
hasten
hasten
have
have
have
have
have
hatch
hatch
hate
hate
hate
hate
hat
haul
hauler
haul
haul
haunt
haunt
haunt
haunt
haunt
haunt
haven
have
have
have
have
have
have
have
have
hawaius
hawker
hawk
hawk
hawk
hazard
hcfc
hdtv
headache
head
head
head
head
head
headlight
headline
headline
headline
headphone
headquarters
headrest
headset
head
head
head
head
heal
heal
health-product
heal
heap
heap
heap
hear
hear
hear
hearing
hearing
hear
hear
hear
hear
hearten
heart
hear
hear
heat
heater
heat
heat
heat
heat
heave
heave
heaven
heave
heavyweight
heckle
hedger
hedge
hedge
hedge
hedge
hedge
heebie-jeeby
heed
heed
heed
heel
heighborhood
heighten
heighten
heighten
height
heir
hold
hold
helicopter
help
help
help
help
help
help
help
help
help
help
help
hemorrhage
hemorrhage
hemorrhoid
hen
hen
herald
herald
herald
herbicide
hercule
herd
herd
herniate
hero
heron
hesitate
hesitate
hesitate
hew
hew
hew
hide
hideout
hider
hide
hide
hide
hide
highland
highlight
highlight
highlight
highlight
highlight
highlight
highlight
high-rise
high
hightail
hightop
highway
highway
hike
hiker
hike
hill
hinder
hinder
hinder
hinder
hinder
hinge
hint
hint
hinterland
hint
hint
hint
hint
hint
hip
hire
hire
hire
hire
hire
hire
hire
hire
hispanic
hiss
historian
historical-claim
historicize
hitch
hitch
hit
hit
hitter
hit
hit
hit
hit
hit
hit
hit
hoard
hoard
hoard
hobby
hobble
hobble
hobble
hobbyist
hobo
hoe
hog
hog
hog
hoist
holder
holder
holding
holding
hold
hold
holdout
holdover
hold
holdup
hold
hold
hold
hold
hold
hold
hole
hole
hole
holiday
holler
homefe
homeowner
homer
homer
homer
home
homicide
homosexual
homosexual
honduran
hondura
hone
hone
honorarium
honor
honor
honor
honor
honor
hood
hoodwink
hook
hook
hook
hook
hookup
hook
hoof
hope
hope
hope
hope
hope
hope
hope
hope
hope
Hope
hop
hopscotch
hop
horizon
hormone
horn
horoscope
horrible
horror
horse
horse
horticultural-product
hosanna
hose
hose
hose
hospitalization
hospitalize
hospital
hospital
hostage
host
hostility
host
host
host
host
hot-cereal
hotel-casino
hotelier
hotel
hotline
hound
hound
hour
hour
house
household
house
house
house
house
houseware
housewife
housing
hover
hover
hover
howl
huckster
huddle
hug
hug
hug
hulk
humanities
humanize
human-resource
human-rights
human
humble
hum
hunch
hundred
hundred
hang
hang
hunker
hunt
hunter-gatherer
hunter
hunt
hunt
hunt
hunt
hurdle
hurl
hurl
hurl
hurricane
hurry
hurry
hurry
hurt
hurtle
hurt
hurt
hurt
hurt
hurt
hurt
husband
husband
hustler
hustle
hybrid
hyena
hype
hypermarket
hype
hypnotize
hypocrite
hypothesize
ice-bagger
ideal
idea
idea
identify
identify
identify
identify
identify
identify
identity
ideology
ideologue
ideologue
idiot
idle
idle
idle
idle
ignite
ignite
ignite
ignore
ignore
ignore
ignore
ignore
ignore
ignore
Ignore
illegality
illness
ill
illuminate
illuminate
illusion
illustrate
illustrate
illustrate
illustrate
illustrate
illustration
image
imagine
imagine
imagine
imagine
imagine
imagine
imagine
imbalance
imitate
imitate
imitate
immerse
immigrant
immigrate
immunity
impact
impact
impact
impair
impair
impart
impeach
impede
impede
impede
impediment
impede
impel
impend
imperative
imperfection
imperialist
imperil
impersonation
implant
implant
implant
implant
implement
implement
implement
implement
implement
implicate
implicate
implication
imply
imply
imply
implore
implore
imply
imply
imply
import
import
import
importer
import
import
import
import
import
import
impose
impose
impose
impose
impose
impose
impound
impound
impoverish
impress
impress
impress
impressionist
impress
imprison
imprison
imprison
imprison
impropriety
improve
improve
improvement
improve
improve
improve
improve
improve
improvise
impugn
impulse
inaugurate
incarcerate
incense
incentive
inch
inch
inch
inch
inch
incident
incision
incite
incline
include
include
include
include
include
include
include
include
include
income
incongruity
inconsistency
incorporate
incorporate
incorporate
incorporate
incorporate
increase
increase
increase
increase
increase
increase
increase
increase
increase
increase
increase
increase
increase
increment
incriminate
incumbent
incur
incur
incur
incur
incur
indemnify
independent
index
indexer
index
index
index-future
index
index-option
indicate
indicate
indicate
indicate
indicate
indicate
indication
indicator
index
indict
indict
indictment
indict
individual
individual
indoctrinate
induce
induce
inducement
induce
induce
induce
indulgence
indulge
indulge
indulge
industrialist
industrialize
industrialize
industrial
industrial
industry
industry
inefficiency
inequality
inequity
infant
infant
infect
infect
infect
infection
inference
infer
infiltrate
infiltrate
infiltrate
inflame
inflate
inflate
inflate
inflate
inflate
inflation-adjust
inflict
inflict
inflict
inflow
influence
influence
influence
influence
influence
influence
influence
information-service
information-system
inform
inform
inform
inform
inform
infraction
infringe
infringe
infringe
infringe
infringe
infuriate
infuriate
infuse
infuse
ingest
ingot
ingrate
ingratiate
ingredient
inhabit
inhabit
inhabit
inherit
inherit
inherit
inherit
inhibit
inhibit
inhibit
initial
initial
initial
initiate
initiate
initiate
initiate
initiate
initiatior
initiative
initiative
inject
inject
inject
injection
inject
inject
inject
injunction
injure
injure
injure
injury
injure
injustice
ink
inmate
inning
innocent
innoculate
innovate
innovate
innovation
innovator
i
inn
innuendo
input
inquire
inquiry
inquire
inroad
insect
insert
insert
insert
insert
insert
insider
insider
insight
insinuate
insist
insist
insist
insist
insist
insist
insist
inspect
inspect
inspect
inspection
inspector
inspector
inspect
inspect
inspect
inspiration
inspire
inspire
inspire
inspire
inspire
installation
install
install
install
installment
install
install
instance
instigate
instill
instinct
institute
institute
institute
institute
institution
institution
instruct
instruct
instruct
instruction
instructor
instruct
instruct
instrumentalist
instrument
instrument
insulate
insulate
insulate
insulate
insulin
insult
insult
insurance-claim
insure
insure
insurere
insurer
insurer
insurer
insure
insure
insure
insurgent
insure
integrated-technology
integrate
integrate
integrate
intellectual
intend
intend
intend
intend
intend
intensify
intensify
intensify
intensify
intention
intent
interaction
intercede
intercept
intercept
interconnect
interconnect
interest
interest
interest
interest
interfere
interfere
interfere
interfere
interfere
interior-furnishings
interior
interject
interlope
intermediary
intermix
internationalist
international-operation
interpretation
interpret
interpret
interpret
interpret
interpret
interpret
interrogate
interrogator
interrupt
interrupt
interruption
interrupt
intersection
intersperse
intersperse
interstate
intertitle
intertwine
intertwine
interval
intervene
intervene
intervene
intervene
interventionist
intervention
interview
interview
interview
interview
interview
interview
intimate
intimidate
intimidate
intimidate
intimidation
intone
intrigue
intrigue
introduce
introduce
introduce
introduce
introduce
introduce
introduce
introduction
intrude
intrusion
inundate
invade
invader
invade
invade
invade
invade
invalidate
invent
invent
invent
invention
inventory
inventory
inventor
invent
invent
invert
invest
invest
investigate
investigate
investigate
investigate
investigate
investigate
investigation
investigator
investigator
invest
invest
invest
investment
investor-relation
investor
investor
invest
invest
invest
invitation
invite
invite
invite
invite
invite
invoice
invoke
invoke
invoke
invoke
invoke
involve
involve
involve
involve
involve
involve
involve
involve
ious
ipo
ira
iris
irk
irk
irk
irk
irony
iron
iron
irradiate
irregularity
irritate
irritate
island
island
is
isolate
isolate
isolate
isolate
isolate
issue
issue
issuer
issue
issue
issue
issue
issue
issue
issue
be
be
be
itemize
item
item
jab
jackal
jack
jack
jacket
jacket
jackhammer
jack
jack
jail
jail
jail
jail
jam
jam
jam
jam
jan.
japanese-american
japanese
japanese
jar
jar
jaunt
jaunt
jeans
jeep
jell
jeopardize
jeopardize
jeopardize
jeopardize
jerk
jetliner
jet
jet
jettison
jet
jeweler
jewel
jew
jiggle
jillion
jingle
jinks
jinx
jitters
job
job
jockey
jock
jog
join
join
join
join
join
join
joint-implant
joint
join
join
join
joke
joke
joke
joke
jolt
jolt
jolt
jolt
jolt
jostle
journalist
journalist
journal
joust
joy
judge
judgeship
judge
judge
judge
judge
judge
judge
judge
judgment
juggler
juggle
juggle
jug
juice
jumbo
jump
jump
jump
jump
jump
jump
jump
jump
juncture
junior
junk-bond
junket
junk-holder
junkholder
junk-holder
junkie
junk
jury
jurisdiction
jurist
juror
jury-rig
justice
justify
justify
justify
justify
jut
jut
juxtapose
kayo
kc-135
keen
keeper
keep
keep
keep
keep
keep
keep
keep
keep
ketchup
keyboard
key
key
key
kickback
kick
kick
kicker
kick
kick
kick
kick
kick
kiddie
kid
kidnap
kidnap
kidnapper
kidnap
kid
kid
kill
kill
killer
killing
kill
kill
kill
kill
kill
kilobyte
kilogram
kilometer
kindle
kind
kinfolk
kingpin
king
kiss
kiss
kit
knead
knead
knee
know
knight
knit
knit
knit
knock
knock
knock
knock
knock
knot
know
know
known
know
know
know
know
know
know
knuckle
kowtow
krona
kudos
label
label
label
Label
label
label
label
label
laboratory
laborer
labor
labor
labor
lab
lace
lack
lack
lackey
lack
lack
lack
lady
laggard
lag
lag
lag
lagoon
lag
lag
lag
lag
lag
lay
lay
lake
lambast
lambaste
lament
lament
laminate
lamppost
lamp
land
land
landfill
landholding
landing
land
landlord
landowner
landowner
landscaper
landscape
landslide
land
land
land
lane
language
languish
languish
languish
languish
languish
lapse
lapse
lapse
lap
laptop
laptop
lap
laser
lash
lash
lash
lash
last
last
last
last
last
last
latch
latch
latch
latch
lathe
laud
laud
laugh
laugh
laugh
laugh
laugh
laugh
launch
launch
launch
launch
launch
launch
launder
launder
launder
launderer
launder
launder
laurel
lavish
lavish
lawbreaker
lawmaker
lawmaker
lawmaker
law-making
lawn
law
lawsuit
lawsuit
lawyer
lawyer
lawyer
laxative
layer
lay
layoff
layoff
lay
lay
lay
lay
lbo
leader
leader
lead
lead
lead
lead
lead
lead
lead
lead
leaf
leaflet
leaguer
league
leak
leak
leaker
leak
leak
lean
lean
lean
lean
lean
lean
lean
leap
leap
leapfrog
leap
leap
leap
leap
leap
leap
learn
learn
learn
learn
learn
learn
learn
lease
lease
lease
lease
lease
lease
lease
lease
leather
leaf
leave
leave
leave
leave
leave
leave
lecture
lecture
lecture
lecture
ledger
lead
lead
lead
leech
leftist
leftovers
leave
leave
leave
leave
legalize
legal-service
legion
legislate
legislate
legislator
legislator
legislature
legitimize
legitimize
leg
lemming
lemon
lender
lender
lend
lend
lend
lend
lend
lengthen
lengthen
lengthen
lengthen
lengthen
length
lens
lens
lend
lend
leotard
lesbian
lesion
lessen
lessen
lesser
lesson
let
letter
letter
let
let
let
let
let
let
let
let
level
level
level
level
level
level
leverage
leverage
leverage
leverage
leverage
levy
levy
liability
liaison
liaison
liar
libel
liberalization
liberalize
liberalize
liberalize
liberalize
liberalize
liberal
liberal
liberate
libertarian
liberty
librarian
library
louse
license
license
licens
license
license
license
license
lick
lid
lie
lie
lie
lie
lieutenant
lie
lie
lifeguard
life
lift
lift
lift
lift
lift
lift
lift
lift
light
lighten
lighten
lighten
light
light
light
light
like
like
liken
liken
liken
likes
like
like
like
limb
limitation
limit
limit
limit
limit
limit
limit
limit
limit
limousine
limp
linebacker
line
line
liner
line
line
lineup
line
line
linger
linger
linger
linger
line
linkage
link
link
link
link
link
link
link
link
link
lion
lipoprotein
lip
lipstick
liquefy
liquefy
liquefy
liquefy
liquidate
liquidate
liquidate
liquidate
liquidate
liquid
lira
list
list
listen
listen
listener
listener
listen
listen
listen
listen
listen
listing
list
list
list
list
list
lithograph
litigant
litigator
litter
litter
light
light
live
live
live-haul
live-hauler
life
life
live
live
live
live
live
live
live
live
load
load
loading
load
load
load
loafer
loan
loan
loan
loan
loan
loan
loathe
loathe
loathe
loaf
lobby
lobby
lobby
lobby
lobbyist
lobby
locale
locality
localize
local
locate
locate
locate
locate
locate
location
lock
lock
lock
lock
lock
lock
lock
locution
lodge
lodge
lodge
lodgings
log
log
logger
log
logistics
logo
log-roll
log
log
log
log
long-term
long
look
look
lookee-loo
look
look
look
look
look
look
look
loom
loom
loom
loom
loom
loom
loony
loophole
loop
loosen
loosen
loosen
loose
loot
loot
lop
lord
lord
loser
lose
lose
lose
lose
lose
loss
loss
loss
lose
lose
lose
lotion
lot
lot
lottery
loudspeaker
loui
lounge
lovebird
love
love
lover
love
love
love
love
lower
lower
lower
lower
lower
lower
low-life
low
loyalty
lubricant
luck
lug
lug
lug
lull
lumber
luminary
lump
lump
lump
lump
lunch
lunge
lunge
lung
lurch
lurch
lurch
lure
lure
lure
lure
lure
lure
lure
lurk
luxury
lie
lyric
lyric
machete
machiguenga
machine
machine
machinist
machinist
machinist
make
make
make
mafia
mafioso
magazine
magazine
maggot
magician
magistrate
magnetize
magnet
magnify
magnify
magnify
magnolia
maharaja
mail
mail
mailer
mailing
mail
mailman
mail-sort
mail
mail
mainframe
main
maintain
maintain
maintain
maintain
maintain
maintain
maintain
major
major
maker
maker
make
make
make
make
make
make
make
make
make
make
makin
malefactor
male
malfunction
malign
mall
mammoth
manacle
manage
manage
manage
management
manager
manager
manage
manage
manage
manage
manage
mandate
mandate
mandate
mandate
mandate
mandate
maneuver
maneuver
maneuvering
maneuver
maneuver
maneuver
maneuver
maneuver
manhandle
manifestation
manifesto
manifest
maninstay
manipulate
manipulate
manipulate
manipulate
manipulate
manipulation
manipulator
man
mannerism
manners
man
mansion
manual
manual
manuever
manufacture
manufacture
manufacturer
manufacturer
manufacture
manufacture
manufacture
manufacture
man
many
many
map
map
map
map
map
marathon
marble
march
march
marcher
march
march
march
march
margeote
marginalia
marginalize
margin-call
margin
margin
margin
margin
markdown
mark
mark
market
market
marketeer
marketer
marketer
marketing-communication
market
market-maker
marketplace
market
market
market
market
market
mark
markka
mark
mark
mark
mark
mark
marquee
mar
marriage
marry
marry
marry
marry
marsh
marvel
marvel
marvel
mask
mask
mask
mask
mason
masquerade
massacre
massage
massage
massage
mass
mass
masseur
masseuse
mass-media
mass-produce
master
masterpiece
master
master
match
match
match
match
match
match
match
mate
materialize
materialize
materialize
materialize
materialize
material
material
mate
mathematics
mate
matter
matter
matter
matter
matter
matter
matter
mature
mature
mature
mature
mature
maturity
maturity
maul
maven
maximize
maximize
maxim
mayor
maze
mcdonald
meadow
meal
meander
meander
meaning
mean
means
means
mean
mean
mean
mean
mean
mean
mean
measure
measure
measure
measurement
measure
measure
measure
measure
measure
meat
meat
mechanic
mechanism
medallion
meddle
meddle
media
mediate
mediator
medical-product
medicine
meeting
meeting
meet
meet
meet
meet
meet
meet
meet
megabyte
mega-crash
mega-hit
mega-issue
mega-merger
mega-problem
mega-project
megaquestion
mega-resort
megawatt
meld
meld
meld
mellow
melody
melt
melt
melt
membership
member
member
memento
memoirs
memorabilia
memorandum
memorandum
memorialize
memory
memorize
memo
memo
mend
man
man
mention
mention
mention
mention
mention
mention
mentor
menu
mercantilist
mercedes-benz
mercedes
merchandise
merchandiser
merchandise
merchant
merchant
merge
merge
merger
merge
merge
merge
meringue
merit
merit
merit
mesh
message
messenger
mess
messr.
mess
metabolize
metal
metal
metal
metal-worker
metalworker
metaphor
mete
meter
methodology
method
mete
metric
meet
meet
mouse
mouse
micoprocessor
microbe
microchip
microcomputer
microeconomic
microelectronics
microphone
microprocessor
microwave
mid-1940
mid-1960
mid-1970
mid-1980
mid-1990
middleman
midsize
miff
miff
mig-29
mighta
migrate
migration
mile
milestone
military-electronics
militate
militia
milk
milk
milk
mill
millionaire
million-plus
million
million
mill
mimic
mimic
mimic
mimic
mince
mind
mind
mind
mind
minefield
mineral
miner
mine
mine
mingle
miniaturize
minicar
minicomputer
minimill
minimize
minimize
minimize
minimum
mine
miniseries
minister
ministry
minisupercomputer
minivan
minneapoli
minority
minor
mint
mint
mint
minus
minus
minute
minutiae
mips
mips
mire
mirror
mirror
mirror
mirror
misadventure
miscalculate
miscalculate
miscarriage
misclassify
miscreant
misdeed
misdemeanor
misfortune
misguide
mishandle
mishandle
misinterpret
misinterpret
misjudge
misjudgment
mislay
mislead
mislead
mislead
mismeasurement
misperception
misplace
misquote
misrepresentation
misrepresent
misrepresent
misrepresent
misrepresent
misroute
miss
miss
miss
missile
miss
missionary
mission
misspend
misstate
misstate
misstatement
misstate
miss
miss
mistake
mistake
mistake
mistreat
mistress
mistrial
mist
misunderstanding
misunderstand
misunderstand
misuse
mite
mitigate
mitigate
mitsubishus
mitsuus
mix
mix
mix
mixer
mix
mix
mixture
mix
moan
moan
moan
mobilize
mobilize
mobilize
mobilize
mock
mock
model
model
model
model
model
modem
moderate
moderate
moderate
moderate
moderate
modernize
modernize
modernize
modernize
mode
modification
modification
modify
modify
modify
modulate
moisturizer
mold
mold
molecule
mollify
mollify
moment
monday
monetarist
moneymaker
monitor
monitor
monitor
monitor
monitor
monitor
monitor
monitor
monkey
monolith
monologue
monopoly
monopolize
monopolize
monopolize
monopolize
month
month
moonie
moonlight
moon
mop
mop
moral
mores
morning
morsel
mortgage
mortgage
mortgage
moslem
motel
mother
mother
motif
motion
motion
motivate
motivate
motivate
motivate
motive
motorcycle
motorist
motorize
motor
mound
mountain
mount
mount
mount
mount
mount
mount
mourn
mourn
mousetrap
mouth
mouth
move
move
move
movement
move
move
move
move
move
move
move
move
movie
move
move
mow
muck
muddy
muddle
muffle
muff
mull
mull
mull
multimedia
multinational
multiple
multiple
multiply
multiply
multiply
multiply
mumble
mummy
munch
municipality
municipal
municipal
municipal
muni
muni
mural
murder
murderer
murder
murder
murmur
muscle
muscle
muscle
muscovite
muse
muse
museum
museum
muse
mushroom
mushroom
mushroom
musician
muster
mutate
mutate
mutation
mute
mute
mutilate
mutiny
mutter
mutt
muzzle
be
mystery
myth
nab
nagging
nag
nag
nail
nail
nail
name-dropper
name-drop
name
name
name
nameplate
name
name
name
name
name
name
narcotic
narrative
narrow
narrow
narrow
narrow
narrow
narrow
nationalist
nationalize
nationalize
national
nation
native
natural-food
natural-resource
navy
navigate
naysayer
naysay
nazi
neanderthal
near
near
near-monopoly
near
necessitate
necessitate
necessity
neck
necktie
need
need
need
need
need
need
need
need
need
negate
negative
neglect
neglect
neglect
negotiate
negotiate
negotiate
negotiate
negotiate
negotiate
negotiation
negotiation
negotiator
negotiator
neighbhorhood
neighborhood
neighbor
neighbor
neighbour
neophyte
nerd
nerd
nerve
nestle
nest
net
net
net
net
net
net
network
network
network
network
neurologist
neutralize
neutralize
neutron
newborn
newcast
newcomer
newscast
newsy
newsletter
news
newspaper
newspaper
newsprint
newsstand
newsstand
news-weekly
nibble
niche
nichola
nick
nickname
nickname
nightclub
nightmare
night
nine-month
nine-tenth
nix
nobleman
nod
no-load
nominate
nominate
nominate
nomination
nominee
non-client
non-communist
nonconformist
non-economist
non-lawyer
non-lawyer
nonoperate
nonperformer
nonperform
nonperform
nonrecurr
non-seaman
nonstop
noodle
normalize
norm
norm
northrop
nose-dive
nosedive
nose-dive
nosedive
nose
no.
notch
notch
notebook
note
note
noteholder
note
note
note
note
note
note
note
note
notice
notice
notice
notice
notice
notice
notification
notify
notify
notify
notify
notify
notify
note
note
notion
no.
novel
novelty
novitiate
nov.
nozzle
nuance
nuclear-arm
nudge
nullify
nullify
nullify
number-cruncher
number
number
number
number
nurse
nursery
nurse
nurse
nurture
nurture
nurture
nurture
nut
oak
oasis
oats
obey
obfuscate
object
object
object
objection
objection
objective
object
object
object
obligate
obligate
obligation
obligation
oblige
oblige
oblige
obliterate
obscure
obscure
obscure
observation
observe
observe
observer
observer
observe
observe
observe
observe
observe
obsess
obsolete
obsolete
obstacle
obstruct
obstruct
obstruct
obtain
obtain
obtain
obtain
obtain
obviate
occasion
occasion
occupation
occupy
occupy
occupy
occupy
occupy
occur
occur
occurrence
occur
occur
occur
occur
ocean
octave
octogenarian
oddball
oddity
oddity
odds
odds
offender
offend
offend
offend
offensive
offer
offer
offer
offer
offering
offer
offer
offer
offer
offer
offer
offer
off-hour
offical
officer
officer
office
office
office-supplies
official
official
official
offus
offset
offset
offset
offset
offset
offset
offset
offshoot
offspring
ogle
ogle
oils
oils
old
old-timer
olefin
olympics
omen
omission
omit
omit
omit
omit
omit
oncogene
oncogene
one
onlooker
onlooker
on-ramp
ooze
ooze
open
open
openend
opener
opening
open
open
open
open
open
opera
operate
operate
operate
operate
operate
operate
operate
operate
operation
operative
operator
opine
opinion-maker
opinion
opinion
opponent
opponent
opportunist
opportunity
oppose
oppose
oppose
oppose
oppose
oppose
oppose
opt
opt
optical-product
optimist
opt
option
option
option
option
opt
opt
orange
orchardist
orchard
orchestra
orchestrate
orchestrate
orchestrate
orchid
ordain
order
order
order
order
order
order
order
order
ordinance
organism
organization
organization
organize
organize
organize
organizer
organize
organize
organize
organ
orient
originate
originate
originate
originate
originate
origination
originator
origin
orkem
ornament
orphan
orphan
other
other
ounce
oust
oust
oust
oust
oust
outage
outbid
outbid
outbid
outbreak
outcome
outdate
outdo
outdistance
outdo
outfielder
outfit
outfit
outflank
outflow
outflow
outfly
outgain
outgrow
outgrow
outing
outlander
outlast
outlast
outlaw
outlaw
outlaw
outlay
outlay
outleap
outlet
outline
outline
outline
outline
outline
outlook
outmode
outnumber
out-of-stater
outpace
outpace
outpace
outpace
outpace
outpace
outperform
outperform
outperform
outperform
outperform
outperform
outpost
outrage
outrank
outsell
outsell
outsell
outshine
outshine
outsider
outskirts
out-smart
outsell
outstrip
outstrip
outstrip
outstrip
outstrip
out-trade
outweigh
outweigh
outweigh
outweigh
oven
over-allotment
overalls
overarch
overbid
overbid
overbought
overburden
overcome
overcharge
overcollateralize
overcome
overcome
overcome
overcome
overcommit
overdo
overdo
overdose
overdose
overemphasize
overflow
overhang
overhaul
overhaul
overhaul
overheate
overheate
overlay
overlap
overlap
overlap
overlay
overlook
overlook
overlook
overlook
overlook
overlook
over-magazine
overpay
overpay
overpay
overpay
overplant
overpower
overprice
overpurchase
overreact
overreact
overreact
overreact
overreact
override
override
override
overrule
overrule
overrule
overrule
overrun
oversee
oversee
oversee
oversee
overseer
oversee
oversee
overshadow
overshadow
overshadow
oversimplify
oversell
oversell
overstate
overstate
overstate
overstate
overstrain
oversubscribe
overtake
overtax
overthrow
overthrow
overthrow
overture
overturn
overturn
overturn
overturn
overuse
overvalue
overvalue
overweight
overwhelm
overwhelm
overwhelm
overwhelm
overwhelm
overwork
owe
owe
owe
owe
owe
owe
own
own
owner
owner
own
own
own
own
own
own
pace
pacemaker
pace
pacify
packaged-goods
packaged-goods
package
package
package
package
package
package
pack
pack
packet
pack
pack
pack
pack
pack
pac
pac
pact
paddle
paean
page
pay
pay
pay
pay
painewebber
pain
paint
paint
painter
painting
painting
paint
paint
paint
paint
pair
pair
pair
palazzo
pale
pale
pale
pale
palm
palmtop
palmtop
palm
pal
pamper
pamphlet
pancake
pander
panelist
panel
pang
panic
panic
panic
panic
panjandrum
pan
pan
pan
pantage
panties
pants
pan
paper-goods
paper
paper-product
papers
papers
parachute
parachute
parade
parakeet
parallel
parallel
parallel
paralyze
paralyze
paramedic
parameter
paraphernalia
paraphrase
parasite
parastatal
parcel
parcel
parcel
parch
pardon
pare
pare
parent
parent
pare
pariba
parimutuel
pare
parish
parishioner
parity
park
park
park
park
park
park
parlor
parry
parry
partake
part
participant
participant
participate
participate
participate
participate
participate
participate
participation
particulars
party
party
party
part
partisan
partisan
partnership
partnership
partner
partner
partner
part
part
part
pasha
passage
pass
pass
pass
passenger-kilometer
passenger
passer-by
pass
pass
pass
passion
passport
pass
pass
password
paste
pastel
pasteurize
pastime
pastor
patch
patch
patent
patent
patent
path
patient
patient
patrol
patrol
patronize
patronize
patronize
patron
pattern
pattern
pattern
pause
pause
pause
pause
pause
pause
pave
pave
pave
pave
paw
pawn
pawn
payable
paycheck
payer
payer
pay
pay
payment
payment
payment
payoff
payout
payout
payroll
pay
pay
pay
pay
pay
pay
pcb
pc
peacemaker
peach
peak
peak
peak
peak
peak
peal
peal
peanut
pearl
pear
peasant
peasant
pea
peccadillo
peck
peck
peculiarity
pedal
pedal
pedal
peddle
peddle
peddle
peddle
peddle
pedestrian
pedigree
peek
peel
peer
peer
peer
peer
peer
peg
peg
peg
peg
peg
peg
pellet
penalize
penalize
penalize
penalty
penny
pencil
pencil
pencil
pencil
pend
pend
pend
penetrate
penetrate
penetrate
penis
pen
penny
pension
pen
people
people
people
people
pepper
pepper
pepper
pepsi
perceive
perceive
perceive
perceive
percentage
perception
perch
perfect
performance
perform
perform
performer
performing-art
perform
perform
perform
perform
perform
peril
periodical
period
period
peripheral
perishable
perish
perk
perk
perk
permeate
permeate
permit
permit
permit
permit
permit
permit
permit
perpetrate
perpetuate
perpetuate
perpetuate
perpetuate
persecute
persecute
persist
persist
persist
persist
persist
personality
personalize
personalize
personnel
personnel
person
persuade
persuade
persuade
persuade
persuade
persuade
pertain
perturb
peruse
peruse
pervade
pervade
perversity
pesata
peseta
peso
pessimist
pester
pesticide
petition
petition
petition
petrochemical
pet
pet
pharaoh
pharmaceutical
pharmaceutical
pharmacy
pharmacist
phase
phase
phase
phase
phase
phenomenon
phillip
philosopher
philosophy
phobia
phone
phone
phone
phone
phone
phone
photocopier
photocopy
photocopy
photofinisher
photograph
photographer
photograph
photograph
photograph
photo
phrase
physician
physics
piano
piaster
pick
pick
picker
pick
pickin
pickle
pick
pick
pickup
pick
pick
pick
picture
picture
picture
picture
picture
picture
piece
piece
piece
piece
pierce
pier
pie
piggyback
piggyback
piglet
pigment
pig
pile
pile
pile
pile
pile
piling
pile
pile
pillar
pillory
pillory
pillowcase
pillow
pill
pilot
pilot
pimp
pinch
pinch
pinch
pinch
pine
ping
ping
pin
pin
pin-point
pinpoint
pinpoint
pin
pin
pint
pin
pioneer
pioneer
pioneer
pipe
pipe
pipeline
pipe
pirate
pirate
piroghi
pistil
pistol
piston
pitch
pitch
pitcher
pitch
pitch
pitch
pitchman
pitch
pitch
pitfall
pitfall
pit
pit
pit
pit
pit
pit
pivot
pizzas-with-everything
pizzeria
placate
placate
place
place
placement
place
place
place
place
place
place
plague
plague
plague
plague
plainclothes
plain
plain
plaintiff
plaintiff
plane
planet
plank
plan
plan
planner
planner
plan
plan
plan
plan
plan
plan
plan
plantation
plant
plant
plant
plant
plant
plant
plan
plan
plastic
plastic
plate
platform
platitude
plaudit
play
play
player
player
playground
play
play
playoff
play
play
play
play
play
plead
plead
pleading
plead
plead
pleasantry
please
please
please
please
please
please
please
plea
pleasure
plea
pledge
pledge
pledge
pledge
pledge
pliers
ply
plight
plod
plot
plot
plotter
plot
plot
plow
plow
plow
plow
ploy
ploy
pluck
pluck
plug
plug
plug
plug
plug
plummet
plummet
plummet
plummet
plummet
plunge
plunge
plunge
plunge
plunge
plunge
plunge
plunk
plus
plus
ply
poacher
poach
pocket
pocket
pocket
pocket
pocket
pockmark
point
point
pointer
point
point
point
point
point
poise
poison
poison
poke
poke
poke
polarize
pole
pole
police
police
police
police
policy
policy
police
policyholder
policy-maker
policy-make
polish
polish
polish
polish
politician
politician
politicize
politico-plaintiff
politics
politics
politics
poll
poll
pollen-produce
pollinate
pollinate
pollinate
pollinate
poll
poll
pollster
poll
pollutant
polluter
pollute
pollute
poll
pol
poltergeist
polymer
polyol
polyp
polyrhythm
ponder
ponder
ponder
pond
pony
pony
pontificate
pony
pool
pool
pool
pool
pop
pop
popularize
popularize
popularize
populate
populate
populate
population
pop
pop
porcelain
porch
pore
pore
pore
pork-barreler
portable
portend
portend
portfolio
portfolio
port
portion
portrait
portrayal
portray
portray
portray
portray
portray
portray
port
port
pose
pose
pose
pose
pose
pose
position
position
position
position
position
possess
possess
possess
possess
possession
possess
possess
possibility
postcard
post
post
post
post
poster
posting
post
postmark
postmark
postpone
postpone
postpone
postpone
postpone
post
post
post
posture
post
potable
potato
potentate
potentiality
pothole
pot
pot
pouch
pounce
pound
pound
pound
pound
pour
pour
pour
pour
pour
pour
powder
power
powerhouse
power
power
practice
practice
practice
practice
practice
practitioner
pragmatist
prairie
praise
praise
praise
praise
praise
praise
praise
prance
prayer
pray
preach
preach
preach
pre-approve
preapprove
prearrange
precaution
precede
precedent
precede
precede
precede
precinct
precious-metal
precious-metal
precipice
precipitate
precipitate
preclude
preclude
preclude
predate
predator
predecessor
predetermine
predicate
predict\/advocate
predict
predict
predict
predict
prediction
prediction
predict
predict
predict
predispose
pre-empt
pre-empt
preference
prefer
prefer
prefer
prefer
prefer
prefer
prefer
prejudice
prejudice
premiere
premiere
premiere
premiere
premise
premium
preoccupy
prepay
prepay
preparation
preparative
prepare
prepare
preparer
prepare
prepare
prepare
prepare
prepay
prepayment
prepayment
prepay
prep
pre-register
pre-register
prerogative
presage
presage
preschooler
prescribe
prescribe
prescribe
prescribe
prescription
presentation
present
present
presenter
present
present
present
present
present
present
preserve
preserve
preserve
preserve
preserve
preside
preside
president
president
preside
preside
pre-sign
press
press
press
press
press
pressure
pressure
pressure
pressure
pressure
pressure
pressure
press
press
press
presume
presume
presume
pretend
pretend
pretend
pretension
pre-test
pre-try
prevail
prevail
prevail
prevail
prevail
prevail
prevent
prevent
prevent
prevent
prevent
prevent
prevent
prevent
preview
preview
prey
price
price
price-earnings
price\/earnings
price
price
price
price
price
price
pricing
price
prick
priest
prime
primitive
prince
principal
principle
print
print
printer
print
print
printout
print
print
print
print
priority
prisoner
prison
privatize
privatize
privatize
privilege
prize
prize
probability
probe
probe
probe
probe
probe
problematic
problem
procedure
proceed
proceed
proceedings
proceedings
proceed
proceeds
proceeds
proceed
proceed
proceed
process
process
process
process
process
process
processor
process
process
proclaim
proclaim
proclaim
proclaim
proclaim
proclamation
procure
prod
prod
prod
produce
produce
producer
producer
produce
produce
produce
produce
produce
production
product
product
prod
profess
profess
profess
professional
professional
profession
professor
profess
proffer
proffer
profferr
profile
profile
profile
profit
profit
profiteer
profiteer
profit
profit-sharing
profit
profit
profit
profit
profit-taking
profitt
profit
profit
progenitor
prognosticator
program
programmer
program
program
program
program
program
progress
progress
progress
progress
progression
progressive
progress
prohibit
prohibit
prohibit
prohibition
prohibit
prohibit
prohibit
project
project
project
project
project
projection
projector
project
project
project
project
project
proliferate
proliferate
proliferate
prolong
prolong
promise
promise
promise
promise
promise
promise
promise
promise
promote
promote
promoter
promote
promote
promote
promote
promotion
prompt
prompt
prompt
prompt
prompt
prompt
promulgate
prong
pronounce
pronounce
pronouncement
pronounce
proof-of-purchase
proofread
propagandist
propagandize
propagandize
propel
propel
propel
propel
property
proponent
proponent
proportion
proposal
proposal
proposal
propose
propose
propose
propose
propose
propose
proposition
prop
prop
prop
proprietorship
proprietor
propse
prop
prop
proscribe
proscribe
prosecute
prosecute
prosecute
prosecute
prosecution
prosecutor
prosecutor
prosecutor
pro
pro
prospects
prospects
prospects
prospectus
prosper
prosper
prostitute
protect
protect
protect
protection
protector
protect
protect
protect
protege
protein
protein
protest
protest
protester
protest
protestor
protest
protest
protest
protocol
prototype
prove
prove
prove
proverb
prove
prove
prove
prove
provide
provide
provide
provider
provide
provide
provide
provide
provide
provide
province
prove
provision
provision
provoke
provoke
provoke
provoke
proxy
prune
prune
pseudo-lobbyist
psychic
psychologist
psychologist
publication
publicize
publicize
public-relation
public-works
public-works
publish
publish
publish
publisher
publisher
publish
publish
publish
pub
puffer
pull-back
pullback
pull
pull
pull
pullout
pull
pull
pull
pull
pull
pulverize
pummel
pummel
pummel
pump
pump
pump
pump
pump
pump
punch
punch
puncher
punch
punch
punch
punch
pundit
punish
punish
punish
pun
punt
pupil
puppet
puppy
purchase
purchase
purchaser
purchase
purchase
purchase
purchase
purchase
purchase
purge
purge
purge
purge
purge
purist
pur-poise
purport
purport
purpose
purr
purse-snatching
purse
pursue
pursue
pursuer
pursue
pursue
pursue
pursue
pursuit
push
push
pusher
push
push
push
push
push
push
put
put
put
put
put
put
put
put
put
put
put
put
put
puzzle
puzzle
puzzle
puzzle
pyramid
pyramid
quack
quack
quadruped
quadruple
quadruple
quadruple
quadruple
quake
qualification
qualify
qualify
qualify
qualify
qualify
qualify
quality
qualm
quantify
quantify
quantity
quarrel
quarrel
quarterback
quarter
quartet
quash
quash
quash
queer
quell
query
query
query
question
question
question
question
question
question
question
question
question
queue
queue
quibble
quicken
quiet
quiet
quiet
quiet
quip
quip
quip
quip
quirk
quit
quit
quit
quit
quit
quit
quiver
quiz
quota-cheater
quota
quotation
quote
quote
quote
quote
quote
quote
quote
quote
race
racehorse
race
racetrack
race
race
rack
rack
racketeer
racket
rack
rack
radar-elude
radical
radio
radio
rafter
rage
rage
rage
rage
rage
raid
raid
raider
raid
raid
raid
railbike
railcar
railing
railroad
rail
rail
railway
rain
rain
rain
raise
raise
raiser
raise
raise
raise
raise
raise
raise
raise
rake
rake
rally
rally
rally
rally
rally
rally
rally
rally
rally
ramble
ramification
ram
rampart
ramp
ramp
rancher
ranch
rand
range
range
ranger
range
range
range
range
range
ring
rank
rank
ranking
rank
rankle
rank
rank
rank
rank
run
rape
rape
rapeseed
rape
rapist
raptor
rarefy
ratchet
rate
rate
rate
ratepayer
rate
rate
rate
rate
rate
rate
ratify
ratify
ratify
ratify
rating
rating
rate
rationalization
rationalize
rationalize
ration
ratio
ratio
rat
rattle
rattle
rattle
rattle
rattle
rat
ravage
ravages
ravages
rave
rave
ravine
raw-material
ray
raze
raze
reach
reach
reach
reach
reach
reach
reach
reach
reach
react
react
react
reaction
reactivate
reactivate
reactor
react
react
react
reader
reader
ready
reading
read
read
readmit
read
read
read
read
read
read
read
read
reaffirm
reaffirm
reaffirm
reaffirm
reaganaut
realestate
realign
realign
realignment
realign
realist
reality
realize
realize
realize
realize
realize
realize
reallocate
reallocate
realm
ream
reap
reap
reap
reappoint
reapportion
reappraise
reappraise
reappraise
reap
reap
reard
rear
rear
rearm
rearrange
rearrange
reason
reason
reason
reason
reason
reason
reason
reassert
reassert
reassert
reassess
reassess
reassign
reassign
reassignment
reassume
reassurance
reassure
reassure
reassure
reassure
reauthorize
reawaken
rebate
rebel
rebel
rebound
rebound
rebound
rebound
rebound
rebound
rebound
rebind
rebuff
rebuff
rebuild
rebuild
rebuild
rebuild
rebuke
rebut
rebut
rebut
recalculate
recalculate
recalculation
recall
recall
recall
recall
recall
recall
recall
recall
recall
recant
recant
recapitalization
recapitalize
recapture
recede
recede
receipt
receivable
receive
receive
receiver
receive
receive
receive
receive
recentralize
receptionist
receptor
recess
recession
recharge
recipe
recipient
recite
recite
reckon
reckon
reckon
reckon
reckon
reclaim
reclaim
reclaim
reclaim
reclaim
reclassify
recline
recognize
recognize
recognize
recognize
recognize
recognize
recommendation
recommendaton
recommend
recommend
recommend
recommend
recommend
recommend
reconcile
reconcile
reconcile
reconnect
reconsider
reconsider
reconstruct
reconstruct
reconstruct
reconstruct
record
record
recorder
recording
record
record
record
record
record
record
recount
recount
recount
recount
recoup
recoup
recoup
recover
recover
recovery
recover
recover
recover
recover
recover
recraft
re-creaction
recreate
re-create
re-creation
recruit
recruit
recruit
recruit
recruit
recruit
recruit
rectangle
rectify
rectify
recuperate
recur
recuse
recycle
recycle
recycle
recycle
redden
redeem
redeem
redeem
redefine
redefine
redefine
redemption
redeploy
redesign
redesign
redesign
redesign
redevelop
red-flag
redial
redirect
rediscover
redistribute
redistribute
redline
redo
redouble
redound
redo
redraw
redress
red
red
reduce
reduce
reduce
reduce
reduce
reduce
reduce
reduction
reef
re-elect
re-elect
reel
reel
reel
re-emerge
re-emphasize
re-enact
re-enactment
re-enactment
re-enter
re-enter
re-enter
re-establish
re-establish
reestablish
re-evaluate
re-evaluate
re-evaluate
re-examine
reexamine
re-export
refashion
referee
reference
referral
refer
refer
refer
refer
refer
refer
refer
refile
refinance
refinance
refinance
refinance
refine
refinery
refiner
refiner
refine
refine
refit
reflect
reflect
reflect
reflect
reflect
reflect
reflect
refocus
refocus
refocus
refocus
refocus
reform
reformer
reform
reform
reformulate
reform
refrain
refrain
refresh
refrigerator
refuel
refugee
refund
refund
refund
refund
refund
refurbish
refurbish
refurbish
refuse
refuse
refuser
refuse
refuse
refuse
refuse
refute
refute
regain
regain
regain
regain
regain
regain
regain
regard
regard
regard
regard
regard
regard
regard
regard
regenerate
region
register
register
register
register
register
register
registrant
registration
regret
regret
regret
regret
regret
regret
regroup
regroup
regulate
regulate
regulate
regulate
regulation
regulation
regulator
regulator
regulator
regumm
rehabilitate
rehabilitate
rehash
reign
reign
reignite
reignite
reignite
reignite
reimburse
reimburse
reimbursement
reimburse
reimburse
reimburse
reimpose
reincorporate
reincorporate
reindict
reinforce
reinforce
reinforcement
reinforce
reinforce
reinforce
reinforce
reinforce
rein
rein
reinstall
reinstate
reinstate
reinstate
reinstate
reinstitute
reinsurer
reintegrate
reintroduce
rein
reinvent
reinvent
reinvest
reinvest
reinvest
reinvest
reinvest
reinvigorate
reinvigorate
reinvigorate
reiterate
reiterate
reiterate
reit
reject
reject
reject
rejection
reject
reject
reject
rejoice
rejoin
rejoin
rejoin
rejoin
rejuvenate
rekindle
rekindle
rekindle
rekindle
relabel
relate
relate
relate
relate
relate
relate
relate
relationship
relation
relation
relative
relaunch
relaunch
relax
relax
relax
relax
relax
relay
release
release
release
release
release
release
release
release
relegate
relent
relent
relent
relic
rely
rely
rely
rely
relieve
relieve
relieve
religion
relinquish
relinquish
relinquish
relinquish
relish
relish
relish
relive
relocate
relocate
relocate
relocate
relocation
rely
rely
rely
rely
remake
remain
remain
remain
remain
remains
remains
remain
remain
remain
remake
remand
remark
remark
remarketer
remarketing
remark
remark
remark
remedy
remedy
remedy
remember
remember
remember
remember
remember
remember
remember
remic
remic
remind
remind
reminder
remind
remind
remind
remind
remittance
remnant
remodel
remodel
remora
remove
remove
remove
remove
remove
remove
remunerate
rename
rename
rename
render
render
rendering
render
render
rendezvous
renege
renege
renegotiate
renegotiate
renegotiate
renewal
renew
renew
renew
renew
renew
renew
renounce
renounce
renounce
renovate
renovate
renovate
renown
rental
rent
renter
rent
rent
rent
rent
rent
reoffer
reopen
reopen
reopen
reopen
reopen
reorganize
reorganize
reorganize
reorient
repackage
repackage
repackage
repay
repay
repaint
repair
repair
repair
repair
repair
repair
repair
reparation
repass
repatriate
repay
repayment
repay
repeal
repeal
repeal
repeat
repeat
repeater
repeat
repeat
repeat
repeat
repel
repel
repercussion
replace
replace
replacement
replace
replace
replace
replace
replace
replaster
replay
replenish
replenish
replicate
replicate
replicate
reply
reply
reply
reply
reply
reply
repond
report
report
reporter
report
report
report
report
report
report
report
report
report
repose
reposition
repository
repossess
representation
representative
representative
represent
represent
represent
representive
represent
represent
represent
repress
repress
reprice
reprint
reprint
reprint
reprint
reprisal
reproduce
reproduce
reproduce
reprove
rep
republican
republic
repudiate
repurchase
repurchase
repurchase
repurchase
repurchase
repurchase
repurchase
reputation
repute
request
request
request
request
request
request
require
require
requirement
require
require
require
require
require
requisition
reroute
reroute
rerun
resale
reschedule
reschedule
reschedule
rescind
rescind
rescind
rescission
rescue
rescuer
rescue
rescue
research
researcher
researcher
researcher
research
research
research
reseller
resell
resell
resell
resell
resemblance
resemble
resemble
resemble
resemble
resent
resent
resent
reservation
reserve
reserve
reserve
reserve
reserve
reserve
reserve
reserve
reserve
reservoir
reset
reshape
reshape
reshape
reshape
reshuffle
reshuffle
reshuffling
reshuffle
reside
residence
resident
resident
reside
reside
reside
residue
resignation
resignation
resign
resign
resign
resign
resign
resin
resist
resist
resist
resist
resist
resist
resist
resell
resell
resell
resolution
resolve
resolve
resolve
resolve
resonate
resonate
resonate
resort
resort
resort
resort
resource
respect
respect
respects
respect
respect
respond
respond
respondent
respond
respond
respond
respond
respond
response
response
responsibility
restart
restart
restarter
restart
restart
restate
restate
restate
restate
restaurant
restaurant
rest
restore
restore
restore
restore
restrain
restrain
restrain
restraint
restrain
restrict
restrict
restrict
restriction
restrict
restrict
restrict
restrict
restructure
restructure
restructure
restructure
restructure
restructuring
restructure
rest
rest
rest
rest
rest
restyle
resubmit
result
result
result
result
result
result
result
result
result
resume
resume
resume
resume
resume
resume
resume
re-supply
resurface
resurface
resurge
resurrect
resurrect
resurrect
resurrect
resurrect
resuscitate
resuscitate
retailer
retailer
retail
retail-sale
retail
retail
retail
retain
retain
retain
retain
retain
retain
retake
retaliate
retardant
retard
rethink
rethink
retire
retire
retire
retiree
retirement
retire
retire
retire
retire
retool
retool
retort
retort
retrace
retract
retrain
retreat
retreat
retreat
retreat
retreat
retrench
retrieve
retrieve
retrieve
retrieve
retrofit
retry
return
return
return
return
return
return
return
return
reunion
reunite
reunite
reuse
revalue
revamp
revamp
revamp
revamp
be
reveal
reveal
reveal
reveal
reveal
reveal
reveal
revelation
reveler
revel
revel
revel
revenue
revenue
reverberate
reverberate
reverberate
reverberation
reversal
reverse
reverse
reverse
reverse
reverse
reverse
reverse
revert
revert
review
review
review
review
review
review
review
review
revise
revise
revise
revise
revise
revise
revise
revisionist
revision
revisit
revisit
revisit
revitalize
revitalize
revival
revival
revive
revive
revive
revive
revive
revoke
revoke
revoke
revolutionary
revolutionize
revolutionize
revolve
revolve
revolve
rev
reward
reward
reward
reward
reward
reward
reward
rework
rewrite
rewrite
rewrite
rhyme
rhyme
rhyme
ribby
ribbon
rib
rican
riches
rider
ride
ride
ride
ridge
ridicule
ridicule
ride
rid
rid
rid
rid
rid
riff
rifle
rig
rig
right
rights
rights
rights
right-to-lifer
right-winger
rigor
rig
rile
rile
rim
ringer
ringer
ring
ring
ring
ring
ring
riot
ripen
ripen
ripoff
rip
rip
ripple
ripple
ripple
rise
rise
rise
rise
rise
rise
rise
risk
risk
risk
risk
risk
risk
risk
rite
ritual
rival
rivalry
rival
rival
rival
rival
river
rivet
rivet
rivet
rivet
roadblock
road
road
roadway
roam
roam
roar
roar
rob
robbery
robber
robber
rob
robe
robot
rock
rock
rocker
rocket
rocket
rocket
rock
rock
rock
rodent
ride
ride
rod
rogue
roil
roil
role
rollback
roll
roll
roll
roller
roll
rollover
roll
roll
roll
roll
romance
romanticize
romp
romp
roofer
roof
rooftop
roommate
room
roost
root
rooter
root
root
root
root
rope
rosarian
rose
rise
rise
rotate
rotate
rotate
rot
rot
rough
roughneck
round
round
round
round
round
roustabout
route
route
route
routine
route
row
row
row
royalty
rub
rubber-neck
rubber-stamp
rubdown
rubfest
rubin
ruble
rub
rub
rub
rub
ruffle
ruffle
rug
ruin
ruin
ruin
ruin
ruin
ruin
rule
rule
ruler
rule
rule
rule
rule
rule
rule
ruling
rule
rumble
rumble
rumble
rumbling
rumble
ruminate
ruminate
rumination
rumor
rumor
rumor
rumor
rumor
ring
run-in
runner
runner-up
run
run
run
run
runup
run
run
run
run
runway
rupture
rupture
rupture
rush
rush
rush
rush
rush
rush
rust
rusticate
rustler
rustling
rv
saatchus
saber
sabotage
sack
sacking
sack
sack
sacrifice
sacrifice
sacrifice
sacrifice
saddle
saddle
safeguard
safeguard
safeguard
safeguard
safety
sage
sag
sag
sag
sag
sago
say
say
say
say
say
sail
sail
sailor
sail
saint
salary
salary
salaryman
salesman
sale
sale
sale
salespeople
salespeople
salicylate
salt
salute
salute
salvage
salvage
salve
samaritan
samovar
sample
sample
sanction
sanction
sanction
sanction
sandinista
sand
sandwich
sandwich
sandwich
sandwich
sing
sanitationist
sanitize
sanitize
sink
san
sap
sap
sap
satellite
satisfy
satisfy
satisfy
satisfy
satisfy
satisfy
satisfy
satisfy
saturate
saturate
saturate
sit
sit
saucer
sauce
sauna
save
save
savers\/investors
saver
save
save
save
save
savings
savings
save
savor
savor
savor
savor
see
say
say
say
say
say
say
say
say
scab
scalawag
scale
scale
scale
scale
scale
scalp
scam
scammer
scamper
scam
scandalize
scandal
scanner
scan
scan
scan
scan
scape
scare
scare
scare
scare
scare
scare
scarf
scare
scare
scar
scar
scatter
scavenger
scenario
scenario
scene
scent
schedule
schedule
schedule
schedule
schedule
schemer
scheme
scheme
schmumper
scholarship
scholar
schoolboy
schoolchildren
schoolmate
school
school
schoolteacher
school
science
scientist
scientist
scime
scime
scoff
scoff
scoff
scold
scold
scoop
scoop
scoop
scoop
scoop
scoot
score
score
score
score
score
score
scorn
scorn
scotch
scotch
scourge
scour
scour
scout
scout
scowl
scowl
scramble
scramble
scramble
scramble
scramble
scrape
scrap
scrap
scrap
scrap
scrap
scrap
scrap
scrap
scratch
scratch
scratch
scratch
scream
scream
scream
scream
scream
screech
screech
screen
screening
screen
screen
screen
screen
screenwriter
screw
screw
screw
scribble
scribbler
scribble
scribe
scrimp
scrimp
script
scriptwriter
scrounge
scrounge
scrubber
scrutinize
scrutinize
scrutinize
scrutinize
sculptor
sculpture
scurry
scurry
scurry
scuttle
scuttle
scuttle
sealant
seal
seal
seal
seal
seal
seaman
search
search
search
search
search
search
sear
sear
sea
seasoning
season
seat
seat
seat
seat
seat
secede
second-guess
second-guess
seconds
seconds
secretary
secret
section
sector
secure
secure
secure
secure
secure
securite
security
security
sedan
seduce
seduce
seed
seed
see
see
seeker
seek
seek
seek
seek
seek
seek
seek
seem
seem
seem
seem
seem
seem
see
see
seep
seesaw
see
see
seethe
see
see
see
see
segment
segment
segregate
segregate
seize
seize
seize
seize
seize
seize
seizure
select
select
select
selection
selection
select
select
select
self-destruct
self-insure
self-reinsure
self-starter
seller
sell
sell
sell-off
sell-off
selloff
sell
sell
sell
sell
sell
semantics
semester
semi-celebrity
semiconductor
semifinish
semifinish
seminar
senator
senator
sender
send
send
send
send
send
senior
senior
sense
sens
sense
sense
sensibility
sense
sensitive
sensitivity
sensitize
sen.
sensor
sentence
sentence
sentence
sentence
sentencing
sentence
sentence
sentiment
send
send
separate
separate
separate
separate
separate
sequel
sequester
sequester
sequester
sequin
sergeant
serial
series
series
servant
serve
serve
serve
server
serve
serve
serve
service
service
service
service
service
service
serve
session
setback
set
set
setter
setting
set
set
settle
settle
settlement
settlement
settler
settle
settle
settle
settle
settle
set
set
set
set
sever
sever
sever
sever
sevice
sewer
sew
sex
shack
shades
shadow
shadow
shadow
shag
shake
shake
shake
shake
shake
shake
shake
shape
shape
shape
shape
shape
shape
shard
sharecropper
share
share
shareholder
shareholder
shareholding
share
share
share
share
share
share
share
shark
sharpen
sharpen
sharpen
shatter
shatter
shatter
shatter
shave
shave
shave
shave
shave
shear
sheath
shed
shed
shed
shed
shed
shed
sheet
sheik
shell
shell
shell
shell
shelter
shelter
shelter
shelter
shelve
shelf
shepherd
sheriff
shy
shy
shield
shield
shield
shield
shield
shift
shift
shift
shift
shift
shift
shift
shilling
shill
shimmer
shine
shine
shine
shine
shin
shipbuilder
shipment
shipment
ship
ship
shipper
shipper
ship
shipset
ship
ship
ship
shipyard
shirk
shirk
shirt
shiver
shiver
shock
shock
shock
shock
shock
shoehorn
shoe-horn
shoelace
shoemake
shoe
shake
shake
shooting
shoot
shoot
shoot
shoot
shoot
shopkeeper
shop
shop
shopper
shopper
shopper
shop
shop
shop
shop
shop
shore
shore
shore
shear
shear
shortage
shortchange
short-circuit
shortcoming
short
shorten
shorten
shorten
short
short
short-seller
shorts
short
shot
shoot
shoot
shoulder
shoulder
shoulder
shoulder
shout
shout
shout
shout
shout
shove
shovel
shove
shove
shove
showcase
show
show
shower
shower
showgirl
showing
show
show
show
showroom
showroom
show
show-stopper
show
show
show
show
show
shrink
shred
shriek
shrine
shrink
shrink
shrink
shrink
shrivel
shroud
shrub
shrub
shrug
shrug
shrug
shrug
shrink
shudder
shuffle
shuffle
shun
shun
shun
shun
shun
shutdown
shut
shut
shutter
shutter
shut
shuttle
shuttle
shuttle
shuttle
shut
shut
shut
shy
shy
shy
sibling
side
side
sideline
sideline
sideline
side
side
sidestep
sidestep
sidestep
sidestep
sidestep
sidetrack
side
side
sidewalk
sift
sift
sift
sigh
sigh
sigh
sigh
sighting
sight
signal
signal
SIGNAL
signal
signal
signal
signal
signal
signal
signal
signatory
signature
signboard
sign
sign
sign
signify
signify
signify
sign
sign
sign
sign
sign
silence
silence
silence
silence
silt
similarity
simmer
simmer
simplicity
simplify
simplify
simplify
simplify
simplify
simulate
simulate
simulation
simulator
singer
sing
singin
single
single
singles
single
single
single
sing
sing
sing
sink
sink
sink
sin
siphon
siphon
siphon
siphon
sip
sip
siren
sister
sitcom
site
sit
sit
sit
sit
situate
situation
sit
sit
sit
six-pack
sixty
sixty
size
size
size
sizzle
sizzle
skateboard
skeptic
skeptic
sketch
sketch
sketch
skew
skid
skid
skid
skid
skid
skid
skid
skier
sky
ski
skill
skill
skimmer
skimp
skim
skin
skip
skipper
skip
skip
skip
skip
skirmish
skirmish
skirt
skirt
skirt
ski
ski
skr1.5
skr205
skr20
skr225
skr29
skull
skyrocket
skyrocket
skyrocket
slab
slacken
slacken
slacken
slacks
slack
slay
slam-dunk
slam
slam
slap
slap
slap
slap
slap
slash
slash
slash
slash
slash
slash
slate
slate
slate
slat
slaughter
slaying
slay
sleep
sleep
sleep
sleep
sleep
sleep
sleeve
sleep
slice
slice
slice
slide-pack
slide
slide
slide
slide
slide
slide
slide
slim
slim
slinger
sling
slip
slip
slip
slip
slip
slip
slither
slither
slit
sliver
slogan
slog
slog
slope
slope
slosh
slot
slough
slowdown
slow
slow
slow
slow
slow
slow
s&ls
slump
slump
slump
slump
slump
slump
slum
slur
smack
smack
smart
smash
smash
smash
smash
smell
smell
smell
smell
smell
smidgin
smile
smile
smile
smile
smile
smile
smoke
smoker
smoker
smokescreen
smoke
smoke
smoke
smoke
smolder
smolder
smooth
smooth
smother
smother
smother
smuggle
snafus
snag
snag
snake
snake
snake
snap
snap
snap
snapshot
snap
snap
snare
snarl
snatch
snatch
snatch
sneak
sneaker
sneak
sneak
sniff
sniff
sniff
sniff
snipe
snippet
snivel
'
snoop
snooze
snore
snort
snowball
snowball
snowbird
snub
snub
soak
soak
soap
soapsud
soar
soar
soar
soar
soar
soar
soar
sober
sob
socall
social-affair
socialist
socialist
socialize
socialize
society
sociologist
sock
sock
sock
soda
sofa
soft-drink
soften
soften
soften
soften
soften
softie
soil
soil-nutrient
soil
soiree
soldier
soldier
sell
sell
solicitation
solicit
solicit
solicit
solicitor
solicit
solicit
solidify
solidify
solidify
solution
solve
solve
solve
solvent
solve
solve
solve
solve
song
songster
songwriter
son
soothe
soothe
sophisticate
sop
sorehead
sort
sort
sort
sort
sort
seek
seek
soulmate
soul
sound
sound
sounding
sound
sound
sound
sound
sound
sound
sound
soup
source
source
source
sour
sour
sour
soviet
soviet
sow
sow
sow
sow
sow
soybean
soybean
soybean
spaceship
space
spackle
spaghetti
span
span
span
span
spare
spare
spare
spare
spare
spare
spare
spark
spark
spark
sparkplug
spark
spark
spark
spark
spar
spar
spasm
spa
spawn
spawn
spawn
spawn
speaker
speaker
speak
speak
speak
speak
speak
spearhead
spearhead
spearhead
specialist
specialist
specialize
specialize
specialize
specialize
specialize
special
specialty
specialty-chemical
specialty-metal
species
specification
specification
specifics
specify
specify
specify
specify
specify
specimen
spec
spectator
speculate
speculate
speculate
speculate
speculate
speculation
speculator
speculator
speed
speed
speech
speed
speed
speed
speed
speed
speed
spell
spell
spell
spell
spell
spender
spend
spend
spend
spend
spendthrift
spend
spend
spend
spend
spend
spew
spew
spice
spider
spy
spy
spy
spigot
spike
spill
spill
spill
spill
spill
spin
spinoff
spin
spin
spiral
spiral
spiral
spirit
spirit
spirit
splash
splint
splits
splits
split
split
split
split
spoil
spoil
speak
spokesman
spokesman
spoke
spokesperson
speak
sponsor
sponsor
sponsor
sponsor
sponsor
sponsor
sponsor
sponsor
spook
spook
spook
spook
spook
spoonbill
spoonful
spore
sport
sporting-goods
sport
sportsman
sport
sport
sport
spotlight
spot
spot
spot
spot
spot
spot
spot
spot
spot
spouse
spout
spring
sprawl
spray
spray
spread
spreadsheet
spread
spread
spread
spread
spread
spread
spread
spring
spring
spring
sprinkle
sprinkler
sprinkle
sprinkle
spritzer
sprout
sprout
sprout
spruce
spruce
spring
spud
spin
spin
spurn
spurn
spurn
spurn
spurn
spurn
spur
spur
spur
spur
spur
spurt
spurt
spurt
spurt
spurt
spur
sputter
sputter
spy
spy
squabble
squad
squall
squander
squander
square
square
square
square
square
squat
squeak
squeegee
squeeze
squeeze
squeeze
squeeze
squeeze
squeeze
squelch
squelch
squint
squint
squirm
stab
stab
stab
stabilize
stabilize
stabilize
stabilize
stabilize
stabilize
stabilize
stack
stack
stack
stack
stadium
stadium
staff
staffer
staffer
staff
staff
staff
stage
stage
stage
stage
stage
stage
stage
stagewhisper
stagger
stagger
stage
stagnate
stagnate
staid
stain
stain
staircase
stair
stake
stake
stake
stalk
stalk
stall
stall
stall
stall
stall
stall
stall
stalwart
stampede
stampede
stamping
stamp
stamp
stamp
stanch
standardize
standard
standby
stand
stand
stand
stand
stand
stand
stand
stand
staple
stare
stare
stare
stare
star
star
star
start
start
start
starter
start
start
startle
start
start
start
start-up
start-up
start
start
star
starve
starve
starve
starve
stash
stash
state
state
statement
statement
statesman
state
state
state
state
state
state
state
station
station
statistician
statistics
statistics
statue
statute
staunch
stave
stay
stay
stay
stay
stay
stay
stay
steady
steady
steak
steal
steal
steal
steal
steam
steam
steam
steelmaker
steelmaker
steel
steelworker
steer
steer
steer
steer
steer
stem
stem
stem
stem
stem
stem
step
step
step
step
step
step
step
step
step
step
stereo
stereotype
sterile
sterilize
sterilize
sterilize
steroid
steward
stew
sticker
stick
stick
stick
stick
stick
stick
stifle
stifle
stifle
still-rage
stilt
stimulate
stimulate
stimulate
stimulator
stimulus
sting
stingray
stink
stint
stipend
stipulate
stipulate
stipulate
stir
stirring
stir
stirrup
stir
stir
stir
stir
stitch
stitch
stockbroker
stockbroker
stockbuild
stock
stockholder
stockholder
stockholding
stock-index-future
stock-index
stock
stock-option
stockpile
stockpile
stock
stock
stock
stock
stock
stockyard
stoke
stoke
stoke
steal
steal
stomach
stomach
stomp
stomp
stone
stone
stonewall
stand
stand
stooge
stool
stoppage
stop
stop
stop
stop
stop
stop
stop
stop
store
store
storefront
store
store
store
store
store
story
store
storm
storm
storm
storyteller
stow
straddle
strafe
straighten
straighten
strain
strainer
strain
strain
strain
strain
strait
strand
strand
strand
strangle
strangle
strap
strap
stratagem
strategy
strategy
strategist
strategist
strawberry
stray
stray
stray
streak
stream
stream
streamline
streamline
streamline
stream
street
streetspeak
strengthen
strengthen
strengthen
strengthen
strengthen
strengthen
strength
stress
stress
stress
stress
stress
stressor
stress
stress
stretch
stretch
stretch
stretch
stretch
stretch
stretch
stretch
strew
stricken
stride
striker
strike
strike
strike
strike
strike
strike
strike
string
string
stripe
strip
strip
strip
strip
strip
strip
strip
strive
strive
strive
strive
stride
stroke
stroke
stroke
stroke
stroll
stroll
stroll
stronghold
strive
strike
strike
strike
structure
structure
structure
structure
structure
struggle
struggle
struggle
struggle
struggle
struggle
struggle
stub
stick
stick
stud
student-athlete
studentle
student
student
student
study
study
study
study
study
studio
studio
study
study
study
stuff
stuff
stuff
stuff
stumble
stumble
stumble
stumble
stumble
sting
sting
stun
stun
stun
stunt
style
style
style
stymie
subcommittee
subcompact
subconference
subcontractor
subcontractor
subcontract
subdue
subgroup
subject
subject
subject
subject
subject
sublet
submarine
sub-market
submit
submit
submit
submit
submit
submit
subordinate
subordinate
subordinate
subordinate
subordinate
subpoena
subpoena
subpoena
subscribe
subscriber
subscriber
subscribe
subscribe
subscribe
subscribe
subscribe
subscription
sub-segment
subside
subside
subside
subsidiary
subsidy
subsidy
subsidize
subsidize
subsidize
subsidize
subsidize
subskill
substance
substantiate
substation
substitute
substitute
substitute
substitute
substitute
substitute
substract
subsume
subtilis
subtitle
subtract
subtract
subtract
subtract
sub-underwriter
sub-underwrite
suburb
subversive
subvert
subvert
subvert
subway
succeed
succeed
succeed
succeed
succeed
succeed
succeed
success
successor
succumb
succumb
succumb
sucker
suck
sue
sue
sue
sue
suffer
suffer
suffer
suffer
suffer
suffer
suffer
suffice
suffice
suffice
suggest
suggest
suggest
suggestion
suggest
suggest
suggest
sue
suit
suite
suitor
suitor
suit
suit
suit
suit
summary
summarize
summarize
summarize
summarize
sum
summer
summon
summon
summon
summon
sum
sum
sum
sunday
sunflower
sunglass
sing
sink
sink
sunset
supercede
supercede
supercomputer
superconcentrate
superconcentrate
superconductor
superconductor
superimpose
superintendent
superior
supermarket
supermarket
superpower
superpremium
supersede
supersede
supersede
superstar
supervise
supervise
supervise
supervise
supervise
supervise
supervisor
supplement
supplement
supply
supply
supplier
supplier
supplies
supply
supply
supply
supply
support
support
supporter
supporter
support
support
support
support
support
support
suppose
suppose
suppose
suppose
suppose
suppressant
suppress
suppress
suppress
surface
surface
surface
surface
surface
surface
surfer
surge
surge
surge
surge
surge
surge
surge
surmount
surpass
surpass
surpass
surpass
surpass
surplus
surprise
surprise
surprise
surprise
surprise
surprise
surrender
surrender
surrender
surrender
surrender
surround
surround
surround
surround
surround
surtax
survey
survey
survey
survey
survey
survey
survey
survey
survive
survive
survive
survive
survive
survive
survive
survive
survive
survivor
suspect
suspect
suspect
suspect
suspect
suspect
suspect
suspend
suspend
suspend
suspend
suspension
suspicion
sustain
sustain
sustain
sustain
sustain
suture
suvivor
be
s
be
swallow
swallow
swallow
swamp
swamp
swamp
swan
swap
swap
swap
swap
swap
swarm
swathe
sway
sway
sway
sway
swear
swear
swear
sweat
sweater
sweat
sweatshirt
sweat
sweat
sweat
swede
sweeper
sweep
sweep
sweepstakes
sweep
sweep
sweeten
sweeten
sweetener
sweeten
sweet
swell
swell
swell
swell
swell
swell
swell
sweep
sweep
swerve
swim
swim
swindle
swine
swing
swing
swing
swing
swing
switch
switch
switcher
switch
switch
switch
switch
switch
switch
swivel
Swivel
swear
swear
swing
swing
swing
sycophant
symbolize
symbolize
symbol
sympathy
sympathizer
sympathize
symposium
symptom
sym
synchronize
synchronize
synchronize
syndciate
syndicate
syndicate
syndicate
syndicate
syndicate
syndication
synergy
syngery
synonym
synthesizer
synthesize
synthetic
system
system
tabac
table
tablespoon
tablet
tabloid
taboo
tab
tack
tack
tackle
tackle
tackle
tackle
tackle
taco
tactic
tag
tag
tag
tail
tailor
tailor
tail
taint
take
take
takeover
taker
take
take
taketh
take
take
take
take
takings
take
take
talent
tale
tale
talk
talk
talk
talk
talk
talk
talk
talk
talk
talk
tally
tally
tally
tame
tame
tamper
tamper
tamper
tampon
tandy
tangle
tangle
tango
tank
tanker
tanker
tank
tank
tank
tan
tan
tantalize
tape
tape
Tape
taper
taper
taper
taper
tape
tapestry
tape
tape
taping
tape
tap
tap
tap
tap
tap
tap
tap
target
target
target
target
target
target
target
target
tariff
tarnish
tarnish
tarnish
tar
tartan
task
tassel
taste
taste
taste
taste
taste
teach
teach
taunt
tax-deduction
tax
tax
tax
tax
tax
tax-exempt
tax-exempt
taxpayer
taxpayer
taxpayer
tax-reduce
tax
tax-writer
t-bill
teacher
teach
teach
teach
teach
teach
team
team
teammate
team
team
team
tear
tear
tear
tease
teaspoon
technical-service
technician
technique
technocrat
technology
teem
teem
teen-ager
teenager
teens
teens
teeter
tooth
telecine
telecommunications
telecommunications
telecuss
telegraph
telegraph
telemarketer
telephone
telephone-operation
telephone
telephone
telephone
telesystem
telesystem
televise
television
telex
teller
tell
tell
tell
tell
tell
temblor
temperature
temper
temp
tempt
tempt
tempt
tempt
tempt
tenant
tend
tend
tendency
tender
tender
tender
tender
tender
tender
tender
tend
tend
tend
tend
tenet
tension
ten
tenth
term
term
terminal
terminal
terminate
terminate
terminate
terminate
termination
term
term
term
terrify
terrify
territory
terrorist
testament
test-drive
test-drive
test
test
tester
test-fire
testify
testify
testify
testify
testify
testify
test
test
test
test
test
test
test
tether
textbook
textile
text
thank
thank
thanks
thanks
thanks
thank
thank
thank
that
theater
theft
theft
theme
theme
theologian
theory
theorist
theorist
theorize
theory-teach
therapy
therapist
thermometer
the
the
thief
thief
thing
thing
think
think
think
think
think
think
thin
thin
third
thirty
thirty
thistle
thoroughbred
thought
think
think
thousand
thousand
thrash
thrash
thrash
thread
threaten
threaten
threaten
threaten
threaten
threaten
threat
three-fourth
three-quarter
three-seventh
throw
thrift
thrift
thrill
thrill
thrill
thrive
thrive
thrive
thrive
thrive
thrive
throat
thrower
throw
throw
throw
throw
throw
throw
throw
thrust
thrust
thrust
thrust
thug
thumb
thumb
thumb
thumb
thunder
thwart
thwart
thwart
thwart
tick
ticket
ticket
ticket
tick
tick
tick
tidbit
tide
tie
tie
tie-in
tie
tie
tie-up
tie
tiger
tighten
tighten
tighten
tighten
tighten
tile
tilt
tilt
tilt
timberland
timber
time
time
time-hotel
time-share
time
time
time
time
timpani
tinge
tinge
tinker
tinker
tinker
tin
tip
tip
tipster
tiptoe
tiptoe
tiptoe
tip
tire
tire-kicker
tire
tire
tissue
titan
title
title
title
title
toast
toddler
toehold
toe
toil
toiletries
toil
toil
toil
tell
tell
tolerate
toll
toll
tomato
tone
tone
tongue
tonnage
ton
ton
take
tool
toot
topic
top
top
top
top
topple
topple
topple
top
top
top
top
torch
torch
tear
tory
tormentor
torment
torment
tornado
tear
torpedo
torpedo
tort
torture
torture
torture
toss
toss
tosser
toss
toss
total
total
total
total
total
total
total
total
total
tote
tote
tote
totter
totter
touch
touch
touch
touch
touch
touch
touch
toughen
toughen
tough
tour
tour
tourist
tournament
tour
tour
tour
tout
tout
tout
tout
tout
towel
tower
tower
tower
townhouse
township
town
tow
toy
toy
trace
trace
trace
trace
trace
trace
track
track
track
track
track
track
track
tractor
tract
trade
trade
trade
trademark
trade-off
tradeoff
trader
trader
trade
trade
trade
trade
trade
trade
trade
traditionalist
tradition
traduce
traduce
trafficker
tragedy
trail
trail
trailer
trail
trail
trail
trail
trail
train
train
trainer
train
train
train
train
train
train
traipse
trait
tramp
trample
trample
transact
transact
transaction
transaction
transact
transcribe
transcript
transfer
transfer
transfer
transfer
transfer
transfer
transform
transform
transform
transform
transform
transfusion
transistor
translate
translate
translate
translate
translate
translation
transmission
transmit
transmit
transmit
transmit
transmogrify
transmogrify
transplant
transplant
transplant
transplant
transport
transport
transport
transport
transport
transport
transport
transport
transvestite
trap
trappings
trap
trap
trash
trash
trauma
traumatize
traumatize
travail
travel
travel
traveler
traveler
travel
Travel
travelogue
travels
travel
travel
travel
travel
tray
treadmill
tread
tread
treasurer
treasure
treasure
treasury
treasury
treat
treat
treat
treat
treatise
treatment
treat
treat
treat
treat
treble
tree
trek
tremble
tremor
trench
trend
trend-setter
trend
trend
trespass
trespass
trial
triangle
tribe
tribute
trickle
trickle
trickle
trick
trick
try
try
try
try
trigger
trigger
trigger
trigger
trigger
trigger
trigger
trillion
trill
trimester
trim
trim
trim
trim
trim
trim
triple
triple
triple
triple
triple
trip
trip
triumph
trivialize
trivia
troops
troops
tro
trot
trot
trot
trouble
trouble
trouble
troublemaker
trouble
trouble
trouble
trouble
trough
trough
troupe
trousers
trout
trucker
truck-part
truck
truck
truck
trudge
trump
trumpet
trumpet
trumpet
trundle
trunk
trust
trust
trustee
trustee
trust
trust
trust
trust
trust
trust
truth
try
try
tryout
try
try
try
try
t-shirt
t-shirt
tube
tub
tuck
tuck
tuck
tuck
tug
tug
tuition
tuition
tumble
tumble
tumble
tumble
tumble
tumble
tumor
tumor-suppressor
tune
tune
tune
tune
tune
tunnel
turban
turbine
turboprop
turmoil
turnaround
turn
turn
turn
turn
turn-on
turn
turn
turn
turn
turn
turn
turtle
tusk
tutor
tutorial
tutor
tuxedo
tv
tweezers
twenty
twiddle
twin
twist
twist
twist
twist
twist
twitch
two-hundredth
two-seventh
two-third
twothird
two-third
tycoon
tie
type
typeface
type
typewriter
typhoon
typify
typify
ufo
ulcer
ultimatum
umbrella
un-advertiser
unban
unblock
uncertainty
unchlorinate
uncle
unconsolidate
unconsolidate
uncover
uncover
uncover
uncover
underclass
undercut
undercut
undercut
undercut
undercut
underestimate
underestimate
underfund
undergird
undergo
undergo
undergo
undergo
underlie
underline
underline
underlie
underlie
undermine
undermine
undermine
undermine
undermine
underperform
underperformer
underperform
underperform
underperform
underpin
underpin
underpin
underprice
underreact
underscore
underscore
underscore
underscore
underscore
underscore
underscore
undersell
understaff
understand\/adopt
understand
understand
understand
understand
understate
understate
understate
understate
understand
understand
undertake
undertake
undertaking
undertake
undertone
undertake
underutilize
undervalue
undervalue
underweight
undergo
underwhelm
underwiter
underwriter
underwriter
underwrite
underwrite
underwrite
underwriting
underwrite
underwrite
underwrite
underwrite
undo
undo
undo
undulate
undulate
unearth
unexecute
unfaze
unfocus
unfold
unfold
unfold
unfold
unhinge
unhock
unhusk
unify
uniform
unify
unify
unify
unionist
unionize
union
union
unite
Unite
unite
unite
unitholder
unitholder
unit
unit
university
university
unknown
unleash
unleash
unleash
unleash
unleash
unleash
unload
unload
unload
unload
unload
unlock
unlock
unlock
unmask
unmask
unmaterialize
unnerve
unnerve
unplug
unpolarize
unravel
unravel
unravel
unravel
unroll
unroll
unseat
unseat
unsettle
unsettle
unveil
unveil
unveil
unveil
unveil
unveil
unwaver
unwind
unwind
update
update
update
update
upgrade
upgrade
upgrade
upgrade
upgrade
upgrade
upheaval
uphold
uphold
uphold
uphold
uphold
uphold
up
up
uproot
ups-and-downs
upset
upset
upset
upset
upset
upset
up
uptick
ural
urge
urge
urge
urge
urge
urge
urging
urge
use
use
Use
user
user
use
use
use
use
use
usher
usher
usher
usher
usher
use
Use
usurp
u.s.
utility
utility
utilize
utmost
utopian
utterance
utter
utter
uvb
vacancy
vacancy
vacate
vacate
vacate
vacate
vacationer
vacation
vacation
vaccine
vacillate
vacuum
vagabond
vagary
validate
valuation
value
value
value
value
value
value
value
value
valve
vandalize
vanish
vanish
vanish
vanish
vanish
vanish
vanity
van
vapor
variable
variation
vary
vary
vary
variety
vary
vary
vary
vary
vase
vassal
vault
vault
vcr
veer
veer
vegetable
vegetable
vegetarian
vehicle
veil
veil
vend
vendor
vent
ventilate
ventilate
venture
venture
venture
vent
venue
verdict
verge
verify
verify
version
vessel
vest
vestment
vest
veteran
veterinarian
veto
veto
veto
veto
veto
have
have
vex
viaduct
vibrate
vicar
vice
vicissitude
vicitim
victimize
victim
victim
victory
victory
videocassette
videodisk
video
videotape
videotape
vietnamese
view
view
viewer
viewer
viewing
view
viewpoint
view
view
view
view
view
vignette
villager
village
village
villain
vindicate
vineyard
vintage
vinyl-product
violate
violate
violate
violate
violate
violate
violation
virgin
virtue
virtuoso
visage
visionary
vision
visit
visit
visit
visit
visitor
visitor
visit
visit
visit
visit
visualize
visualize
visual
vitiate
voice
voice
voice
voice
voice
voice
voice
voice
void
void
volume
volunteer
volunteer
volunteer
volunteer
vomit
vote
vote
vote-getter
voter
voter
vote
vote
vote
vote
vote
voucher
vow
vow
vowel
vowel
vow
vow
vow
vie
waddle
wade
wad
wafer
waffle
waffle
waft
wage
wages
wage
wage
wagon
wag
wail
wail
wait
wait
waiter
wait
wait
wait
wait
wait
waive
waive
waiver
waiver
waive
waive
waive
wake
wake
walk
walkie-talkie
walk
walk
walk
walkout
walk
walk
walk
walk
walk
walk
wallcovering
wallet
wallop
wallow
wall
wall
wander
wander
wander
wander
wane
wane
wane
wane
wane
wane
wane
want
want
want
want
want
want
want
ward
warden
ward
warehouse
wares
warhead
warm
warm
warm
warm
warm
warn
warn
warn
warn
warner
warning
warn
warn
warn
warn
warrant
warranty
warrant
warrant
warrant
warrant
warren
war
warrior
war
war
war
wart
war
wash
wash
wash
wash
wash
waste
waste
waste
waste
waste
waste
be
be
be
watchdog
watch
watch
watcher
watch
watch
watch
watch
watch
watch
watch
water
waterfall
water
water
water
waterworks
watt
wave
wavelength
waver
waver
wave
wave
wax
wax
way
way
weaken
weaken
weaken
weaken
weaken
weaken
weaken
weaken
weakness
wean
weapon
wear
wear
wear
wear
wear
wear
weasle
weather
weather
weave
weave
web
wed
wedding
wedge
wedge
wedge
wednesday
wed
wed
weed
weekday
weekend
weekly
weeknight
week
weeper
weep
weigh
weigh
weigh
weigh
weigh
weight
weighting
weight
weight
weigh
weigh
welcome
welcome
welcome
welcome
welcome
welcome
welcome
weld
well
well-state
well-wisher
go
go
weep
be
be
be
be
we
whack
whack
whack
whale
wheelbase
wheel
wheel
wheeze
when-issue
while
whimper
whim
whip
whipping
whip
whipsaw
whipsaw
whip
whip
whirlwind
whir
whisk
whisper
whisper
whisper
whistle
whistle
whistle
whistle
whites
whitewash
whittle
whizz
wholesaler
wholesaler
wholesale
whoop
whoosh
widen
widen
widen
widen
widen
widen
widen
widget
widow
widow
wield
wield
wield
wield
wiggle
wiggle
wiggle
wig
wilfr
willie
will
will
will
wimp
wimp
windfall
wind
window
windshield
wind
wind
wind
winery
wine
wing
wink
winner
winner
win
win
win
win
winter
win
win
wipe
wipe
wipe
wipe
wipe
wire
wire
wiretap
wire
wisecrack
wish
wish
wish
wish
wish
wish
wish-list
wish
wish
witch
withdrawal
withdraw
withdraw
withdraw
withdraw
wither
wither
withhold
withhold
withholding
withhold
withhold
withhold
withhold
withstand
withstand
withstand
withstand
witness
witness
witness
witness
witness
wife
wife
wizard
woe
wake
wake
wolf
womanize
woman
woman
wonderbar
wonder
wonder
wonder
wonder
wonder
wonder
won
win
win
win
woodchuck
wood-product
wood
woo
woo
woo
word
word-processing
word
wear
workbook
workday
work
work
worker
worker
worker
workings
work
work
work
workman
worksheet
worksheet
work
workstation
work
work
work
work
work
world-affair
world
worm
wear
wear
worry
worry
worry
worrier
worry
worry
worry
worry
worry
worry
worsen
worsen
worsen
worsen
wound
wound
wind
wind
wind
weave
wow
wrack
wrack
wrack
wrangle
wrap
wrap
wrapper
wrap
wrap
wrap
wreak
wreak
wreak
wreck
wreck
wreck
wrench
wrench
wrest
wrestler
wrestle
wrestle
wrestle
wrest
wriggle
wring
wrist
write-downs
writedown
write-off
writeoff
writer\/producers
writer
write
write
write
write
writhe
writings
write
write
write
write
wrong
write
write
work
wring
x-ray
yacht
yank
yank
yank
yank
yard
yearbook
yearling
year
year
year
yell
yell
yellow
yell
yell
yelp
yen
yield
yield
yield
yield
yield
yield
yield
yield
youngster
younker
youth
yuppie
zapper
zap
zero
zero
zero
zero
zigzag
zig-zag
zip
zip
zloty
zombie
zone
zone
zone
zoom
zoom
zoom


================================================
FILE: ccgbank/data/wsj_0595Corrected.auto
================================================
ID=wsj_0595.1 PARSER=GOLD NUMPARSE=1
(<T S[dcl] 1 2> (<T NP 0 1> (<L N NNS NNS Wives N>) ) (<T S[dcl]\NP 0 2> (<T (S[dcl]\NP)/(S[b]\NP) 0 2> (<L (S[dcl]\NP)/(S[b]\NP) MD MD May (S[dcl]\NP_10)/(S[b]_11\NP_10:B)_11>) (<L (S\NP)\(S\NP) RB RB Not (S_23\NP_18)_23\(S_23\NP_18)_23>) ) (<T S[b]\NP 0 2> (<L S[b]\NP VB VB Benefit S[b]\NP_28>) (<T (S\NP)\(S\NP) 0 2> (<L ((S\NP)\(S\NP))/S[dcl] WRB WRB When ((S_41\NP_36)_41\(S_41\NP_36)_41)/S[dcl]_42>) (<T S[dcl] 1 2> (<T NP 0 1> (<L N NN NN Men N>) ) (<T S[dcl]\NP 0 2> (<L (S[dcl]\NP)/NP VBZ VB Do (S[dcl]\NP_49)/NP_50>) (<T NP 0 1> (<L N NNS NNS Chores N>) ) ) ) ) ) ) ) 
ID=wsj_0595.2 PARSER=GOLD NUMPARSE=1
(<T S[dcl] 0 2> (<T S[dcl] 1 2> (<T S/S 0 2> (<L (S/S)/S[dcl] WRB WRB WHEN (S_159/S_159)/S[dcl]_160>) (<T S[dcl] 1 2> (<T NP 0 1> (<L N NNS NNS HUSBANDS N>) ) (<T S[dcl]\NP 0 2> (<T (S[dcl]\NP)/NP 0 2> (<L (S[dcl]\NP)/NP VBP VBP take (S[dcl]\NP_167)/NP_168>) (<L (S\NP)\(S\NP) RP RP on (S_180\NP_175)_180\(S_180\NP_175)_180>) ) (<T NP 0 1> (<T N 1 2> (<L N/N JJR JJR more N_189/N_189>) (<L N NN NN housework N>) ) ) ) ) ) (<T S[dcl] 1 2> (<L , , , , ,>) (<T S[dcl] 1 2> (<L NP PRP PRP they NP>) (<T S[dcl]\NP 0 2> (<L (S[dcl]\NP)/(S[to]\NP) VBP VBP tend (S[dcl]\NP_59)/(S[to]_60\NP_59:B)_60>) (<T S[to]\NP 0 2> (<L (S[to]\NP)/(S[b]\NP) TO TO to (S[to]\NP_69)/(S[b]_70\NP_69:B)_70>) (<T S[b]\NP 0 2> (<L (S[b]\NP)/PP VB VB substitute (S[b]\NP_77)/PP_78>) (<T PP 0 2> (<L PP/NP IN IN for PP/NP_83>) (<T NP 0 2> (<T NP 0 1> (<L N NNS NNS chores N>) ) (<T NP\NP 0 1> (<T S[pss]\NP 0 2> (<L S[pss]\NP VBN VBN done S[pss]\NP_91>) (<T (S\NP)\(S\NP) 0 2> (<T (S\NP)\(S\NP) 0 2> (<L ((S\NP)\(S\NP))/NP IN IN by ((S_104\NP_99)_104\(S_104\NP_99)_104)/NP_105>) (<T NP 1 2> (<L NP[nb]/N DT DT the NP[nb]_112/N_112>) (<L N NNS NNS kids N>) ) ) (<T (S\NP)\(S\NP)[conj] 1 2> (<T conj 1 2> (<L conj/conj RB RB rather conj_142/conj_142>) (<L conj IN IN than conj>) ) (<T (S\NP)\(S\NP) 0 2> (<L ((S\NP)\(S\NP))/NP IN IN by ((S_125\NP_120)_125\(S_125\NP_120)_125)/NP_126>) (<T NP 1 2> (<L NP[nb]/N DT DT the NP[nb]_133/N_133>) (<L N NN NN wife N>) ) ) ) ) ) ) ) ) ) ) ) ) ) ) (<L . . . . .>) ) 
ID=wsj_0595.3 PARSER=GOLD NUMPARSE=1
(<T S[dcl] 0 2> (<T S[dcl] 1 2> (<T NP 0 1> (<T N 1 2> (<L N/N NNP NNP Rand N_287/N_287>) (<T N 1 2> (<L N/N NNP NNP Corp. N_280/N_280>) (<T N 1 2> (<L N/N NNS NNS researchers N_273/N_273>) (<T N 1 2> (<L N/N NNP NNP Linda N_266/N_266>) (<T N 1 2> (<L N NNP NNP Waite N>) (<T N[conj] 1 2> (<L conj CC CC and conj>) (<T N 1 2> (<L N/N NNP NNP Frances N_255/N_255>) (<L N NNP NNP Goldscheider N>) ) ) ) ) ) ) ) ) (<T S[dcl]\NP 0 2> (<L (S[dcl]\NP)/NP VBD VBD analyzed (S[dcl]\NP_127)/NP_128>) (<T NP 0 2> (<T NP 1 2> (<L NP[nb]/N DT DT a NP[nb]_142/N_142>) (<T N 1 2> (<L N/N JJ JJ large N_137/N_137>) (<L N NN NN sample N>) ) ) (<T NP\NP 0 2> (<L (NP\NP)/NP IN IN of (NP_150\NP_150)/NP_151>) (<T NP 0 2> (<T NP 0 1> (<T N 1 2> (<L N/N JJ JJ married N_160/N_160>) (<L N NNS NNS women N>) ) ) (<T NP\NP 0 2> (<L (NP\NP)/NP IN IN with (NP_169\NP_169)/NP_170>) (<T NP 0 2> (<T NP 0 2> (<T NP 0 1> (<T N 1 2> (<T N/N 1 2> (<T (N/N)/(N/N) 0 2> (<L ((N/N)/(N/N))/(S[asup]\NP) IN IN at ((N_195/N_187)_195/(N_195/N_187)_195)/(S[asup]_196\NP_190)_196>) (<L S[asup]\NP JJS JJS least S[asup]\NP_201>) ) (<L N/N CD CD one N_179/N_179>) ) (<L N NN NN child N>) ) ) (<T NP\NP 0 2> (<L (NP\NP)/NP IN IN at (NP_210\NP_210)/NP_211>) (<T NP 0 1> (<L N NN NN home N>) ) ) ) (<T NP\NP 0 2> (<L (NP\NP)/NP IN IN between (NP_222\NP_222)/NP_223>) (<T NP 0 2> (<T NP 1 2> (<L NP[nb]/N DT DT the NP[nb]_230/N_230>) (<L N NNS NNS ages N>) ) (<T NP\NP 0 2> (<L (NP\NP)/NP IN IN of (NP_238\NP_238)/NP_239>) (<T NP 0 1> (<T N 1 2> (<L N CD CD six N>) (<T N[conj] 1 2> (<L conj CC CC and conj>) (<L N CD CD 18 N>) ) ) ) ) ) ) ) ) ) ) ) ) ) (<L . . . . .>) ) 
ID=wsj_0595.4 PARSER=GOLD NUMPARSE=1
(<T S[dcl] 0 2> (<T S[dcl] 1 2> (<T NP 1 2> (<L NP[nb]/N DT DT The NP[nb]_246/N_246>) (<L N NNS NNS women N>) ) (<T S[dcl]\NP 0 2> (<L (S[dcl]\NP)/NP VBD VBD indicated (S[dcl]\NP_144)/NP_145>) (<T NP 0 2> (<T NP 0 2> (<T NP/(S[dcl]\NP) 0 2> (<L (NP/(S[dcl]\NP))/N WDT WDT which (NP/(S[dcl]_154\N_155:B)_154)/N_155>) (<T N 1 2> (<L N/N NN NN family N_164/N_164>) (<L N NN NN member N>) ) ) (<T S[dcl]\NP 1 2> (<L (S\NP)/(S\NP) RB RB usually (S_201\NP_196)_201/(S_201\NP_196)_201>) (<T S[dcl]\NP 0 2> (<L (S[dcl]\NP)/NP VBD VBD did (S[dcl]\NP_171)/NP_172>) (<T NP 0 1> (<T N 1 2> (<L N/N JJ JJ various N_188/N_188>) (<T N 1 2> (<L N/N NN NN household N_181/N_181>) (<L N NNS NNS chores N>) ) ) ) ) ) ) (<T NP[conj] 1 2> (<L conj CC CC and conj>) (<T NP 0 2> (<T NP 1 2> (<L NP[nb]/N DT DT the NP[nb]_215/N_215>) (<T N 1 2> (<L N/N JJ JJ approximate N_210/N_210>) (<L N NN NN share N>) ) ) (<T NP\NP 0 1> (<T S[dcl]/NP 1 2> (<T S/(S\NP) 0 1> (<L NP DT DT each NP>) ) (<L (S[dcl]\NP)/NP VBD VBD did (S[dcl]\NP_222)/NP_223>) ) ) ) ) ) ) ) (<L . . . . .>) ) 
ID=wsj_0595.5 PARSER=GOLD NUMPARSE=1
(<T S[dcl] 0 2> (<T S[dcl] 1 2> (<T S/S 1 2> (<L (S/S)/(S/S) RB RB Not (S_307/S_301)_307/(S_307/S_301)_307>) (<L S/S RB RB unexpectedly S_293/S_293>) ) (<T S[dcl] 1 2> (<L , , , , ,>) (<T S[dcl] 1 2> (<T NP 0 1> (<L N NNS NNS wives N>) ) (<T S[dcl]\NP 1 2> (<L , , , , ,>) (<T S[dcl]\NP 1 2> (<T (S\NP)/(S\NP) 0 2> (<L ((S\NP)/(S\NP))/(S[adj]\NP) IN IN whether ((S_266\NP_259)_266/(S_266\NP_259)_266)/(S[adj]_267\NP_259:B)_267>) (<T S[adj]\NP 0 2> (<L S[adj]\NP JJ VBG working S[adj]\NP_272>) (<T S[adj]\NP[conj] 1 2> (<L conj CC CC or conj>) (<L S[adj]\NP JJ JJ non-working S[adj]\NP_277>) ) ) ) (<T S[dcl]\NP 1 2> (<L , , , , ,>) (<T S[dcl]\NP 0 2> (<L (S[dcl]\NP)/NP VBD VBD did (S[dcl]\NP_92)/NP_93>) (<T NP 0 2> (<T NP 1 2> (<T NP[nb]/N 1 2> (<T NP/NP 1 2> (<L (NP/NP)/(NP/NP) IN IN by (NP_121/NP_115)_121/(NP_121/NP_115)_121>) (<L NP/NP RB RB far NP_107/NP_107>) ) (<L NP[nb]/N DT DT the NP[nb]_100/N_100>) ) (<L N JJS JJS most N>) ) (<T NP\NP 0 2> (<L (NP\NP)/NP IN : -- (NP_129\NP_129)/NP_130>) (<T NP 0 2> (<T NP 0 2> (<T NP 0 1> (<T N 1 2> (<T N/N 1 2> (<L (N/N)/(N/N) IN IN about (N_153/N_147)_153/(N_153/N_147)_153>) (<L N/N CD CD 80 N_139/N_139>) ) (<L N NN NN % N>) ) ) (<T NP\NP 0 2> (<L (NP\NP)/NP IN IN of (NP_162\NP_162)/NP_163>) (<T NP 1 2> (<L NP[nb]/N DT DT the NP[nb]_178/N_178>) (<T N 1 2> (<L N NN NN shopping N>) (<T N[conj] 1 2> (<L , , , , ,>) (<T N 1 2> (<L N NN NN laundry N>) (<T N[conj] 1 2> (<L conj CC CC and conj>) (<L N NN NN cooking N>) ) ) ) ) ) ) ) (<T NP[conj] 1 2> (<L , , , , ,>) (<T NP[conj] 1 2> (<L conj CC CC and conj>) (<T NP 0 2> (<T NP 0 1> (<T N 1 2> (<L N/N IN IN about N_187/N_187>) (<L N NNS NNS two-thirds N>) ) ) (<T NP\NP 0 2> (<L (NP\NP)/NP IN IN of (NP_196\NP_196)/NP_197>) (<T NP 0 2> (<T NP 0 1> (<L N NN NN housecleaning N>) ) (<T NP[conj] 1 2> (<L , , , , ,>) (<T NP 0 2> (<T NP 0 1> (<T S[ng]\NP 0 2> (<L (S[ng]\NP)/NP VBG VBG washing (S[ng]\NP_207)/NP_208>) (<T NP 0 1> (<L N NNS NNS dishes N>) ) ) ) (<T NP[conj] 1 2> (<L , , , , ,>) (<T NP 0 2> (<T NP 0 1> (<T N 1 2> (<L N/N NN NN child N_221/N_221>) (<L N NN NN care N>) ) ) (<T NP[conj] 1 2> (<L conj CC CC and conj>) (<T NP 0 1> (<T N 1 2> (<L N/N NN NN family N_238/N_238>) (<T N 1 2> (<L N/N NN NN paper N_231/N_231>) (<L N NN NN work N>) ) ) ) ) ) ) ) ) ) ) ) ) ) ) ) ) ) ) ) ) ) ) ) (<L . . . . .>) ) 
ID=wsj_0595.6 PARSER=GOLD NUMPARSE=1
(<T S[dcl] 1 2> (<T S/S 1 2> (<L (S/S)/(S/S) RB RB Only (S_247/S_241)_247/(S_247/S_241)_247>) (<T S/S 0 2> (<L (S/S)/NP IN IN for (S_217/S_217)/NP_218>) (<T NP 0 2> (<T NP 0 1> (<L N NN NN yardwork N>) ) (<T NP[conj] 1 2> (<L conj CC CC and conj>) (<T NP 0 1> (<T N 1 2> (<L N/N NN NN home N_230/N_230>) (<L N NN NN maintenance N>) ) ) ) ) ) ) (<T S[dcl] 0 2> (<T S[dcl] 0 2> (<T S[dcl]/(S[b]\NP) 0 2> (<L (S[dcl]/(S[b]\NP))/NP VBD VBD did (S[dcl]/(S[b]_180\NP_177)_180)/NP_181>) (<T NP 0 1> (<L N NNS NNS women N>) ) ) (<T S[b]\NP 0 2> (<L (S[b]\NP)/NP VB VB do (S[b]\NP_191)/NP_192>) (<T NP 0 2> (<T NP 0 1> (<L N JJR JJR less N>) ) (<T NP\NP 0 2> (<L (NP\NP)/NP IN IN than (NP_203\NP_203)/NP_204>) (<T NP 0 1> (<L N NN NN half N>) ) ) ) ) ) (<L . . . . .>) ) ) 
ID=wsj_0595.7 PARSER=GOLD NUMPARSE=1
(<T S[dcl] 0 2> (<T S[dcl] 1 2> (<L S/S CC CC But S_345/S_345>) (<T S[dcl] 1 2> (<T NP 1 2> (<L NP[nb]/N DT DT the NP[nb]_338/N_338>) (<L N NNS NNS researchers N>) ) (<T S[dcl]\NP 0 2> (<L (S[dcl]\NP)/S[em] VBD VBD found (S[dcl]\NP_65)/S[em]_66>) (<T S[em] 0 2> (<L S[em]/S[dcl] IN IN that S[em]/S[dcl]_71>) (<T S[dcl] 1 2> (<T S/S 0 2> (<L (S/S)/S[dcl] IN IN while (S_273/S_273)/S[dcl]_274>) (<T S[dcl] 1 2> (<T NP 1 2> (<T NP[nb]/N 1 2> (<T NP 0 1> (<L N NNS NNS children N>) ) (<L (NP[nb]/N)\NP POS POS 's (NP[nb]_327/N_327)\NP_328>) ) (<T N 1 2> (<L N/N NN NN household N_320/N_320>) (<L N NNS NNS tasks N>) ) ) (<T S[dcl]\NP 0 2> (<T S[dcl]\NP 0 2> (<L (S[dcl]\NP)/NP VBD VBD eased (S[dcl]\NP_281)/NP_282>) (<T NP 1 2> (<T NP[nb]/N 1 2> (<T NP 1 2> (<L NP[nb]/N DT DT the NP[nb]_299/N_299>) (<L N NN NN mother N>) ) (<L (NP[nb]/N)\NP POS POS 's (NP[nb]_291/N_291)\NP_292>) ) (<L N NN NN burden N>) ) ) (<L (S\NP)\(S\NP) RB RB appreciably (S_311\NP_306)_311\(S_311\NP_306)_311>) ) ) ) (<T S[dcl] 1 2> (<L , , , , ,>) (<T S[dcl] 1 2> (<T NP 1 2> (<T NP[nb]/N 1 2> (<T NP 1 2> (<L NP[nb]/N DT DT the NP[nb]_263/N_263>) (<L N NN NN husband N>) ) (<L (NP[nb]/N)\NP POS POS 's (NP[nb]_255/N_255)\NP_256>) ) (<T N 1 2> (<L N/N VBG VBG helping N_248/N_248>) (<L N NN NN hand N>) ) ) (<T S[dcl]\NP 0 2> (<L (S[dcl]\NP)/(S[to]\NP) VBZ VBZ appears (S[dcl]\NP_80)/(S[to]_81\NP_80:B)_81>) (<T S[to]\NP 0 2> (<T S[to]\NP 0 2> (<L (S[to]\NP)/(S[b]\NP) TO TO to (S[to]\NP_90)/(S[b]_91\NP_90:B)_91>) (<T S[b]\NP 0 2> (<T S[b]\NP 0 2> (<L (S[b]\NP)/NP VB VB lighten (S[b]\NP_98)/NP_99>) (<T NP 1 2> (<T NP[nb]/N 1 2> (<T NP 1 2> (<L NP[nb]/N DT DT the NP[nb]_116/N_116>) (<L N NNS NNS children N>) ) (<L (NP[nb]/N)\NP POS POS 's (NP[nb]_108/N_108)\NP_109>) ) (<L N NN NN load N>) ) ) (<T (S\NP)\(S\NP) 1 2> (<L ((S\NP)\(S\NP))/((S\NP)\(S\NP)) RB RB almost ((S_167\NP_159)_167\(S_160\NP_159)_160)_167/((S_167\NP_159)_167\(S_160\NP_159)_160)_167>) (<T (S\NP)\(S\NP) 0 2> (<L ((S\NP)\(S\NP))/NP IN IN on ((S_129\NP_124)_129\(S_129\NP_124)_129)/NP_130>) (<T NP 1 2> (<L NP[nb]/N DT DT a NP[nb]_144/N_144>) (<T N 1 2> (<L N/N JJ JJ one-for-one N_139/N_139>) (<L N NN NN basis N>) ) ) ) ) ) ) (<T S[to]\NP[conj] 1 2> (<L conj CC CC and conj>) (<T S[to]\NP 0 2> (<L (S[to]\NP)/(S[b]\NP) TO TO to (S[to]\NP_176)/(S[b]_177\NP_176:B)_177>) (<T S[b]\NP 0 2> (<T S[b]\NP 0 2> (<L (S[b]\NP)/NP VB VB reduce (S[b]\NP_184)/NP_185>) (<T NP 1 2> (<T NP[nb]/N 1 2> (<T NP 1 2> (<L NP[nb]/N DT DT the NP[nb]_202/N_202>) (<L N NN NN wife N>) ) (<L (NP[nb]/N)\NP POS POS 's (NP[nb]_194/N_194)\NP_195>) ) (<L N NN NN responsibility N>) ) ) (<T (S\NP)\(S\NP) 1 2> (<L ((S\NP)\(S\NP))/((S\NP)\(S\NP)) RB RB only ((S_237\NP_229)_237\(S_230\NP_229)_230)_237/((S_237\NP_229)_237\(S_230\NP_229)_230)_237>) (<L (S\NP)\(S\NP) RB RB modestly (S_214\NP_209)_214\(S_214\NP_209)_214>) ) ) ) ) ) ) ) ) ) ) ) ) ) (<L . . . . .>) ) 
ID=wsj_0595.8 PARSER=GOLD NUMPARSE=1
(<T S[dcl] 0 2> (<T S[dcl] 1 2> (<T NP 1 2> (<L NP[nb]/N DT DT This NP[nb]_345/N_345>) (<L N NN NN pattern N>) ) (<T S[dcl]\NP 0 2> (<T S[dcl]\NP 0 2> (<L (S[dcl]\NP)/(S[adj]\NP) VBD VBD was (S[dcl]\NP_268)/(S[adj]_269\NP_268:B)_269>) (<T S[adj]\NP 1 2> (<L (S[adj]\NP)/(S[adj]\NP) RB RB particularly (S[adj]_286\NP_281)_286/(S[adj]_286\NP_281)_286>) (<L S[adj]\NP JJ JJ evident S[adj]\NP_274>) ) ) (<T (S\NP)\(S\NP) 0 2> (<L ((S\NP)\(S\NP))/NP IN IN among ((S_299\NP_294)_299\(S_299\NP_294)_299)/NP_300>) (<T NP 0 1> (<T N 1 2> (<T N/N 1 2> (<L (N/N)/(N/N) RBR RBR more (N_337/N_331)_337/(N_337/N_331)_337>) (<T N/N 1 2> (<L (N/N)/(N/N) RB RB highly (N_323/N_317)_323/(N_323/N_317)_323>) (<L N/N VBN VBN educated N_309/N_309>) ) ) (<L N NNS NNS couples N>) ) ) ) ) ) (<L . . . . .>) ) 
ID=wsj_0595.9 PARSER=GOLD NUMPARSE=1
(<T S[dcl] 0 2> (<T S[dcl] 1 2> (<T S/S 0 2> (<L (S/S)/NP IN IN In (S_214/S_214)/NP_215>) (<T NP 1 2> (<L NP[nb]/N DT DT these NP[nb]_222/N_222>) (<L N NNS NNS families N>) ) ) (<T S[dcl] 1 2> (<L , , , , ,>) (<T S[dcl] 1 2> (<T NP 0 1> (<L N NNS NNS husbands N>) ) (<T S[dcl]\NP 0 2> (<T (S[dcl]\NP)/NP 0 2> (<L (S[dcl]\NP)/NP VBD VBD took (S[dcl]\NP_89)/NP_90>) (<L (S\NP)\(S\NP) RP RP on (S_102\NP_97)_102\(S_102\NP_97)_102>) ) (<T NP 0 2> (<T NP 0 1> (<T N 1 2> (<T N/N 1 2> (<T (N/N)/(N/N) 1 2> (<L ((N/N)/(N/N))/((N/N)/(N/N)) CD CD 80 ((N_150/N_141)_150/(N_142/N_141)_142)_150/((N_150/N_141)_150/(N_142/N_141)_142)_150>) (<L (N/N)/(N/N) NN JJ % (N_125/N_119)_125/(N_125/N_119)_125>) ) (<L N/N JJR JJR more N_111/N_111>) ) (<L N NNS NNS chores N>) ) ) (<T NP\NP 0 2> (<L (NP\NP)/PP IN IN than (NP_159\NP_159)/PP_160>) (<T PP 0 2> (<L PP/NP IN IN in PP/NP_165>) (<T NP 0 2> (<T NP 0 1> (<L N NNS NNS couples N>) ) (<T NP\NP 0 2> (<L (NP\NP)/NP IN IN with (NP_176\NP_176)/NP_177>) (<T NP 0 1> (<T N 1 2> (<L N/N JJ JJ only N_200/N_200>) (<T N 1 2> (<L N/N NN NN grammar N_193/N_193>) (<T N 1 2> (<L N/N NN NN school N_186/N_186>) (<L N NN NN education N>) ) ) ) ) ) ) ) ) ) ) ) ) ) (<L . . . . .>) ) 
ID=wsj_0595.10 PARSER=GOLD NUMPARSE=1
(<T S[dcl] 0 2> (<T S[dcl] 1 2> (<L S/S CC CC But S_259/S_259>) (<T S[dcl] 1 2> (<T NP 0 2> (<T NP 1 2> (<L NP[nb]/N DT DT the NP[nb]_219/N_219>) (<L N NNS NNS kids N>) ) (<T NP\NP 0 2> (<L (NP\NP)/NP IN IN with (NP_227\NP_227)/NP_228>) (<T NP 0 1> (<T N 1 2> (<T N/N 1 2> (<L (N/N)/(N/N) RB RB highly (N_251/N_245)_251/(N_251/N_245)_251>) (<L N/N VBN VBN educated N_237/N_237>) ) (<L N NNS NNS parents N>) ) ) ) ) (<T S[dcl]\NP 0 2> (<L (S[dcl]\NP)/NP VBD VBD did (S[dcl]\NP_132)/NP_133>) (<T NP 0 2> (<T NP 0 1> (<T N 1 2> (<T N/N 1 2> (<T (N/N)/(N/N) 1 2> (<L ((N/N)/(N/N))/((N/N)/(N/N)) CD CD 68 ((N_181/N_172)_181/(N_173/N_172)_173)_181/((N_181/N_172)_181/(N_173/N_172)_173)_181>) (<L (N/N)/(N/N) NN NN % (N_156/N_150)_156/(N_156/N_150)_156>) ) (<L N/N JJR JJR less N_142/N_142>) ) (<L N NN NN housework N>) ) ) (<T NP\NP 0 2> (<L (NP\NP)/NP IN IN than (NP_190\NP_190)/NP_191>) (<T NP 0 2> (<L NP DT DT those NP>) (<T NP\NP 0 2> (<L (NP\NP)/NP IN IN in (NP_201\NP_201)/NP_202>) (<T NP 0 1> (<T N 1 2> (<L N/N JJ JJ less-educated N_211/N_211>) (<L N NNS NNS families N>) ) ) ) ) ) ) ) ) ) (<L . . . . .>) ) 
ID=wsj_0595.11 PARSER=GOLD NUMPARSE=1
(<T S[dcl] 0 2> (<T S[dcl] 1 2> (<L NP[expl] PRP PRP It NP[expl]>) (<T S[dcl]\NP[expl] 0 2> (<T (S[dcl]\NP[expl])/S[em] 0 2> (<T (S[dcl]\NP[expl])/S[em] 0 2> (<L ((S[dcl]\NP[expl])/S[em])/(S[adj]\NP) VBZ VBZ is ((S[dcl]\NP[expl]_133)/S[em]_134)/(S[adj]_135\NP_131)_135>) (<L S[adj]\NP JJ JJ clear S[adj]\NP_140>) ) (<T (S\NP)\(S\NP) 1 2> (<L , , , , ,>) (<T (S\NP)\(S\NP) 0 2> (<T S[dcl]/S[dcl] 1 2> (<T S/(S\NP) 0 1> (<T NP 0 1> (<T N 1 2> (<L N/N NNP NNP Ms. N_157/N_157>) (<L N NNP NNP Waite N>) ) ) ) (<L (S[dcl]\NP)/S[dcl] VBZ VBZ says (S[dcl]\NP_147)/S[dcl]_148>) ) (<L , , , , ,>) ) ) ) (<T S[em] 0 2> (<L S[em]/S[dcl] DT DT that S[em]/S[dcl]_184>) (<T S[dcl] 1 2> (<T NP 0 2> (<T NP 0 1> (<L N JJS JJS most N>) ) (<T NP\NP 0 2> (<L (NP\NP)/NP IN IN of (NP_271\NP_271)/NP_272>) (<T NP 0 2> (<T NP 1 2> (<L NP[nb]/N DT DT the NP[nb]_279/N_279>) (<L N NN NN effect N>) ) (<T NP\NP 0 2> (<L (NP\NP)/NP IN IN of (NP_287\NP_287)/NP_288>) (<T NP 0 1> (<T N 1 2> (<L N/N VBG VBG increasing N_297/N_297>) (<L N NN NN education N>) ) ) ) ) ) ) (<T S[dcl]\NP 0 2> (<L (S[dcl]\NP)/(S[pt]\NP) VBZ VBZ has (S[dcl]\NP_193)/(S[pt]_194\NP_193:B)_194>) (<T S[pt]\NP 0 2> (<L (S[pt]\NP)/(S[to]\NP) VBN VBN been (S[pt]\NP_203)/(S[to]_204\NP_203:B)_204>) (<T S[to]\NP 0 2> (<L (S[to]\NP)/(S[b]\NP) TO TO to (S[to]\NP_213)/(S[b]_214\NP_213:B)_214>) (<T S[b]\NP 0 2> (<L S[b]\NP VB VB shift S[b]\NP_219>) (<T (S\NP)\(S\NP) 0 2> (<L ((S\NP)\(S\NP))/(S[dcl]\NP) WP WP who ((S_234\NP_227)_234\(S_234\NP_227)_234)/(S[dcl]_235\NP_227:B)_235>) (<T S[dcl]\NP 0 2> (<L (S[dcl]\NP)/(S[ng]\NP) VBZ VBZ is (S[dcl]\NP_244)/(S[ng]_245\NP_244:B)_245>) (<T S[ng]\NP 0 2> (<L (S[ng]\NP)/NP VBG VBG helping (S[ng]\NP_252)/NP_253>) (<T NP 1 2> (<L NP[nb]/N DT DT the NP[nb]_260/N_260>) (<L N NN NN wife\/mother N>) ) ) ) ) ) ) ) ) ) ) ) ) (<L . . . . .>) ) 
ID=wsj_0595.13 PARSER=GOLD NUMPARSE=1
(<T S[adj] 1 2> (<T NP 0 1> (<T N 1 2> (<L N/N NNP NNP Nursing N_55/N_55>) (<T N 1 2> (<L N/N NNP NNP Home N_48/N_48>) (<L N NNPS NNPS Patients N>) ) ) ) (<T S[adj]\NP 0 2> (<L (S[adj]\NP)/(S[to]\NP) JJ JJ Apt (S[adj]\NP_10)/(S[to]_11\NP_8)_11>) (<T S[to]\NP 0 2> (<L (S[to]\NP)/(S[b]\NP) TO TO to (S[to]\NP_20)/(S[b]_21\NP_20:B)_21>) (<T S[b]\NP 0 2> (<L (S[b]\NP)/NP VB VB Be (S[b]\NP_28)/NP_29>) (<T NP 0 1> (<T N 1 2> (<L N/N JJ JJ Private N_38/N_38>) (<L N NNS NNS Payers N>) ) ) ) ) ) ) 
ID=wsj_0595.14 PARSER=GOLD NUMPARSE=1
(<T S[dcl] 0 2> (<T S[dcl] 1 2> (<T S[dcl] 1 2> (<T NP 0 1> (<T N 1 2> (<T N/N 1 2> (<L (N/N)/(N/N) RB RB FAR (N_174/N_168)_174/(N_174/N_168)_174>) (<L N/N JJR JJR FEWER N_160/N_160>) ) (<T N 1 2> (<L N/N JJ JJ elderly N_153/N_153>) (<T N 1 2> (<L N/N NN NN nursing N_146/N_146>) (<T N 1 2> (<L N/N NN NN home N_139/N_139>) (<L N NNS NNS residents N>) ) ) ) ) ) (<T S[dcl]\NP 0 2> (<T S[dcl]\NP 0 2> (<L (S[dcl]\NP)/NP VBP VBP bankrupt (S[dcl]\NP_84)/NP_85>) (<L NP PRP PRP themselves NP>) ) (<T (S\NP)\(S\NP) 0 2> (<L ((S\NP)\(S\NP))/(S[pss]\NP) IN IN than ((S_102\NP_95)_102\(S_102\NP_95)_102)/(S[pss]_103\NP_95:B)_103>) (<T S[pss]\NP 0 2> (<T (S[pss]\NP)/(S[pss]\NP) 0 2> (<L (S[pss]\NP)/(S[pss]\NP) VBD VBD was (S[pss]\NP_112)/(S[pss]_113\NP_112:B)_113>) (<L (S\NP)\(S\NP) RB RB previously (S_125\NP_120)_125\(S_125\NP_120)_125>) ) (<L S[pss]\NP VBN VBN believed S[pss]\NP_130>) ) ) ) ) (<T S[dcl]\S[dcl] 1 2> (<L , , , , ,>) (<T S[dcl]\S[dcl] 1 2> (<T NP 0 1> (<T N 1 2> (<L N/N CD CD two N_74/N_74>) (<T N 1 2> (<L N/N JJ JJ recent N_67/N_67>) (<L N NNS NNS studies N>) ) ) ) (<L (S[dcl]\S[dcl])\NP VBP VBP declare (S[dcl]\S[dcl]_57)\NP_58>) ) ) ) (<L . . . . .>) ) 
ID=wsj_0595.16 PARSER=GOLD NUMPARSE=1
(<T S[dcl] 0 2> (<T S[dcl] 1 2> (<T NP 0 1> (<T N 1 2> (<L N/N JJ JJ Conventional N_342/N_342>) (<L N NN NN wisdom N>) ) ) (<T S[dcl]\NP 0 2> (<T (S[dcl]\NP)/(S[pt]\NP) 0 2> (<L (S[dcl]\NP)/(S[pt]\NP) VBZ VBZ has (S[dcl]\NP_152)/(S[pt]_153\NP_152:B)_153>) (<L (S\NP)\(S\NP) RB RB long (S_165\NP_160)_165\(S_165\NP_160)_165>) ) (<T S[pt]\NP 0 2> (<L (S[pt]\NP)/S[em] VBN VBN held (S[pt]\NP_172)/S[em]_173>) (<T S[em] 0 2> (<L S[em]/S[dcl] RB RB that S[em]/S[dcl]_178>) (<T S[dcl] 1 2> (<T NP 0 2> (<T NP 0 1> (<T N 1 2> (<L N/N RB RB anywhere N_295/N_295>) (<T N 1 2> (<L N/N IN IN from N_288/N_288>) (<T N 0 2> (<L N NN NN one-fourth N>) (<T N\N 0 2> (<L (N\N)/N CC TO to (N_278\N_278)/N_279>) (<L N NN NN one-half N>) ) ) ) ) ) (<T NP\NP 0 2> (<L (NP\NP)/NP IN IN of (NP_304\NP_304)/NP_305>) (<T NP 1 2> (<L NP[nb]/N DT DT all NP[nb]_333/N_333>) (<T N 1 2> (<L N/N JJ JJ elderly N_328/N_328>) (<T N 1 2> (<L N/N JJ JJ long-term N_321/N_321>) (<T N 1 2> (<L N/N NN NN care N_314/N_314>) (<L N NNS NNS patients N>) ) ) ) ) ) ) (<T S[dcl]\NP 0 2> (<L (S[dcl]\NP)/(S[pss]\NP) VBP VBP are (S[dcl]\NP_187)/(S[pss]_188\NP_187:B)_188>) (<T S[pss]\NP 0 2> (<L (S[pss]\NP)/(S[to]\NP) VBN VBN obliged (S[pss]\NP_197)/(S[to]_198\NP_197:B)_198>) (<T S[to]\NP 0 2> (<L (S[to]\NP)/(S[b]\NP) TO TO to (S[to]\NP_207)/(S[b]_208\NP_207:B)_208>) (<T S[b]\NP 0 2> (<T S[b]\NP 0 2> (<T (S[b]\NP)/PP 0 2> (<L ((S[b]\NP)/PP)/NP VB VB spend ((S[b]\NP_217)/PP_218)/NP_219>) (<L NP PRP PRP themselves NP>) ) (<T PP 0 2> (<L PP/NP IN IN into PP/NP_226>) (<T NP 0 1> (<L N NN NN poverty N>) ) ) ) (<T (S\NP)\(S\NP) 0 2> (<L ((S\NP)\(S\NP))/(S[ng]\NP) IN IN before ((S_244\NP_237)_244\(S_244\NP_237)_244)/(S[ng]_245\NP_237:B)_245>) (<T S[ng]\NP 0 2> (<L (S[ng]\NP)/PP VBG VBG qualifying (S[ng]\NP_252)/PP_253>) (<T PP 0 2> (<L PP/NP IN IN for PP/NP_258>) (<T NP 0 1> (<T N 1 2> (<L N/N NNP NNP Medicaid N_267/N_267>) (<L N NN NN assistance N>) ) ) ) ) ) ) ) ) ) ) ) ) ) ) (<L . . . . .>) ) 
ID=wsj_0595.17 PARSER=GOLD NUMPARSE=1
(<T S[dcl] 0 2> (<T S[dcl] 1 2> (<L S/S CC CC But S_551/S_551>) (<T S[dcl] 1 2> (<T NP 0 2> (<T NP 0 1> (<T N 1 2> (<L N/N JJ JJ separate N_455/N_455>) (<L N NNS NNS reports N>) ) ) (<T NP\NP 0 2> (<L (NP\NP)/NP IN IN from (NP_464\NP_464)/NP_465>) (<T NP 0 2> (<T NP 0 2> (<T NP 0 1> (<T N 1 2> (<L N/N NNP NNP Joshua N_485/N_485>) (<T N 1 2> (<L N NNP NNP Weiner N>) (<T N[conj] 1 2> (<L conj CC CC and conj>) (<T N 1 2> (<L N/N NNP NNP Denise N_474/N_474>) (<L N NNP NNP Spence N>) ) ) ) ) ) (<T NP\NP 0 2> (<L (NP\NP)/NP IN IN of (NP_494\NP_494)/NP_495>) (<T NP 1 2> (<L NP[nb]/N DT DT the NP[nb]_509/N_509>) (<T N 1 2> (<L N/N NNP NNP Brookings N_504/N_504>) (<L N NNP NNP Institution N>) ) ) ) ) (<T NP[conj] 1 2> (<L conj CC CC and conj>) (<T NP 0 2> (<T NP 0 1> (<T N 1 2> (<L N/N NNP NNP Korbin N_518/N_518>) (<L N NNP NNP Liu N>) ) ) (<T NP\NP 0 2> (<L (NP\NP)/NP IN IN of (NP_527\NP_527)/NP_528>) (<T NP 1 2> (<L NP[nb]/N DT DT the NP[nb]_542/N_542>) (<T N 1 2> (<L N/N NNP NNP Urban N_537/N_537>) (<L N NNP NNP Institute N>) ) ) ) ) ) ) ) ) (<T S[dcl]\NP 0 2> (<L (S[dcl]\NP)/S[em] VBP VBP find (S[dcl]\NP_190)/S[em]_191>) (<T S[em] 0 2> (<L S[em]/S[dcl] IN IN that S[em]/S[dcl]_196>) (<T S[dcl] 1 2> (<T NP 0 2> (<T NP 0 2> (<T NP 1 2> (<L NP[nb]/N DT DT a NP[nb]_374/N_374>) (<T N 1 2> (<T N/N 1 2> (<L (N/N)/(N/N) RB RB surprisingly (N_369/N_363)_369/(N_369/N_363)_369>) (<L N/N JJ JJ small N_355/N_355>) ) (<L N NN NN proportion N>) ) ) (<T NP\NP 0 2> (<T NP\NP 0 2> (<L (NP\NP)/NP : : -- (NP_382\NP_382)/NP_383>) (<T NP 0 1> (<T N 1 2> (<T N/N 1 2> (<T (N/N)/(N/N) 1 2> (<L ((N/N)/(N/N))/((N/N)/(N/N)) RB RB only ((N_431/N_422)_431/(N_423/N_422)_423)_431/((N_431/N_422)_431/(N_423/N_422)_423)_431>) (<L (N/N)/(N/N) IN IN about (N_406/N_400)_406/(N_406/N_400)_406>) ) (<L N/N CD CD 10 N_392/N_392>) ) (<L N NN NN % N>) ) ) ) (<L : : : -- :>) ) ) (<T NP\NP 0 2> (<L (NP\NP)/NP IN IN of (NP_442\NP_442)/NP_443>) (<T NP 0 1> (<L N NNS NNS residents N>) ) ) ) (<T S[dcl]\NP 0 2> (<T S[dcl]\NP 0 2> (<T (S[dcl]\NP)/PP 0 2> (<L ((S[dcl]\NP)/PP)/(S[adj]\NP) VBP VBP start ((S[dcl]\NP_207)/PP_208)/(S[adj]_209\NP_207:B)_209>) (<L S[adj]\NP IN IN out S[adj]\NP_214>) ) (<T PP 0 2> (<L PP/NP RB RB as PP/NP_219>) (<T NP 0 1> (<T N 1 2> (<L N/N JJ JJ private N_228/N_228>) (<L N NNS NNS payers N>) ) ) ) ) (<T S[dcl]\NP[conj] 1 2> (<L conj CC CC but conj>) (<T S[dcl]\NP 0 2> (<T S[dcl]\NP 0 2> (<T S[dcl]\NP 0 2> (<T (S[dcl]\NP)/PP 0 2> (<L (S[dcl]\NP)/PP VBP VBP spend (S[dcl]\NP_236)/PP_237>) (<L (S\NP)\(S\NP) RP RP down (S_249\NP_244)_249\(S_249\NP_244)_249>) ) (<T PP 0 2> (<L PP/NP TO TO to PP/NP_254>) (<T NP 0 1> (<T N 1 2> (<L N/N NNP NNP Medicaid N_263/N_263>) (<L N NNS NNS levels N>) ) ) ) ) (<T (S\NP)\(S\NP) 0 2> (<L ((S\NP)\(S\NP))/NP IN IN in ((S_277\NP_272)_277\(S_277\NP_272)_277)/NP_278>) (<T NP 1 2> (<L NP[nb]/N DT DT a NP[nb]_306/N_306>) (<T N 1 2> (<L N/N JJ JJ single N_301/N_301>) (<T N 1 2> (<L N/N NN NN nursing N_294/N_294>) (<T N 1 2> (<L N/N NN NN home N_287/N_287>) (<L N NN NN stay N>) ) ) ) ) ) ) (<T (S\NP)\(S\NP) 0 2> (<L ((S\NP)\(S\NP))/S[dcl] IN IN before ((S_319\NP_314)_319\(S_319\NP_314)_319)/S[dcl]_320>) (<T S[dcl] 1 2> (<L NP PRP PRP they NP>) (<T S[dcl]\NP 0 2> (<L S[dcl]\NP VBP VBP die S[dcl]\NP_325>) (<T S[dcl]\NP[conj] 1 2> (<L conj CC CC or conj>) (<T S[dcl]\NP 0 2> (<L (S[dcl]\NP)/(S[pss]\NP) VBP VBP are (S[dcl]\NP_334)/(S[pss]_335\NP_334:B)_335>) (<L S[pss]\NP VBN VBN discharged S[pss]\NP_340>) ) ) ) ) ) ) ) ) ) ) ) ) ) (<L . . . . .>) ) 
ID=wsj_0595.18 PARSER=GOLD NUMPARSE=1
(<T S[dcl] 1 2> (<L LRB LRB -LRB- -LRB- LRB>) (<T S[dcl] 1 2> (<T NP 1 2> (<L NP[nb]/N DT DT Another NP[nb]_464/N_464>) (<L N NN NN one-third N>) ) (<T S[dcl]\NP 0 2> (<T S[dcl]\NP 0 2> (<T S[dcl]\NP 0 2> (<T S[dcl]\NP 0 2> (<T S[dcl]\NP 0 2> (<T (S[dcl]\NP)/PP 0 2> (<L (S[dcl]\NP)/PP VBP VBP are (S[dcl]\NP_333)/PP_334>) (<L (S\NP)\(S\NP) RB RB already (S_346\NP_341)_346\(S_346\NP_341)_346>) ) (<T PP 0 2> (<L PP/NP IN IN on PP/NP_351>) (<T NP 0 1> (<L N NNP NNP Medicaid N>) ) ) ) (<T (S\NP)\(S\NP) 0 2> (<L ((S\NP)\(S\NP))/S[dcl] WRB WRB when ((S_367\NP_362)_367\(S_367\NP_362)_367)/S[dcl]_368>) (<T S[dcl] 1 2> (<L NP PRP PRP they NP>) (<T S[dcl]\NP 0 2> (<L (S[dcl]\NP)/NP VBP VBP enter (S[dcl]\NP_375)/NP_376>) (<T NP 1 2> (<L NP[nb]/N DT DT the NP[nb]_390/N_390>) (<T N 1 2> (<L N/N NN NN nursing N_385/N_385>) (<L N NNS NNS homes N>) ) ) ) ) ) ) (<T (S\NP)\(S\NP) 1 2> (<L , , , , ,>) (<T NP 0 2> (<T NP 1 2> (<L NP[nb]/N DT DT a NP[nb]_420/N_420>) (<T N 1 2> (<T N/N 1 2> (<L (N/N)/(N/N) RB RB considerably (N_415/N_409)_415/(N_415/N_409)_415>) (<L N/N JJR JJR higher N_401/N_401>) ) (<L N NN NN proportion N>) ) ) (<T NP\NP 0 2> (<L (NP\NP)/S[pss] IN IN than (NP_428\NP_428)/S[pss]_429>) (<T S[pss] 1 2> (<T NP 1 2> (<L NP[nb]/N DT DT the NP[nb]_441/N_441>) (<L N NNS NNS analysts N>) ) (<L S[pss]\NP VBN VBN anticipated S[pss]\NP_434>) ) ) ) ) ) (<L . . . . .>) ) (<L RRB RRB -RRB- -RRB- RRB>) ) ) ) 
ID=wsj_0595.19 PARSER=GOLD NUMPARSE=1
(<T S[dcl] 0 2> (<T S[dcl] 1 2> (<L S/S CC CC But S_235/S_235>) (<T S[dcl] 1 2> (<T NP 0 2> (<T NP 1 2> (<L NP[nb]/N DT DT a NP[nb]_207/N_207>) (<T N 1 2> (<T N/N 1 2> (<L (N/N)/(N/N) RB RB remarkably (N_202/N_196)_202/(N_202/N_196)_202>) (<L N/N JJ JJ high N_188/N_188>) ) (<L N NN NN percentage N>) ) ) (<T NP\NP 0 2> (<T NP\NP 0 2> (<L (NP\NP)/NP : : -- (NP_215\NP_215)/NP_216>) (<T NP 0 1> (<T N 1 2> (<L N/N IN IN over N_225/N_225>) (<L N DT DT half N>) ) ) ) (<L : : : -- :>) ) ) (<T S[dcl]\NP 0 2> (<T S[dcl]\NP 0 2> (<L (S[dcl]\NP)/NP VBP VBP are (S[dcl]\NP_117)/NP_118>) (<T NP 0 1> (<T N 1 2> (<L N/N JJ JJ private N_127/N_127>) (<L N NNS NNS payers N>) ) ) ) (<T (S\NP)\(S\NP) 0 2> (<L ((S\NP)\(S\NP))/NP IN IN throughout ((S_141\NP_136)_141\(S_141\NP_136)_141)/NP_142>) (<T NP 0 2> (<T NP 1 2> (<L NP[nb]/N PRP$ PRP$ their NP[nb]_149/N_149>) (<L N NN NN stay N>) ) (<T NP[conj] 1 2> (<L , , , , ,>) (<T NP 1 2> (<L NP/NP RB RB even NP_177/NP_177>) (<T NP 1 2> (<L NP[nb]/N DT DT a NP[nb]_170/N_170>) (<T N 0 2> (<T N 1 2> (<L N/N RB RB fairly N_158/N_158>) (<L N JJ JJ lengthy N>) ) (<L N\N CD CD one N_165\N_165>) ) ) ) ) ) ) ) ) ) (<L . . . . .>) ) 
ID=wsj_0595.20 PARSER=GOLD NUMPARSE=1
(<T S[dcl] 0 2> (<T S[dcl] 1 2> (<T NP 0 1> (<T N 1 2> (<L N/N IN IN About N_248/N_248>) (<L N NN NN one-third N>) ) ) (<T S[dcl]\NP 0 2> (<T S[dcl]\NP 0 2> (<T S[dcl]\NP 0 2> (<L (S[dcl]\NP)/PP VBZ NN pay (S[dcl]\NP_117)/PP_118>) (<T PP 0 2> (<L PP/PP IN IN out PP_125/PP_125>) (<T PP 0 2> (<L PP/NP IN IN of PP/NP_130>) (<T NP 1 2> (<L NP[nb]/N PRP$ PRP$ their NP[nb]_144/N_144>) (<T N 1 2> (<L N/N JJ JJ own N_139/N_139>) (<L N NNS NNS pockets N>) ) ) ) ) ) (<L , , , , ,>) ) (<T (S\NP)\(S\NP) 0 2> (<L ((S\NP)\(S\NP))/S[dcl] IN IN while ((S_159\NP_154)_159\(S_159\NP_154)_159)/S[dcl]_160>) (<T S[dcl] 1 2> (<T NP 1 2> (<L NP[nb]/N DT DT the NP[nb]_239/N_239>) (<L N NN NN rest N>) ) (<T S[dcl]\NP 0 2> (<L (S[dcl]\NP)/(S[pss]\NP) VBP VBP are (S[dcl]\NP_169)/(S[pss]_170\NP_169:B)_170>) (<T S[pss]\NP 0 2> (<T S[pss]\NP 0 2> (<L S[pss]\NP VBN VBN covered S[pss]\NP_175>) (<L (S\NP)\(S\NP) IN IN throughout (S_187\NP_182)_187\(S_187\NP_182)_187>) ) (<T (S\NP)\(S\NP) 0 2> (<L ((S\NP)\(S\NP))/NP IN IN by ((S_200\NP_195)_200\(S_200\NP_195)_200)/NP_201>) (<T NP 0 2> (<T NP 0 1> (<L N NNP NNP Medicare N>) ) (<T NP[conj] 1 2> (<L , , , , ,>) (<T NP 0 2> (<T NP 0 1> (<T N 1 2> (<L N/N JJ JJ private N_213/N_213>) (<L N NNS NNS insurers N>) ) ) (<T NP[conj] 1 2> (<L conj CC CC or conj>) (<T NP 1 2> (<L NP[nb]/N DT DT the NP[nb]_228/N_228>) (<T N 1 2> (<L N/N NNPS NNPS Veterans N_223/N_223>) (<L N NNP NNP Administration N>) ) ) ) ) ) ) ) ) ) ) ) ) ) (<L . . . . .>) ) 
ID=wsj_0595.21 PARSER=GOLD NUMPARSE=1
(<T S[dcl] 0 2> (<T S[dcl] 1 2> (<T NP 1 2> (<L NP[nb]/N DT DT Both NP[nb]_225/N_225>) (<L N NNS NNS reports N>) ) (<T S[dcl]\NP 0 2> (<L (S[dcl]\NP)/(S[pss]\NP) VBP VBP are (S[dcl]\NP_128)/(S[pss]_129\NP_128:B)_129>) (<T S[pss]\NP 0 2> (<L (S[pss]\NP)/PP VBN VBN based (S[pss]\NP_136)/PP_137>) (<T PP 0 2> (<L PP/NP IN IN on PP/NP_142>) (<T NP 0 2> (<T NP 0 1> (<T N 1 2> (<T N/N 1 2> (<L (N/N)/(N/N) JJ JJ several (N_165/N_159)_165/(N_165/N_159)_165>) (<L N/N CD CD thousand N_151/N_151>) ) (<L N NNS NNS patients N>) ) ) (<T NP\NP 0 1> (<T S[pss]\NP 0 2> (<L S[pss]\NP VBN VBN sampled S[pss]\NP_171>) (<T (S\NP)\(S\NP) 0 2> (<L ((S\NP)\(S\NP))/NP IN IN in ((S_184\NP_179)_184\(S_184\NP_179)_184)/NP_185>) (<T NP 1 2> (<L NP[nb]/N DT DT a NP[nb]_213/N_213>) (<T N 1 2> (<L N/N CD CD 1985 N_208/N_208>) (<T N 1 2> (<L N/N JJ JJ nationwide N_201/N_201>) (<T N 1 2> (<L N/N NN NN government N_194/N_194>) (<L N NN NN survey N>) ) ) ) ) ) ) ) ) ) ) ) ) (<L . . . . .>) ) 
ID=wsj_0595.22 PARSER=GOLD NUMPARSE=1
(<T S[dcl] 0 2> (<T S[dcl] 1 2> (<T NP 1 2> (<L NP[nb]/N DT DT The NP[nb]_323/N_323>) (<T N 1 2> (<L N/N NNP NNP Brookings N_318/N_318>) (<T N 1 2> (<L conj CC CC and conj>) (<T N 1 2> (<L N/N NNP NNP Urban N_309/N_309>) (<T N 1 2> (<L N/N NNP NNP Institute N_302/N_302>) (<L N NNS NNS authors N>) ) ) ) ) ) (<T S[dcl]\NP 0 2> (<T (S[dcl]\NP)/S[em] 0 2> (<T (S[dcl]\NP)/S[em] 0 2> (<T (S[dcl]\NP)/S[em] 0 2> (<L (S[dcl]\NP)/S[em] VBP VBP caution (S[dcl]\NP_102)/S[em]_103>) (<L , , , , ,>) ) (<L (S\NP)\(S\NP) RB RB however (S_117\NP_112)_117\(S_117\NP_112)_117>) ) (<L , , , , ,>) ) (<T S[em] 0 2> (<L S[em]/S[dcl] IN IN that S[em]/S[dcl]_124>) (<T S[dcl] 0 2> (<T S[dcl] 1 2> (<T NP 0 1> (<T N 1 2> (<L N/N JJS JJS most N_184/N_184>) (<T N 1 2> (<L N/N NN NN nursing N_177/N_177>) (<T N 1 2> (<L N/N NN NN home N_170/N_170>) (<L N NNS NNS stays N>) ) ) ) ) (<T S[dcl]\NP 0 2> (<L (S[dcl]\NP)/PP VBP VBP are (S[dcl]\NP_131)/PP_132>) (<T PP 0 2> (<L PP/NP IN IN of PP/NP_137>) (<T NP 0 1> (<T N 1 2> (<T N/N 1 2> (<L (N/N)/(N/N) RB RB comparatively (N_160/N_154)_160/(N_160/N_154)_160>) (<L N/N JJ JJ short N_146/N_146>) ) (<L N NN NN duration N>) ) ) ) ) ) (<T S[dcl][conj] 1 2> (<L , , , , ,>) (<T S[dcl][conj] 1 2> (<L conj CC CC and conj>) (<T S[dcl] 1 2> (<T NP 0 1> (<T S[ng]\NP 0 2> (<L (S[ng]\NP)/NP VBG VBG reaching (S[ng]\NP_273)/NP_274>) (<T NP 1 2> (<L NP[nb]/N DT DT the NP[nb]_288/N_288>) (<T N 1 2> (<L N/N NNP NNP Medicaid N_283/N_283>) (<L N NN NN level N>) ) ) ) ) (<T S[dcl]\NP 0 2> (<T S[dcl]\NP 0 2> (<L (S[dcl]\NP)/(S[adj]\NP) VBZ VBZ is (S[dcl]\NP_194)/(S[adj]_195\NP_194:B)_195>) (<T S[adj]\NP 1 2> (<L (S[adj]\NP)/(S[adj]\NP) RBR RBR more (S[adj]_212\NP_207)_212/(S[adj]_212\NP_207)_212>) (<L S[adj]\NP JJ JJ likely S[adj]\NP_200>) ) ) (<T (S\NP)\(S\NP) 0 2> (<L ((S\NP)\(S\NP))/NP IN IN with ((S_225\NP_220)_225\(S_225\NP_220)_225)/NP_226>) (<T NP 0 2> (<T NP 1 2> (<L NP[nb]/N DT DT an NP[nb]_254/N_254>) (<T N 1 2> (<T N/N 1 2> (<L (N/N)/(N/N) RB RB unusually (N_249/N_243)_249/(N_249/N_243)_249>) (<L N/N JJ JJ long N_235/N_235>) ) (<L N NN NN stay N>) ) ) (<T NP[conj] 1 2> (<L conj CC CC or conj>) (<T NP 0 1> (<T N 1 2> (<L N/N VBN VBN repeated N_263/N_263>) (<L N NNS NNS stays N>) ) ) ) ) ) ) ) ) ) ) ) ) ) (<L . . . . .>) ) 
ID=wsj_0595.23 PARSER=GOLD NUMPARSE=1
(<T S[dcl] 0 2> (<T S[dcl] 1 2> (<L S/S RB RB Moreover S_444/S_444>) (<T S[dcl] 1 2> (<T S/S 1 2> (<L , , , , ,>) (<T S/S 0 2> (<T S[dcl]/S[dcl] 1 2> (<T S/(S\NP) 0 1> (<L NP PRP PRP they NP>) ) (<L (S[dcl]\NP)/S[dcl] VBP VBP note (S[dcl]\NP_418)/S[dcl]_419>) ) (<L , , , , ,>) ) ) (<T S[dcl] 1 2> (<T NP 0 2> (<L NP DT DT those NP>) (<T NP\NP 0 2> (<L (NP\NP)/(S[dcl]\NP) WP WP who (NP_368\NP_368)/(S[dcl]_369\NP_368:B)_369>) (<T S[dcl]\NP 0 2> (<L (S[dcl]\NP)/(S[to]\NP) VBP VBP manage (S[dcl]\NP_378)/(S[to]_379\NP_378:B)_379>) (<T S[to]\NP 0 2> (<L (S[to]\NP)/(S[b]\NP) TO TO to (S[to]\NP_388)/(S[b]_389\NP_388:B)_389>) (<T S[b]\NP 0 2> (<L (S[b]\NP)/NP VB VB pay (S[b]\NP_396)/NP_397>) (<T NP 1 2> (<L NP[nb]/N PRP$ PRP$ their NP[nb]_411/N_411>) (<T N 1 2> (<L N/N JJ JJ own N_406/N_406>) (<L N NN NN way N>) ) ) ) ) ) ) ) (<T S[dcl]\NP 1 2> (<L (S\NP)/(S\NP) RB RB often (S_356\NP_351)_356/(S_356\NP_351)_356>) (<T S[dcl]\NP 0 2> (<T S[dcl]\NP 0 2> (<L (S[dcl]\NP)/(S[adj]\NP) VBP VBP do (S[dcl]\NP_210)/(S[adj]_211\NP_210:B)_211>) (<L S[adj]\NP RB RB so S[adj]\NP_216>) ) (<T (S\NP)\(S\NP) 1 2> (<L ((S\NP)\(S\NP))/((S\NP)\(S\NP)) RB RB only ((S_344\NP_336)_344\(S_337\NP_336)_337)_344/((S_344\NP_336)_344\(S_337\NP_336)_337)_344>) (<T (S\NP)\(S\NP) 0 2> (<L ((S\NP)\(S\NP))/(S[ng]\NP) IN IN by ((S_231\NP_224)_231\(S_231\NP_224)_231)/(S[ng]_232\NP_224:B)_232>) (<T S[ng]\NP 0 2> (<T S[ng]\NP 0 2> (<L (S[ng]\NP)/NP VBG VBG selling (S[ng]\NP_239)/NP_240>) (<T NP 1 2> (<L NP[nb]/N PRP$ PRP$ their NP[nb]_247/N_247>) (<L N NNS NNS homes N>) ) ) (<T S[ng]\NP[conj] 1 2> (<L , , , , ,>) (<T S[ng]\NP 0 2> (<T S[ng]\NP 0 2> (<T (S[ng]\NP)/NP 0 2> (<L (S[ng]\NP)/NP VBG VBG using (S[ng]\NP_254)/NP_255>) (<L (S\NP)\(S\NP) RP RP up (S_267\NP_262)_267\(S_267\NP_262)_267>) ) (<T NP 0 1> (<T N 1 2> (<L N/N NN NN life N_276/N_276>) (<L N NNS NNS savings N>) ) ) ) (<T S[ng]\NP[conj] 1 2> (<L conj CC CC or conj>) (<T S[ng]\NP 0 2> (<T (S[ng]\NP)/PP 0 2> (<L (S[ng]\NP)/PP VBG VBG drawing (S[ng]\NP_284)/PP_285>) (<L (S\NP)\(S\NP) RB RB heavily (S_297\NP_292)_297\(S_297\NP_292)_297>) ) (<T PP 0 2> (<L PP/NP IN IN on PP/NP_302>) (<T NP 0 2> (<T NP 0 1> (<L N NNS NNS children N>) ) (<T NP[conj] 1 2> (<L conj CC CC and conj>) (<T NP 0 1> (<T N 1 2> (<L N/N JJ JJ other N_314/N_314>) (<L N NNS NNS relatives N>) ) ) ) ) ) ) ) ) ) ) ) ) ) ) ) ) ) (<L . . . . .>) ) 
ID=wsj_0595.24 PARSER=GOLD NUMPARSE=1
(<T S[dcl] 1 2> (<T NP 0 1> (<T N 1 2> (<L N/N NNP NNP Reagan N_239/N_239>) (<T N 1 2> (<L N/N NN NN Era N_232/N_232>) (<L N NN NN Young N>) ) ) ) (<T S[dcl]\NP 0 2> (<L (S[dcl]\NP)/NP VBP VBP Hold (S[dcl]\NP_212)/NP_213>) (<T NP 0 1> (<T N 1 2> (<L N/N JJ JJ Liberal N_222/N_222>) (<L N NNS NNS Views N>) ) ) ) ) 
ID=wsj_0595.25 PARSER=GOLD NUMPARSE=1
(<T S 0 2> (<T S 0 2> (<T S 0 2> (<T S 0 2> (<L S/N DT DT THE S/N_35>) (<T N 1 2> (<L N/N NNP NNP REAGAN N_62/N_62>) (<T N 1 2> (<L N/N NN NN generation N_55/N_55>) (<T N 1 2> (<L N/N JJ JJ young N_48/N_48>) (<T N 1 2> (<L N NNS NNS men N>) (<T N[conj] 1 2> (<L conj CC CC and conj>) (<L N NNS NNS women N>) ) ) ) ) ) ) (<T S\S 0 1> (<T S[ng]\NP 0 2> (<T S[ng]\NP 0 2> (<L (S[ng]\NP)/NP VBG VBG reaching (S[ng]\NP_69)/NP_70>) (<T NP 0 1> (<T N 1 2> (<L N/N JJ JJ political N_79/N_79>) (<L N NN NN maturity N>) ) ) ) (<T (S\NP)\(S\NP) 0 2> (<L ((S\NP)\(S\NP))/NP IN IN during ((S_93\NP_88)_93\(S_93\NP_88)_93)/NP_94>) (<T NP 1 2> (<T NP[nb]/N 1 2> (<T NP 0 1> (<T N 1 2> (<L N/N NNP NNP Ronald N_113/N_113>) (<L N NNP NNP Reagan N>) ) ) (<L (NP[nb]/N)\NP POS POS 's (NP[nb]_103/N_103)\NP_104>) ) (<L N NN NN presidency N>) ) ) ) ) ) (<T S\S 0 2> (<L (S\S)/(S[dcl]\NP) IN : -- (S_129\S_129)/(S[dcl]_130\NP_126)_130>) (<T S[dcl]\NP 0 2> (<T S[dcl]\NP 0 2> (<T S[dcl]\NP 0 2> (<L (S[dcl]\NP)/(S[adj]\NP) VBP VBP are (S[dcl]\NP_139)/(S[adj]_140\NP_139:B)_140>) (<T S[adj]\NP 1 2> (<L (S[adj]\NP)/(S[adj]\NP) RB RB firmly (S[adj]_172\NP_167)_172/(S[adj]_172\NP_167)_172>) (<T S[adj]\NP 0 2> (<L (S[adj]\NP)/PP JJ JJ liberal (S[adj]\NP_147)/PP_148>) (<T PP 0 2> (<L PP/NP IN IN on PP/NP_153>) (<T NP 0 1> (<T N 1 2> (<L N NN NN race N>) (<T N[conj] 1 2> (<L conj CC CC and conj>) (<L N NN NN gender N>) ) ) ) ) ) ) ) (<L , , , , ,>) ) (<T (S\NP)\(S\NP) 0 2> (<L ((S\NP)\(S\NP))/PP VBG VBG according ((S_187\NP_182)_187\(S_187\NP_182)_187)/PP_188>) (<T PP 0 2> (<L PP/NP TO TO to PP/NP_193>) (<T NP 0 2> (<T NP 0 1> (<L N NNP NNP NORC N>) ) (<T NP[conj] 1 2> (<L , , , , ,>) (<T NP 0 2> (<T NP 1 2> (<L NP[nb]/N DT DT the NP[nb]_224/N_224>) (<T N 1 2> (<L N/N JJ JJ social N_219/N_219>) (<T N 1 2> (<L N/N NN NN science N_212/N_212>) (<T N 1 2> (<L N/N NN NN research N_205/N_205>) (<L N NN NN center N>) ) ) ) ) (<T NP\NP 0 2> (<L (NP\NP)/NP IN IN at (NP_232\NP_232)/NP_233>) (<T NP 0 2> (<T NP 1 2> (<L NP[nb]/N DT DT the NP[nb]_240/N_240>) (<L N NNP NNP University N>) ) (<T NP\NP 0 2> (<L (NP\NP)/NP IN IN of (NP_248\NP_248)/NP_249>) (<T NP 0 1> (<L N NNP NNP Chicago N>) ) ) ) ) ) ) ) ) ) ) ) ) (<L . . . . .>) ) 
ID=wsj_0595.26 PARSER=GOLD NUMPARSE=1
(<T S[dcl] 0 2> (<T S[dcl] 1 2> (<T NP 0 1> (<T N 1 2> (<L N/N JJ JJ Many N_291/N_291>) (<T N 1 2> (<L N/N JJ JJ political N_284/N_284>) (<L N NNS NNS analysts N>) ) ) ) (<T S[dcl]\NP 0 2> (<L (S[dcl]\NP)/(S[pt]\NP) VBP VBP have (S[dcl]\NP_194)/(S[pt]_195\NP_194:B)_195>) (<T S[pt]\NP 0 2> (<L (S[pt]\NP)/S[em] VBN VBN speculated (S[pt]\NP_202)/S[em]_203>) (<T S[em] 0 2> (<L S[em]/S[dcl] IN IN that S[em]/S[dcl]_208>) (<T S[dcl] 1 2> (<T NP 1 2> (<L NP[nb]/N DT DT the NP[nb]_275/N_275>) (<T N 1 2> (<L N/N NNP NNP Reagan N_270/N_270>) (<L N NNS NNS years N>) ) ) (<T S[dcl]\NP 0 2> (<L (S[dcl]\NP)/(S[b]\NP) MD MD would (S[dcl]\NP_217)/(S[b]_218\NP_217:B)_218>) (<T S[b]\NP 0 2> (<L (S[b]\NP)/NP VB VB produce (S[b]\NP_225)/NP_226>) (<T NP 1 2> (<L NP[nb]/N DT DT a NP[nb]_261/N_261>) (<T N 1 2> (<T N/N 1 2> (<L (N/N)/(N/N) RB RB staunchly (N_256/N_250)_256/(N_256/N_250)_256>) (<L N/N JJ JJ conservative N_242/N_242>) ) (<T N 1 2> (<L N/N JJR JJR younger N_235/N_235>) (<L N NN NN generation N>) ) ) ) ) ) ) ) ) ) ) (<L . . . . .>) ) 
ID=wsj_0595.27 PARSER=GOLD NUMPARSE=1
(<T S[dcl] 0 2> (<T S[dcl] 1 2> (<T NP 1 2> (<T NP[nb]/N 1 2> (<T NP 0 1> (<L N NNP NNP NORC N>) ) (<L (NP[nb]/N)\NP POS POS 's (NP[nb]_248/N_248)\NP_249>) ) (<T N 1 2> (<T N/N 1 2> (<L (N/N)/(N/N) JJS JJS most (N_241/N_235)_241/(N_241/N_235)_241>) (<L N/N JJ JJ recent N_227/N_227>) ) (<T N 1 2> (<L N/N NN NN opinion N_220/N_220>) (<L N NNS NNS surveys N>) ) ) ) (<T S[dcl]\NP 0 2> (<T (S[dcl]\NP)/(S[adj]\NP) 0 2> (<T (S[dcl]\NP)/(S[adj]\NP) 0 2> (<L ((S[dcl]\NP)/(S[adj]\NP))/NP VBP VBP find ((S[dcl]\NP_112)/(S[adj]_113\NP_114:B)_113)/NP_114>) (<T NP 1 2> (<L NP[nb]/N DT DT the NP[nb]_128/N_128>) (<T N 1 2> (<L N/N JJS JJS youngest N_123/N_123>) (<L N NNS NNS adults N>) ) ) ) (<L (S\NP)\(S\NP) RB RB indeed (S_140\NP_135)_140\(S_140\NP_135)_140>) ) (<T S[adj]\NP 0 2> (<T S[adj]\NP 1 2> (<T (S[adj]\NP)/(S[adj]\NP) 1 2> (<L ((S[adj]\NP)/(S[adj]\NP))/((S[adj]\NP)/(S[adj]\NP)) RB RB somewhat ((S[adj]_187\NP_179)_187/(S[adj]_180\NP_179)_180)_187/((S[adj]_187\NP_179)_187/(S[adj]_180\NP_179)_180)_187>) (<L (S[adj]\NP)/(S[adj]\NP) JJR JJR more (S[adj]_164\NP_159)_164/(S[adj]_164\NP_159)_164>) ) (<T S[adj]\NP 0 2> (<L S[adj]\NP JJ JJ pro-Reagan S[adj]\NP_145>) (<T S[adj]\NP[conj] 1 2> (<L conj CC CC and conj>) (<L S[adj]\NP JJ JJ pro-Republican S[adj]\NP_150>) ) ) ) (<T (S[adj]\NP)\(S[adj]\NP) 0 2> (<L ((S[adj]\NP)\(S[adj]\NP))/NP IN IN than ((S[adj]_200\NP_195)_200\(S[adj]_200\NP_195)_200)/NP_201>) (<T NP 0 1> (<T N 1 2> (<L N/N JJ JJ other N_210/N_210>) (<L N NNS NNS adults N>) ) ) ) ) ) ) (<L . . . . .>) ) 
ID=wsj_0595.28 PARSER=GOLD NUMPARSE=1
(<T S[dcl] 0 2> (<T S[dcl] 1 2> (<L S/S CC CC But S_311/S_311>) (<T S[dcl] 1 2> (<L , , , , ,>) (<T S[dcl] 1 2> (<T S/S 0 2> (<L (S/S)/NP VBZ VBZ says (S_277/S_277)/NP_278>) (<T NP 0 1> (<T N 1 2> (<L N/N NN NN chief N_301/N_301>) (<T N 1 2> (<L N/N NN NN investigator N_294/N_294>) (<T N 1 2> (<L N/N NNP NNP Tom N_287/N_287>) (<L N NNP NNP Smith N>) ) ) ) ) ) (<T S[dcl] 1 2> (<L , , , , ,>) (<T S[dcl] 1 2> (<L NP DT DT this NP>) (<T S[dcl]\NP 0 2> (<T (S[dcl]\NP)/(S[b]\NP) 0 2> (<L (S[dcl]\NP)/(S[b]\NP) VBZ VBZ does (S[dcl]\NP_149)/(S[b]_150\NP_149:B)_150>) (<L (S\NP)\(S\NP) RB RB not (S_162\NP_157)_162\(S_162\NP_157)_162>) ) (<T S[b]\NP 0 2> (<L (S[b]\NP)/PP VB VB translate (S[b]\NP_169)/PP_170>) (<T PP 0 2> (<T PP 0 2> (<L PP/NP IN IN into PP/NP_175>) (<T NP 0 2> (<T NP 0 2> (<T NP 0 1> (<L N NN NN support N>) ) (<T NP\NP 0 2> (<L (NP\NP)/NP IN IN for (NP_186\NP_186)/NP_187>) (<T NP 0 1> (<L N NN NN conservatism N>) ) ) ) (<T NP\NP 0 2> (<L (NP\NP)/(S[adj]\NP) IN IN in (NP_200\NP_200)/(S[adj]_201\NP_197)_201>) (<L S[adj]\NP JJ JJ general S[adj]\NP_206>) ) ) ) (<T PP[conj] 1 2> (<L conj CC CC or conj>) (<T PP 0 2> (<L PP/NP IN IN into PP/NP_211>) (<T NP 0 2> (<T NP 0 1> (<T N 1 2> (<L N/N JJ JJ conservative N_220/N_220>) (<L N NNS NNS positions N>) ) ) (<T NP\NP 0 2> (<L (NP\NP)/NP IN IN on (NP_229\NP_229)/NP_230>) (<T NP 0 1> (<T N 1 2> (<T N/N 0 2> (<L N/N JJ JJ feminist N_239/N_239>) (<T N/N[conj] 1 2> (<L conj CC CC and conj>) (<T N/N 1 2> (<L (N/N)/(N/N) JJ JJ civil (N_260/N_254)_260/(N_260/N_254)_260>) (<L N/N NNS NNS rights N_246/N_246>) ) ) ) (<L N NNS NNS issues N>) ) ) ) ) ) ) ) ) ) ) ) ) ) ) (<L . . . . .>) ) 
ID=wsj_0595.29 PARSER=GOLD NUMPARSE=1
(<T S[dcl] 0 2> (<T S[dcl] 1 2> (<T NP 0 2> (<T NP 0 1> (<L N NNS NNS Answers N>) ) (<T NP\NP 0 2> (<L (NP\NP)/NP TO TO to (NP_414\NP_414)/NP_415>) (<T NP 0 2> (<T NP 1 2> (<L NP[nb]/N DT DT a NP[nb]_429/N_429>) (<T N 1 2> (<L N/N NN NN dozen N_424/N_424>) (<L N NNS NNS questions N>) ) ) (<T NP\NP 0 2> (<L (NP\NP)/NP IN IN in (NP_437\NP_437)/NP_438>) (<T NP 1 2> (<L NP[nb]/N DT DT the NP[nb]_486/N_486>) (<T N 1 2> (<L N/N CD CD 1986 N_481/N_481>) (<T N 1 2> (<L , , , , ,>) (<T N 1 2> (<L N/N CD CD 1987 N_472/N_472>) (<T N 1 2> (<L , , , , ,>) (<T N 1 2> (<L N/N CD CD 1988 N_463/N_463>) (<T N 1 2> (<L conj CC CC and conj>) (<T N 1 2> (<L N/N CD CD 1989 N_454/N_454>) (<T N 1 2> (<L N/N JJ JJ national N_447/N_447>) (<L N NNS NNS surveys N>) ) ) ) ) ) ) ) ) ) ) ) ) ) (<T S[dcl]\NP 0 2> (<L (S[dcl]\NP)/S[em] VBP VBP reveal (S[dcl]\NP_149)/S[em]_150>) (<T S[em] 0 2> (<L S[em]/S[dcl] IN IN that S[em]/S[dcl]_155>) (<T S[dcl] 1 2> (<T NP 0 2> (<T NP 0 1> (<T N 1 2> (<L N NNS NNS men N>) (<T N[conj] 1 2> (<L conj CC CC and conj>) (<L N NNS NNS women N>) ) ) ) (<T NP\NP 0 2> (<L (NP\NP)/NP IN IN in (NP_356\NP_356)/NP_357>) (<T NP 1 2> (<L NP[nb]/N DT DT the NP[nb]_403/N_403>) (<T N 1 2> (<T N/N 0 2> (<L N/N CD CD 18 N_373/N_373>) (<T (N/N)\(N/N) 0 2> (<L ((N/N)\(N/N))/(N/N) CC TO to ((N_390/N_381)_390\(N_390/N_381)_390)/(N_391/N_385)_391>) (<L N/N CD CD 24 N_398/N_398>) ) ) (<T N 1 2> (<L N/N NN NN age N_366/N_366>) (<L N NN NN bracket N>) ) ) ) ) ) (<T S[dcl]\NP 0 2> (<L (S[dcl]\NP)/(S[adj]\NP) VBP VBP are (S[dcl]\NP_164)/(S[adj]_165\NP_164:B)_165>) (<T S[adj]\NP 0 2> (<T S[adj]\NP 0 2> (<T (S[adj]\NP)/PP 1 2> (<T (S[adj]\NP)/(S[adj]\NP) 1 2> (<L ((S[adj]\NP)/(S[adj]\NP))/((S[adj]\NP)/(S[adj]\NP)) RB RB considerably ((S[adj]_208\NP_200)_208/(S[adj]_201\NP_200)_201)_208/((S[adj]_208\NP_200)_208/(S[adj]_201\NP_200)_201)_208>) (<L (S[adj]\NP)/(S[adj]\NP) RBR RBR more (S[adj]_185\NP_180)_185/(S[adj]_185\NP_180)_185>) ) (<L (S[adj]\NP)/PP JJ JJ liberal (S[adj]\NP_172)/PP_173>) ) (<T PP 0 2> (<L PP/NP IN IN on PP/NP_213>) (<T NP 0 1> (<T N 1 2> (<L N NN NN race N>) (<T N[conj] 1 2> (<L conj CC CC and conj>) (<L N VB VB gender N>) ) ) ) ) ) (<T (S[adj]\NP)\(S[adj]\NP) 0 2> (<L ((S[adj]\NP)\(S[adj]\NP))/S[inv] IN IN than ((S[adj]_233\NP_228)_233\(S[adj]_233\NP_228)_233)/S[inv]_234>) (<T S[inv] 0 2> (<L S[inv]/NP VBD VBD were S[inv]/NP_239>) (<T NP 0 2> (<T NP 0 2> (<T NP 1 2> (<L NP[nb]/N DT DT the NP[nb]_285/N_285>) (<T N 1 2> (<T N/N 0 2> (<L N/N CD CD 18 N_255/N_255>) (<T (N/N)\(N/N) 0 2> (<L ((N/N)\(N/N))/(N/N) CC TO to ((N_272/N_263)_272\(N_272/N_263)_272)/(N_273/N_267)_273>) (<L N/N CD CD 24 N_280/N_280>) ) ) (<T N 1 2> (<L N/N NN NN year N_248/N_248>) (<L N NNS NNS olds N>) ) ) ) (<T NP\NP 0 2> (<L (NP\NP)/NP IN IN in (NP_293\NP_293)/NP_294>) (<T NP 1 2> (<T NP[nb]/N 1 2> (<T NP 0 1> (<L N NNP NNP NORC N>) ) (<L (NP[nb]/N)\NP POS POS 's (NP[nb]_303/N_303)\NP_304>) ) (<L N NN NN polling N>) ) ) ) (<T NP\NP 0 2> (<L (NP\NP)/NP IN IN in (NP_315\NP_315)/NP_316>) (<T NP 1 2> (<L NP[nb]/N DT DT the NP[nb]_341/N_341>) (<T N 0 2> (<T N 1 2> (<L N/N JJ JJ early N_325/N_325>) (<L N CD CD 1970s N>) ) (<T N[conj] 1 2> (<L conj CC CC and conj>) (<T N 1 2> (<L N/N JJ JJ early N_334/N_334>) (<L N CD CD 1980s N>) ) ) ) ) ) ) ) ) ) ) ) ) ) ) (<L . . . . .>) ) 
ID=wsj_0595.30 PARSER=GOLD NUMPARSE=1
(<T S[dcl] 0 2> (<T S[dcl] 1 2> (<L NP PRP PRP They NP>) (<T S[dcl]\NP 0 2> (<T (S[dcl]\NP)/(S[adj]\NP) 0 2> (<L (S[dcl]\NP)/(S[adj]\NP) VBD VBD were (S[dcl]\NP_298)/(S[adj]_299\NP_298:B)_299>) (<L (S\NP)\(S\NP) RB RB also (S_311\NP_306)_311\(S_311\NP_306)_311>) ) (<T S[adj]\NP 0 2> (<T (S[adj]\NP)/PP 0 2> (<T (S[adj]\NP)/PP 1 2> (<L (S[adj]\NP)/(S[adj]\NP) RB RB as (S[adj]_331\NP_326)_331/(S[adj]_331\NP_326)_331>) (<L (S[adj]\NP)/PP JJ JJ liberal (S[adj]\NP_318)/PP_319>) ) (<T (S[adj]\NP)/PP[conj] 1 2> (<L conj CC CC or conj>) (<T (S[adj]\NP)/PP 1 2> (<L (S[adj]\NP)/(S[adj]\NP) RBR RBR more (S[adj]_351\NP_346)_351/(S[adj]_351\NP_346)_351>) (<L (S[adj]\NP)/PP JJ JJ liberal (S[adj]\NP_338)/PP_339>) ) ) ) (<T PP 0 2> (<L PP/NP IN IN than PP/NP_358>) (<T NP 0 2> (<T NP 1 2> (<L NP[nb]/N DT DT any NP[nb]_379/N_379>) (<T N 1 2> (<L N/N JJ JJ other N_374/N_374>) (<T N 1 2> (<L N/N NN NN age N_367/N_367>) (<L N NN NN group N>) ) ) ) (<T NP\NP 0 2> (<L (NP\NP)/NP IN IN in (NP_387\NP_387)/NP_388>) (<T NP 1 2> (<L NP[nb]/N DT DT the NP[nb]_416/N_416>) (<T N 1 2> (<L N/N CD CD 1986 N_411/N_411>) (<T N 1 2> (<L N/N IN IN through N_404/N_404>) (<T N 1 2> (<L N/N CD CD 1989 N_397/N_397>) (<L N NNS NNS surveys N>) ) ) ) ) ) ) ) ) ) ) (<L . . . . .>) ) 
ID=wsj_0595.31 PARSER=GOLD NUMPARSE=1
(<T S[dcl] 0 2> (<T S[dcl] 1 2> (<T S/S 0 2> (<L (S/S)/NP IN IN For (S_349/S_349)/NP_350>) (<T NP 0 1> (<L N NN NN example N>) ) ) (<T S[dcl] 1 2> (<L , , , , ,>) (<T S[dcl] 1 2> (<T NP 0 2> (<T NP 0 1> (<T N 1 2> (<L N/N CD CD 66 N_253/N_253>) (<L N NN NN % N>) ) ) (<T NP\NP 0 2> (<L (NP\NP)/NP IN IN of (NP_262\NP_262)/NP_263>) (<T NP 0 2> (<T NP 1 2> (<L NP[nb]/N DT DT the NP[nb]_309/N_309>) (<T N 1 2> (<T N/N 0 2> (<L N/N CD CD 18 N_279/N_279>) (<T (N/N)\(N/N) 0 2> (<L ((N/N)\(N/N))/(N/N) CC TO to ((N_296/N_287)_296\(N_296/N_287)_296)/(N_297/N_291)_297>) (<L N/N CD CD 24 N_304/N_304>) ) ) (<T N 1 2> (<L N/N NN NN year N_272/N_272>) (<L N NNS NNS olds N>) ) ) ) (<T NP\NP 0 2> (<L (NP\NP)/NP IN IN in (NP_317\NP_317)/NP_318>) (<T NP 1 2> (<L NP[nb]/N DT DT the NP[nb]_339/N_339>) (<T N 1 2> (<L N/N CD CD four N_334/N_334>) (<T N 1 2> (<L N/N JJS JJS latest N_327/N_327>) (<L N NNS NNS surveys N>) ) ) ) ) ) ) ) (<T S[dcl]\NP 0 2> (<L (S[dcl]\NP)/NP VBD VBD favored (S[dcl]\NP_129)/NP_130>) (<T NP 0 2> (<T NP 1 2> (<L NP[nb]/N DT DT an NP[nb]_151/N_151>) (<T N 1 2> (<L N/N JJ JJ open N_146/N_146>) (<T N 1 2> (<L N/N NN NN housing N_139/N_139>) (<L N NN NN law N>) ) ) ) (<T NP\NP 0 1> (<T S[ng]\NP 0 2> (<T (S[ng]\NP)/PP 0 2> (<L ((S[ng]\NP)/PP)/NP VBG VBG prohibiting ((S[ng]\NP_160)/PP_161)/NP_162>) (<T NP 0 1> (<L N NNS NNS homeowners N>) ) ) (<T PP 0 2> (<L PP/(S[ng]\NP) IN IN from PP/(S[ng]_172\NP_170)_172>) (<T S[ng]\NP 0 2> (<T (S[ng]\NP)/(S[to]\NP) 0 2> (<L (S[ng]\NP)/(S[to]\NP) VBG VBG refusing (S[ng]\NP_181)/(S[to]_182\NP_181:B)_182>) (<T (S\NP)\(S\NP) 0 2> (<L ((S\NP)\(S\NP))/NP IN IN on ((S_195\NP_190)_195\(S_195\NP_190)_195)/NP_196>) (<T NP 0 1> (<T N 1 2> (<L N/N JJ JJ racial N_205/N_205>) (<L N NNS NNS grounds N>) ) ) ) ) (<T S[to]\NP 0 2> (<L (S[to]\NP)/(S[b]\NP) TO TO to (S[to]\NP_215)/(S[b]_216\NP_215:B)_216>) (<T S[b]\NP 0 2> (<L (S[b]\NP)/PP VB VB sell (S[b]\NP_223)/PP_224>) (<T PP 0 2> (<L PP/NP TO TO to PP/NP_229>) (<T NP 0 1> (<T N 1 2> (<L N/N JJ JJ prospective N_238/N_238>) (<L N NNS NNS buyers N>) ) ) ) ) ) ) ) ) ) ) ) ) ) ) (<L . . . . .>) ) 
ID=wsj_0595.32 PARSER=GOLD NUMPARSE=1
(<T S[dcl] 0 2> (<T S[dcl] 1 2> (<L NP DT DT That NP>) (<T S[dcl]\NP 0 2> (<L (S[dcl]\NP)/PP VBZ VBZ compares (S[dcl]\NP_204)/PP_205>) (<T PP 0 2> (<L PP/NP IN IN with PP/NP_210>) (<T NP 0 2> (<T NP 0 2> (<T NP 0 2> (<T NP 0 1> (<T N 1 2> (<L N/N CD CD 58 N_219/N_219>) (<L N NN NN % N>) ) ) (<T NP\NP 0 2> (<L (NP\NP)/NP IN IN of (NP_228\NP_228)/NP_229>) (<T NP 1 2> (<L NP[nb]/N DT DT the NP[nb]_250/N_250>) (<T N 1 2> (<L N/N JJ JJ similar N_245/N_245>) (<T N 1 2> (<L N/N NN NN age N_238/N_238>) (<L N NN NN group N>) ) ) ) ) ) (<T NP\NP 0 2> (<L (NP\NP)/NP IN IN in (NP_258\NP_258)/NP_259>) (<T NP 1 2> (<L NP[nb]/N DT DT the NP[nb]_287/N_287>) (<T N 1 2> (<L N/N CD CD 1980 N_282/N_282>) (<T N 1 2> (<L N/N IN IN through N_275/N_275>) (<T N 1 2> (<L N/N CD CD 1982 N_268/N_268>) (<L N NNS NNS surveys N>) ) ) ) ) ) ) (<T NP[conj] 1 2> (<L conj CC CC and conj>) (<T NP 0 2> (<T NP 0 1> (<T N 1 2> (<L N/N CD CD 55 N_296/N_296>) (<L N NN NN % N>) ) ) (<T NP\NP 0 2> (<L (NP\NP)/NP IN IN in (NP_305\NP_305)/NP_306>) (<T NP 1 2> (<L NP[nb]/N DT DT the NP[nb]_334/N_334>) (<T N 1 2> (<L N/N CD CD 1972 N_329/N_329>) (<T N 1 2> (<L N/N IN IN through N_322/N_322>) (<T N 1 2> (<L N/N CD CD 1975 N_315/N_315>) (<L N NNS NNS surveys N>) ) ) ) ) ) ) ) ) ) ) ) (<L . . . . .>) ) 
ID=wsj_0595.33 PARSER=GOLD NUMPARSE=1
(<T S[dcl] 0 2> (<T S[dcl] 1 2> (<T S/S 0 1> (<T S[pss]\NP 0 2> (<L (S[pss]\NP)/S[qem] VBN VBN Asked (S[pss]\NP_264)/S[qem]_265>) (<T S[qem] 0 2> (<L S[qem]/S[dcl] IN IN whether S[qem]/S[dcl]_270>) (<T S[dcl] 1 2> (<L NP PRP PRP they NP>) (<T S[dcl]\NP 0 2> (<T (S[dcl]\NP)/PP 0 2> (<L (S[dcl]\NP)/PP VBD VBD agreed (S[dcl]\NP_277)/PP_278>) (<T (S[dcl]\NP)/PP[conj] 1 2> (<L conj CC CC or conj>) (<L (S[dcl]\NP)/PP VBD VBD disagreed (S[dcl]\NP_285)/PP_286>) ) ) (<T PP 0 2> (<L PP/NP IN IN with PP/NP_293>) (<T NP 1 2> (<L NP[nb]/N DT DT the NP[nb]_378/N_378>) (<T N 0 2> (<L N/S[em] NN NN claim N/S[em]_298>) (<T S[em] 0 2> (<L S[em]/S[dcl] IN IN that S[em]/S[dcl]_303>) (<T S[dcl] 1 2> (<T NP 0 1> (<L N NNS NNS men N>) ) (<T S[dcl]\NP 0 2> (<T (S[dcl]\NP)/(S[pss]\NP) 0 2> (<L (S[dcl]\NP)/(S[pss]\NP) VBP VBP are (S[dcl]\NP_312)/(S[pss]_313\NP_312:B)_313>) (<L (S\NP)\(S\NP) RB RB emotionally (S_325\NP_320)_325\(S_325\NP_320)_325>) ) (<T S[pss]\NP 1 2> (<L (S\NP)/(S\NP) RB RB better (S_370\NP_365)_370/(S_370\NP_365)_370>) (<T S[pss]\NP 0 2> (<T S[pss]\NP 0 2> (<L (S[pss]\NP)/PP VBN VBN suited (S[pss]\NP_332)/PP_333>) (<T PP 0 2> (<L PP/NP TO TO to PP/NP_338>) (<T NP 0 1> (<L N NNS NNS politics N>) ) ) ) (<T (S\NP)\(S\NP) 0 2> (<L ((S\NP)\(S\NP))/NP IN IN than ((S_354\NP_349)_354\(S_354\NP_349)_354)/NP_355>) (<T NP 0 1> (<L N NNS NNS women N>) ) ) ) ) ) ) ) ) ) ) ) ) ) ) ) (<T S[dcl] 1 2> (<L , , , , ,>) (<T S[dcl] 1 2> (<T NP 0 2> (<T NP 0 1> (<T N 1 2> (<L N/N CD CD 70 N_231/N_231>) (<L N NN NN % N>) ) ) (<T NP\NP 0 2> (<L (NP\NP)/NP IN IN of (NP_240\NP_240)/NP_241>) (<T NP 1 2> (<L NP[nb]/N DT DT the NP[nb]_255/N_255>) (<T N 1 2> (<L N/N NNP NNP Reagan N_250/N_250>) (<L N NN NN generation N>) ) ) ) ) (<T S[dcl]\NP 0 2> (<T S[dcl]\NP 0 2> (<L S[dcl]\NP VBD VBD disagreed S[dcl]\NP_131>) (<L , , , , ,>) ) (<T (S\NP)\(S\NP) 0 2> (<L ((S\NP)\(S\NP))/PP VBN VBN compared ((S_146\NP_141)_146\(S_146\NP_141)_146)/PP_147>) (<T PP 0 2> (<L PP/NP IN IN with PP/NP_152>) (<T NP 0 2> (<T NP 0 2> (<T NP 0 1> (<T N 1 2> (<T N/N 1 2> (<L (N/N)/(N/N) IN IN under (N_175/N_169)_175/(N_175/N_169)_175>) (<L N/N CD CD 60 N_161/N_161>) ) (<L N NN NN % N>) ) ) (<T NP\NP 0 2> (<L (NP\NP)/NP IN IN of (NP_184\NP_184)/NP_185>) (<T NP 0 1> (<T N 1 2> (<L N/N JJR JJR younger N_198/N_198>) (<T N 1 2> (<L N NNS NNS men N>) (<T N[conj] 1 2> (<L conj CC CC and conj>) (<L N NNS NNS women N>) ) ) ) ) ) ) (<T NP\NP 0 2> (<L (NP\NP)/NP IN IN in (NP_207\NP_207)/NP_208>) (<T NP 1 2> (<L NP[nb]/N DT DT the NP[nb]_222/N_222>) (<T N 1 2> (<L N/N JJR JJR earlier N_217/N_217>) (<L N NNS NNS years N>) ) ) ) ) ) ) ) ) ) ) (<L . . . . .>) ) 
ID=wsj_0595.34 PARSER=GOLD NUMPARSE=1
(<T NP 0 1> (<T N 1 2> (<L N NNPS NNPS Odds N>) (<T N[conj] 1 2> (<L conj CC CC and conj>) (<L N NNPS NNPS Ends N>) ) ) ) 
ID=wsj_0595.35 PARSER=GOLD NUMPARSE=1
(<T S[dcl] 0 2> (<T S[dcl] 0 2> (<T S[dcl] 1 2> (<T S[dcl] 1 2> (<T NP 0 1> (<T N 1 2> (<T N/N 0 2> (<L N/N JJ VBN SEPARATED N_150/N_150>) (<T N/N[conj] 1 2> (<L conj CC CC and conj>) (<L N/N JJ VBN divorced N_157/N_157>) ) ) (<T N 1 2> (<L N NNS NNS men N>) (<T N[conj] 1 2> (<L conj CC CC and conj>) (<L N NNS NNS women N>) ) ) ) ) (<T S[dcl]\NP 0 2> (<L (S[dcl]\NP)/(S[adj]\NP) VBP VBP are (S[dcl]\NP_46)/(S[adj]_47\NP_46:B)_47>) (<T S[adj]\NP 0 2> (<T S[adj]\NP 1 2> (<T (S[adj]\NP)/(S[adj]\NP) 1 2> (<L ((S[adj]\NP)/(S[adj]\NP))/((S[adj]\NP)/(S[adj]\NP)) RB RB far ((S[adj]_113\NP_105)_113/(S[adj]_106\NP_105)_106)_113/((S[adj]_113\NP_105)_113/(S[adj]_106\NP_105)_106)_113>) (<L (S[adj]\NP)/(S[adj]\NP) RBR RBR more (S[adj]_90\NP_85)_90/(S[adj]_90\NP_85)_90>) ) (<T S[adj]\NP 0 2> (<L (S[adj]\NP)/(S[to]\NP) JJ JJ likely (S[adj]\NP_56)/(S[to]_57\NP_54)_57>) (<T S[to]\NP 0 2> (<L (S[to]\NP)/(S[b]\NP) TO TO to (S[to]\NP_66)/(S[b]_67\NP_66:B)_67>) (<T S[b]\NP 0 2> (<L (S[b]\NP)/NP VB VB be (S[b]\NP_74)/NP_75>) (<T NP 0 1> (<L N NNS NNS smokers N>) ) ) ) ) ) (<T (S[adj]\NP)\(S[adj]\NP) 0 2> (<L ((S[adj]\NP)\(S[adj]\NP))/NP IN IN than ((S[adj]_126\NP_121)_126\(S[adj]_126\NP_121)_126)/NP_127>) (<T NP 0 1> (<T N 1 2> (<L N/N JJ JJ married N_136/N_136>) (<L N NNS NNS persons N>) ) ) ) ) ) ) (<T S[dcl]\S[dcl] 1 2> (<L , , , , ,>) (<T S[dcl]\S[dcl] 1 2> (<T NP 0 2> (<T NP 1 2> (<L NP[nb]/N DT DT the NP[nb]_16/N_16>) (<L N NNPS NNPS Centers N>) ) (<T NP\NP 0 2> (<L (NP\NP)/NP IN IN for (NP_24\NP_24)/NP_25>) (<T NP 0 1> (<T N 1 2> (<L N/N NNP NNP Disease N_34/N_34>) (<L N NNP NNP Control N>) ) ) ) ) (<L (S[dcl]\S[dcl])\NP VBZ VBZ discovers (S[dcl]\S[dcl]_8)\NP_9>) ) ) ) (<L : : : ... :>) ) (<L . . . . .>) ) 
ID=wsj_0595.36 PARSER=GOLD NUMPARSE=1
(<T S[dcl] 0 2> (<T S[dcl] 1 2> (<T S[dcl] 1 2> (<T NP 0 1> (<T N 1 2> (<L N/N NN NN Graduate N_285/N_285>) (<L N NNS NNS students N>) ) ) (<T S[dcl]\NP 0 2> (<L (S[dcl]\NP)/(S[ng]\NP) VBP VBP are (S[dcl]\NP_178)/(S[ng]_179\NP_178:B)_179>) (<T S[ng]\NP 0 2> (<T (S[ng]\NP)/(S[to]\NP) 0 2> (<L (S[ng]\NP)/(S[to]\NP) VBG VBG taking (S[ng]\NP_188)/(S[to]_189\NP_188:B)_189>) (<T (S\NP)\(S\NP) 0 2> (<L (S\NP)\(S\NP) RBR RBR longer (S_201\NP_196)_201\(S_201\NP_196)_201>) (<T ((S\NP)\(S\NP))\((S\NP)\(S\NP)) 0 2> (<L (((S\NP)\(S\NP))\((S\NP)\(S\NP)))/(S[adj]\NP) IN IN than (((S_226\NP_214)_226\(S_216\NP_217)_215)_226\((S_226\NP_214)_226\(S_216\NP_217)_215)_226)/(S[adj]_227\NP_217:B)_227>) (<L S[adj]\NP RB RB ever S[adj]\NP_232>) ) ) ) (<T S[to]\NP 0 2> (<L (S[to]\NP)/(S[b]\NP) TO TO to (S[to]\NP_241)/(S[b]_242\NP_241:B)_242>) (<T S[b]\NP 0 2> (<L (S[b]\NP)/NP VB VB get (S[b]\NP_249)/NP_250>) (<T NP 0 2> (<T NP 1 2> (<L NP[nb]/N PRP$ PRP$ their NP[nb]_257/N_257>) (<L N NN NN doctor N>) ) (<T NP\NP 0 2> (<L (NP\NP)/NP IN IN of (NP_265\NP_265)/NP_266>) (<T NP 0 1> (<T N 1 2> (<L N/N NN NN philosophy N_275/N_275>) (<L N NNS NNS degrees N>) ) ) ) ) ) ) ) ) ) (<T S[dcl]\S[dcl] 1 2> (<L , , , , ,>) (<T S[dcl]\S[dcl] 1 2> (<T NP 1 2> (<L NP[nb]/N DT DT the NP[nb]_167/N_167>) (<T N 1 2> (<L N/N NNP NNP National N_162/N_162>) (<T N 1 2> (<L N/N NNP NNP Research N_155/N_155>) (<L N NNP NNP Council N>) ) ) ) (<L (S[dcl]\S[dcl])\NP VBZ VBZ says (S[dcl]\S[dcl]_145)\NP_146>) ) ) ) (<L . . . . .>) ) 
ID=wsj_0595.37 PARSER=GOLD NUMPARSE=1
(<T S[dcl] 0 2> (<T S[dcl] 1 2> (<L NP PRP PRP It NP>) (<T S[dcl]\NP 0 2> (<L (S[dcl]\NP)/S[dcl] VBZ VBZ estimates (S[dcl]\NP_144)/S[dcl]_145>) (<T S[dcl] 1 2> (<T NP 0 2> (<T NP 1 2> (<L NP[nb]/N DT DT the NP[nb]_364/N_364>) (<L N NN NN time N>) ) (<T NP\NP 0 2> (<L (NP\NP)/NP IN IN between (NP_372\NP_372)/NP_373>) (<T NP 0 2> (<T NP 0 1> (<T N 1 2> (<L N/N NN NN college N_382/N_382>) (<L N NN NN graduation N>) ) ) (<T NP[conj] 1 2> (<L conj CC CC and conj>) (<T NP 0 2> (<T NP 1 2> (<L NP[nb]/N DT DT the NP[nb]_390/N_390>) (<L N NN NN awarding N>) ) (<T NP\NP 0 2> (<L (NP\NP)/NP IN IN of (NP_398\NP_398)/NP_399>) (<T NP 1 2> (<L NP[nb]/N DT DT a NP[nb]_413/N_413>) (<T N 1 2> (<L N/N NNP NNP Ph. N_408/N_408>) (<L N NNP NNP D. N>) ) ) ) ) ) ) ) ) (<T S[dcl]\NP 0 2> (<L (S[dcl]\NP)/(S[pt]\NP) VBZ VBZ has (S[dcl]\NP_154)/(S[pt]_155\NP_154:B)_155>) (<T S[pt]\NP 0 2> (<T S[pt]\NP 0 2> (<T S[pt]\NP 0 2> (<T S[pt]\NP 0 2> (<L S[pt]\NP VBN VBN lengthened S[pt]\NP_160>) (<T (S\NP)\(S\NP) 0 2> (<L ((S\NP)\(S\NP))/NP IN IN by ((S_173\NP_168)_173\(S_173\NP_168)_173)/NP_174>) (<T NP 0 1> (<T N 1 2> (<L N/N CD CD 30 N_183/N_183>) (<L N NN NN % N>) ) ) ) ) (<T (S\NP)\(S\NP) 0 2> (<L ((S\NP)\(S\NP))/NP IN IN over ((S_197\NP_192)_197\(S_197\NP_192)_197)/NP_198>) (<T NP 1 2> (<L NP[nb]/N DT DT the NP[nb]_219/N_219>) (<T N 1 2> (<L N/N JJ JJ past N_214/N_214>) (<T N 1 2> (<L N/N CD CD 20 N_207/N_207>) (<L N NNS NNS years N>) ) ) ) ) ) (<L , , , , ,>) ) (<T (S\NP)\(S\NP) 0 2> (<T ((S\NP)\(S\NP))/(S[ng]\NP) 0 2> (<L (((S\NP)\(S\NP))/(S[ng]\NP))/NP IN IN with (((S_238\NP_230)_238\(S_238\NP_230)_238)/(S[ng]_239\NP_233:B)_239)/NP_233>) (<T NP 1 2> (<L NP[nb]/N DT DT the NP[nb]_254/N_254>) (<T N 1 2> (<L N/N JJ JJ average N_249/N_249>) (<L N NN NN gap N>) ) ) ) (<T S[ng]\NP 1 2> (<L (S\NP)/(S\NP) RB RB now (S_357\NP_352)_357/(S_357\NP_352)_357>) (<T S[ng]\NP 0 2> (<L (S[ng]\NP)/PP VBG VBG ranging (S[ng]\NP_261)/PP_262>) (<T PP 1 2> (<T PP/PP 0 2> (<L (PP/PP)/NP IN IN from (PP_297/PP_297)/NP_298>) (<T NP 0 2> (<T NP 0 1> (<T N 1 2> (<T N/N 1 2> (<L (N/N)/(N/N) IN IN about (N_321/N_315)_321/(N_321/N_315)_321>) (<L N/N CD CD 7.4 N_307/N_307>) ) (<L N NNS NNS years N>) ) ) (<T NP\NP 0 2> (<L (NP\NP)/NP IN IN in (NP_330\NP_330)/NP_331>) (<T NP 1 2> (<L NP[nb]/N DT DT the NP[nb]_345/N_345>) (<T N 1 2> (<L N/N JJ JJ physical N_340/N_340>) (<L N NNS NNS sciences N>) ) ) ) ) ) (<T PP 0 2> (<L PP/NP TO TO to PP/NP_267>) (<T NP 0 2> (<T NP 0 1> (<T N 1 2> (<L N/N CD CD 16.2 N_276/N_276>) (<L N NNS NNS years N>) ) ) (<T NP\NP 0 2> (<L (NP\NP)/NP IN IN in (NP_285\NP_285)/NP_286>) (<T NP 0 1> (<L N NN NN education N>) ) ) ) ) ) ) ) ) ) ) ) ) ) (<L . . . . .>) ) 


================================================
FILE: ccgbank/extract/add-chunks.xsl
================================================
<?xml version="1.0"?>
<!-- 
Copyright (C) 2003-5 University of Edinburgh (Michael White)
$Revision: 1.1 $, $Date: 2009/11/09 19:45:41 $ 

This transformation adds LF chunks (to be realized separately) to the 
HLDS representations.
-->
<xsl:transform 
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform" 
  version="1.0"
  xmlns:xalan2="http://xml.apache.org/xslt"
  exclude-result-prefixes="xalan2">

  <xsl:output indent="yes" xalan2:indent-amount="2"/> 
  <xsl:strip-space elements="*"/>

  
  <!-- default: chunk all non-trivial children when there is at least one relational child --> 
  <xsl:template match="*[(self::diamond or self::satop) and .//diamond[nom]]">
    <xsl:call-template name="chunk-all"/>
  </xsl:template>

  
  <!-- override: don't chunk w/in a disjunctive relation -->
  <xsl:template match="diamond[op[@name='xor']/satop]" priority="1.5">
    <xsl:call-template name="copy"/>
  </xsl:template>

  
  <!-- or a satop containing a mood feature -->
  <xsl:template match="satop[diamond[@mode='mood']]" priority="1.4">
    <xsl:call-template name="copy"/>
  </xsl:template>

  
  <!-- or w/in scopal body -->
  <xsl:template match="diamond[@mode='Body']" priority="1.3">
    <xsl:call-template name="copy"/>
  </xsl:template>

  <xsl:template match="satop[parent::op[@name='xor' and parent::diamond[@mode='Body']]]" priority="1.3">
    <xsl:call-template name="copy"/>
  </xsl:template>


  <!-- or a tuple -->
  <xsl:template match="*[prop[@name='tup']]" priority="1.2">
    <xsl:call-template name="copy"/>
  </xsl:template>

  
  <!-- or under a First rel containing a tuple item (for gapping) -->
  <xsl:template match="diamond[@mode='First'and diamond[@mode='Item' and prop[@name='tup']]]" priority="1.1">
    <xsl:call-template name="copy"/>
  </xsl:template>
  

  <!-- or under a GenRel with a Mod rel connecting to the head (eg for 'during which') -->
  <xsl:template match="diamond[@mode='GenRel'][diamond[@mode='Mod']//nom/@name = preceding-sibling::nom/@name]">
    <xsl:call-template name="copy"/>
  </xsl:template>

  
  <!-- chunk all children -->
  <xsl:template name="chunk-all">
    <xsl:copy>
      <xsl:apply-templates select="@*"/>
      <chunk>
        <xsl:apply-templates select="node()"/>
      </chunk>
    </xsl:copy>
  </xsl:template>
  
  
  <!-- Copy -->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

  <xsl:template name="copy">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/extract/convert-to-graph.xsl
================================================
<?xml version="1.0"?>
<!-- 
Copyright (C) 2003-5 University of Edinburgh (Michael White)
$Revision: 1.1 $, $Date: 2009/11/09 19:45:41 $ 

This transformation converts a hybrid logic dependency semantics representation
to a node-rel graph.
-->
<xsl:transform 
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform" 
  version="1.0"
  xmlns:xalan2="http://xml.apache.org/xslt"
  exclude-result-prefixes="xalan2">

  <xsl:output indent="yes" xalan2:indent-amount="2"/> 
  <xsl:strip-space elements="*"/>

  
  <!-- convert satops to nodes --> 
  <xsl:template match="satop">
    <node id="{@nom}">
      <xsl:apply-templates/>
    </node>
  </xsl:template>

  <!-- add pred -->
  <xsl:template match="prop">
    <xsl:attribute name="pred"><xsl:value-of select="@name"/></xsl:attribute>
  </xsl:template>  
  
  <!-- convert sem features -->
  <xsl:template match="diamond[not(nom)]">
    <xsl:attribute name="{@mode}"><xsl:value-of select="prop/@name"/></xsl:attribute>
  </xsl:template>
  
  <!-- convert modal rels to rels with nodes -->
  <xsl:template match="diamond[nom]">
    <rel name="{@mode}">
      <node>
        <xsl:apply-templates/>
      </node>
    </rel>
  </xsl:template>
  
  <!-- convert initial nominals to id's --> 
  <xsl:template match="nom[following-sibling::*]">
    <xsl:attribute name="id"><xsl:value-of select="@name"/></xsl:attribute>
  </xsl:template>
  
  <!-- convert solo nominals to idref's --> 
  <xsl:template match="nom[not(following-sibling::*)]">
    <xsl:attribute name="idref"><xsl:value-of select="@name"/></xsl:attribute>
  </xsl:template>


  <!-- convert xor to one-of -->
  <xsl:template match="op[@name='xor']">
    <one-of>
      <xsl:for-each select="*">
        <!-- add atts unless satop or diamond -->
        <xsl:choose>
          <xsl:when test="not(self::satop or self::diamond)">
            <atts><xsl:apply-templates/></atts>
          </xsl:when>
          <xsl:otherwise>
          </xsl:otherwise>
        </xsl:choose>
      </xsl:for-each>
    </one-of>
  </xsl:template>
  
  <!-- convert opts -->
  <xsl:template match="op[@name='opt']">
    <opt><xsl:apply-templates/></opt>
  </xsl:template>
    
  <!-- filter conj -->
  <xsl:template match="op[@name='conj']">
    <xsl:apply-templates/>
  </xsl:template>
    
  
  <!-- Copy -->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/extract/convert-to-hlds.xsl
================================================
<?xml version="1.0"?>
<!-- 
Copyright (C) 2003-5 University of Edinburgh (Michael White)
$Revision: 1.1 $, $Date: 2009/11/09 19:45:41 $ 

This transformation converts a node-rel graph to a hybrid logic 
dependency semantics representation.
-->
<xsl:transform 
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform" 
  version="1.0"
  xmlns:xalan2="http://xml.apache.org/xslt"
  exclude-result-prefixes="xalan2">

  <xsl:output indent="yes" xalan2:indent-amount="2"/> 
  <xsl:strip-space elements="*"/>

  
  <!-- check for non-empty node content of node elts with id's -->
  <xsl:template match="node[@id and (@shared='true' or count(@*[name(.)!='id'] | *) = 0)]" priority="1.5">
    <xsl:message terminate="yes">Error: node with id = <xsl:value-of select="@id"/> should be a reference (with idref)</xsl:message>
  </xsl:template>
  
    
  <!-- convert stand-alone nodes to satops --> 
  <xsl:template match="node[@id and not(parent::rel or parent::one-of[parent::rel])]" priority="1.0">
    <satop nom="{@id}">
      <xsl:call-template name="convert-feats-and-children"/>
    </satop>
  </xsl:template>
  
  <!-- convert dependent nodes using an initial nominal --> 
  <xsl:template match="node[@id]">
    <!-- add conj op under one-of -->
    <xsl:choose>
      <xsl:when test="parent::one-of">
        <op name="conj">
          <nom name="{@id}"/>
          <xsl:call-template name="convert-feats-and-children"/>
        </op>
      </xsl:when>
      <xsl:otherwise>
        <nom name="{@id}"/>
        <xsl:call-template name="convert-feats-and-children"/>
      </xsl:otherwise>
    </xsl:choose>
  </xsl:template>
  
  <!-- convert stand-alone node references with children or attributes to satops (keeping shared attribute, if present) --> 
  <xsl:template match="node[@idref and count(@*[name(.)!='idref' and name(.)!='shared'] | *) &gt; 0 and not(parent::rel or parent::one-of[parent::rel])]" priority="1.0">
    <satop nom="{@idref}">
      <xsl:copy-of select="@shared"/>
      <xsl:call-template name="convert-feats-and-children"/>
    </satop>
  </xsl:template>
  
  <!-- convert dependent node references with children or attributes using an initial nominal (keeping shared attribute, if present) --> 
  <xsl:template match="node[@idref and count(@*[name(.)!='idref' and name(.)!='shared'] | *) &gt; 0]">
    <!-- add conj op under one-of -->
    <xsl:choose>
      <xsl:when test="parent::one-of">
        <op name="conj">
          <nom name="{@idref}"> <xsl:copy-of select="@shared"/> </nom>
          <xsl:call-template name="convert-feats-and-children"/>
        </op>
      </xsl:when>
      <xsl:otherwise>
        <nom name="{@idref}"> <xsl:copy-of select="@shared"/> </nom>
        <xsl:call-template name="convert-feats-and-children"/>
      </xsl:otherwise>
    </xsl:choose>
  </xsl:template>
  
  <!-- convert empty node references (with no attributes) to nominals (keeping shared attribute, if present) --> 
  <xsl:template match="node[@idref and count(@*[name(.)!='idref' and name(.)!='shared'] | *) = 0]">
    <nom name="{@idref}"> <xsl:copy-of select="@shared"/> </nom>
  </xsl:template>

    
  <!-- convert rels -->
  <xsl:template match="rel">
    <diamond mode="{@name}">
      <xsl:apply-templates/>
    </diamond>
  </xsl:template>
  
  
  <!-- convert one-of -->
  <xsl:template match="one-of">
    <op name="xor">
      <xsl:apply-templates/>
    </op>
  </xsl:template>

  <!-- convert opt -->
  <xsl:template match="opt">
    <op name="opt">
      <xsl:apply-templates/>
    </op>
  </xsl:template>

  
  <!-- convert atts -->
  <!-- nb: atts can include rels, and can be used to group them too -->
  <xsl:template match="atts">
    <!-- add conj op if multiple preds -->
    <xsl:choose>
      <xsl:when test="count(@*) &gt; 1 or *">
        <op name="conj">
          <xsl:call-template name="convert-feats-and-children"/>
        </op>
      </xsl:when>
      <xsl:otherwise>
        <xsl:call-template name="convert-feats-and-children"/>
      </xsl:otherwise>
    </xsl:choose>
  </xsl:template>

  
  <!-- convert sem features of current node and children -->
  <xsl:template name="convert-feats-and-children">
    <!-- convert sem features -->
    <xsl:call-template name="convert-feats"/>
    <!-- do rest -->
    <xsl:apply-templates/>
  </xsl:template>
  
  <!-- convert sem features of current node -->
  <xsl:template name="convert-feats">
    <!-- add pred (if any) -->
    <xsl:if test="@pred">
      <prop name="{@pred}"/>
    </xsl:if>
    <!-- do rest -->
    <xsl:for-each select="@*[name(.) != 'id' and name(.) != 'idref' and name(.) != 'pred' and name(.) != 'shared']">
      <diamond mode="{name(.)}"><prop name="{.}"/></diamond>
    </xsl:for-each>
  </xsl:template>
  
  
  <!-- Copy -->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/extract/grammar.xml
================================================
<?xml version="1.0"?>
<grammar name="openccgbank"
  xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
  xsi:noNamespaceSchemaLocation="../../grammars/grammar.xsd"
>

  <lexicon file="lexicon.xml" openlex="true"/>
  <morphology file="morph.xml"/>
  <rules file="rules.xml" combosfile="info/combos-train"/>

  <tokenizer replacement-sem-classes="DATE LOCATION MONEY ORGANIZATION PERCENT PERSON TIME"/>

  <LF-from-XML>
    <transform file="convert-to-hlds.xsl"/>
    <transform file="add-chunks.xsl"/>
  </LF-from-XML>

  <LF-to-XML>
    <transform file="raise-nodes.xsl"/>
    <transform file="convert-to-graph.xsl"/>
  </LF-to-XML>

</grammar>


================================================
FILE: ccgbank/extract/raise-nodes.xsl
================================================
<?xml version="1.0"?>
<!-- 
Copyright (C) 2003-7 University of Edinburgh (Michael White)
$Revision: 1.1 $, $Date: 2009/11/09 19:45:41 $ 

This transformation raises desired shared nodes up to a parallel location, 
so that the resulting subtrees can be more easily chunked into realizable
constituents.  The predicates are moved under a new satop, leaving behind 
just a nominal reference.

This is a modified version of the standard transformation that uses 
First/Next list structures, without elements or items.
-->
<xsl:transform 
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform" 
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:set="xalan://java.util.HashSet"
  xmlns:xalan2="http://xml.apache.org/xslt"
  exclude-result-prefixes="set xalan xalan2">

  <xsl:output indent="yes" xalan2:indent-amount="2"/> 
  <xsl:strip-space elements="*"/>

  <!-- tracks nodes which have been moved -->
  <xsl:variable name="moved" select="set:new()"/>
  
  
  <!-- raise coordinated nodes --> 
  <xsl:template match="*[diamond[@mode='First']]">
    <xsl:call-template name="raise-shared-nodes">
      <!-- check for shared nominals under different list items -->
      <xsl:with-param name="rel">Next</xsl:with-param>
    </xsl:call-template>
  </xsl:template>

  
  <!-- skip the predicates of moved nodes -->
  <xsl:template match="*[preceding-sibling::nom[set:contains($moved, string(@name))]]" priority="1.0"/>

  
  <!-- raises shared nodes --> 
  <xsl:template name="raise-shared-nodes">
    <xsl:param name="noms-root" select="."/>
    <xsl:param name="rel-root" select="$noms-root"/>
    <xsl:param name="rel"/>
    
    <!-- get all nominals with predicates under $noms-root, but not already moved -->
    <xsl:variable name="noms" 
      select="$noms-root//nom[not(set:contains($moved, string(@name))) and following-sibling::prop]"/>

    <!-- check each such nominal, gathering shared stuff to move -->
    <xsl:variable name="shared"> 
      <xsl:for-each select="$noms">
        <!-- check for the same nominal appearing under and not under $rel from $rel-root -->
        <xsl:variable name="nom" select="@name"/>
        <xsl:if test="$rel-root/diamond[@mode =  $rel]//nom[@name=$nom] and
                      $rel-root/diamond[@mode != $rel]//nom[@name=$nom]"
        >
          <!-- make new satop for preds on shared nominal -->
          <satop nom="{$nom}">
            <xsl:apply-templates select="following-sibling::node()"/>
          </satop>
          <!-- record the move -->
          <xsl:variable name="void" select="set:add($moved, string($nom))"/>
          <!-- nb: need to read result to ensure add operation happens! -->
          <xsl:variable name="void2" select="$void"/>
        </xsl:if>
      </xsl:for-each>
    </xsl:variable>

    <!-- recurse, copying shared stuff at end -->
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
      <xsl:copy-of select="$shared"/>
    </xsl:copy>
  </xsl:template>
  
  
  <!-- Copy -->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/models/hypertagger/ht-prior.flm
================================================

## A prior probability model that estimates p(supertag | word, pos)
## with smoothed back-off (a "soft tagging dictionary" if you will).

1
 
## lexical category ("supertag") (T) given POS tag (P) and word (W).

T : 2 P(0) W(0) t_p0w0.count t_p0w0.lm 3
  P0,W0 W0 wbdiscount gtmin 15 
  P0 P0 wbdiscount
  0 0 wbdiscount


================================================
FILE: ccgbank/models/hypertagger/ht.config
================================================
# location of FLM file and vocab file for prior model
#priorModel=ht-prior.flm
#priorModelVocab=vocab.st

# maxent model (trained using ZL's toolkit) for hypertagging
maxentModel=ht.mod

# beam width for beta-best search through the tags returned by the maxent model
betas =  0.075 0.03 0.01 0.003 0.001 0.0003 0.0001 0.00001

# if using tagging dictionaries (instead of prior models) specify the dictionary threshold
# ("K" value from Clark 2002)
dictk=10

# specify tagging dictionaries. these are only used if prior models are NOT specified!
#wDict=word.dict.min10
#posDict=pos.dict.min10

# filename for configuration of POS tagger
posConfig=pos.config

# arg names and short names
argnames = Arg0:A0 Arg1:A1 Arg1a:A1a Arg1b:A1b Arg2:A2 Arg2a:A2a Arg2b:A2b Arg3:A3 Arg4:A4 Arg5:A5 


================================================
FILE: ccgbank/models/hypertagger/ht2.config
================================================
# location of FLM file and vocab file for prior model
#priorModel=stprior.flm
#priorModelVocab=vocab.st

# maxent model (trained using ZL's toolkit) for hypertagging
maxentModel=ht.mod
# second-pass model
maxentModel2=ht2.mod

# beam width for beta-best search through the tags returned by the maxent model
# these will be applied to both hypertagging models
betas =  0.075 0.03 0.01 0.003 0.001 0.0003 0.0001 0.00001

# if using tagging dictionaries (instead of prior models) specify the dictionary threshold
# ("K" value from Clark 2002)
#dictk=10

# specify tagging dictionaries. these are only used if prior models are NOT specified!
#wDict=word.dict.min10
#posDict=pos.dict.min10

# filename for configuration of POS tagger
posConfig=pos.config

# arg names and short names
argnames = Arg0:A0 Arg1:A1 Arg1a:A1a Arg1b:A1b Arg2:A2 Arg2a:A2a Arg2b:A2b Arg3:A3 Arg4:A4 Arg5:A5


================================================
FILE: ccgbank/models/hypertagger/ht2.train.config
================================================
# config file for generating events during realizer training
#
# a single beta level (not the most strict one) is used, rather 
# than adaptive backoff (todo: try reverse adaptation)

# maxent model (trained using ZL's toolkit) for hypertagging
maxentModel=ht.mod
# second-pass model
maxentModel2=ht2.mod

# beam width for beta-best search through the tags returned by the maxent model
# these will be applied to both hypertagging models
betas =  0.001

# filename for configuration of POS tagger
posConfig=pos.config


================================================
FILE: ccgbank/models/hypertagger/pos.config
================================================
# this model gives priors on POS tags.
#priorModel=posprior.flm
#priorModelVocab=vocab.pos

# this is a Zhang Le-style MEM.
maxentModel=pos.mod

# you can also configure the tagger's beta-value here using the key "beta"


================================================
FILE: ccgbank/models/hypertagger/posprior.flm
================================================

## A prior probability model that estimates p(pos | word)
## with smoothed back-off (a "soft tagging dictionary" if you will).

1
 
## POS tag (P) given word (W) with a back-off to the prior on the POS itself.

P : 1 W(0) p_w0.count p_w0.lm 2
  W0 W0 wbdiscount gtmin 1 
  0 0 wbdiscount gtmin 1 


================================================
FILE: ccgbank/models/hypertagger/vocab.flm
================================================

## flm file for determining the vocab

3
 
## word (W) unigram

W : 0 w.count w.lm 1
  0 0

## supertag (T) unigram

T : 0 t.count t.lm 1
  0 0

## pos tag (P) unigram 

P : 0 p.count p.lm 1
  0 0


================================================
FILE: ccgbank/models/parser/binary.flm
================================================

## binary step of Hockenmaier's HWDep generative syntactic model
## with added pos tags

6
 
## expansion (E) given parent cat (P), lexcat parent (CP), head postag parent (T) and headword parent (W)

E : 4 P(0) CP(0) T(0) W(0) e_p0cp0t0w0.count e_p0cp0t0w0.lm 5
  P0,CP0,T0,W0 W0 wbdiscount gtmin 10
  P0,CP0,T0 T0 wbdiscount
  P0,CP0 CP0 wbdiscount
  P0 P0 wbdiscount
  0 0 wbdiscount

## head (H) given expansion (E), parent cat (P) and lexcat parent (CP)

H : 3 E(0) P(0) CP(0) h_e0p0cp0.count h_e0p0cp0.lm 4
  E0,P0,CP0 CP0 wbdiscount
  E0,P0 P0 wbdiscount
  E0 E0 wbdiscount
  0 0 wbdiscount

## sibling (S) given expansion (E), parent cat (P), head cat (H), lexcat parent (CP), head postag parent and headword parent (W)

S : 6 E(0) P(0) H(0) CP(0) T(0) W(0) s_e0p0h0cp0t0w0.count s_e0p0h0cp0t0w0.lm 7
  E0,P0,H0,CP0,T0,W0 W0 wbdiscount gtmin 10
  E0,P0,H0,CP0,T0 T0 wbdiscount
  E0,P0,H0,CP0 CP0 wbdiscount
  E0,P0,H0 H0 wbdiscount
  E0,P0 P0 wbdiscount
  E0 E0 wbdiscount
  0 0 wbdiscount

## lexcat sibling (CS) given expansion (E), sibling (S), parent cat (P) and head cat (H)

CS : 4 E(0) S(0) P(0) H(0) cs_e0s0p0h0.count cs_e0s0p0h0.lm 5
  E0,S0,P0,H0 H0 wbdiscount
  E0,S0,P0 P0 wbdiscount
  E0,S0 S0 wbdiscount
  E0 E0 wbdiscount
  0 0 wbdiscount

## head postag sibling (TS) given lexcat sibling (CS), sibling (S), parent cat (P), head cat (H), head postag parent (T) and headword parent (W)

TS : 6 CS(0) S(0) P(0) H(0) T(0) W(0) ts_cs0s0p0h0t0w0.count ts_cs0s0p0h0t0w0.lm 7
  CS0,S0,P0,H0,T0,W0 W0 wbdiscount gtmin 10
  CS0,S0,P0,H0,T0 T0 wbdiscount
  CS0,S0,P0,H0 H0 wbdiscount
  CS0,S0,P0 P0 wbdiscount
  CS0,S0 S0 wbdiscount
  CS0 CS0 wbdiscount
  0 0 wbdiscount

## headword sibling (WS) given lexcat sibling (CS), sibling (S), parent cat (P), head cat (H), head postag parent (T), headword parent (W) and head postag sibling (TS) 

WS : 7 CS(0) S(0) P(0) H(0) T(0) W(0) TS(0) ws_cs0s0p0h0t0w0ts0.count ws_cs0s0p0h0t0w0ts0.lm 8
  CS0,S0,P0,H0,T0,W0,TS0 TS0 wbdiscount gtmin 5
  CS0,S0,P0,H0,T0,W0 W0 wbdiscount gtmin 10
  CS0,S0,P0,H0,T0 T0 wbdiscount gtmin 5
  CS0,S0,P0,H0 H0 wbdiscount
  CS0,S0,P0 P0 wbdiscount
  CS0,S0 S0 wbdiscount
  CS0 CS0 wbdiscount
  0 0 wbdiscount


================================================
FILE: ccgbank/models/parser/gen-events.prefs
================================================
<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE preferences SYSTEM "http://java.sun.com/dtd/preferences.dtd">
<preferences EXTERNAL_XML_VERSION="1.0"><root type="user"><map/><node name="opennlp"><map/><node name="ccg"><map><entry key="Parse Cell Pruning Value" value="25"/><entry key="Parse Edge Limit" value="100000"/><entry key="Parse Lazy Unpacking" value="true"/><entry key="Parse Pruning Value" value="25"/><entry key="Parse Time Limit" value="0"/><entry key="Use Eisner Constraints" value="true"/><entry key="Use Word Positions To Convert Atoms" value="true"/></map></node></node></root></preferences>


================================================
FILE: ccgbank/models/parser/leaf.flm
================================================

## leaf step of Hockenmaier's HWDep generative syntactic model
## with added pos tags

1
 
## expansion (E) given parent cat (P), lexcat parent (CP), head postag parent (T) and headword parent (W)

E : 4 P(0) CP(0) T(0) W(0) e_p0cp0t0w0.count e_p0cp0t0w0.lm 5
  P0,CP0,T0,W0 W0 wbdiscount gtmin 10
  P0,CP0,T0 T0 wbdiscount
  P0,CP0 CP0 wbdiscount
  P0 P0 wbdiscount
  0 0 wbdiscount


================================================
FILE: ccgbank/models/parser/model.init
================================================
1
genlogprob 1


================================================
FILE: ccgbank/models/parser/parse.prefs
================================================
<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE preferences SYSTEM "http://java.sun.com/dtd/preferences.dtd">
<preferences EXTERNAL_XML_VERSION="1.0"><root type="user"><map/><node name="opennlp"><map/><node name="ccg"><map><entry key="Parse Cell Pruning Value" value="25"/><entry key="Parse Edge Limit" value="100000"/><entry key="Parse Lazy Unpacking" value="false"/><entry key="Parse Pruning Value" value="7"/><entry key="Parse Time Limit" value="0"/><entry key="Use Eisner Constraints" value="true"/><entry key="Use Word Positions To Convert Atoms" value="true"/></map></node></node></root></preferences>


================================================
FILE: ccgbank/models/parser/top.flm
================================================

## top step of Hockenmaier's HWDep generative syntactic model
## with added pos tags

4
 
## head (H) given expansion (E), parent cat (P) and lexcat parent (CP)
## nb: E, P and CP should all equal <top> when invoked

H : 3 E(0) P(0) CP(0) h_e0p0cp0.count h_e0p0cp0.lm 4
  E0,P0,CP0 CP0 wbdiscount
  E0,P0 P0 wbdiscount
  E0 E0 wbdiscount
  0 0 wbdiscount

## lexcat top (CT) given parent cat (P)

CT : 1 P(0) ct_p0.count ct_p0.lm 2
  P0 P0 wbdiscount
  0 0 wbdiscount

## head postag top (TT) given lexcat parent (CP)

TT : 1 CP(0) tt_cp0.count tt_cp0.lm 2
  CP0 CP0 wbdiscount
  0 0 wbdiscount

## headword top (WT) given lexcat parent (CP), head postag top (TT)

WT : 2 CP(0) TT(0) wt_cp0tt0.count wt_cp0tt0.lm 3
  CP0,TT0 TT0 wbdiscount gtmin 5
  CP0 CP0 wbdiscount
  0 0 wbdiscount


================================================
FILE: ccgbank/models/parser/unary.flm
================================================

## unary step of Hockenmaier's HWDep generative syntactic model
## with added pos tags

2
 
## expansion (E) given parent cat (P), lexcat parent (CP), head postag parent (T) and headword parent (W)

E : 4 P(0) CP(0) T(0) W(0) e_p0cp0t0w0.count e_p0cp0t0w0.lm 5
  P0,CP0,T0,W0 W0 wbdiscount gtmin 10
  P0,CP0,T0 T0 wbdiscount
  P0,CP0 CP0 wbdiscount
  P0 P0 wbdiscount
  0 0 wbdiscount

## head (H) given expansion (E), parent cat (P) and lexcat parent (CP)

H : 3 E(0) P(0) CP(0) h_e0p0cp0.count h_e0p0cp0.lm 4
  E0,P0,CP0 CP0 wbdiscount
  E0,P0 P0 wbdiscount
  E0 E0 wbdiscount
  0 0 wbdiscount


================================================
FILE: ccgbank/models/parser/vocab.flm
================================================

## flm file for determining the vocab

13
 
## headword (W) unigram

W : 0 w.count w.lm 1
  0 0

## headword top (WT) 

WT : 0 wt.count wt.lm 1
  0 0

## headword sibling (WS)

WS : 0 ws.count ws.lm 1
  0 0

## expansion (E)

E : 0 e.count e.lm 1
  0 0

## head (H) cat

H : 0 h.count h.lm 1
  0 0

## parent (P) cat

P : 0 p.count p.lm 1
  0 0

## lexcat parent (CP)

CP : 0 cp.count cp.lm 1
  0 0

## lexcat top (CT)

CT : 0 ct.count ct.lm 1
  0 0

## head postag top (TT)

TT : 0 tt.count tt.lm 1
  0 0

## head postag parent (T)

T : 0 t.count t.lm 1
  0 0

## sibling (S) cat

S : 0 s.count s.lm 1
  0 0

## lexcat sibling (CS)

CS : 0 cs.count cs.lm 1
  0 0

## head postag sibling (TS)

TS : 0 ts.count ts.lm 1
  0 0


================================================
FILE: ccgbank/models/realizer/alph.init
================================================
6
genlogprob 1
$ngram0 1
$ngram1 1
$ngram2 1
$ngram3 1
$deplen 1


================================================
FILE: ccgbank/models/realizer/gen-events.prefs
================================================
<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE preferences SYSTEM "http://java.sun.com/dtd/preferences.dtd">
<preferences EXTERNAL_XML_VERSION="1.0"><root type="user"><map/><node name="opennlp"><map/><node name="ccg"><map><entry key="Cell Pruning Value" value="100"/><entry key="Do Unpacking" value="true"/><entry key="Edge Limit" value="25000"/><entry key="Features to Show" value=""/><entry key="New Best Time Limit" value="0.2"/><entry key="Pruning Value" value="20"/><entry key="Show Bitset" value="true"/><entry key="Show Completeness" value="true"/><entry key="Show Derivations" value="false"/><entry key="Show Features" value="true"/><entry key="Show Incomplete Edges" value="false"/><entry key="Show Semantics" value="true"/><entry key="Show Timing" value="false"/><entry key="Time Limit" value="30000"/><entry key="Use Chunks" value="true"/><entry key="Use Eisner Constraints" value="true"/><entry key="Use Packing" value="true"/><entry key="Use Word Positions To Convert Atoms" value="true"/></map></node></node></root></preferences>


================================================
FILE: ccgbank/models/realizer/model.init
================================================
2
genlogprob 1
$ngram0 1


================================================
FILE: ccgbank/models/realizer/rz-test.prefs
================================================
<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE preferences SYSTEM "http://java.sun.com/dtd/preferences.dtd">
<preferences EXTERNAL_XML_VERSION="1.0"><root type="user"><map/><node name="opennlp"><map/><node name="ccg"><map><entry key="Cell Pruning Value" value="100"/><entry key="Do Unpacking" value="true"/><entry key="Edge Limit" value="25000"/><entry key="Features to Show" value=""/><entry key="New Best Time Limit" value="0.2"/><entry key="Pruning Value" value="10"/><entry key="Show Bitset" value="true"/><entry key="Show Completeness" value="true"/><entry key="Show Derivations" value="false"/><entry key="Show Features" value="true"/><entry key="Show Incomplete Edges" value="false"/><entry key="Show Semantics" value="true"/><entry key="Show Timing" value="false"/><entry key="Time Limit" value="15000"/><entry key="Use Chunks" value="true"/><entry key="Use Eisner Constraints" value="true"/><entry key="Use Packing" value="true"/><entry key="Use Word Positions To Convert Atoms" value="true"/></map></node></node></root></preferences>


================================================
FILE: ccgbank/models/realizer/stp3.flm
================================================

## Supertags FLM

## Supertag (T) based on POS tags (P), plus POS trigram

2

## POS trigram
P : 2 P(-1) P(-2) p_p1p2.count p_p1p2.lm 3
  P1,P2 P2 kndiscount
  P1 P1 kndiscount
  0 0 ndiscount

## 3gram with prev two POSs
T : 3 P(0) P(-1) P(-2) t_p0p1p2.count t_p0p1p2.lm 4
  P0,P1,P2 P2 kndiscount
  P0,P1 P1 kndiscount
  P0 P0 kndiscount
  0 0 kndiscount


================================================
FILE: ccgbank/models/supertagger/pos.config
================================================
# an example POS tagger config file (D.N. Mehay)
# change to suit your needs (e.g., replace the following paths
# with paths that point to the relevant files).

# "basic" = Ratnaparkhi-style features, inter alia
# there is nothing else in OpenCCG, at the moment.
taggerType=basic

# this model gives priors on POS tags.
priorModel=posprior.flm
priorModelVocab=vocab.pos

# this is a Zhang Le-style MEM.
maxentModel=pos.mod

# this last must be an ARPA-formatted n-gram model over POS tags (with <s> and </s>)
# (7- to 9-grams work well, without much memory usage).
sequenceModel=pos.lm

# tagging beam width (beta=1 means "single-best", i.e., unitagging)
beta=0.044
#beta=0.1
#beta=1.0

# tagging algorithm.  (choose from 'forward' and 'forward-backward')
# the former is faster, the latter is better.
taggingAlgorithm=forward-backward

# self-explanatory (will potentially print certain errors and warnings, if set to 'true')
verbose=true

================================================
FILE: ccgbank/models/supertagger/posprior.flm
================================================

## A prior probability model that estimates p(pos | word)
## with smoothed back-off (a "soft tagging dictionary" if you will).

1
 
## POS tag (P) given word (W) with a back-off to the prior on the POS itself.

P : 1 W(0) p_w0.count p_w0.lm 2
  W0 W0 wbdiscount gtmin 1 
  0 0 wbdiscount gtmin 1 


================================================
FILE: ccgbank/models/supertagger/st.config
================================================
# an example supertagger config file (D.N. Mehay)
# change to suit your needs (e.g., replace the following paths
# with paths that point to the relevant files).

# this is a comment ("basic" means C,C & Vadas (2006)-style features).
# there is nothing else in OpenCCG, at the moment.
taggerType=basic

# this model gives priors on supertags.
#priorModel=stprior.flm
#priorModelVocab=vocab.st

# this is a Zhang Le-style MEM.
maxentModel=st.mod

# this last must be an ARPA-formatted n-gram model over supertags (with <s> and </s>)
# (7- to 9-grams work well, without much memory usage).
sequenceModel=st.lm

# tagging beam widths (first try beta1, then beta2 if that doesn't give a parse, etc.).
# give as many as you want, but keep in mind that your parser will try them all out
# (which may make it try to parse in vain -- i.e., when it just doesn't have the
# categories to do it).
#betas =  0.024 0.003875 0.001225 0.0005377 0.000275 0.0000925 0.00004
#betas =  0.075 0.03 0.01 0.005 0.001 0.0005
betas =  0.075 0.03 0.01 0.003 0.001 0.0003 0.0001 0.00001

# if not using the prior model (above), you must give 'K' values (see Clark and Curran (2007)).
# the first one is for all beta values but the last. the second one is for
# the last.
firstK=20
lastK=100

# also, if you're not using the prior models, you need to specify a word-keyed tagging
# dictionary (this interacts with the 'K' values) and a POS-keyed tagging dictionary.
wDict=word.dict.min10
posDict=pos.dict.min10

# use automatic POS features? (even if you are automatically POS tagging,
# but only using single-best, set this to false).
autoPOS=true

# if autoPOS=true, you need to specify a POS config file.
posConfig=pos.config

# tagging algorithm.  (choose from 'forward' and 'forward-backward')
# the former is faster, the latter is better.
taggingAlgorithm=forward-backward

# self-explanatory (will print certain errors and warnings, if set to 'true')
verbose=true

# option to include gold tags
#includeGold=true

# POS-specific relaxation
#betaMultipliers=, 0.01 : 0.01 . 0.1 CC 0.1
betaMultipliers=, 0.01 : 0.01 . 0.1


================================================
FILE: ccgbank/models/supertagger/st.config.train
================================================
# an example supertagger config file (D.N. Mehay)
# change to suit your needs (e.g., replace the following paths
# with paths that point to the relevant files).

# this is a comment ("basic" means C,C & Vadas (2006)-style features).
# there is nothing else in OpenCCG, at the moment.
taggerType=basic

# this model gives priors on supertags.
#priorModel=stprior.flm
#priorModelVocab=vocab.st

# this is a Zhang Le-style MEM.
maxentModel=st.mod

# this last must be an ARPA-formatted n-gram model over supertags (with <s> and </s>)
# (7- to 9-grams work well, without much memory usage).
sequenceModel=st.lm

# tagging beam widths (first try beta1, then beta2 if that doesn't give a parse, etc.).
# give as many as you want, but keep in mind that your parser will try them all out
# (which may make it try to parse in vain -- i.e., when it just doesn't have the
# categories to do it).
#betas =  0.024 0.003875 0.001225 0.0005377 0.000275 0.0000925 0.00004
#betas =  0.075 0.03 0.01 0.005 0.001 0.0005
betas =  0.075 0.03 0.01

# if not using the prior model (above), you must give 'K' values (see Clark and Curran (2007)).
# the first one is for all beta values but the last. the second one is for
# the last.
firstK=20
lastK=100

# also, if you're not using the prior models, you need to specify a word-keyed tagging
# dictionary (this interacts with the 'K' values) and a POS-keyed tagging dictionary.
wDict=word.dict.min10
posDict=pos.dict.min10

# use automatic POS features? (even if you are automatically POS tagging,
# but only using single-best, set this to false).
autoPOS=false

# if autoPOS=true, you need to specify a POS config file.
posConfig=pos.config

# tagging algorithm.  (choose from 'forward' and 'forward-backward')
# the former is faster, the latter is better.
taggingAlgorithm=forward-backward

# self-explanatory (will print certain errors and warnings, if set to 'true')
verbose=true

# option to include gold tags
includeGold=true

# POS-specific relaxation
betaMultipliers=, 0.01 : 0.01 . 0.1 CC 0.1


================================================
FILE: ccgbank/models/supertagger/st.noprior.config
================================================
# an example supertagger config file (D.N. Mehay)
# change to suit your needs (e.g., replace the following paths
# with paths that point to the relevant files).

# this is a comment ("basic" means C,C & Vadas (2006)-style features).
# there is nothing else in OpenCCG, at the moment.
taggerType=basic

# this model gives priors on supertags. use it.
# nb: testing out no prior model here ...
#priorModel=stprior.flm
#priorModelVocab=vocab.st

# this is a Zhang Le-style MEM.
#maxentModel=st.mod
maxentModel=st.noprior.mod

# this last must be an ARPA-formatted n-gram model over supertags (with <s> and </s>)
# (7- to 9-grams work well, without much memory usage).
sequenceModel=st.lm

# tagging beam widths (first try beta1, then beta2 if that doesn't give a parse, etc.).
# give as many as you want, but keep in mind that your parser will try them all out
# (which may make it try to parse in vain -- i.e., when it just doesn't have the
# categories to do it).
#betas =  0.024 0.003875 0.001225 0.0005377 0.000275 0.0000925 0.00004
#betas =  0.075 0.03 0.01 0.005 0.001 0.0005
betas =  0.075 0.03 0.01 0.003 0.001 0.0003 0.0001 0.00001

# if not using the prior model (above), you must give 'K' values (see Clark and Curran (2007)).
# the first one is for all beta values but the last. the second one is for
# the last.
firstK=20
lastK=100

# also, if you're not using the prior models, you need to specify a word-keyed tagging
# dictionary (this interacts with the 'K' values) and a POS-keyed tagging dictionary.
wDict=word.dict.min10
posDict=pos.dict.min10

# use automatic POS features? (even if you are automatically POS tagging,
# but only using single-best, set this to false).
autoPOS=true

# if autoPOS=true, you need to specify a POS config file.
posConfig=pos.config

# tagging algorithm.  (choose from 'forward' and 'forward-backward')
# the former is faster, the latter is better.
taggingAlgorithm=forward-backward

# self-explanatory (will print certain errors and warnings, if set to 'true')
verbose=true

# option to include gold tags
#includeGold=true

# POS-specific relaxation
#betaMultipliers=, 0.01 : 0.01 . 0.1 CC 0.1
betaMultipliers=, 0.01 : 0.01 . 0.1


================================================
FILE: ccgbank/models/supertagger/stprior.flm
================================================

## A prior probability model that estimates p(supertag | word, pos)
## with smoothed back-off (a "soft tagging dictionary" if you will).

1
 
## lexical category ("supertag") (T) given POS tag (P) and word (W).

T : 2 P(0) W(0) t_p0w0.count t_p0w0.lm 3
  P0,W0 W0 wbdiscount gtmin 15 
  P0 P0 wbdiscount
  0 0 wbdiscount


================================================
FILE: ccgbank/models/supertagger/vocab.flm
================================================

## flm file for determining the vocab

3
 
## word (W) unigram

W : 0 w.count w.lm 1
  0 0

## supertag (T) unigram

T : 0 t.count t.lm 1
  0 0

## pos tag (P) unigram 

P : 0 p.count p.lm 1
  0 0


================================================
FILE: ccgbank/original/models/postagger/pos.config
================================================
# an example POS tagger config file (D.N. Mehay)
# change to suit your needs (e.g., replace the following paths
# with paths that point to the relevant files).

# "basic" = Ratnaparkhi-style features, inter alia
# there is nothing else in OpenCCG, at the moment.
taggerType=basic

# this model gives priors on POS tags.
priorModel=posprior.flm
priorModelVocab=vocab.pos

# this is a Zhang Le-style MEM.
maxentModel=pos.mod

# this last must be an ARPA-formatted n-gram model over POS tags (with <s> and </s>)
# (7- to 9-grams work well, without much memory usage).
sequenceModel=pos.lm

# tagging beam width (beta=1 means "single-best", i.e., unitagging)
beta=0.044
#beta=0.1
#beta=1.0

# tagging algorithm.  (choose from 'forward' and 'forward-backward')
# the former is faster, the latter is better.
taggingAlgorithm=forward-backward

# self-explanatory (will potentially print certain errors and warnings, if set to 'true')
verbose=true

================================================
FILE: ccgbank/original/models/postagger/posprior.flm
================================================

## A prior probability model that estimates p(pos | word)
## with smoothed back-off (a "soft tagging dictionary" if you will).

1
 
## POS tag (P) given word (W) with a back-off to the prior on the POS itself.

P : 1 W(0) p_w0.count p_w0.lm 2
  W0 W0 wbdiscount gtmin 1 
  0 0 wbdiscount gtmin 1 


================================================
FILE: ccgbank/original/models/supertagger/st.config
================================================
# an example supertagger config file (D.N. Mehay)
# change to suit your needs (e.g., replace the following paths
# with paths that point to the relevant files).

# this is a comment ("basic" means C,C & Vadas (2006)-style features).
# there is nothing else in OpenCCG, at the moment.
taggerType=basic

# this model gives priors on supertags.
#priorModel=stprior.flm
#priorModelVocab=vocab.st

# this is a Zhang Le-style MEM.
maxentModel=st.mod

# this last must be an ARPA-formatted n-gram model over supertags (with <s> and </s>)
# (7- to 9-grams work well, without much memory usage).
sequenceModel=st.lm

# tagging beam widths (first try beta1, then beta2 if that doesn't give a parse, etc.).
# give as many as you want, but keep in mind that your parser will try them all out
# (which may make it try to parse in vain -- i.e., when it just doesn't have the
# categories to do it).
betas =  0.024 0.003875 0.001225 0.0005377 0.000275 0.0000925 0.00004
#betas =  0.075 0.03 0.01 0.005 0.001

# if not using the prior model (above), you must give 'K' values (see Clark and Curran (2007)).
# the first one is for all beta values but the last. the second one is for
# the last.
firstK=20
lastK=100

# also, if you're not using the prior models, you need to specify a word-keyed tagging
# dictionary (this interacts with the 'K' values) and a POS-keyed tagging dictionary.
wDict=word.dict.min10
posDict=pos.dict.min10

# use automatic POS features? (even if you are automatically POS tagging,
# but only using single-best, set this to false).
autoPOS=true

# if autoPOS=true, you need to specify a POS config file.
posConfig=../postagger/pos.config

# tagging algorithm.  (choose from 'forward' and 'forward-backward')
# the former is faster, the latter is better.
taggingAlgorithm=forward-backward

# self-explanatory (will print certain errors and warnings, if set to 'true')
verbose=true

================================================
FILE: ccgbank/original/models/supertagger/stprior.flm
================================================

## A prior probability model that estimates p(supertag | word, pos)
## with smoothed back-off (a "soft tagging dictionary" if you will).

1
 
## lexical category ("supertag") (T) given POS tag (P) and word (W).

T : 2 P(0) W(0) t_p0w0.count t_p0w0.lm 3
  P0,W0 W0 wbdiscount gtmin 15 
  P0 P0 wbdiscount
  0 0 wbdiscount


================================================
FILE: ccgbank/original/models/supertagger/vocab.flm
================================================

## flm file for determining the vocab

3
 
## word (W) unigram

W : 0 w.count w.lm 1
  0 0

## supertag (T) unigram

T : 0 t.count t.lm 1
  0 0

## pos tag (P) unigram 

P : 0 p.count p.lm 1
  0 0


================================================
FILE: ccgbank/plugins/MyGenSynScorer.java
================================================

package plugins;

import opennlp.ccg.synsem.*;
import java.io.*;

public class MyGenSynScorer extends GenerativeSyntacticModel
{
    static String modeldir = getModelDir();
    static String getModelDir() {
	String retval = System.getProperty("gensyn.model.dir", "models/parser");
	if (!retval.endsWith("/")) retval += "/";
	return retval;
    }

    public MyGenSynScorer() throws IOException {
        super(modeldir+"top.flm", modeldir+"leaf.flm", modeldir+"unary.flm", modeldir+"binary.flm");
    }
}

================================================
FILE: ccgbank/plugins/MyNgramCombo.java
================================================
package plugins;

import opennlp.ccg.ngrams.*;
import java.io.*;
import java.util.*;
import java.lang.Thread;

public class MyNgramCombo extends LinearNgramScorerCombo
{
    static String bigWordsLM() { 
	String retval = System.getProperty("big.words.lm", "models/realizer/gigaword4.5g.kenlm.bin"); 
	if (new File(retval).exists()) return retval;
	System.out.println("Reusing trigram model as a stand-in for the big LM");
	return null;
    }
    static String wordsLM() { return System.getProperty("words.lm", "models/realizer/train.3bo"); }
    static String wordsSCLM() { return System.getProperty("words.sc.lm", "models/realizer/train-sc.3bo"); }
    static String stposFLM() { return System.getProperty("stpos.flm", "models/realizer/stp3.flm"); }

    // map to keep track of trigram model for reuse
    static Map<Thread,NgramScorer> lmMap = new IdentityHashMap<Thread,NgramScorer>(5);

    // return big lm, while setting trigram model if using it as a stand-in
    static NgramScorer getBigLM() throws IOException {
	String biglm = bigWordsLM();
	if (biglm != null) return new KenNgramModel(5, biglm, false, true, true, '_', false);
	NgramScorer retval = new StandardNgramModel(3, wordsLM());
	lmMap.put(Thread.currentThread(), retval);
	return retval;
    }

    // return trigram lm, reusing existing one if present
    static NgramScorer getWordsLM() throws IOException {
	NgramScorer retval = lmMap.get(Thread.currentThread());
	if (retval != null) {
	    lmMap.remove(Thread.currentThread());
	    return retval;
	}
	return new StandardNgramModel(3, wordsLM());
    }

    public MyNgramCombo() throws IOException {
	super(new NgramScorer[] { 
		getBigLM(), 
		getWordsLM(),
		new StandardNgramModel(3, wordsSCLM(), true), 
		new FactoredNgramModelFamily(stposFLM()) 
	    });
    }
}


================================================
FILE: ccgbank/plugins/MyNgramGenSynProduct.java
================================================
package plugins;

import opennlp.ccg.ngrams.*;
import opennlp.ccg.synsem.*;
import java.io.*;

public class MyNgramGenSynProduct extends SignScorerProduct
{
    public MyNgramGenSynProduct() throws IOException {
	super(new SignScorer[] { new MyGenSynScorer(), new MyNgramCombo() }); 
    }
}


================================================
FILE: ccgbank/plugins/MyNgramPrecisionBaselineGenInterp.java
================================================

package plugins;

import opennlp.ccg.ngrams.*;
import opennlp.ccg.synsem.*;

import java.io.*;

public class MyNgramPrecisionBaselineGenInterp extends SignScorerInterpolation implements SelfParaphraseBiaser
{
    static String[] targets = { "e plurubus unum" };

    NgramPrecisionModel selfBiaser;

    public MyNgramPrecisionBaselineGenInterp() throws IOException {
        super(
	      new SignScorer[] { new NgramPrecisionModel(targets), new MyNgramGenSynProduct() },
	      new double[] { 100.0, 1.0 }
	);
	selfBiaser = (NgramPrecisionModel) models[0];
    }

    public void setTargets(String[] targets) { selfBiaser.setTargets(targets); }
}

================================================
FILE: ccgbank/plugins/MyNgramPrecisionPerceptronInterp.java
================================================

package plugins;

import opennlp.ccg.ngrams.*;
import opennlp.ccg.synsem.*;

import java.io.*;

public class MyNgramPrecisionPerceptronInterp extends SignScorerInterpolation implements SelfParaphraseBiaser
{
    static String[] targets = { 
	"lee said brianna had dragged food , toys and other things into the bedroom .", 
	"lee , 33 , said the girl had dragged the food , toys and other things into her mother 's bedroom ." 
	//"charles o. prince , 53 , was named as mr. weill 's successor .",
	//"mr. weill 's longtime confidant , charles o. prince , 53 , was named as his successor ."
    };

    NgramPrecisionModel selfBiaser;

    public MyNgramPrecisionPerceptronInterp() throws IOException {
        super(
	      new SignScorer[] { new NgramPrecisionModel(targets), new MyRealizerPerceptronScorer() },
	      //new double[] { 100.0, 1.0 }
	      new double[] { 10000.0, 1.0 }
	);
	selfBiaser = (NgramPrecisionModel) models[0];
    }

    public void setTargets(String[] targets) { selfBiaser.setTargets(targets); }
}

================================================
FILE: ccgbank/plugins/MyParserPerceptronScorer.java
================================================

package plugins;

import opennlp.ccg.synsem.*;
import opennlp.ccg.perceptron.*;
import opennlp.ccg.hylo.*;

import java.io.*;

public class MyParserPerceptronScorer extends ReRankingPerceptronScorer
{
    static String modeldir = getModelDir();
    static String getModelDir() {
	String retval = System.getProperty("parser.models.dir", "models/parser");
	if (!retval.endsWith("/")) retval += "/";
	return retval;
    }

    static String modelname = getModelName();
    static String getModelName() { return System.getProperty("parser.model.name", "model.gz"); }

    public MyParserPerceptronScorer() throws IOException {
        super(
	      //new ComposedFeatureExtractor(new MyGenSynScorer(), new SyntacticFeatureExtractor()), 
	      new ComposedFeatureExtractor(new MyGenSynScorer(), new MySynSemFeatureExtractor()), 
	      new Model(modeldir + modelname)
	);
    }

    protected SignScorer getBaseScorer(FeatureExtractor featureExtractor) {
	return (SignScorer) ((ComposedFeatureExtractor)featureExtractor).featureExtractors[0];
    }
}

================================================
FILE: ccgbank/plugins/MyRealizerPerceptronScorer.java
================================================

package plugins;

import opennlp.ccg.synsem.*;
import opennlp.ccg.perceptron.*;

import java.io.*;

public class MyRealizerPerceptronScorer extends PerceptronScorer
{
    static String getModelDir() {
	String retval = System.getProperty("realizer.models.dir", "models/realizer");
	if (!retval.endsWith("/")) retval += "/";
	return retval;
    }

    static String getModelName() { return System.getProperty("realizer.model.name", "model.gz"); }

    static String getAgrMultiplier() { return System.getProperty("realizer.agr.mult", "10"); }

    static double calcAgrMultiplier() {
	try {
	    double mult = Double.parseDouble(getAgrMultiplier());
	    return mult;
	}
	catch (NumberFormatException exc) {
	    System.out.println("Ignoring unparseable negative agreement feature weight multiplier: " + getAgrMultiplier());
	    return 1.0;
	}
    }

    static double agrMult = calcAgrMultiplier();

    public MyRealizerPerceptronScorer() throws IOException {
        super(
	      //new ComposedFeatureExtractor(new MyNgramGenSynProduct(), new MySynAgrFeatureExtractor()), 
	      new ComposedFeatureExtractor(new MyNgramGenSynProduct(), new MySynSemAgrFeatureExtractor()), 
	      new Model(getModelDir() + getModelName(), agreementFilter)
	);
	System.out.println("Loading perceptron model from: " + getModelDir() + getModelName());
	System.out.println("Boosting negative agreement and punctuation balancing feature weights by a factor of " + agrMult);
    }

    // feature filter for boosting negative agreement feature weights
    private static Model.FeatureFilter agreementFilter = new Model.FeatureFilter() {
	    /** Returns the modified feature weight for the given feature. */
	    public double adjustedWeight(String name, double weight) {
		if (weight >= 0) return weight;
		if (name.equals("$punct") || name.startsWith("AGR") || isAdjacentPunctFeat(name)) 
		    return weight * agrMult;
		return weight;
	    }
	};

    // returns whether a feature is an adjacent punctuation n-gram feature
    private static boolean isAdjacentPunctFeat(String name) {
	String[] keys = name.split(":");
	if (keys.length >= 2 && isPunct(keys[0]) && isPunct(keys[1]))
	    return true;
	if (keys.length >= 4 && keys[0].equals("P") && keys[2].equals("P") && isPunct(keys[1]) && isPunct(keys[3]))
	    return true;
	return false;
    }

    // sentence-boundary markers treated like punctuation
    private static boolean isPunct(String token) {
	return token.equals("-") || token.equals("--") 
	    || token.equals(",") || token.equals(";") 
	    || token.equals(":") || token.equals("!")
	    || token.equals("?") || token.equals(".")
	    || token.equals("...") || token.equals("``")
	    || token.equals("'") || token.equals("''")
	    || token.equals("LRB") || token.equals("RRB");
    }
}

================================================
FILE: ccgbank/plugins/MySynAgrFeatureExtractor.java
================================================

package plugins;

import opennlp.ccg.synsem.*;
import opennlp.ccg.perceptron.*;
import opennlp.ccg.hylo.*;

public class MySynAgrFeatureExtractor extends ComposedFeatureExtractor
{
    public MySynAgrFeatureExtractor() {
        super(new SyntacticFeatureExtractor(), new EnglishAgreementExtractor());
    }
}

================================================
FILE: ccgbank/plugins/MySynSemAgrFeatureExtractor.java
================================================

package plugins;

import opennlp.ccg.synsem.*;
import opennlp.ccg.perceptron.*;
import opennlp.ccg.hylo.*;

public class MySynSemAgrFeatureExtractor extends ComposedFeatureExtractor
{
    public MySynSemAgrFeatureExtractor() {
        super(new MySynSemFeatureExtractor(), new EnglishAgreementExtractor());
    }
}

================================================
FILE: ccgbank/plugins/MySynSemFeatureExtractor.java
================================================

package plugins;

import opennlp.ccg.synsem.*;
import opennlp.ccg.perceptron.*;
import opennlp.ccg.hylo.*;

public class MySynSemFeatureExtractor extends ComposedFeatureExtractor
{
    public MySynSemFeatureExtractor() {
        super(new SyntacticFeatureExtractor(), new LexDepFeatureExtractor());
    }
}

================================================
FILE: ccgbank/stanford-nlp/classifiers/stanfordner-README
================================================
Place your Stanford NE tagging models here.

================================================
FILE: ccgbank/stanford-nlp/stanfordnlp-README
================================================
Place your Stanford core NLP jar file here (preferably renaming it to 'stanford-core-nlp.jar') and
then also place, e.g., NE tagging models under './classifiers'.

================================================
FILE: ccgbank/templates/addFilterLexFeats.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform" 
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"  
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">
  
  <xsl:output method="xml" indent="yes" xalan2:indent-amount="2"/> 
  <xsl:strip-space elements="*"/>

  <!-- Transform which introduces punct placeholder feats in the lexical cats of unbalanced comma & dash appositive cats-->

	<!--Various kinds of comma appositions taken care of-->

	<!--Commas introducing np-appositions-->
	<xsl:template match="complexcat[parent::entry and ancestor::family[(starts-with(@pos1,'PUNCT_APPOS') or starts-with(@pos,'PUNCT_APPOS')) and not(contains(@name,'punct'))]]/*[1]/fs">             
	
		<fs>
			<xsl:apply-templates select="@*|node()"/>
			<feat attr="unbal" val="comma"/>
		</fs>

	</xsl:template>		

	<!--wh-prns introducing np-appositions-->
	<xsl:template match="complexcat[count(descendant::atomcat[@type='punct'])=1 and parent::entry and ancestor::family[@indexRel='whApposRel']]/*[1]/fs">             

		<fs>
			<xsl:apply-templates select="@*|node()"/>
			<feat attr="unbal" val="comma"/>
		</fs>

	</xsl:template>		

	<!--Dashes except that are treated like prepositions-->
	<xsl:template match="complexcat[parent::entry and ancestor::family[not(@name='punct[--]') and (contains(@pos1,'DASH') or contains(@pos,'DASH')) and not(contains(@name,'punct'))]]/*[1]/fs">             
		<fs>
			<xsl:apply-templates select="@*|node()"/>
			<feat attr="unbal" val="dash"/>
		</fs>

	</xsl:template>		

	<xsl:template match="complexcat[parent::entry and ancestor::family[count(child::member)=1 and child::member/@stem='--'  and @pos=':' and (@name='s_~1\np_2\(s_1\np_2)/np_3' or  @name='np_~1\np_1/np_2')]]/*[1]/fs">             
		<fs>
			<xsl:apply-templates select="@*|node()"/>
			<feat attr="unbal" val="dash"/>
		</fs>
	</xsl:template>

  <!-- default copy rule -->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>

================================================
FILE: ccgbank/templates/addStems.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->

<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

  <xsl:output method="xml" indent="yes" xalan2:indent-amount="2"/>
  <xsl:strip-space elements="*"/>
  
  
  <!-- Transform for adding stems to leaf nodes in the derivations -->
  
  <!-- Helper class for looking up stems -->
  <xsl:variable name="obj" select="java:opennlp.ccgbank.convert.MorphLookup.new()"/>

  <!-- Add stems for plural nouns and verbs -->
  <!-- Also add PERF, PROG and PASS as rels -->
  <xsl:template match="Leafnode[@pos='NNS' or starts-with(@pos,'VB')]">
    <xsl:copy>
      <!-- copy attrs -->
      <xsl:apply-templates select="@*"/>
      <!-- add stem -->
      <xsl:variable name="stem" select="java:getStem($obj,@lexeme,@pos)"/>
      <xsl:if test="$stem">
        <xsl:attribute name="stem"><xsl:value-of select="$stem"/></xsl:attribute>
      </xsl:if>
      <!-- warnings 
      <xsl:if test="not($stem)">
        <xsl:message>addStems: no stem for <xsl:value-of select="@lexeme"/>_<xsl:value-of select="@pos"/></xsl:message>
      </xsl:if>-->
      <!-- 
      <xsl:if test="@rel and not(starts-with(@rel,$stem))">
        <xsl:message>addStems: mismatch between rel and stem: <xsl:value-of select="@rel"/>, <xsl:value-of select="$stem"/></xsl:message>
      </xsl:if>
      -->
      <!-- add PERF rel for perfective 'have' -->
      <xsl:if test="$stem='have' and not(@rel) and complexcat/complexcat/atomcat[1][@type='s']/fs/feat[@val='pt']">
        <xsl:attribute name="rel">PERF</xsl:attribute>
      </xsl:if>
      <!-- add PROG rel for progressive 'be' -->
      <xsl:if test="$stem='be' and not(@rel) and complexcat/complexcat/atomcat[1][@type='s']/fs/feat[@val='ng']">
        <xsl:attribute name="rel">PROG</xsl:attribute>
      </xsl:if>
      <!-- add PASS rel for passive 'be' -->
      <xsl:if test="$stem='be' and not(@rel) and complexcat/complexcat/atomcat[1][@type='s']/fs/feat[@val='pss']">
        <xsl:attribute name="rel">PASS</xsl:attribute>
      </xsl:if>
      <!-- copy rest -->
      <xsl:apply-templates select="node()"/>
    </xsl:copy>
  </xsl:template>

  
  <!--Default global copy rule-->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/adjustAppos.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

<xsl:output method="xml" indent="yes" xalan2:indent-amount="2" omit-xml-declaration = "yes"/>

<xsl:strip-space elements="*"/>

<!--Java helper class-->
<xsl:variable name="obj" select="java:opennlp.ccgbank.convert.PunctHelper.new()"/>
<!--Transform which ensures balancing of appositive nps-->

<xsl:template match="/">
 <xsl:apply-templates/>
</xsl:template>


<!--Balancing comma for place name appositive-->
<xsl:template match="Treenode[child::Leafnode[@pos1=',' and starts-with(preceding::Leafnode[1]/@pos1,'TRIAL') ]]">
  <xsl:apply-templates select="*[position()>1 and not(@pos1=',')]"/>
</xsl:template>

<xsl:template match="Treenode[child::Leafnode[@pos1=',' and starts-with(following::Leafnode[1]/@pos1,'TRIAL') ]]">
  <xsl:apply-templates select="*[position()>1 and not(@pos1=',')]"/>
</xsl:template>

<!--Default global copy rule-->
 <xsl:template match="@*|node()">
   <xsl:copy>
     <xsl:apply-templates select="@*|node()"/>
   </xsl:copy>
 </xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/adjustCandCcats1.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

  <xsl:output method="xml" indent="yes" xalan2:indent-amount="2"/>
  <xsl:strip-space elements="*"/>
  
  <!-- Transform which adjusts some cats in C&C parses-->

  <!-- change eg s_1/s_1/(s_1/s_1) to s_~1/s_1/(s_~1/s_1), to support mod-index -->

	<xsl:template match="Leafnode[
      count(.//complexcat[
        atomcat[1][@type='s'] and *[3][self::atomcat][@type='s']
      ]) = 2
    and //atomcat[1]/fs[@id='1'] and count(.//atomcat[@type='s']/fs[@id='2'])=0]"
  >
    <Leafnode candc="true">
      <xsl:apply-templates select="@*[not(name()='candc')]|node()"/>
    </Leafnode>
  </xsl:template>

  <xsl:template match="Leafnode[
      count(.//complexcat[
        atomcat[1][@type='s'] and *[3][self::atomcat][@type='s']
      ]) = 2
    ]//atomcat[1]/fs[@id='1']"
  >
    <fs inheritsFrom="1">
      <xsl:apply-templates/>
    </fs>
  </xsl:template>
  
  <!-- change eg s_1\np_2/(s_1\np_2)/(s_1\np_2/(s_1\np_2)) to s_~1\np_2/(s_1\np_2)/(s_~1\np_2/(s_1\np_2)), to support mod-index -->

	<xsl:template match="Leafnode[
      count(.//complexcat[
        atomcat[1][@type='s'] and *[3][self::atomcat][@type='np']
      ]) = 4
    and //atomcat/fs[@id='1'] and count(.//atomcat[@type='s' and position()=1]/fs[@id='3'])=0 ]"
  >

		<Leafnode candc="true">
      <xsl:apply-templates select="@*[not(name()='candc')]|node()"/>
    </Leafnode>
    
  </xsl:template>

	<xsl:template match="Leafnode[
      count(.//complexcat[
        atomcat[1][@type='s'] and *[3][self::atomcat][@type='np']
      ]) = 4
    ]//atomcat[parent::complexcat[parent::Leafnode or count(preceding-sibling::complexcat)=1]]/fs[@id='1']"
  >

		<fs inheritsFrom="1">
      <xsl:apply-templates/>
    </fs>

  </xsl:template>

	    
  <!-- default copy rule -->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>

================================================
FILE: ccgbank/templates/adjustCats.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

  <xsl:output method="xml" indent="yes" xalan2:indent-amount="2"/>
  <xsl:strip-space elements="*"/>
  
  <!-- Transform which does misc adjustments of categories in parses. -->

  
  <!-- Change eg [with], [of] to 'lex' feat, instead of 'form', with full word as val. -->
  <xsl:template match="atomcat[@type='pp']/fs/feat[@attr='form']">
    <feat attr="lex" val="{@val}"/>
  </xsl:template>
  
  <!-- Change case-marking preps to use ~2 -->
  <xsl:template match="Leafnode[not(@candc) and ../@roles]/complexcat[not(atomcat[2][@type='pp'])]/atomcat[1][@type='pp']/fs[feat[@attr='form']]">
    <fs inheritsFrom="2">
      <xsl:apply-templates/>
    </fs>
  </xsl:template>

  <!-- Change that-comp indices to s[em]_~1/s[dcl]_1, reflecting sem null status. -->
  <xsl:template match="Leafnode[not(@candc)]/complexcat[atomcat[2][@type='s']/fs[feat[@attr='form']/@val='dcl']]
    /atomcat[1][@type='s']/fs[feat[@attr='form']/@val='em']"
  >
    <fs inheritsFrom="1">
      <xsl:apply-templates/>
    </fs>
  </xsl:template>
  
  <xsl:template match="Leafnode[not(@candc)]/complexcat[atomcat[1][@type='s']/fs[feat[@attr='form']/@val='em']]
    /atomcat[2][@type='s']/fs[feat[@attr='form']/@val='dcl']"
  >
    <fs id="1">
      <xsl:apply-templates/>
    </fs>
  </xsl:template>
  
  
  <!-- Change to-inf indices to s[to]_~1\np_2/(s[b]_1\np_2), reflecting sem null status. -->
  <xsl:template match="Leafnode[not(@candc)]/complexcat[complexcat/atomcat[1][@type='s']/fs[feat[@attr='form']/@val='b']]
    /atomcat[1][@type='s']/fs[feat[@attr='form']/@val='to']"
  >
    <fs inheritsFrom="1">
      <xsl:apply-templates/>
    </fs>
  </xsl:template>
  
  <xsl:template match="Leafnode[not(@candc)]/complexcat[atomcat[1][@type='s']/fs[feat[@attr='form']/@val='to']]
    /complexcat/atomcat[1][@type='s']/fs[feat[@attr='form']/@val='b']"
  >
    <fs id="1">
      <xsl:apply-templates/>
    </fs>
  </xsl:template>
  

  <!-- change eg n_1/n_1 to n_~1/n_1, to support mod-index -->
  <xsl:template match="Leafnode[not(@candc)]/complexcat[
      (atomcat[1][@type='n'] and *[3][self::atomcat][@type='n'][fs/@id='1']) or 
      (atomcat[1][@type='np'] and *[3][self::atomcat][@type='np'])
    ]/atomcat[1]/fs"
  >
    <fs inheritsFrom="1">
      <xsl:apply-templates/>
    </fs>
  </xsl:template>
  
  
  <!-- change eg n_1/n_2/(n_1/n_2) to n_~1/n_1/(n_~1/n_1), to support mod-index -->
  <!-- tbd: check sem of 'than' eg ((N/N)/(N/N))\(S[adj]\NP) --> 
  <xsl:template match="Leafnode[not(@candc) and 
      count(.//complexcat[
        (atomcat[1][@type='n'][fs/@id='1'] and *[3][self::atomcat][@type='n'][fs/@id='2']) or 
        (atomcat[1][@type='np'][fs/@id='1'] and *[3][self::atomcat][@type='np'][fs/@id='2'])
      ]) = 2
    ]//atomcat/fs[@id='1']"
  >
    <fs inheritsFrom="1">
      <xsl:apply-templates/>
    </fs>
  </xsl:template>
  
  <xsl:template match="Leafnode[not(@candc) and 
      count(.//complexcat[
        (atomcat[1][@type='n'][fs/@id='1'] and *[3][self::atomcat][@type='n'][fs/@id='2']) or 
        (atomcat[1][@type='np'][fs/@id='1'] and *[3][self::atomcat][@type='np'][fs/@id='2'])
      ]) = 2
    ]//atomcat/fs[@id='2']"
  >
    <fs id="1">
      <xsl:apply-templates/>
    </fs>
  </xsl:template>
  
  
  <!-- change eg s_1/s_1 to s_~1/s_1, to support mod-index -->
  <xsl:template match="Leafnode[not(@candc)]/complexcat[
      atomcat[1][@type='s'][fs/@id='1'] and *[3][self::atomcat][@type='s'][fs/@id='1']
    ]/atomcat[1]/fs"
  >
    <fs inheritsFrom="1">
      <xsl:apply-templates/>
    </fs>
  </xsl:template>
  

  <!-- change eg s_1/s_2/(s_1/s_2) to s_~1/s_1/(s_~1/s_1), to support mod-index -->
  <xsl:template match="Leafnode[not(@candc) and 
      count(.//complexcat[
        atomcat[1][@type='s'] and *[3][self::atomcat][@type='s']
      ]) = 2
    ]//atomcat/fs[@id='1']"
  >
    <fs inheritsFrom="1">
      <xsl:apply-templates/>
    </fs>
  </xsl:template>
  
  <xsl:template match="Leafnode[not(@candc) and 
      count(.//complexcat[
        atomcat[1][@type='s'] and *[3][self::atomcat][@type='s']
      ]) = 2
    ]//atomcat/fs[@id='2']"
  >
    <fs id="1">
      <xsl:apply-templates/>
    </fs>
  </xsl:template>
  
  
  <!-- change eg s_1\np_2\(s_1\np_2) to s_~1\np_2\(s_1\np_2), to support mod-index -->
  <xsl:template match="Leafnode[not(@candc) and 
      count(.//complexcat[
        atomcat[1][@type='s'][fs/@id='1'] and *[3][self::atomcat][@type='np'][fs/@id='2']
      ]) = 2
    ]/complexcat/atomcat[1]/fs"
  >
    <fs inheritsFrom="1">
      <xsl:apply-templates/>
    </fs>
  </xsl:template>
  

  <!-- change eg s_1\np_2/(s_3\np_2)/(s_1\np_2/(s_3\np_2)) to s_~1\np_2/(s_1\np_2)/(s_~1\np_2/(s_1\np_2)), to support mod-index -->
  <xsl:template match="Leafnode[not(@candc) and 
      count(.//complexcat[
        atomcat[1][@type='s'] and *[3][self::atomcat][@type='np']
      ]) = 4
    ]//atomcat/fs[@id='1']"
  >
    <fs inheritsFrom="1">
      <xsl:apply-templates/>
    </fs>
  </xsl:template>
  
  <xsl:template match="Leafnode[not(@candc) and 
      count(.//complexcat[
        atomcat[1][@type='s'] and *[3][self::atomcat][@type='np']
      ]) = 4
    ]//atomcat/fs[@id='3']"
  >
    <fs id="1">
      <xsl:apply-templates/>
    </fs>
  </xsl:template>
  

  <!-- default copy rule -->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/adjustParenthetical.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

<xsl:output method="xml" indent="yes" xalan2:indent-amount="2" omit-xml-declaration = "yes"/>

<xsl:strip-space elements="*"/>

<!--Java helper class-->
<xsl:variable name="obj" select="java:opennlp.ccgbank.convert.PunctHelper.new()"/>
<!--Transform which deletes original balancing commas of sentence medial parentheticals-->

<xsl:template match="/">
    <xsl:apply-templates/>
</xsl:template>

<xsl:template match="Treenode[count(*)=3 and child::Leafnode[following::Leafnode[1][@pos1='PUNCT_PARENTHETICAL_VRB' or  @pos1='PUNCT_PARENTHETICAL'] or preceding::Leafnode[1]/@pos1='PUNCT_PARENTHETICAL_BAL' ]]">

	<xsl:apply-templates select="*[position() &gt; 1 and not(following::Leafnode[1][@pos1='PUNCT_PARENTHETICAL' or @pos1='PUNCT_PARENTHETICAL_VRB'] or preceding::Leafnode[1]/@pos1='PUNCT_PARENTHETICAL_BAL' )]"/>

</xsl:template>

<xsl:template match="Treenode[count(*)=3 and child::Leafnode[following::Leafnode[1][@pos1='PUNCT_ADV-PARENTHETICAL_BAL1'] or preceding::Leafnode[1]/@pos1='PUNCT_ADV-PARENTHETICAL_BAL2' ]]">

<xsl:apply-templates select="*[position() &gt; 1 and not(following::Leafnode[1][@pos1='PUNCT_ADV-PARENTHETICAL_BAL1'] or preceding::Leafnode[1]/@pos1='PUNCT_ADV-PARENTHETICAL_BAL2' )]"/>

</xsl:template>

<!--Select only those complexcats which are first children of complexcats-->
<xsl:template match="complexcat/*[1][self::complexcat]">
  <xsl:apply-templates/>
</xsl:template>

<!--Default global copy rule-->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>

================================================
FILE: ccgbank/templates/adjustReportedSpeech.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

<xsl:output method="xml" indent="yes" xalan2:indent-amount="2" omit-xml-declaration = "yes"/>

<xsl:strip-space elements="*"/>

<!--Java helper class-->
<xsl:variable name="obj" select="java:opennlp.ccgbank.convert.PunctHelper.new()"/>
<!--Transform which deletes original balancing commas of sentence medial parentheticals-->

<xsl:template match="/">
    <xsl:apply-templates/>
</xsl:template>

<!--Delete spurious comma-->
<xsl:template match="Treenode[count(*)=3 and child::Leafnode[@pos1=',' and (following::Leafnode[1][@pos1='PUNCT_SAY'] or preceding::Leafnode[1][@pos1='PUNCT_SAY_BAL']) ]]">

	<xsl:apply-templates select="*[position() &gt; 1 and not(@pos1=',')]"/>
</xsl:template>


<!--Default global copy rule-->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>

================================================
FILE: ccgbank/templates/adjustRoles.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->

<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

  <xsl:output method="xml" indent="yes" xalan2:indent-amount="2"/>
  <xsl:strip-space elements="*"/>
  
  
  <!-- Transform for guessing at missing arg roles and adding roles to cat names -->
  
  <!-- Helper class for adjusting roles -->
  <xsl:variable name="obj" select="java:opennlp.ccgbank.convert.RoleAdjuster.new()"/>

  
  <!-- Adjust arg roles and cats on relevant leaf nodes -->
  <xsl:template match="Leafnode[@argRoles]">
    <xsl:copy>
      <!-- copy attrs -->
      <xsl:apply-templates select="@*"/>
      <!-- get adjusted roles -->
      <xsl:variable name="roles2" select="java:getAdjustedRoles($obj,@cat,@argRoles)"/>
      <!-- replace roles if changed -->
      <xsl:if test="$roles2 != @argRoles">
        <xsl:attribute name="argRoles0"><xsl:value-of select="@argRoles"/></xsl:attribute>
        <xsl:attribute name="argRoles"><xsl:value-of select="$roles2"/></xsl:attribute>
      </xsl:if>
      <!-- add roles to cat name -->
      <!-- nb: 'if' test not really nec but seems to avoid a warning at runtime -->
      <xsl:variable name="cat2" select="java:getCatPlusRoles($obj,@cat,$roles2)"/>
      <xsl:if test="$cat2 != @cat"> 
        <xsl:attribute name="cat"><xsl:value-of select="$cat2"/></xsl:attribute>
      </xsl:if>
      <!-- copy rest -->
      <xsl:apply-templates select="node()"/>
    </xsl:copy>
  </xsl:template>

  
  <!--Default global copy rule-->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/adv-placement.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

<xsl:output method="xml" indent="yes" xalan2:indent-amount="2" omit-xml-declaration = "yes"/>

<xsl:strip-space elements="*"/>

<xsl:template match="/">
  <xsl:apply-templates/>
</xsl:template>

<xsl:variable name="obj" select="java:opennlp.ccgbank.convert.PhraseExtractor.new()"/>

<xsl:template match="Derivation">
	<Derivation>
		<xsl:apply-templates select="@*|node()"/>
	</Derivation>
	<xsl:variable name="void" select="java:printInfo($obj)"/>
</xsl:template>

<!--Store id-->
<xsl:template match="Treenode[@Header]">
	<xsl:variable name="void" select="java:storeSentId($obj,@Header)"/>
	<Treenode>
		<xsl:apply-templates select="@*|node()"/>
	</Treenode>
</xsl:template>

<!--Store Adverbs-->
<xsl:template match="Leafnode[@pos='RB']">
	
	<xsl:variable name="void2" select="java:storeWord($obj,@lexeme)"/>
	<xsl:variable name="void3" select="java:storeWord($obj,following::Leafnode[1]/@lexeme)"/>

	<xsl:variable name="void" select="java:storePhrase($obj,'ADV')"/>

	<!--Once a ADV is detected, skip all lower level phrases-->
	<Leafnode>
		<xsl:apply-templates select="@*|node()"/>
	</Leafnode>
</xsl:template>

<!--Default global copy rule-->
<xsl:template match="@*|node()">
   <xsl:copy>
     <xsl:apply-templates select="@*|node()"/>
   </xsl:copy>
</xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/agr-macroInsert.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->

<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

  <xsl:output method="xml" indent="yes" xalan2:indent-amount="2"/>
  <xsl:strip-space elements="*"/>
  
  
  <!--Transform which takes in as input the morph.xml file and outputs a morph.xml file -->
  
  <!--Java Program in the grammar extractor package invoked-->

  <xsl:variable name="obj" select="java:opennlp.ccgbank.extract.MorphExtrHelper.new()"/>

  
  <xsl:template match="morph">

    <morph xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:noNamespaceSchemaLocation="../morph.xsd" name="protogrammar">
  
      <xsl:apply-templates>
        <xsl:sort select="@word"/>
        <xsl:sort select="@stem"/>
        <xsl:sort select="@pos"/>
      </xsl:apply-templates>

      <macro name="@sg-nom">
         <fs id="9">
           <feat attr="num" val="sg"/>
         </fs>
      </macro>
      <macro name="@pl-nom">
         <fs id="9">
           <feat attr="num" val="pl"/>
         </fs>
      </macro>

			<macro name="@sg-copula">
         <fs id="2">
           <feat attr="num" val="sg"/>
         </fs>
      </macro>
      <macro name="@pl-copula">
         <fs id="2">
           <feat attr="num" val="pl"/>
         </fs>
      </macro>
			<!--<entry pos="Dummy" word="*dummy*"/>-->
    </morph>
  </xsl:template>
  

  <!-- include relevant atts for each entry -->
  <xsl:template match="entry">
    <entry>
      <xsl:apply-templates select="@*"/>
			<xsl:call-template name = "sem-class" />
    </entry>
  </xsl:template>
  
  <xsl:template match="entry[(@family='n_9' or @family='np_9') and (@pos='NN')]">
    <entry>

			<xsl:variable name="macro-name" select="java:agrMacroDecider($obj,'@sg-nom',@class,@pos,@word)"/>

			<xsl:if test="string-length($macro-name) &gt; 0">
         <xsl:attribute name = "macros" >
           <xsl:value-of select = "$macro-name" />
				 </xsl:attribute>
			 </xsl:if>
       <xsl:apply-templates select="@*[not(name()='family') and not(name()='macros')]"/> 	 
			<xsl:call-template name = "sem-class" />
    </entry>
  </xsl:template>
  
  <xsl:template match="entry[(@family='n_9' or @family='np_9') and @pos='NNS']">
    <entry>

			<xsl:variable name="macro-name" select="java:agrMacroDecider($obj,'@pl-nom',@class,@pos,@word)"/>

			<xsl:if test="string-length($macro-name) &gt; 0">
         <xsl:attribute name = "macros" >
           <xsl:value-of select = "$macro-name" />
				 </xsl:attribute>
			</xsl:if>

      <xsl:apply-templates select="@*[not(name()='family') and not(name()='macros')]"/>
			<xsl:call-template name = "sem-class" />
    </entry>
  </xsl:template>

	<xsl:template match="entry[(@word='was' or @word='is') and @stem='be']">
    <entry word="{@word}" pos="{@pos}" macros="@sg-copula">
      <xsl:apply-templates select="@*"/>
    </entry>
  </xsl:template>

	<xsl:template match="entry[(@word='were' or @word='are') and @stem='be']">
    <entry word="{@word}" pos="{@pos}" macros="@pl-copula">
      <xsl:apply-templates select="@*"/>
    </entry>
  </xsl:template>


	<!--Add semantic class (BBN) to morph entry if present-->
	<xsl:template name="sem-class">
		<xsl:if test="@class">  
			<xsl:copy-of select="@class"/>
		</xsl:if>
  </xsl:template>
  
  <!--Default global copy rule-->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>
  
</xsl:transform>


================================================
FILE: ccgbank/templates/allotIdLeaf.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

<xsl:output method="xml" indent="yes" xalan2:indent-amount="2" omit-xml-declaration = "yes"/>

<xsl:strip-space elements="*"/>

<xsl:variable name="obj" select="java:opennlp.ccgbank.convert.InfoHelper.new()"/>

<!--Transform to allot term_nos to lexical items (Leafnodes)-->

<xsl:template match="/">
  <xsl:apply-templates select="@*|node()"/>
</xsl:template>

<xsl:template match="Treenode[@Header]">

  <xsl:variable name="void" select="java:initId($obj)"/>
  <Treenode nt_id="{generate-id()}">
   <xsl:apply-templates select="@*|node()"/>
  </Treenode>
</xsl:template>

<xsl:variable name="rquote">''</xsl:variable>

<!--Allot punctless ids to lexical items starting from 0,1,..-->
<xsl:template match="Leafnode">
	<xsl:variable name="termNo" select="java:getTermNo($obj)"/>
  <xsl:variable name="pless_ind" select="java:getPunctlessIndex($obj,@lexeme0)"/>
  <Leafnode>
		<xsl:attribute name="term_no"><xsl:value-of select="$termNo"/></xsl:attribute>
    <xsl:attribute name="pless_ind"><xsl:value-of select="$pless_ind"/></xsl:attribute>
    <xsl:apply-templates select="@*|node()"/>
  </Leafnode>
</xsl:template>

<!--Default global copy rule-->

   <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/allotIdTree.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

<xsl:output method="xml" indent="yes" xalan2:indent-amount="2" omit-xml-declaration = "yes"/>

<xsl:strip-space elements="*"/>


<xsl:variable name="obj" select="java:opennlp.ccgbank.convert.InfoHelper.new()"/>

<!--Transform to allot term_nos to non-terminals (Treenodes)-->

<!--Also gives full fledged cats with feat ids for hitherto unmarked Treenode cats using CreateTestbed derived aux files-->

<xsl:template match="/">
  <xsl:apply-templates select="@*|node()"/>
</xsl:template>

<xsl:template match="Treenode[@Header]">

  <xsl:variable name="void" select="java:initId($obj)"/>
  <Treenode nt_id="{generate-id()}">
   <xsl:apply-templates select="@*|node()"/>
  </Treenode>
</xsl:template>

<!--Allot xslt ids and cat ids to treenodes-->
<xsl:template match="Treenode">

	<xsl:variable name="header" select="ancestor-or-self::*[@Header]/@Header"/>
	<xsl:variable name="nt-id" select="java:getNonTermNo($obj)"/>
	<xsl:variable name="tree-info" select="java:getTreeInfo($obj,concat($header,' ',$nt-id))"/>

	<Treenode nt_id="{$nt-id}">

		<xsl:choose>
	 	<xsl:when test="string-length($tree-info)>0 and (java:checkTreeInfo($obj,$header,$nt-id,number(count(*[1]/descendant::atomcat))))">
      <xsl:attribute name="cat-full"><xsl:value-of select="$tree-info"/></xsl:attribute>
			<xsl:apply-templates select="@*"/>	
			<xsl:apply-templates select="*[1]" mode="tree-id"/>	
			<xsl:apply-templates select="*[position() &gt; 1]"/>	
    </xsl:when>
		<xsl:otherwise>
			<xsl:apply-templates select="@*|node()"/>	
		</xsl:otherwise>
		</xsl:choose>
  </Treenode>
</xsl:template>

<!--Template which allots actual Treenode ids from info in the bkgrnd class
<xsl:template match="atomcat" mode="tree-id">
	<xsl:variable name="tree-cat" select="java:getTreeId($obj)"/>
	<atomcat type="{@type}">
		<xsl:choose>
			<xsl:when test="starts-with($tree-cat,'M_')">
				<fs inheritsFrom="{substring-after($tree-cat,'_')}">
					<xsl:if test="descendant::fs">
						<xsl:apply-templates select="descendant::fs/*"/>
					</xsl:if>
				</fs>
			</xsl:when>
			<xsl:otherwise>
				<fs id="{$tree-cat}">
					<xsl:if test="descendant::fs">
						<xsl:apply-templates select="descendant::fs/*"/>
					</xsl:if>
				</fs>
			</xsl:otherwise>	
		</xsl:choose>
	</atomcat>
</xsl:template>

<xsl:template match="slash" mode="tree-id">
	<xsl:variable name="slash" select="java:getTreeSlash($obj)"/>
	<slash dir="{substring-before($slash,'_')}" mode="{substring-after($slash,'_')}"/>
</xsl:template>-->


<!--Tree-id copy rule-->
   <xsl:template match="@*|node()" mode="tree-id">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()" mode="tree-id"/>
    </xsl:copy>
  </xsl:template>


<!--Default global copy rule-->

   <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/allotIndexRel.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

<xsl:output method="xml" indent="yes" xalan2:indent-amount="2" omit-xml-declaration = "yes"/>

<xsl:strip-space elements="*"/>

<xsl:template match="/">
  <xsl:apply-templates/>
</xsl:template>

<!--Transform which allots index rel based on pos tags-->

<!--Add index rels to punctuation categories-->
  <xsl:template match="Leafnode">           
    <Leafnode>
      <xsl:apply-templates select="@*"/>
     <!-- add indexRel -->
      <xsl:choose>

				<!--Adv conj-->

				<!--Conjunction commas-->
				<xsl:when test="@pos='PUNCT_CONJ' or @pos1='PUNCT_CONJ'">
          <xsl:attribute name="indexRel">First</xsl:attribute>
        </xsl:when>
				
				<xsl:when test="(@pos='CC' or @pos='PUNCT_CONJ' or @pos1='CC' or @pos1='PUNCT_CONJ') and starts-with(@name,'s_1\np_2\(s_1\np_2)\*(s_3\np_4\(s_3\np_4))')">
          <xsl:attribute name="indexRel">GenRel</xsl:attribute>
        </xsl:when>

				<xsl:when test="@name='np_1/(s[dcl]_2\np_3)' or @name='np_1/(s[dcl]_2/np_3)'">
					<xsl:attribute name="indexRel">GenRel</xsl:attribute>
        </xsl:when>

				<xsl:when test="@name='n_1/n_1\*(n_2/n_2)/*(n_3/n_3)'">
					<xsl:attribute name="indexRel">GenRel</xsl:attribute>
        </xsl:when>

				<xsl:when test="@name='sent_1\*n_1'">
					<xsl:attribute name="indexRel">moodColon</xsl:attribute>
        </xsl:when>

				<!--Appos np commas-->

				<xsl:when test="@pos='PUNCT_APPOS' or @pos1='PUNCT_APPOS'">
          <xsl:attribute name="indexRel">ApposRel</xsl:attribute>
        </xsl:when>

				<xsl:when test="@pos='PUNCT_APPOS_PLACE' or @pos='PUNCT_APPOS_ADDR' or @pos1='PUNCT_APPOS_PLACE' or @pos1='PUNCT_APPOS_ADDR'">
          <xsl:attribute name="indexRel">ApposRel</xsl:attribute>
        </xsl:when>

				<xsl:when test="@pos='PUNCT_APPOS_MISC' or @pos1='PUNCT_APPOS_MISC'">
          <xsl:attribute name="indexRel">ApposRel</xsl:attribute>
        </xsl:when>

				<xsl:when test="@pos='PUNCT_APPOS_VRB' or @pos1='PUNCT_APPOS_VRB'">
          <xsl:attribute name="indexRel">ApposRel</xsl:attribute>
        </xsl:when>

				<!--Extraposed appositives-->
				<xsl:when test="@pos='PUNCT_EXTR-APPOS' or @pos1='PUNCT_EXTR-APPOS'">
          <xsl:attribute name="indexRel">ApposRel</xsl:attribute>
        </xsl:when>

				<xsl:when test="(@pos='WRB' or @pos='WP' or @pos='WDT') and contains(@name,'punct[,]')">
          <xsl:attribute name="indexRel">whApposRel</xsl:attribute>
        </xsl:when>

				<!--Commas which anchor pre-sentential adv adjuncts-->
				<xsl:when test="@pos='PUNCT_INIT_ADJ-MOD' or @pos1='PUNCT_INIT_ADJ-MOD'">
          <xsl:attribute name="indexRel">emph-intro</xsl:attribute>
        </xsl:when>
				<xsl:when test="@pos='PUNCT_INIT_ADJ-ARG' or @pos1='PUNCT_INIT_ADJ-ARG'">
          <xsl:attribute name="indexRel">EmphIntro</xsl:attribute>
        </xsl:when>
	
				<!--Commas which introduce say verbs-->
				<xsl:when test="substring(@pos,1,9)='PUNCT_SAY' or substring(@pos1,1,9)='PUNCT_SAY'">
					<xsl:attribute name="indexRel">ElabRel</xsl:attribute>
        </xsl:when>

				<!--post & pre vp adjunct commas-->
				<xsl:when test="@pos='PUNCT_PRE-VP_ADJ' or @pos='PUNCT_POST-VP_ADJ' or @pos1='PUNCT_PRE-VP_ADJ' or @pos1='PUNCT_POST-VP_ADJ'">
					<xsl:attribute name="indexRel">modFeat</xsl:attribute>
        </xsl:when>
			
				<!--Emph final commas-->
				<xsl:when test="@pos='PUNCT_EMPH_FINAL' or @pos1='PUNCT_EMPH_FINAL'">
					<xsl:attribute name="indexRel">emph-final</xsl:attribute>
        </xsl:when>
				<xsl:when test="@pos='PUNCT_EMPH_FINAL_VRB' or @pos1='PUNCT_EMPH_FINAL_VRB'">
					<xsl:attribute name="indexRel">EmphFinal</xsl:attribute>
        </xsl:when>

				<!--Parenthetical commas-->
				<xsl:when test="@pos='PUNCT_PARENTHETICAL' or @pos1='PUNCT_PARENTHETICAL'">
					<xsl:attribute name="indexRel">interrupt</xsl:attribute>
        </xsl:when>
				<xsl:when test="@pos='PUNCT_PARENTHETICAL_VRB' or @pos1='PUNCT_PARENTHETICAL_VRB'">
					<xsl:attribute name="indexRel">InterruptRel</xsl:attribute>
        </xsl:when>	

				<!--Brackets-->
				<xsl:when test="starts-with(@pos,'PUNCT_LPAREN') and not(starts-with(@name,'punct'))">
					<xsl:attribute name="indexRel">ParenRel</xsl:attribute>
				</xsl:when>

				<!--Colons after say verbs-->
				<xsl:when test="@pos='PUNCT_COLON_SAY' or @pos1='PUNCT_COLON_SAY'">
          <xsl:attribute name="indexRel">colonExp</xsl:attribute>
        </xsl:when>

				<!--Dash expansions-->
				<xsl:when test="@pos='IN-DASH' or @pos='PUNCT_ELAB_DASH_CAT' or @pos='PUNCT_ELAB_DASH' or @pos1='IN-DASH' or @pos1='PUNCT_ELAB_DASH_CAT' or @pos1='PUNCT_ELAB_DASH'">
          <xsl:attribute name="indexRel">DashInterp</xsl:attribute>
        </xsl:when>
				
				<!--Ellipsis relations ie dots in text-->
				<xsl:when test="@pos='PUNCT_DOTS1' or @pos='PUNCT_DOTS2' or @pos1='PUNCT_DOTS1' or @pos1='PUNCT_DOTS2'">
          <xsl:attribute name="indexRel">EllipsisRel</xsl:attribute>
        </xsl:when>
			</xsl:choose>
			<xsl:apply-templates/>
		</Leafnode>
	</xsl:template>		

<!--Default global copy rule-->
<xsl:template match="@*|node()">
   <xsl:copy>
     <xsl:apply-templates select="@*|node()"/>
   </xsl:copy>
</xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/anim-macroInsert.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->

<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

  <xsl:output method="xml" indent="yes" xalan2:indent-amount="2"/>
  <xsl:strip-space elements="*"/>
  
  
  <!--Transform which takes in as input the morph.xml file and outputs a morph.xml file -->
  
  <!--Java Program in the grammar extractor package invoked-->
  <xsl:variable name="obj" select="java:opennlp.ccgbank.extract.MorphExtrHelper.new()"/>
  
	<xsl:template match="morph">
   <morph>
  
      <xsl:apply-templates select="@*|node()"/>
			
		  <!--<entry pos="Dummy" word="*dummy*"/>-->
			
      <macro name="@anim-nom">
         <fs id="9">
           <feat attr="anim" val="+"/>
         </fs>
      </macro>
      <macro name="@non-anim-nom">
         <fs id="9">
           <feat attr="anim" val="-"/>
         </fs>
      </macro>
			<macro name="@anim-wh">
         <fs id="1">
           <feat attr="anim" val="+"/>
         </fs>
      </macro>
      <macro name="@non-anim-wh">
         <fs id="1">
           <feat attr="anim" val="-"/>
         </fs>
      </macro>
   </morph>
  </xsl:template>
  
	<xsl:template match="entry">
    <entry>
			<xsl:apply-templates select="@*[not(name()='family')]"/>
    </entry>
  </xsl:template>

  <xsl:template match="entry[(@family='n_9' or @family='np_9')]">
    <entry>

			<xsl:variable name="macro-name" select="java:macroNamer($obj,@macros,@class,@pos,@word)"/>

			<xsl:if test="string-length($macro-name) &gt; 0">
				<xsl:attribute name = "macros" >
	  			<xsl:value-of select = "$macro-name" />
   			</xsl:attribute>
			</xsl:if>
			<xsl:apply-templates select="@*[not(name()='family') and not(name()='macros')]"/>			

    </entry>
  </xsl:template>
    
	<xsl:template match="entry[@pos='WP' and (@word='who')]">
    <entry macros="@anim-wh">
			<xsl:apply-templates select="@*[not(name()='family')]"/>			
    </entry>
  </xsl:template>
	<xsl:template match="entry[@pos='WDT']">
    <entry macros="@non-anim-wh">
			<xsl:apply-templates select="@*[not(name()='family')]"/>			
    </entry>
  </xsl:template>

	<!--Add semantic class (BBN) to morph entry if present-->
	<xsl:template name="sem-class">
		<xsl:if test="@class">  
			<xsl:copy-of select="@class"/>
		</xsl:if>
  </xsl:template>


  <!--Default global copy rule-->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>
  
</xsl:transform>


================================================
FILE: ccgbank/templates/annotateAppos-Dash.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

<xsl:output method="xml" indent="yes" xalan2:indent-amount="2" omit-xml-declaration = "yes"/>

<xsl:strip-space elements="*"/>

<!--Transform which corrects the structure of , np\np marked appositives to , x ==> np\np-->

<xsl:template match="/">
  	<xsl:apply-templates/>
</xsl:template>

<!--Delete existing appositive commas-->
<xsl:template match="Treenode[*[3]/@lexeme='--' and *[2]/*[2]/@pos1='PUNCT_ELAB_DASH']">
		<xsl:apply-templates select="*[2]"/>
</xsl:template>

<xsl:template match="Treenode[@cat0='NP\NP' and *[2]/@pos1='PUNCT_ELAB_DASH']">

	<Treenode cat="np\np" head="0" dtr="2" cat0="NP\NP">
		<xsl:apply-templates select="@*"/>
		<complexcat>
    		<atomcat type="np">
      		<fs id="1">
        	</fs>
      	</atomcat>
      	<slash dir="\" mode="&lt;"/>
      	<atomcat type="np">
      		<fs id="1">
					</fs>
      	</atomcat>
		</complexcat>
		<xsl:call-template name="tree"/>
	</Treenode>	
	
</xsl:template>

<xsl:template name="tree">

	<xsl:choose>
		<xsl:when test="parent::*/*[3]/@lexeme='--'">
			<Treenode cat="np\np/*punct[,]" head="0" dtr="2">
				<xsl:apply-templates select="@*"/>
      	<complexcat>
        	<atomcat type="np">
          	<fs id="1">
						</fs>
        	</atomcat>
        	<slash dir="\" mode="&lt;"/>
        	<atomcat type="np">
          	<fs id="1">
						</fs>
        	</atomcat>
					<slash dir="/" mode="*"/>
        	<atomcat type="punct">
          	<fs id="2">
            	<feat attr="lex" val="--"/>
          	</fs>
        	</atomcat>
      	</complexcat>
				<xsl:call-template name="leaf"/>
			</Treenode>	
			<Leafnode cat="punct[--]_1" lexeme="--" pos=":" pos1="PUNCT_ELAB_DASH_BAL" cat0=",">
    		<atomcat type="punct">
      		<fs id="1">
        		<feat attr="lex" val="--"/>
        	</fs>
      	</atomcat>
    	</Leafnode>
		</xsl:when>
		<xsl:otherwise>
				<xsl:call-template name="leaf"/>
		</xsl:otherwise>
	</xsl:choose>
</xsl:template>

<xsl:template name="leaf">
	
	<Leafnode cat="" lexeme="--" pos=":" pos1="PUNCT_ELAB_DASH" cat0=",">
  	<complexcat>
    	<atomcat type="np">
      	<fs inheritsFrom="1">
				</fs>
      </atomcat>
      <slash dir="\" mode="&lt;"/>
      <atomcat type="np">
      	<fs id="1">
				</fs>
      </atomcat>
			<xsl:if test="parent::*/*[3]/@lexeme='--'">
      	<slash dir="/" mode="*"/>
	    	<atomcat type="punct">
  	  		<fs id="2">
    				<feat attr="lex" val="--"/>
					</fs>
      	</atomcat>
			</xsl:if>
			<slash dir="/" mode="*"/>
			<complexcat>
    		<atomcat type="np">
					<fs inheritsFrom="1"/>
      	</atomcat>
      	<slash dir="\" mode="&lt;"/>
      	<atomcat type="np">
      		<fs id="1">
					</fs>
      	</atomcat>
			</complexcat>
		</complexcat>
	</Leafnode>
	<xsl:apply-templates select="*[3]"/>
</xsl:template>

<!--Default global copy rule-->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/annotateAppos1.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

<xsl:output method="xml" indent="yes" xalan2:indent-amount="2" omit-xml-declaration = "yes"/>

<xsl:strip-space elements="*"/>

<!--Applies Heuristic1: Isolate all subject position NPs which are surrounded by balanced commas-->

<!--Java Program in the parse package invoked-->
<xsl:variable name="obj" select="java:opennlp.ccgbank.convert.ApposTally.new()"/>

<xsl:template match="/">
	<xsl:apply-templates/>
</xsl:template>


<!--Storing id of the sent in a java var-->
<xsl:template match="Treenode[@Header]">
	<xsl:variable name="dummy1" select="java:storeId($obj,@Header)"/>
	<Treenode cat="{@cat}" Header="{@Header}" head="{@head}" dtr="{@dtr}" cat0="{@cat}">
  	<xsl:apply-templates select="@*|node()"/>
	</Treenode>
</xsl:template>


<!--Heuristic1: Check whether there are balanced commas around NP-->	
<!--np[conj] Commas selected-->
<xsl:template match="Treenode[@cat='np[conj]' and child::Leafnode[@pos1='PUNCT_CONJ' and @lexeme=',']]">

	<!--Re-init balance status var in background java class-->
	<xsl:variable name="dummy0" select="java:flushVars($obj)"/>

	<!--Grandparent of the context leafnode selected -->
  <xsl:variable name="par" select=".."/>
	
	<!--and $par/../../atomcat[1]/@type='s'">-->

	<xsl:if test="$par/following-sibling::Leafnode/@lexeme=','"> 

		<xsl:variable name="dummy1" select="java:storeBalance($obj,'appos')"/>

		<!--Find lexical mtl of np1+np2-->
		<xsl:apply-templates select="preceding-sibling::*[1]" mode="interLex"/>
		<xsl:variable name="dummy2" select="java:storeLex($obj,'X','X')"/>
		<xsl:apply-templates select="*[3]" mode="interLex"/>

		<!--Stick heads into the tail of the sentence-->
		<xsl:variable name="dummy3" select="java:storeLex($obj,'Heads','')"/>
		<!--Find heads of np1, np2 (appos np)-->
		<xsl:apply-templates select="$par" mode="headFindGen"/>	
		<!--<xsl:variable name="dummy4" select="java:printLex($obj)"/>-->
	</xsl:if>

	<xsl:variable name="res" select="java:getBalance($obj)"/>
	<xsl:variable name="resCaps" select="java:getCaps($obj,$res)"/>
	
	<xsl:choose>
		<xsl:when test="$res='appos'">
	
			<Treenode cat="np\np" head="0" dtr="2" cat0="np\np">
				<xsl:apply-templates select="@*"/>
				<complexcat>
					<atomcat type="np">
    				<fs id="1">
						</fs>
    			</atomcat>
					<slash dir="\" mode="&lt;"/>
					<atomcat type="np">
    				<fs id="1">
						</fs>
    			</atomcat>
				</complexcat>

				<Leafnode cat="np_1\np_1/*punct[,]/*np" lexeme="{Leafnode/@lexeme}" pos1="PUNCT_{$resCaps}" cat0="{Leafnode/@lexeme}">
					<xsl:apply-templates select="*[2]/@*[not(name()='pos1')]"/>
					<complexcat>
						<atomcat type="np">
    					<fs inheritsFrom="1">
							</fs>
    				</atomcat>
						<slash dir="\" mode="&lt;"/>
						<atomcat type="np">
    					<fs id="1">
							</fs>
    				</atomcat>
						<slash dir="/" mode="*"/>
						<atomcat type="np">
    					<fs id="3">
							</fs>
    				</atomcat>
					</complexcat>
		 		</Leafnode>
  			<xsl:apply-templates select="*[position()>2]"/>
			</Treenode>
		</xsl:when>	
		<xsl:otherwise>	
			<Treenode cat="np[{$res}]" head="{@head}" dtr="{@dtr}" cat0="{@cat0}">
    		<xsl:apply-templates select="@*[not(name='cat')]|node()"/>
    	</Treenode>
		</xsl:otherwise>	
	</xsl:choose>
</xsl:template>	

<!--Template which traps head noun across the board ie both np,its appos-->
<xsl:template match = "Leafnode[count(atomcat)=1 and atomcat[1]/@type='n']" mode="headFindGen">
	<xsl:variable name="lex" select="concat('-',@lexeme)"/>
	<xsl:variable name="dummy1" select="java:storeLex($obj,$lex,@pos1)"/>
	<!--Stores head info-->
	<xsl:variable name="dummy2" select="java:storeHead($obj,@lexeme,@pos1,0)"/>
</xsl:template>
<!--Skipping modifiers in head nouns-->
<xsl:template match = "Treenode[@cat='np\np']" mode="headFindGen"/>

<!--Copying intervening lexical mtl-->
<xsl:template match = "Leafnode" mode="interLex">
	<!--Store intervening lexical mtl -->
  <xsl:variable name="dummy" select="java:storeLex($obj,@lexeme,@pos1)"/>
</xsl:template>

<xsl:template match = "Treenode" mode="interLex">
	<xsl:apply-templates mode="interLex"/>
</xsl:template>

<!--Default global copy rule-->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/annotateAppos2.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

<xsl:output method="xml" indent="yes" xalan2:indent-amount="2" omit-xml-declaration = "yes"/>

<xsl:strip-space elements="*"/>

<!--Java Program in the parse package invoked-->
<xsl:variable name="obj" select="java:opennlp.ccgbank.convert.ApposTally.new()"/>

<xsl:template match="/">
  <xsl:apply-templates/>
</xsl:template>

<!--Storing id of the sent in a java var-->
<xsl:template match="Treenode[@Header]">
	<xsl:variable name="dummy1" select="java:storeId($obj,@Header)"/>
	<Treenode cat="{@cat}" Header="{@Header}" head="{@head}" dtr="{@dtr}" cat0="{@cat}">
  	<xsl:apply-templates select="@*|node()"/>
	</Treenode>
</xsl:template>


<!--Heuristic 2: Template which does cue analysis-->

<!--np[conj] Commas which are not preceded by a colon selected-->
<xsl:template match="Treenode[@cat='np[conj]' and Leafnode[@lexeme=',' and @pos1='PUNCT_CONJ'] and not(../preceding-sibling::Leafnode/@lexeme=':')]">
	<!--Re-init balance status var in background java class-->
	<xsl:variable name="dummy0" select="java:flushVars($obj)"/>
	
	<!--np1: Main np , np2: appos np-->

	<!--Find lexical mtl of np1+np2-->
	<xsl:apply-templates select="preceding-sibling::*[1]" mode="interLex"/>
	<xsl:variable name="dummy1" select="java:storeLex($obj,'X','X')"/>
	<xsl:apply-templates select="*[3]" mode="interLex"/>
	
	<!--Stick heads into the tail of the sentence-->
	<xsl:variable name="dummy4" select="java:storeLex($obj,'Heads','')"/>
	
	<!--Find heads of np1, np2 (appos np)-->
	<xsl:apply-templates select="preceding-sibling::*[1]" mode="headFindGen1"/>	
	<xsl:apply-templates select="*[3]" mode="headFindGen2"/>	

	<xsl:variable name="res" select="java:cueAnalysis($obj)"/>
	<xsl:variable name="resCaps" select="java:getCaps($obj,$res)"/>

	<!--Get and display result of analysis-->
	
	<xsl:choose>
	<xsl:when test="not($res='conj')">
		<!--<xsl:variable name="dummy1" select="java:printLex($obj)"/>-->
	
	<!--Modify np[conj]-->
	<Treenode cat="np\np" head="{@head}" dtr="{@dtr}" cat0="{@cat0}">
		<xsl:apply-templates select="@*"/>
		<complexcat>
			<atomcat type="np">
    		<fs id="1">
				</fs>
    	</atomcat>
			<slash dir="\" mode="&lt;"/>
			<atomcat type="np">
    		<fs id="1">
				</fs>
    	</atomcat>
		</complexcat>
		<Leafnode cat="np_~1\np_1/*np_2" lexeme="{Leafnode/@lexeme}" pos1="PUNCT_{$resCaps}" cat0="{Leafnode/@lexeme}">
			<xsl:apply-templates select="*[2]/@*[not(name()='pos1')]"/>
			<complexcat>
				<atomcat type="np">
    			<fs inheritsFrom="1">
					</fs>
    		</atomcat>
				<slash dir="\" mode="&lt;"/>
				<atomcat type="np">
    			<fs id="1">
					</fs>
    		</atomcat>
				<slash dir="/" mode="*"/>
				<atomcat type="np">
    			<fs id="3">
					</fs>
    		</atomcat>
			</complexcat>
		</Leafnode>
  	<xsl:apply-templates select="*[position()>2]"/>
  </Treenode>
	</xsl:when>	
	<xsl:otherwise>
		<Treenode cat="np[{$res}]" head="{@head}" dtr="{@dtr}" cat0="{@cat0}">
    	<xsl:apply-templates select="@*[not(name='cat')]|node()"/>
    </Treenode>
	</xsl:otherwise>
	</xsl:choose>	
</xsl:template>	

<!--Template which traps head noun of main np-->
<xsl:template match = "Leafnode[count(atomcat)=1 and atomcat[1]/@type='n']" mode="headFindGen1">
	<xsl:variable name="lex" select="concat('-',@lexeme)"/>
	<xsl:variable name="dummy1" select="java:storeLex($obj,$lex,@pos1)"/>
	<!--Stores head info-->
	<xsl:variable name="dummy2" select="java:storeHead($obj,@lexeme,@pos1,1)"/>
</xsl:template>
<!--Skipping modifiers in head nouns-->
<xsl:template match = "Treenode[@cat='np\np']" mode="headFindGen1"/>

<!--Template which traps head noun of appos np-->
<xsl:template match = "Leafnode[count(atomcat)=1 and atomcat[1]/@type='n']" mode="headFindGen2">
	<xsl:variable name="lex" select="concat('-',@lexeme)"/>
	<xsl:variable name="dummy1" select="java:storeLex($obj,$lex,@pos1)"/>
	<!--Stores head info-->
	<xsl:variable name="dummy2" select="java:storeHead($obj,@lexeme,@pos1,2)"/>
</xsl:template>
<!--Skipping modifiers in head nouns-->
<xsl:template match = "Treenode[@cat='np\np']" mode="headFindGen2"/>


<!--Copying intervening lexical mtl-->
<xsl:template match = "Leafnode" mode="interLex">
	<!--Store intervening lexical mtl -->
  <xsl:variable name="dummy" select="java:storeLex($obj,@lexeme,@pos1)"/>
</xsl:template>
<xsl:template match = "Treenode" mode="interLex">
	<xsl:apply-templates mode="interLex"/>
</xsl:template>

<!--Default global copy rule-->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/annotateAppos3.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

<xsl:output method="xml" indent="yes" xalan2:indent-amount="2" omit-xml-declaration = "yes"/>

<xsl:strip-space elements="*"/>

<!--Transform which corrects the structure of , np\np marked appositives to , x ==> np\np-->

<xsl:template match="/">
  	<xsl:apply-templates/>
</xsl:template>


<!--Cat1-->

<!--Delete existing appositive commas-->
<xsl:template match="Treenode[@cat0='NP' and *[3]/@pos1='PUNCT_APPOS_VRB']">
	<xsl:apply-templates select="*[2]"/>
</xsl:template>

<xsl:template match="Treenode[@cat0='NP\NP' and preceding-sibling::Treenode/*[3]/@pos1='PUNCT_APPOS_VRB']">

	<Treenode cat="np\np" head="0" dtr="2" cat0="NP\NP">
		<xsl:apply-templates select="@*|*[1]"/>
		<xsl:variable name="vrb-feat" select="*[2]/*[1]/atomcat[1]/fs/feat/@val"/>
		<Leafnode cat="" lexeme="," pos1="PUNCT_APPOS_VRB" cat0=",">
			<xsl:apply-templates select="preceding-sibling::Treenode/*[3]/@*"/>
  		<complexcat>
    		<atomcat type="np">
      		<fs inheritsFrom="1">
					</fs>	
      	</atomcat>
      	<slash dir="\" mode="&lt;"/>
      	<atomcat type="np">
      		<fs id="1">
					</fs>
      	</atomcat>
				<slash dir="/" mode="*"/>
				<complexcat>
       		<atomcat type="s">
        		<fs id="4">
          		<feat attr="form" val="{$vrb-feat}"/>
          	</fs>
        	</atomcat>
        	<slash dir="\" mode="&lt;"/>
        	<atomcat type="np">
						<fs id="1">
						</fs>
        	</atomcat>
     	 </complexcat>
			</complexcat>
		</Leafnode>
		<xsl:apply-templates select="*[2]"/>
	</Treenode>	
</xsl:template>


<!--Cat 2-->

<!--Delete existing appositive commas-->
<xsl:template match="Treenode[@cat0='NP' and *[3]/@pos1='PUNCT_APPOS_WH']">
	<xsl:apply-templates select="*[2]"/>
</xsl:template>

<xsl:template match="Treenode[@cat0='NP\NP' and name(*[2])='Leafnode' and preceding::Leafnode[1]/@pos1='PUNCT_APPOS_WH']">

	<Treenode cat="np\np" head="0" dtr="2" cat0="NP\NP">
		<xsl:apply-templates select="*[1]/@*|*[1]"/>
		<Leafnode cat="punct[,]_1" lexeme="," pos1="PUNCT_APPOS_WH" cat0=",">
			<xsl:apply-templates select="preceding::Leafnode[1]/@*"/>	
    	<atomcat type="punct">
      	<fs id="1">
       		<feat attr="lex" val=","/>
       	</fs>
      </atomcat>
    </Leafnode>	
		<Treenode cat="" head="0" dtr="2" cat0="NP\NP">
			<xsl:apply-templates select="*[1]/@*"/>
			<complexcat>
    		<xsl:apply-templates select="*[1]/*"/>
				<slash dir="\" mode="*"/>
				<atomcat type="punct">
  	    	<fs id="11">
    	  		<feat attr="lex" val=","/>
					</fs>
				</atomcat>
			</complexcat>		

			<Leafnode cat="" lexeme="{*[2]/@lexeme}" pos1="{*[2]/@pos1}" cat0="{*[2]/@cat0}">
				<xsl:apply-templates select="*[2]/@*"/>
  			<complexcat>
					<xsl:if test="name(*[2]/*[1])='complexcat'">
						<xsl:apply-templates select="*[2]/complexcat/*[position() &lt; last()-1]"/>			
					</xsl:if>
					<xsl:if test="name(*[2]/*[1])='atomcat'">
						<xsl:apply-templates select="*[2]/*[1]"/>			
					</xsl:if>
					<slash dir="\" mode="*"/>
					<atomcat type="punct">
  	    		<fs id="11">
    	  			<feat attr="lex" val=","/>
						</fs>
      		</atomcat>
					<slash dir="/" mode="*"/>
					<xsl:apply-templates select="*[2]/complexcat/*[position()=last()]"/>		
				</complexcat>
			</Leafnode>
			<xsl:apply-templates select="*[3]"/>
		</Treenode>		
	</Treenode>	
</xsl:template>

<!--Cat 3-->

<!--Delete existing appositive commas-->
<xsl:template match="Treenode[@cat0='NP' and *[3]/@pos1='PUNCT_APPOS_MISC']">
	<xsl:apply-templates select="*[2]"/>
</xsl:template>

<xsl:template match="Treenode[@cat0='NP\NP' and preceding-sibling::Treenode[1]/*[3]/@pos1='PUNCT_APPOS_MISC']">

	<Treenode cat="np\np" head="0" dtr="2" cat0="NP\NP">
		<xsl:apply-templates select="@*|*[1]"/>

		<xsl:variable name="feat" select="*[2]/*[1]/atomcat[1]/fs/feat/@val"/>
		<Leafnode cat="" lexeme="," pos1="PUNCT_APPOS_MISC" cat0=",">
			<xsl:apply-templates select="preceding-sibling::Treenode[1]/*[3]/@*"/>
  		<complexcat>
    		<atomcat type="np">
      		<fs inheritsFrom="1">
					</fs>
      	</atomcat>
      	<slash dir="\" mode="&lt;"/>
      	<atomcat type="np">
      		<fs id="1">
					</fs>
      	</atomcat>
				<slash dir="/" mode="*"/>
				<complexcat>
    			<atomcat type="np">
      			<fs inheritsFrom="1">
						</fs>
      		</atomcat>
      		<slash dir="\" mode="&lt;"/>
      		<atomcat type="np">
      			<fs id="1">
						</fs>
      		</atomcat>
				</complexcat>
			</complexcat>
		</Leafnode>
		<Treenode>
			<xsl:copy-of select="@*"/>
			<xsl:apply-templates/>
		</Treenode>
	</Treenode>	

</xsl:template>

<!--Default global copy rule-->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/annotateBrackets.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  xmlns:exsl="http://exslt.org/common"
  extension-element-prefixes="exsl"		
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

  <xsl:output method="xml" indent="yes" xalan2:indent-amount="2"/>
  <xsl:strip-space elements="*"/>

<!--Java helper class-->
<xsl:variable name="obj" select="java:opennlp.ccgbank.convert.PunctHelper.new()"/>
<!--Paren rules for brackets around sentences & np mods-->

<xsl:template match="/">
  <xsl:apply-templates/>
</xsl:template>

<!--Treenode above the sent-paren in question-->
<xsl:template match="Treenode[*[2]/@pos1='PUNCT_LPAREN1']">

	<!--Choice between lcb and -lrb-->
	<xsl:variable name="lexVal" select="concat('-r',substring(*[2]/@lexeme,3,5))"/>
	<Treenode>
		<xsl:apply-templates select="@*|*[1]"/>		
		<Treenode cat="" head="0" dtr="2" cat0="NewlyAdded">
			<xsl:apply-templates select="@*[not(name()='Header')]"/>		
			<complexcat>
				<xsl:apply-templates select="*[1]"/>
				<slash dir="/" mode="*"/>
				<atomcat type="punct">
      		<fs>
        		<feat attr="lex" val="{$lexVal}"/>
       		</fs>
       	</atomcat>
			</complexcat>
			<Leafnode>
				<xsl:copy-of select="*[2]/@*"/>
				<complexcat>
					<atomcat type="sent">
            <fs inheritsFrom="1"/>
          </atomcat>					
					<slash dir="/" mode="*"/>
					<atomcat type="punct">
          	<fs id="2">
            	 <feat attr="lex" val="{$lexVal}"/>
           	</fs>
        	</atomcat>
					<slash dir="/" mode="*"/>
					<atomcat type="sent">
            <fs id="1"/>
          </atomcat>				
      	</complexcat>
			</Leafnode>
			<xsl:apply-templates select="*[3]"/>		
		</Treenode>
		<Leafnode cat="punct" lexeme="{$lexVal}" pos="RRB" pos1="PUNCT_RPAREN" cat0="RRB">		
    	<atomcat type="punct">
      	<fs id="1">
        	<feat attr="lex" val="{$lexVal}"/>
        </fs>
      </atomcat>
    </Leafnode>
	</Treenode>
</xsl:template>
	
<!--Treenode above the np-mod paren in question-->
<xsl:template match="Treenode[*[2]/@pos1='PUNCT_LPAREN2']">
	
	<!--Choice between lcb and -lrb-->
	<xsl:variable name="lexVal" select="concat('-r',substring(*[2]/@lexeme,3,5))"/>
	<Treenode>
		<xsl:copy-of select="@*"/>
		<xsl:apply-templates select="*[1]"/>		
		<Treenode cat="" head="0" dtr="2" cat0="NewlyAdded">
			<xsl:copy-of select="@*"/>
			<complexcat>
				<xsl:apply-templates select="*[1]/*"/>
				<slash dir="/" mode="*"/>
				<atomcat type="punct">
      		<fs>
        		<feat attr="lex" val="{$lexVal}"/>
       		</fs>
       	</atomcat>
			</complexcat>

			<Leafnode>
				<xsl:copy-of select="*[2]/@*"/>
				<complexcat>
					<xsl:call-template name="args">
          	<xsl:with-param name="case">res</xsl:with-param>
          </xsl:call-template>
					<slash dir="/" mode="*"/>
					<atomcat type="punct">
          	<fs id="2">
            	 <feat attr="lex" val="{$lexVal}"/>
           	</fs>
        	</atomcat>
					<slash dir="/" mode="*"/>
					<xsl:call-template name="args">
          	<xsl:with-param name="case">arg</xsl:with-param>
          </xsl:call-template>
      	</complexcat>
			</Leafnode>
			<xsl:apply-templates select="*[3]"/>		
		</Treenode>
		<Leafnode cat="punct" lexeme="{$lexVal}" pos="RRB" pos1="PUNCT_RPAREN" cat0="RRB">
    	<atomcat type="punct">
      	<fs id="1">
        	<feat attr="lex" val="{$lexVal}"/>
        </fs>
      </atomcat>
    </Leafnode>
	</Treenode>
</xsl:template>

<xsl:template name="args">
	<xsl:param name="case"/>
			<xsl:if test="$case='res'">
				<atomcat type="np">
      		<fs inheritsFrom="1">
					</fs>
      	</atomcat>
      	<slash dir="\" mode="&lt;"/>
      	<atomcat type="np">
      		<fs id="1">
					</fs>
      	</atomcat>
			</xsl:if>
			<xsl:if test="$case='arg'">
				<complexcat>
					<atomcat type="np">
      			<fs inheritsFrom="1">
						</fs>
      		</atomcat>
      		<slash dir="\" mode="&lt;"/>
      		<atomcat type="np">
      			<fs id="1"/>
      		</atomcat>
				</complexcat>
			</xsl:if>
</xsl:template>

<!--Delete original balancing parens and full-stop in the wrong place-->
<xsl:template match="Treenode[@cat0='S[dcl]\NP' and *[2]/@cat0='S[dcl]\NP' and *[3]/@pos='RRB']">
	<xsl:apply-templates select="*[2]"/>		
</xsl:template>
<xsl:template match="Treenode[@cat0='NP\NP' and *[2]/@cat0='NP\NP' and *[3]/@pos='RRB']">
	<xsl:apply-templates select="*[2]"/>		
</xsl:template>

<xsl:template match="Treenode[@cat='sent_1' and preceding-sibling::Leafnode/@pos1='PUNCT_LPAREN1' and *[3]/@pos='RRB']">
	<xsl:apply-templates select="*[2]"/>		
</xsl:template>

<!--Default global copy rule-->
<xsl:template match="@*|node()">
	<xsl:copy>
 		<xsl:apply-templates select="@*|node()"/>
	</xsl:copy>
</xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/annotateColons.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

<xsl:output method="xml" indent="yes" xalan2:indent-amount="2" omit-xml-declaration = "yes"/>

<xsl:strip-space elements="*"/>

<!--Java helper class-->
<xsl:variable name="obj" select="java:opennlp.ccgbank.convert.PunctHelper.new()"/>
<!--Transform which intr colon rules-->

<xsl:template match="/">
	<xsl:apply-templates/>
</xsl:template>

<!--Cat 1-->
<xsl:template match="Treenode[@Header and count(*)=2 and descendant::Leafnode[last() and @lexeme=':' and @cat0=':']]">

	<Treenode>
		<xsl:copy-of select="@*"/>
		<xsl:apply-templates select="*"/>
		<Leafnode cat="sent_1\*x" lexeme=":" pos1=":" pos=":" cat0=":">
      <complexcat>
        <atomcat type="sent">
          <fs id="1"/>
        </atomcat>
        <slash dir="\" mode="*"/>
				<xsl:choose>
					<xsl:when test="*[2]/*[1][self::atomcat]">
						<atomcat type="{*[2]/*[1]/@type}">
          		<fs id="1"/>
		        </atomcat>
					</xsl:when>
					<xsl:otherwise>
						<xsl:apply-templates select="*[2]/*[1]"/>
					</xsl:otherwise>
				</xsl:choose>
      </complexcat>
    </Leafnode>
	</Treenode>
</xsl:template>

<!--Cat 2-->
<!--<xsl:template match="Treenode[*[2][java:removeFeats($obj,@cat0)='(S\NP)/S'] and *[3][@lexeme=':' and @cat0=':']]">-->

<xsl:template match="Treenode[java:removeFeats($obj,@cat0)='(S\NP)/S' and java:removeFeats($obj,*[2][self::Leafnode]/@cat0)='(S\NP)/S' and *[3]/@pos1=':']">

	<Treenode>
		<xsl:apply-templates select="@*|*[1]"/>

		<Leafnode cat="{*[2]/@cat}" lexeme="{*[2]/@lexeme}" pos1="{*[2]/@pos1}" cat0="{*[2]/@cat0}">	
			<xsl:apply-templates select="*[2]/@*"/>
			<complexcat>
				<xsl:apply-templates select="*[2]/*[1]/*"/>
				<slash dir="/" mode="*"/>
				<atomcat type="punct">
    			<fs id="4">
						<feat attr="lex" val=":"/>
					</fs>
  			</atomcat>
			</complexcat>
		</Leafnode>
		<Leafnode cat="{*[3]/@cat}" lexeme="{*[3]/@lexeme}" pos1="PUNCT_COLON" cat0="{*[3]/@cat0}">
			<xsl:apply-templates select="*[3]/@*[not(name()='pos1')]"/>
    	<atomcat type="punct">
    		<fs id="1">
					<feat attr="lex" val=":"/>
				</fs>
  		</atomcat>
		</Leafnode>
	</Treenode>	
</xsl:template>

<!--Cat 3-->
<xsl:template match="Treenode[@cat0='S[dcl]/S[dcl]' and *[2]/@cat0='S[dcl]/S[dcl]' and *[3][@lexeme=':' and @cat0=':']]">

	<Treenode>
	<xsl:apply-templates select="@*|*[1]|*[2]"/>
	<Leafnode cat="{*[3]/@cat}" lexeme=":" pos1="PUNCT_COLON_SAY" cat0=":">
		<xsl:apply-templates select="*[3]/@*[not(name()='pos1')]"/>
		<complexcat>
			<atomcat type="s">
  	  	<fs inheritsFrom="2">
					<feat attr="form" val="dcl"/>
      	</fs>
    	</atomcat>
    	<slash dir="/" mode="&gt;"/>
    	<atomcat type="s">
    		<fs id="2">
					<feat attr="form" val="dcl"/>
      	</fs>
    	</atomcat>			
			<slash dir="\" mode="*"/>
			<complexcat>
				<atomcat type="s">
  	  		<fs id="1">
						<feat attr="form" val="dcl"/>
      		</fs>
    		</atomcat>
    		<slash dir="/" mode="&gt;"/>
    		<atomcat type="s">
    			<fs id="2">
						<feat attr="form" val="dcl"/>		
      		</fs>
    		</atomcat>			
			</complexcat>
		</complexcat>
	</Leafnode>
	</Treenode>
</xsl:template>

<!--Default global copy rule-->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/annotateDots.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  xmlns:exsl="http://exslt.org/common"
  extension-element-prefixes="exsl"		
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

  <xsl:output method="xml" indent="yes" xalan2:indent-amount="2"/>
  <xsl:strip-space elements="*"/>

<!--Java helper class-->
<xsl:variable name="obj" select="java:opennlp.ccgbank.convert.PunctHelper.new()"/>
<!--Dots rule-->

<xsl:template match="/">
  <xsl:apply-templates/>
</xsl:template>

<!--Treenode above the comma in question-->
<xsl:template match="Treenode[@cat0='S[dcl]\NP' and ((*[3]/@cat0='S[dcl]\NP' and *[2]/@lexeme='...') or (*[2]/@cat0='S[dcl]\NP' and *[3]/@lexeme='...'))]">
	
	<xsl:choose>
		<xsl:when test="*[2]/@lexeme='...'">
			<xsl:variable name="dummy0" select="java:storePOS($obj,'PUNCT_DOTS1')"/>
		</xsl:when>
		<xsl:when test="*[3]/@lexeme='...'">
			<xsl:variable name="dummy0" select="java:storePOS($obj,'PUNCT_DOTS2')"/>
		</xsl:when>
	</xsl:choose>

	<xsl:variable name="pos" select="java:getPOS($obj)"/>

	<Treenode cat="{@cat}" head="0" dtr="{@dtr}" cat0="{@cat0}">
		<xsl:variable name="feat" select="*[1]/*[1]/fs/feat/@val"/>	
		<xsl:apply-templates select="*[1]"/>		

		<!--dots occurs after adj-->
		<xsl:if test="$pos='PUNCT_DOTS2'">
			<xsl:apply-templates select="*[2]"/>
		</xsl:if>

		<Leafnode cat="" lexeme="..." pos1="{$pos}" cat0=",">
			<xsl:if test="$pos='PUNCT_DOTS2'">
				<xsl:apply-templates select="*[3]/@*[not(name()='pos1')]"/>
			</xsl:if>
			<xsl:if test="$pos='PUNCT_DOTS1'">
				<xsl:apply-templates select="*[2]/@*[not(name()='pos1')]"/>
			</xsl:if>

			<complexcat>
      	<atomcat type="s">
        	<fs inheritsFrom="1">
						<feat attr="form" val="{$feat}"/>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
					<fs id="2"/>
				</atomcat>

				<!--dots occurs after adj-->
				<xsl:if test="$pos='PUNCT_DOTS2'">
					<slash dir="\" mode="*"/>		
				</xsl:if>
				
				<!--dots occurs before adj-->
				<xsl:if test="$pos='PUNCT_DOTS1'">
					<slash dir="/" mode="*"/>		
				</xsl:if>
        
				<complexcat>
        	<atomcat type="s">
        		<fs id="1">
							<feat attr="form" val="{$feat}"/>
          	</fs>
        	</atomcat>
        	<slash dir="\" mode="&lt;"/>
        	<atomcat type="np">
						<fs id="2"/>
					</atomcat> 
        </complexcat>
      </complexcat>
		</Leafnode>
		<!--dots occurs before adj-->
		<xsl:if test="$pos='PUNCT_DOTS1'">
			<xsl:apply-templates select="*[3]"/>
		</xsl:if>
		<xsl:variable name="pos" select="java:featInit($obj)"/>
	</Treenode>
</xsl:template>


<!--Default global copy rule-->
<xsl:template match="@*|node()">
	<xsl:copy>
 		<xsl:apply-templates select="@*|node()"/>
	</xsl:copy>
</xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/annotateExtraposedAppos.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  xmlns:exsl="http://exslt.org/common"
  extension-element-prefixes="exsl"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

  <xsl:output method="xml" indent="yes" xalan2:indent-amount="2"/>
  <xsl:strip-space elements="*"/>

<!--Java helper class-->
<xsl:variable name="obj" select="java:opennlp.ccgbank.convert.PunctHelper.new()"/>
<!--Extraposed appositives-->

<!--As per CCGbank Pg 52, retain binary rule analysis as this rule is correct-->

<xsl:template match="/">
  <xsl:apply-templates/>
</xsl:template>

<!--[, np ==>s\s]-->
<!--[np , ==>s/s]-->
<!--[, np ==>s\np\(s\np)]-->

<xsl:template match="Leafnode[parent::Treenode[(@cat0='(S\NP)\(S\NP)' or @cat0='S\S' or @cat0='S/S') and ((*[2]/@pos1=',' and *[3]/@cat0='NP') or (*[3]/@pos1=',' and *[2]/@cat0='NP'))]]">

 <Leafnode pos1="PUNCT_EXTR-APPOS">
    <xsl:apply-templates select="@*[not(name()='pos1')]"/>
		<complexcat>
			<xsl:apply-templates select="../*[1]/*" mode="res"/>
			<xsl:choose>
				<xsl:when test="@term_no=../*[3]/@term_no">
				 <slash dir="\" mode="*"/>
				</xsl:when>
				<xsl:otherwise>
				 <slash dir="/" mode="*"/>
				</xsl:otherwise>
			</xsl:choose>
			<atomcat type="np">
      	<fs id="3"/>
       </atomcat>
		</complexcat>
 </Leafnode>
</xsl:template>

<xsl:template match="atomcat[@type='s']" mode="res">

	<xsl:variable name="id" select="java:getPOS($obj)"/>		

	<atomcat type="s">
		<xsl:choose>
			<xsl:when test="string-length($id) &gt; 0">
				<fs id="1"/>
				<xsl:variable name="void" select="java:initPOS($obj)"/>		
			</xsl:when>
			<xsl:otherwise>
				<fs inheritsFrom="1"/>
				<xsl:variable name="void" select="java:storePOS($obj,'1')"/>		
			</xsl:otherwise>
		</xsl:choose>
	</atomcat>
	
</xsl:template>
<xsl:template match="atomcat[@type='np']" mode="res">
	<atomcat type="np">
		<fs id="2"/>
	</atomcat>
</xsl:template>

<!-- Spl copy rule 1-->
  <xsl:template match="@*|node()" mode="res">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()" mode="res"/>
    </xsl:copy>
  </xsl:template>


<!--Default global copy rule-->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>

================================================
FILE: ccgbank/templates/annotateNom-AdjConj.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

<xsl:output method="xml" indent="yes" xalan2:indent-amount="2" omit-xml-declaration = "yes"/>

<xsl:strip-space elements="*"/>

<!--Java helper class-->
<xsl:variable name="obj" select="java:opennlp.ccgbank.convert.PunctHelper.new()"/>
<!--Transform which labels various punct cat part of speech-->

<xsl:template match="/">
  	<xsl:apply-templates/>
</xsl:template>

<xsl:template match="Treenode[*[2]/@pos1='PUNCT_NOM_CONJ']">

	<Treenode cat="" head="1" dtr="2" cat0="">
		<xsl:apply-templates select="@*"/>
		<complexcat>
			<atomcat type="n">
      	<fs id="1"/>
      </atomcat>
			<slash dir="\" mode="*"/>
			<complexcat>
    		<atomcat type="n">
      		<fs inheritsFrom="2"/>
      	</atomcat>
      	<slash dir="/" mode="&gt;"/>
      	<atomcat type="n">
      		<fs id="2"/>
      	</atomcat>
			</complexcat>
		</complexcat>

		<Leafnode cat="{@cat}" lexeme="," pos="," pos1="PUNCT_NOM_CONJ" cat0="{@cat0}">
			<xsl:apply-templates select="*[2]/@*[not(name()='pos1')]"/>

			<complexcat>
				<atomcat type="n">
      		<fs id="1"/>
      	</atomcat>
				<slash dir="\" mode="*"/>
				<complexcat>
    			<atomcat type="n">
      			<fs id="2"/>
      		</atomcat>
      		<slash dir="/" mode="&gt;"/>
      		<atomcat type="n">
      			<fs id="2"/>
      		</atomcat>
				</complexcat>
				<slash dir="/" mode="*"/>
				<atomcat type="n">
      		<fs id="3"/>
      	</atomcat>
    	</complexcat>
		</Leafnode>
		<xsl:apply-templates select="*[3]"/>
	</Treenode>

</xsl:template>

<!--Default global copy rule-->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/annotateParentheticals1.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

<xsl:output method="xml" indent="yes" xalan2:indent-amount="2" omit-xml-declaration = "yes"/>

<xsl:strip-space elements="*"/>

<!--Java helper class-->
<xsl:variable name="obj" select="java:opennlp.ccgbank.convert.PunctHelper.new()"/>
<!--Transform which identifies & labels sentence medial parentheticals-->

<xsl:template match="/">
    <xsl:apply-templates/>
</xsl:template>

<xsl:template match="Treenode[@Header]">
	<xsl:variable name="dummy0" select="java:storePOS($obj,@Header)"/>
	<Treenode>
		<xsl:apply-templates select="@*|node()"/>
	</Treenode>
</xsl:template>


<!--Lexicalizing adverbial parentheticals-->
<xsl:template match="Leafnode[@pos1='RB'and preceding::Leafnode[1][@pos1=',' and ancestor::Treenode[@Header=(java:getPOS($obj))]] and following::Leafnode[1][@pos1=',' and ancestor::Treenode[@Header=(java:getPOS($obj))]]]">

	<xsl:variable name="comma1" select="preceding::Leafnode[1]"/>
	<xsl:variable name="comma2" select="following::Leafnode[1]"/>
	<xsl:variable name="res" select="*[1]/*"/>

	<Treenode head="1" dtr="2">
		<xsl:apply-templates select="*[1]"/>
		<Leafnode pos1="PUNCT_ADV-PARENTHETICAL_BAL1" pos=",">
			<xsl:apply-templates select="$comma1/@*[not(name()='pos1')]"/>
			<atomcat type="punct">
      	<fs id="1">
      		<feat attr="lex" val=","/>
        </fs>
    	</atomcat>
		</Leafnode>		
		<Treenode head="0" dtr="2">
			<complexcat>
				<xsl:apply-templates select="$res"/>
				<slash dir="\" mode="*"/>
				<atomcat type="punct">
      		<fs id="7">
      			<feat attr="lex" val=","/>
        	</fs>
      	</atomcat>
			</complexcat>		
			<Leafnode>
				<xsl:attribute name="paren">ADV-PAREN</xsl:attribute>
				<xsl:apply-templates select="@*"/>
				<complexcat>
					<xsl:apply-templates select="$res"/>
					<slash dir="\" mode="*"/>
					<atomcat type="punct">
      			<fs id="7">
      				<feat attr="lex" val=","/>
        		</fs>
      		</atomcat>
					<slash dir="/" mode="*"/>
					<atomcat type="punct">
      			<fs id="8">
      				<feat attr="lex" val=","/>
        		</fs>
      		</atomcat>
				</complexcat>
			</Leafnode>	
			<Leafnode pos1="PUNCT_ADV-PARENTHETICAL_BAL2" pos=",">
				<xsl:apply-templates select="$comma2/@*[not(name()='pos1')]"/>
				<atomcat type="punct">
      		<fs id="1">
      			<feat attr="lex" val=","/>
        	</fs>
    		</atomcat>
			</Leafnode>		
		</Treenode>
	</Treenode>
</xsl:template>

<!--PP/Verbal-parenthetical: First comma selects parenthetical and following comma-->
<xsl:template match="Treenode[(not(@cat0='NP\NP') and (@cat0='S/S' or @cat0='(S\NP)/(S\NP)' or @cat0='(S\NP)\(S\NP)' or starts-with(@ptb-tag0,'PP'))) and preceding::Leafnode[1][((@lexeme='--' and @pos1=':') or @pos1=',') and ancestor::Treenode[@Header=(java:getPOS($obj))]] and following::Leafnode[1][((@lexeme='--' and @pos1=':') or @pos1=',') and ancestor::Treenode[@Header=(java:getPOS($obj))]]]">

	<xsl:variable name="punct1" select="preceding::Leafnode[1]"/>
	<xsl:variable name="punct2" select="following::Leafnode[1]"/>
	<xsl:variable name="punct-lex" select="$punct2/@lexeme"/>
	<xsl:variable name="res" select="descendant::Leafnode[1]/*[1]/*[1]"/>

	<xsl:choose>
		<xsl:when test="@dtr='1'">
			<xsl:variable name="dummy0" select="java:storePOS($obj,'PUNCT_PARENTHETICAL_VRB')"/>
		</xsl:when>
		<xsl:otherwise>
			<xsl:variable name="dummy0" select="java:storePOS($obj,'PUNCT_PARENTHETICAL')"/>
		</xsl:otherwise>
			
	</xsl:choose>
	<xsl:variable name="pos" select="java:getPOS($obj)"/>		
	<xsl:variable name="void1" select="java:initPOS($obj)"/>		

	<Treenode>
		<xsl:apply-templates select="@*[not(name()='ptb-tag0' or name()='constr')]"/>
		<xsl:apply-templates select="*[1]"/>

		<Treenode>
			<xsl:apply-templates select="@*[not(name()='ptb-tag0' or name()='constr')]"/>
			<complexcat>
				<xsl:apply-templates select="*[1]"/>
				<slash dir="/" mode="*"/>
				<atomcat type="punct">
      		<fs id="1">
      	  	<feat attr="lex" val="{$punct-lex}"/>
        	</fs>
      	</atomcat>
			</complexcat>

			<Leafnode pos1="{$pos}" pos="{$punct1/@pos}">
				<xsl:apply-templates select="$punct1/@*[not(name()='pos1')]"/>
				<complexcat>
					<xsl:apply-templates select="*[1]" mode="mod-arg"/>
					<slash dir="/" mode="*"/>
					<atomcat type="punct">
      			<fs id="7">
      	  		<feat attr="lex" val="{$punct-lex}"/>
        		</fs>
      		</atomcat>
					<slash dir="/" mode="*"/>
					
					<xsl:if test="@dtr='2'">
						<xsl:apply-templates select="*[1]" mode="mod-arg"/>
					</xsl:if>
					
					<xsl:if test="@dtr='1'">
						<xsl:apply-templates select="*[2]/*[1]" mode="vrb-arg"/>
						<xsl:variable name="id" select="java:globalInit($obj)"/>		
					</xsl:if>
				</complexcat>
			</Leafnode>

			<xsl:choose>
				<xsl:when test="@dtr='1'">
					<xsl:apply-templates select="*[2]"/>
				</xsl:when>
				<xsl:otherwise>
					<Treenode>
						<xsl:attribute name="constr">PP-PAREN</xsl:attribute>
						<xsl:apply-templates select="@*|node()"/>
					</Treenode>		
				</xsl:otherwise>
			</xsl:choose>
		</Treenode>
		<Leafnode pos1="PUNCT_PARENTHETICAL_BAL" pos="{$punct2/@pos}">
			<xsl:apply-templates select="$punct2/@*[not(name()='pos1')]"/>
			<atomcat type="punct">
      	<fs id="1">
      		<feat attr="lex" val="{$punct-lex}"/>
        </fs>
    	</atomcat>
		</Leafnode>	
	</Treenode>

</xsl:template>

<xsl:template match="atomcat[@type='s']" mode="mod-arg">

	<xsl:variable name="id" select="java:getPOS($obj)"/>		

	<atomcat type="s">
		<xsl:choose>
			<xsl:when test="string-length($id) &gt; 0">
				<fs id="1"/>
				<xsl:variable name="void" select="java:initPOS($obj)"/>		
			</xsl:when>
			<xsl:otherwise>
				<fs inheritsFrom="1"/>
				<xsl:variable name="void" select="java:storePOS($obj,'1')"/>		
			</xsl:otherwise>
		</xsl:choose>
	</atomcat>
	
</xsl:template>
<xsl:template match="atomcat[@type='np']" mode="mod-arg">
	<atomcat type="np">
		<fs id="2"/>
	</atomcat>
</xsl:template>

<xsl:template match="atomcat[@type='s']" mode="vrb-arg">

	<xsl:variable name="id0" select="number(java:getglobalId($obj))-1"/>		

	<xsl:choose>
		<xsl:when test="$id0 &lt; 3">
			<xsl:variable name="void" select="java:setglobalId($obj,2)"/>		
		</xsl:when>	
		<xsl:otherwise>
			<xsl:variable name="void" select="java:setglobalId($obj,number($id0))"/>
		</xsl:otherwise>
	</xsl:choose>

	<atomcat type="s">
		<xsl:variable name="id" select="java:getglobalId($obj)"/>		
		<fs id="{$id}"/>
	</atomcat>
	
</xsl:template>
<xsl:template match="atomcat[@type='np']" mode="vrb-arg">
	<atomcat type="np">
		<fs id="2"/>
	</atomcat>
</xsl:template>

<!-- Spl copy rule 1-->
  <xsl:template match="@*|node()" mode="mod-arg">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()" mode="mod-arg"/>
    </xsl:copy>
  </xsl:template>

<!-- Spl copy rule 2-->
  <xsl:template match="@*|node()" mode="vrb-arg">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()" mode="vrb-arg"/>
    </xsl:copy>
  </xsl:template>

<!--Default global copy rule-->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/annotateParentheticals2.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  xmlns:exsl="http://exslt.org/common"
  extension-element-prefixes="exsl"		
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

  <xsl:output method="xml" indent="yes" xalan2:indent-amount="2"/>
  <xsl:strip-space elements="*"/>


<!--Transform which deals with parentheticals , say verbs-->

<!--Java helper class-->
<xsl:variable name="obj" select="java:opennlp.ccgbank.convert.PunctHelper.new()"/>

<xsl:template match="/">
 <xsl:apply-templates/>
</xsl:template>


<!--Treenode after the comma in question-->
<xsl:template match="Treenode[preceding-sibling::Leafnode[1][@pos1='PUNCT_VPAREN3' or @pos1='PUNCT_VPAREN4']]">

	<Treenode>
		<xsl:copy-of select="@*"/>
		<complexcat>
			<xsl:apply-templates select="*[1]/*"/>				
			<slash dir="\" mode="*"/>
			<atomcat type="punct">
  			<fs id="4">
					<feat attr="lex" val=","/>
				</fs>
  		</atomcat>
		</complexcat>				
		<xsl:apply-templates select="*[position()>1]"/>
	</Treenode>			
</xsl:template>

<xsl:template match="Leafnode[preceding::Leafnode[1]/@pos1='PUNCT_VPAREN3']">

	<Leafnode>
		<xsl:copy-of select="@*"/>
    <complexcat>
			<!--<xsl:apply-templates select="*[1]/*[position() &lt; 6]"/>-->
			<atomcat type="s">
      	<fs inheritsFrom="1">
        </fs>
      </atomcat>
      <slash dir="\" mode="&lt;"/>
      <atomcat type="np">
      	<fs id="2"/>
      </atomcat>
      <slash dir="\" mode="&lt;"/>
      <complexcat>
      	<atomcat type="s">
        	<fs id="1">
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
        	<fs id="2"/>
        </atomcat>
      </complexcat>
			<slash dir="\" mode="*"/>
			<atomcat type="punct">
  			<fs id="4">
					<feat attr="lex" val=","/>
				</fs>
  		</atomcat>
			<xsl:if test="following-sibling::*/following::Leafnode[1]/@pos1='PUNCT_VPAREN3_BAL' or following-sibling::*[following::Treenode[1][following::Leafnode[1]/@pos1='PUNCT_VPAREN3_BAL']]">
				<slash dir="/" mode="*"/>
				<atomcat type="punct">
  				<fs id="5">
						<feat attr="lex" val=","/>
					</fs>
  			</atomcat>
			</xsl:if>
			<slash dir="/" mode="&gt;"/>
  	  <xsl:apply-templates select="*[1]/*[position() &gt; 6]" mode="res"/>
    </complexcat>
  </Leafnode>
</xsl:template>	

<xsl:template match="Leafnode/*[1]/*[position()=last() and self::atomcat]/fs" mode="res">
	<fs>
		<xsl:copy-of select="@*"/>
	</fs>
</xsl:template>	

<xsl:template match="Leafnode/*[1]/*[last() and self::complexcat]/atomcat[1]/fs" mode="res">
	<fs>
		<xsl:copy-of select="@*"/>
	</fs>
</xsl:template>	

<xsl:template match="Leafnode[preceding::Leafnode[1]/@pos1='PUNCT_VPAREN4']">

	<Leafnode>
		<xsl:copy-of select="@*"/>
    <complexcat>
			<!--<xsl:apply-templates select="*[1]/*"/>-->
			<atomcat type="s">
      	<fs inheritsFrom="1">
        </fs>
      </atomcat>
      <slash dir="\" mode="&lt;"/>
      <atomcat type="np">
      	<fs id="2"/>
      </atomcat>
      <slash dir="\" mode="&lt;"/>
      <complexcat>
      	<atomcat type="s">
        	<fs id="1">
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
        	<fs id="2"/>
        </atomcat>
      </complexcat>
			<slash dir="\" mode="*"/>
			<atomcat type="punct">
  			<fs id="4">
					<feat attr="lex" val=","/>
				</fs>
  		</atomcat>				
			<xsl:if test="following-sibling::Leafnode/@pos1='PUNCT_VPAREN4_BAL'">
				<slash dir="/" mode="*"/>
				<atomcat type="punct">
  				<fs id="5">
						<feat attr="lex" val=","/>
					</fs>
  			</atomcat>
			</xsl:if>				
    </complexcat>
  </Leafnode>
</xsl:template>	

<!--Treenode which is the parent of the balancing comma in question-->
<xsl:template match="Treenode[following-sibling::Leafnode[1]/@pos1='PUNCT_VPAREN3_BAL']">
	
	<Treenode>
		<xsl:copy-of select="@*"/>
		<complexcat>
			<xsl:apply-templates select="*[1]/*"/>				
			<slash dir="\" mode="*"/>
			<atomcat type="punct">
  			<fs id="4">
					<feat attr="lex" val=","/>
				</fs>
  		</atomcat>
			<slash dir="/" mode="*"/>
			<atomcat type="punct">
  			<fs id="5">
					<feat attr="lex" val=","/>
				</fs>
  		</atomcat>								
		</complexcat>				
		<xsl:apply-templates select="*[position()>1]"/>
	</Treenode>			
</xsl:template>	

<!--Treenode above the comma in question/balancing comma-->
<xsl:template match="Treenode[Leafnode[1][@pos1='PUNCT_SAY5']]">
	<xsl:apply-templates select="*[3]"/>
</xsl:template>	

<xsl:template match="Treenode[preceding-sibling::Leafnode[1]/@pos1='PUNCT_SAY5']">	
	<Treenode>
		<xsl:copy-of select="@*"/>
		<xsl:apply-templates select="*[1]"/>

	<Treenode cat="" head="0" dtr="2" cat0="">
		<complexcat>
			<xsl:apply-templates select="*[1]/*"/>		
			<slash dir="/" mode="*"/>
			<atomcat type="punct">
  			<fs id="4">
					<feat attr="lex" val=","/>
				</fs>
  		</atomcat>				
		</complexcat>
		
		<Leafnode cat="," lexeme="," pos="," pos1="PUNCT_SAY5" cat0=",">
			<xsl:copy-of select="*[2]/@*"/>
			<complexcat>
				<atomcat type="s">
        	<fs inheritsFrom="1">
           </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
        	<fs id="2">
           </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <complexcat>
        	<atomcat type="s">
          	<fs id="1">
           </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
          	<fs id="2">
           	</fs>
          </atomcat>
        </complexcat>
				<slash dir="/" mode="*"/>
				<atomcat type="punct">
  				<fs id="3">
						<feat attr="lex" val=","/>
					</fs>
  			</atomcat>
				<slash dir="/" mode="*"/>
				<xsl:apply-templates select="*[2]/*[1]" mode="arg"/>
			</complexcat>
		</Leafnode>
		<xsl:apply-templates select="*[2]"/>
	</Treenode>
	<Leafnode cat="" lexeme="," pos1="PUNCT_SAY5_BAL" pos="," cat0=",">
  	<atomcat type="punct">
   		<fs id="1">
				<feat attr="lex" val=","/>
			</fs>
  	</atomcat>
 	</Leafnode>
	</Treenode>
</xsl:template>	

<!--Alloting correct ids to the category of s[dcl]\s[dcl]-->
<xsl:template match="atomcat[1]/fs" mode="arg">
	<fs id="4">
	 	<xsl:apply-templates mode="arg"/>
  </fs>
</xsl:template>

<xsl:template match="atomcat[2]/fs" mode="arg">
	<fs id="5">
	 	<xsl:apply-templates mode="arg"/>
  </fs>
</xsl:template>

<!--res copy rule-->
<xsl:template match="@*|node()" mode="res">
  <xsl:copy>
    <xsl:apply-templates select="@*|node()" mode="res"/>
  </xsl:copy>
</xsl:template>

<!--arg copy rule-->
<xsl:template match="@*|node()" mode="arg">
  <xsl:copy>
    <xsl:apply-templates select="@*|node()" mode="arg"/>
  </xsl:copy>
</xsl:template>

<!--Default global copy rule-->
<xsl:template match="@*|node()">
	<xsl:copy>
 		<xsl:apply-templates select="@*|node()"/>
	</xsl:copy>
</xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/annotatePlace.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

<xsl:output method="xml" indent="yes" xalan2:indent-amount="2" omit-xml-declaration = "yes"/>

<xsl:strip-space elements="*"/>

<!--Transform which corrects the structure of , np\np marked appositives to , x ==> np\np-->

<xsl:template match="/">
 	<xsl:apply-templates/>
</xsl:template>

<!--Mark place names 1-->
<xsl:template match="Treenode[Leafnode[@pos1='PUNCT_APPOS_PLACE2' or @pos1='PUNCT_APPOS_PLACE_BAL']]">
	<xsl:apply-templates select="*[position() >1 and not(@pos1='PUNCT_APPOS_PLACE2') and not(@pos1='PUNCT_APPOS_PLACE_BAL')]"/>

</xsl:template>

<!--Cat 1: First set of place names-->

<xsl:template match="Treenode[*[2]/@pos1='PUNCT_APPOS_PLACE1']">
	<Treenode cat="np[mod]\np[mod]" head="0" dtr="2" cat0="NP\NP">
		<xsl:apply-templates select="@*"/>
		<complexcat>
      <atomcat type="np">
      	<fs id="1">
				</fs>
      </atomcat>
      <slash dir="\" mode="&lt;"/>
      <atomcat type="np">
      	<fs id="1">
				</fs>
    	</atomcat>
		</complexcat>
		<xsl:call-template name="tree0"/>	
	</Treenode>
</xsl:template>

<!--Cat 2: Second set of place names-->

<xsl:template match="Leafnode[preceding::Leafnode[1]/@pos1='PUNCT_APPOS_PLACE2']">
	<Treenode cat="np\np" head="0" dtr="2" cat0="NP\NP">
		<complexcat>
      <atomcat type="np">
      	<fs id="1">
				</fs>
      </atomcat>
      <slash dir="\" mode="&lt;"/>
      <atomcat type="np">
      	<fs id="1">
				</fs>
    	</atomcat>
		</complexcat>
		<xsl:call-template name="tree0"/>
	</Treenode>
</xsl:template>

<xsl:template name="tree0">

	<xsl:choose>
		<xsl:when test="following::Leafnode[1]/@pos1='PUNCT_APPOS_PLACE_BAL'">
			<Treenode cat="np[mod]\np[mod]/*punct[,]" head="0" dtr="2" cat0="NP\NP\punct[,]">
      	<complexcat>
        	<atomcat type="np">
          	<fs id="1">
						</fs>
        	</atomcat>
        	<slash dir="\" mode="&lt;"/>
        	<atomcat type="np">
          	<fs id="1">
						</fs>
        	</atomcat>
					<slash dir="/" mode="*"/>
        	<atomcat type="punct">
          	<fs id="2">
            	<feat attr="lex" val=","/>
          	</fs>
        	</atomcat>
      	</complexcat>
				<xsl:call-template name="leaf0"/>
			</Treenode>	
			<Leafnode cat="punct[,]_1" lexeme="," pos="," pos1="PUNCT_APPOS_PLACE_BAL" cat0=",">
    		<atomcat type="punct">
      		<fs id="1">
        		<feat attr="lex" val=","/>
        	</fs>
      	</atomcat>
    	</Leafnode>
		</xsl:when>
		<xsl:otherwise>
				<xsl:call-template name="leaf0"/>
		</xsl:otherwise>
	</xsl:choose>
</xsl:template>

<xsl:template name="leaf0">

	<Leafnode cat="np[mod]\np[mod]/*np" lexeme="," pos="," pos1="PUNCT_APPOS_PLACE" cat0=",">
		<complexcat>
			<atomcat type="np">
     		<fs inheritsFrom="1">
				</fs>
     	</atomcat>
     	<slash dir="\" mode="&lt;"/>
     	<atomcat type="np">
      	<fs id="1">
	      </fs>
      </atomcat>
			<slash dir="/" mode="*"/>
			<xsl:if test="following::Leafnode[1]/@pos1='PUNCT_APPOS_PLACE_BAL'">
				<atomcat type="punct">
         	<fs id="2">
           	<feat attr="lex" val=","/>
         	</fs>
        </atomcat>
				<slash dir="/" mode="*"/>
			</xsl:if>
			<atomcat type="np">
	  		<fs id="3">
      	</fs>
    	</atomcat>			
		</complexcat>
	</Leafnode>	
	<xsl:choose>
		<xsl:when test="preceding::Leafnode[1]/@pos1='PUNCT_APPOS_PLACE2'">
			<Leafnode>
				<xsl:copy-of select="@*"/>
				<xsl:call-template name="modPlnp"/>
			</Leafnode>		
		</xsl:when>
		<xsl:when test="*[2]/@pos1='PUNCT_APPOS_PLACE1'">
			<Leafnode>
				<xsl:copy-of select="*[3]/@*"/>
				<xsl:call-template name="modPlnp"/>
			</Leafnode>		
		</xsl:when>
	</xsl:choose>
</xsl:template>

<xsl:template name="modPlnp">

	<atomcat type="np">
		<fs id="1">
    </fs>
  </atomcat>
</xsl:template>

<!--Cat  3-->
<xsl:template match="Treenode[@cat0='N/N' and *[2]/@pos1=',' and *[3][@cat0='N/N' and *[3]/@pos1=',']]">
	
	<Treenode cat="n[nil]/n[nil]" head="{@head}" dtr="{@dtr}" cat0="{@cat0}">
		<xsl:apply-templates select="@*"/>
		<complexcat>
     	<atomcat type="n">
       	<fs id="1">
				</fs>
       </atomcat>
       <slash dir="/" mode="&gt;"/>
       <atomcat type="n">
        <fs id="1">
				</fs>
       </atomcat>
		</complexcat>	

		<Treenode cat="n/n/*punct[,]" head="0" dtr="2">
			<xsl:apply-templates select="@*"/>
     	<complexcat>
       	<atomcat type="n">
         	<fs id="1">
					</fs>
       	</atomcat>
       	<slash dir="/" mode="&gt;"/>
       	<atomcat type="n">
         	<fs id="1">
					</fs>
       	</atomcat>
				<slash dir="/" mode="*"/>
       	<atomcat type="punct">
         	<fs id="2">
           	<feat attr="lex" val=","/>
         	</fs>
       	</atomcat>
     	</complexcat>
			<Leafnode cat=",_1" lexeme="," pos="," pos1="PUNCT_APPOS_ADDR" cat0=",">
				<complexcat>
      		<atomcat type="n">
       			<fs inheritsFrom="1">
						</fs>
       		</atomcat>
       		<slash dir="/" mode="&gt;"/>
       		<atomcat type="n">
       			<fs id="1">
						</fs>
       		</atomcat>
					<slash dir="/" mode="*"/>
	    		<atomcat type="punct">
  	  			<fs id="2">
    					<feat attr="lex" val=","/>
						</fs>
      		</atomcat>
					<slash dir="/" mode="*"/>
					<complexcat>
						<atomcat type="n">
       				<fs inheritsFrom="1">
							</fs>
       			</atomcat>
       			<slash dir="/" mode="&gt;"/>
       			<atomcat type="n">
       				<fs id="1">	
							</fs>
       			</atomcat>
					</complexcat>	
      	</complexcat>
			</Leafnode>	
			<xsl:apply-templates select="*[3]/*[2]"/>
		</Treenode>
		<Leafnode cat="punct[,]_1" lexeme="," pos="," pos1="PUNCT_APPOS_ADDR_BAL" cat0=",">
    	<atomcat type="punct">
      	<fs id="1">
       		<feat attr="lex" val=","/>
       	</fs>
     	</atomcat>
    </Leafnode>
	</Treenode>
</xsl:template>

<!--Default global copy rule-->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/annotatePrtConjs.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

<xsl:output method="xml" indent="yes" xalan2:indent-amount="2" omit-xml-declaration = "yes"/>

<xsl:strip-space elements="*"/>

<xsl:template match="/">
  <xsl:apply-templates/>
</xsl:template>

<xsl:variable name="obj-punct" select="java:opennlp.ccgbank.convert.PunctHelper.new()"/>

<xsl:variable name="obj-mw" select="java:opennlp.ccgbank.convert.MWHelper.new()"/>

<xsl:template match="Treenode[*[2][self::Leafnode and child::PRT[@dir='\']/@pos1='PUNCT_LEX_CONJ']]">

	<xsl:variable name="punct" select="*[2]/PRT[@dir='\']"/>

	<Treenode head="1" dtr="2">
		<complexcat>	
			<xsl:apply-templates select="*[2]/*[1]/*[position() &lt; last()-1]"/>
		</complexcat>	
	
		<Leafnode>
			<xsl:apply-templates select="$punct/@*[not(name()='dir' or name()='type')]"/>
			<xsl:call-template name="prt-def">
				<xsl:with-param name = "node" select="$punct"/>
			</xsl:call-template>
		</Leafnode>
		<Treenode>
			<xsl:apply-templates select="@*"/>
			<complexcat>
				<xsl:apply-templates select="*[1]/*"/>
				<slash dir="\" mode="*"/>
				<xsl:call-template name="prt-def">
					<xsl:with-param name = "node" select="$punct"/>
				</xsl:call-template>
			</complexcat>
			<xsl:apply-templates select="*[position()>1]"/>
		</Treenode>
	</Treenode>
</xsl:template>

<!--Make a copy of pos for future modification-->
<xsl:template match="Leafnode[@pos1='CONJP_HEADXX' or PRT/@pos1='PUNCT_LEX_CONJ-SUCC' or PRT/@pos1='PUNCT_LEX_CONJ']">

	<xsl:variable name="void" select="java:initSettings($obj-mw)"/>			

	<xsl:for-each select="PRT[@dir='/']">
		<xsl:variable name="void" select="java:storePrt($obj-mw,@term_no,@lexeme)"/>			
	</xsl:for-each>

	<xsl:call-template name="prt-expander">
		<xsl:with-param name = "func" select="."/>
	</xsl:call-template>		
		
	
</xsl:template>

<xsl:template name="prt-expander">
	<xsl:param name="func"/>

	
	<xsl:variable name="prtNo" select="java:getPrt($obj-mw)"/>			
	<xsl:variable name="nextPrt" select="java:peekPrt($obj-mw,number($prtNo)+1)"/>			
	<xsl:choose>
		<xsl:when test="string-length($prtNo)>0">

			<xsl:variable name="prt" select="$func/child::PRT[@term_no=$prtNo]"/>	

			<Treenode head="0" dtr="2" cat0="NewlyAdded">
				<complexcat>
					<xsl:apply-templates select="$func/*[1]/*[position() &lt; last()-1]"/>
					<xsl:for-each select="$func/PRT[@dir='\']">
						<slash dir="\" mode="*"/>
						<xsl:call-template name="prt-def">
							<xsl:with-param name = "node" select="."/>
						</xsl:call-template>
					</xsl:for-each>
					<slash dir="/" mode="*"/>
					<xsl:apply-templates select="$func/*[1]/*[position() &gt; last()-1]"/>
					<xsl:if test="string-length($nextPrt)>0">
						<slash dir="/" mode="*"/>
						<atomcat type="prt">
        			<fs>
								<feat attr="lex" val="{$nextPrt}"/>	
							</fs>
        		</atomcat>
					</xsl:if>
				</complexcat>
				<xsl:call-template name="prt-expander">
					<xsl:with-param name = "func" select="$func"/>
				</xsl:call-template>

				<xsl:if test="$prt/@dir='/'">
					<Leafnode>
						<xsl:apply-templates select="$prt/@*"/>
						<xsl:variable name="void1" select="java:globalInit($obj-punct)"/>		
						<xsl:call-template name="prt-def">
							<xsl:with-param name = "node" select="$prt"/>
						</xsl:call-template>						
					</Leafnode>
				</xsl:if>
			</Treenode>
		</xsl:when>
		<xsl:otherwise>
			<Leafnode>
				<xsl:apply-templates select="$func/@*"/>
				<complexcat>
					<xsl:apply-templates select="$func/*[1]/*[position() &lt; last()-1]"/>

					<xsl:for-each select="$func/child::PRT[@dir='\']">
						<xsl:variable name="void" select="java:storePrt($obj-mw,@term_no,@lexeme)"/>			
					</xsl:for-each>

					<xsl:for-each select="$func/PRT[@dir='\']">

						<xsl:variable name="prtNo" select="java:getPrt($obj-mw)"/>			
						<xsl:variable name="prt-node" select="$func/PRT[@term_no=$prtNo]"/>
						<slash dir="\" mode="*"/>
						<xsl:call-template name="prt-def">
							<xsl:with-param name = "node" select="$prt-node"/>
						</xsl:call-template>						
					</xsl:for-each>

					<xsl:apply-templates select="$func/*[1]/*[position() &gt; last()-2]"/>

					<xsl:for-each select="$func/child::PRT[@dir='/']">
						<xsl:variable name="void" select="java:storePrt($obj-mw,@term_no,@lexeme)"/>			
					</xsl:for-each>
		
					<xsl:variable name="void1" select="java:globalInit($obj-punct)"/>		
					<xsl:variable name="void2" select="java:setglobalId($obj-punct,3)"/>		
			
					<xsl:for-each select="$func/PRT[@dir='/']">

						<xsl:variable name="prtNo" select="java:getPrt($obj-mw)"/>			
						<xsl:variable name="prt-node" select="$func/PRT[@term_no=$prtNo]"/>
						<slash dir="/" mode="*"/>
						<xsl:call-template name="prt-def">
							<xsl:with-param name = "node" select="$prt-node"/>
						</xsl:call-template>						
					</xsl:for-each>
				</complexcat>
				<xsl:apply-templates select="*[self::PRT]"/>        	 
			</Leafnode>
		</xsl:otherwise>
	</xsl:choose>
</xsl:template>

<xsl:template name="prt-def">
	<xsl:param name="node"/>

	<xsl:variable name="id" select="java:getglobalId($obj-punct)"/>		

	<atomcat type="{$node/@type}">
  	<fs id="{$id}">
			<feat attr="lex" val="{$node/@lexeme}"/>	
		</fs>
  </atomcat>
</xsl:template>

<!--Default global copy rule-->
<xsl:template match="@*|node()">
   <xsl:copy>
     <xsl:apply-templates select="@*|node()"/>
   </xsl:copy>
</xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/annotateQuotes.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

<xsl:output method="xml" indent="yes" xalan2:indent-amount="2" omit-xml-declaration = "yes"/>

<xsl:strip-space elements="*"/>

<xsl:variable name="obj" select="java:opennlp.ccgbank.convert.InfoHelper.new()"/>

<!--Transform to insert analyses for quotation marks into CCG derivs-->

<xsl:template match="/">
  <xsl:apply-templates select="@*|node()"/>
</xsl:template>

<xsl:variable name="rquote">''</xsl:variable> 
<xsl:variable name="lquote">``</xsl:variable> 

<!--Confer categories to quoted phrases-->

<xsl:template match="Treenode[(*[1][self::atomcat])  and @quote-info]">

	<xsl:variable name="quoteSpan" select="concat(substring-before(@quote-info,' '),' ')"/>

	<xsl:choose >
		<xsl:when test = "count(parent::Treenode[starts-with(@quote-info,$quoteSpan)])=0" >

			<!--Store result cat-->
			<xsl:variable name="res1" select="java:storeRes($obj,@cat)"/>
			<xsl:variable name="res" select="java:getRes($obj)"/>

			<Treenode cat="{$res}" head="0" dtr="2">
				<atomcat type="{$res}"/>
				<!--<xsl:apply-templates select="*[1]"/>-->
				<xsl:call-template name = "bal_punct"/>
				<Leafnode cat="punct['']_1" lexeme="{$rquote}" pos1="PUNCT_QUOTE" cat0="{$rquote}" lexeme0="{$rquote}" pos="{$rquote}">
					<atomcat type="punct">
						<fs id="3">
							<feat attr="lex" val="{$rquote}"/>
						</fs>
					</atomcat>
				</Leafnode>
			</Treenode>
    </xsl:when>
    <xsl:otherwise >
			<xsl:call-template name = "tree" />
    </xsl:otherwise>
  </xsl:choose> 
</xsl:template>

<xsl:template name = "bal_punct" >

	<xsl:variable name="res" select="java:getRes($obj)"/>

	<xsl:variable name="temp" select="substring-after(@quote-info,' ')"/>
	<xsl:variable name="termPunct" select="substring-after($temp,' ')"/>

	<Treenode head="0" dtr="2">
		
		<complexcat>
			<atomcat type="{$res}"/>
			<slash dir="/" mode="*"/>
			<atomcat type="punct">
				<fs>
					<feat attr="lex" val="{$rquote}"/>
				</fs>
			</atomcat>
		</complexcat>
		<xsl:call-template name = "quoteLeaf" />
		<xsl:call-template name = "tree" />
		
	</Treenode>

</xsl:template>

<xsl:template name = "quoteLeaf" >

	<xsl:variable name="res" select="java:getRes($obj)"/>
	<xsl:variable name="info" select="substring-after(@quote-info,' ')"/>
	<xsl:variable name="balStatus" select="substring-before($info,' ')"/>
	<xsl:variable name="termPunct" select="substring-after($info,' ')"/>

	<Leafnode cat="s_~1/*punct[{$rquote}]_3/*punct[,]_2/*s_1" lexeme="{$lquote}" pos1="PUNCT_QUOTE" cat0="{$lquote}" lexeme0="{$lquote}" pos="{$lquote}">
    <complexcat>
      <atomcat type="{$res}">
        <fs id="1"/>
      </atomcat>
			<slash dir="/" mode="*"/>
			<atomcat type="punct">
				<fs id="3">
					<feat attr="lex" val="{$rquote}"/>
				</fs>
			</atomcat>
			<slash dir="/" mode="*"/>
      <atomcat type="{*[1]/@type}">
        <fs id="2"/>
      </atomcat>
    </complexcat>
  </Leafnode>
</xsl:template>

<xsl:template name = "tree" >
	<Treenode>
		<xsl:apply-templates select="@*|node()"/>
	</Treenode>
</xsl:template>

<!--Default global copy rule-->

   <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/annotateReportedSpeech.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

<xsl:output method="xml" indent="yes" xalan2:indent-amount="2" omit-xml-declaration = "yes"/>

<xsl:strip-space elements="*"/>

<!--Java helper class-->
<xsl:variable name="obj" select="java:opennlp.ccgbank.convert.PunctHelper.new()"/>
<!--Transform which identifies & labels reported speech constr (both sentence medial as well as sentence final-->

<xsl:template match="/">
    <xsl:apply-templates/>
</xsl:template>

<xsl:template match="Treenode[@Header]">
	<xsl:variable name="dummy0" select="java:storePOS($obj,@Header)"/>
	<Treenode>
		<xsl:apply-templates select="@*|node()"/>
	</Treenode>
</xsl:template>

<!--Cat 1: Say verb is the anchor-->
<!--Treenode above the comma in question: s\np/s , ==> s\np/s:17-->

<xsl:template match="Treenode[java:removeFeats($obj,@cat0)='(S\NP)/S' and java:removeFeats($obj,*[2][self::Leafnode]/@cat0)='(S\NP)/S' and *[3]/@pos1=',']">

	<Treenode>
		<xsl:copy-of select="@*"/>
		<xsl:apply-templates select="*[1]"/>
		<Leafnode>
  		<xsl:copy-of select="*[2]/@*"/>
      <xsl:attribute name="cat0"><xsl:value-of select="concat(*[2]/@cat0,'_SAY-VERB')"/></xsl:attribute>
			<complexcat>
				<xsl:apply-templates select="*[2]/*[1]/*[position() &lt; last()-1]"/>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="s">
        	<fs id="3">
        		<feat attr="form" val="{*[2]/*[1]/atomcat[3]/fs/feat[@attr='form']/@val}"/>
          </fs>
        </atomcat>
        <slash dir="/" mode="*"/>
        <atomcat type="punct">
        	<fs id="4">
          	<feat attr="lex" val=","/>
          </fs>
        </atomcat>
      </complexcat>
		</Leafnode>
		<Leafnode cat="punct[,]_1" lexeme="," pos="," pos1="PUNCT_COMMA" cat0=",">
			<xsl:copy-of select="*[3]/@*[not(name()='pos1')]"/>
    	<atomcat type="punct">
      	<fs id="1">
					<feat attr="lex" val=","/>
      	</fs>
      </atomcat>
    </Leafnode>
	</Treenode>
</xsl:template>

<!--Cat 2: Labels inv reported speech parenthetical-->
<xsl:template match="Treenode[((@cat0='S[dcl]' and starts-with(@ptb-tag0,'SINV')) or  (@cat0='S[dcl]/S[dcl]' or @cat0='S[dcl]\S[dcl]')) and ../*[1][self::complexcat] and preceding::Leafnode[1][@pos1=',' and ancestor::Treenode[@Header=(java:getPOS($obj))]]]">

	<xsl:variable name="comma1" select="preceding::Leafnode[1]"/>
	<xsl:variable name="comma2" select="following::Leafnode[1][ancestor::Treenode[@Header=(java:getPOS($obj))]]"/>
	<xsl:variable name="res" select="../*[1]"/>
	<xsl:variable name="arg" select="*[1]"/>

	<Treenode>
		<xsl:apply-templates select="../@*"/>
		<!--<complexcat>
			<xsl:call-template name = "res-choice">
				<xsl:with-param name = "res"  select="$res"/>
 	    	<xsl:with-param name = "arg" select="$arg"/>
			</xsl:call-template>
		</complexcat>-->
		<xsl:apply-templates select="$res"/>
		
		<!--Dealing with balanced and unbalanced cases-->
		<xsl:choose>
			<xsl:when test="$comma2/@pos1=','">
				<Treenode>
					<xsl:apply-templates select="../@*"/>
					<complexcat>
						<xsl:apply-templates select="$res/*"/>
						<slash dir="/" mode="*"/>
						<atomcat type="punct">
      				<fs id="1">
      	  			<feat attr="lex" val=","/>
        			</fs>
      			</atomcat>
					</complexcat>
					<xsl:call-template name = "punct-cat">
						<xsl:with-param name = "comma1"  select="$comma1"/>
 	    			<xsl:with-param name = "comma2" select="$comma2"/>
					</xsl:call-template>
				</Treenode>
				<Leafnode pos="," pos1="PUNCT_SAY_BAL">
					<xsl:apply-templates select="$comma2/@*[not(name()='pos1')]"/>
					<atomcat type="punct">
      			<fs id="1">
      				<feat attr="lex" val=","/>
        		</fs>
    			</atomcat>
				</Leafnode>	
			</xsl:when>
			<xsl:otherwise>
				<xsl:call-template name = "punct-cat">
					<xsl:with-param name = "comma1"  select="$comma1"/>
 	    		<xsl:with-param name = "comma2" select="$comma2"/>
				</xsl:call-template>
			</xsl:otherwise>
		</xsl:choose>
	</Treenode>		
</xsl:template>

<xsl:template name="punct-cat">
	<xsl:param name="comma1"/>
	<xsl:param name="comma2"/>

	<xsl:variable name="res" select="../*[1]"/>
	<xsl:variable name="arg" select="*[1]"/>

	<Leafnode pos="," pos1="PUNCT_SAY">
		<xsl:apply-templates select="$comma1/@*[not(name()='pos1')]"/>
		<complexcat>
	
			<xsl:variable name="void1" select="java:globalInit($obj)"/>
			<xsl:variable name="void" select="java:initPOS($obj)"/>
			<xsl:call-template name = "res-choice">
				<xsl:with-param name = "res"  select="$res"/>
 	    	<xsl:with-param name = "arg" select="$arg"/>
			</xsl:call-template>

			<slash dir="/" mode="*"/>
			<xsl:if test="$comma2/@pos1=','">
				<atomcat type="punct">
      		<fs id="7">
      	  	<feat attr="lex" val=","/>
        	</fs>
      	</atomcat>
				<slash dir="/" mode="*"/>
			</xsl:if>
			<xsl:apply-templates select="$arg" mode="arg"/>
			<xsl:variable name="void2" select="java:globalInit($obj)"/>		
		</complexcat>
	</Leafnode>
	<Treenode constr="INV-REPORTED-SPEECH">
		<xsl:apply-templates select="@*|node()"/>
	</Treenode>		
</xsl:template>

<!--Provision for choice of result cat-->

<xsl:template name="res-choice">
	<xsl:param name="res"/>
	<xsl:param name="arg"/>
		
	<xsl:choose>
		<!--<xsl:when test="$res[self::atomcat]">
			<xsl:apply-templates select="$arg/*" mode="res"/>
		</xsl:when>-->
		<xsl:when test="parent::Treenode[starts-with(@cat0,'(S\NP)')]">
			<xsl:apply-templates select="$res/*" mode="res"/>
			<xsl:variable name="id" select="java:setglobalId($obj,3)"/>		
		</xsl:when>
		<xsl:otherwise>
			<xsl:apply-templates select="$res/*" mode="res"/>
			<xsl:variable name="id" select="java:globalInit($obj)"/>				
		</xsl:otherwise>
	</xsl:choose>	
</xsl:template>

<xsl:template match="atomcat[@type='s']" mode="res">

	<xsl:variable name="id" select="java:getPOS($obj)"/>		

	<atomcat type="s">
		<xsl:choose>
			<xsl:when test="string-length($id) &gt; 0">
				<fs id="2"/>
				<xsl:variable name="void" select="java:initPOS($obj)"/>
			</xsl:when>
			<xsl:otherwise>
				<fs inheritsFrom="2"/>
				<xsl:variable name="void" select="java:storePOS($obj,'1')"/>		
			</xsl:otherwise>
		</xsl:choose>
	</atomcat>
</xsl:template>
<xsl:template match="atomcat[@type='np']" mode="res">
	<atomcat type="np">
		<fs id="3"/>
	</atomcat>
</xsl:template>

<xsl:template match="atomcat[@type='s']" mode="arg">

	<xsl:variable name="id" select="java:getglobalId($obj)"/>		
	<atomcat type="s">
		<fs id="{$id}">
		</fs>
	</atomcat>
	
</xsl:template>

<!-- Spl copy rule 1-->
  <xsl:template match="@*|node()" mode="res">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()" mode="res"/>
    </xsl:copy>
  </xsl:template>

<!-- Spl copy rule 2-->
  <xsl:template match="@*|node()" mode="arg">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()" mode="arg"/>
    </xsl:copy>
  </xsl:template>

<!--Default global copy rule-->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>

================================================
FILE: ccgbank/templates/annotateStrayAppos.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

<xsl:output method="xml" indent="yes" xalan2:indent-amount="2" omit-xml-declaration = "yes"/>

<xsl:strip-space elements="*"/>

<!--Java helper class-->
<xsl:variable name="obj" select="java:opennlp.ccgbank.convert.PunctHelper.new()"/>
<!--Transform which labels various punct cat part of speech-->

<xsl:template match="/">
  	<xsl:apply-templates/>
</xsl:template>

<!--Cat 1: -->

<xsl:template match="Treenode[*[2]/@pos1='PUNCT_NP_MOD']">

	<Treenode cat="" head="1" dtr="2" cat0="">
		<xsl:copy-of select="@*"/>
		<xsl:apply-templates select="*[1]"/>
		<Treenode cat="np\np/*punct[,]" head="0" dtr="2" cat0=",">
			<complexcat>
				<xsl:apply-templates select="*[1]/*"/>
				<slash dir="/" mode="*"/>
				<atomcat type="punct">
        	<fs id="3">
          	<feat attr="lex" val=","/>
          </fs>
        </atomcat>
			</complexcat>

			<xsl:variable name="arg1" select="*[3]/*[2]/@cat0"/>

			<Leafnode cat="{@cat}" lexeme="," pos1="{$arg1}" pos="," cat0="{@cat0}">
				<complexcat>
					<atomcat type="np">
      			<fs inheritsFrom="1">
						</fs>
      		</atomcat>
					<slash dir="\" mode="&lt;"/>
    			<atomcat type="np">
      			<fs id="1">
						</fs>
      		</atomcat>
					<slash dir="/" mode="*"/>
					<atomcat type="punct">
        		<fs id="2">
          		<feat attr="lex" val=","/>
          	</fs>
        	</atomcat>
					<slash dir="/" mode="*"/>
					
					<xsl:choose>
						<xsl:when test="$arg1='NP\NP'">
							<complexcat>
								<atomcat type="np">
									<fs inheritsFrom="1"/>
      						<!--<fs inheritsFrom="1">
										<feat attr="mod-punct" val="nil"/>
									</fs>-->
      					</atomcat>
								<slash dir="\" mode="&lt;"/>
    						<atomcat type="np">
      						<fs id="1">
									</fs>
      					</atomcat>
							</complexcat>
						</xsl:when>
						<xsl:when test="$arg1='S[adj]\NP'">
							<complexcat>
	              <atomcat type="s">
                	<fs id="3">
                  	<feat attr="form" val="adj"/>
                  </fs>
                </atomcat>
               	<slash dir="\" mode="&lt;"/>
                <atomcat type="np">
									<fs id="1"/>
								</atomcat>
            	</complexcat>
						</xsl:when>
					</xsl:choose>
    		</complexcat>
			</Leafnode>
			<xsl:apply-templates select="*[3]"/>
		</Treenode>
		<Leafnode cat="punct[,]_1" lexeme="," pos1="PUNCT_COMMA" pos="," cat0=",">
    	<atomcat type="punct">
      	<fs id="1">
					<feat attr="lex" val=","/>
      	</fs>
      </atomcat>
    </Leafnode>
	</Treenode>
</xsl:template>

<xsl:template match="Treenode[*[3]/@pos1='PUNCT_NP_MOD_BAL']">
	<xsl:apply-templates select="*[2]"/>
</xsl:template>

<!--Alloting correct ids to the category of s[dcl]\s[dcl]-->
<xsl:template match="fs" mode="arg1Id">
  <xsl:variable name="id" select="java:getglobalId($obj)"/>
  <fs id="{$id}">
		<xsl:apply-templates mode="arg1Id"/>
		<xsl:if test="$id='1'">
		</xsl:if>
  </fs>
</xsl:template>

<!--arg1 copy rule-->
<xsl:template match="@*|node()" mode="arg1Id">
  <xsl:copy>
    <xsl:apply-templates select="@*|node()" mode="arg1Id"/>
  </xsl:copy>
</xsl:template>

<!--Default global copy rule-->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/annotateVPCommas.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  xmlns:exsl="http://exslt.org/common"
  extension-element-prefixes="exsl"		
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

  <xsl:output method="xml" indent="yes" xalan2:indent-amount="2"/>
  <xsl:strip-space elements="*"/>

<!--Java helper class-->
<xsl:variable name="obj" select="java:opennlp.ccgbank.convert.PunctHelper.new()"/>
<!--Comma cat which deals with comma before/after verbal adjuncts-->
<!--[s\np= , s\np] & [s\np= s\np ,]-->

<xsl:template match="/">
  <xsl:apply-templates/>
</xsl:template>

<xsl:template match="Leafnode[@pos1='PUNCT_PRE-VP_ADJ' or @pos1='PUNCT_POST-VP_ADJ']">
	
	<xsl:if test="@pos1='PUNCT_POST-VP_ADJ'">
		<xsl:variable name="feat" select="preceding-sibling::Treenode/*[1]/*[1]/fs/feat/@val"/>		
		<xsl:call-template name = "punct-cat">
			<xsl:with-param name = "slash-dir" >\</xsl:with-param>
			<xsl:with-param name = "feat"  select="$feat"/>
		</xsl:call-template>
	</xsl:if>	

	<xsl:if test="@pos1='PUNCT_PRE-VP_ADJ'">

		<xsl:variable name="feat" select="following-sibling::Treenode/*[1]/*[1]/fs/feat/@val"/>		
		<xsl:call-template name = "punct-cat">
			<xsl:with-param name = "slash-dir" >/</xsl:with-param>
			<xsl:with-param name = "feat"  select="$feat"/>
		</xsl:call-template>
	</xsl:if>	

</xsl:template>

<xsl:template name="punct-cat">
	<xsl:param name="slash-dir"/>
	<xsl:param name="feat"/>

	<Leafnode>
		<xsl:copy-of select="@*"/>	
		<complexcat>
     	<atomcat type="s">
       	<fs inheritsFrom="1">
         	<feat attr="form" val="{$feat}"/>
         </fs>
      </atomcat>
      <slash dir="\" mode="&lt;"/>
    	<atomcat type="np">
      	<fs id="2">
       	</fs>
      </atomcat>
      <slash dir="{$slash-dir}" mode="*"/>
      <complexcat>
      	<atomcat type="s">
	      	<fs id="1">
       	 		<feat attr="form" val="{$feat}"/>
       		</fs>
       	</atomcat>
       	<slash dir="\" mode="&lt;"/>
       	<atomcat type="np">
       		<fs id="2">
					</fs>
       	</atomcat>
     	</complexcat>
    </complexcat>
	</Leafnode>
</xsl:template>


<!--Emph final commas-->
<xsl:template match="Treenode[@cat0='(S\NP)\(S\NP)' and preceding::Leafnode[1]/@pos1='PUNCT_EMPH_FINAL']">

	<xsl:variable name="comma" select="preceding::Leafnode[1]"/>

	<Treenode>
		<xsl:apply-templates select="@*|*[1]"/>
		<Leafnode>
			<xsl:apply-templates select="$comma/@*"/>
			<complexcat>
				<xsl:apply-templates select="*[1]/*" mode="res"/>
				<xsl:variable name="void1" select="java:globalInit($obj)"/>				
				<slash dir="/" mode="*"/>
				<xsl:apply-templates select="*[1]" mode="res"/>
				<xsl:variable name="void2" select="java:globalInit($obj)"/>				
			</complexcat>
		</Leafnode>
		<Treenode>
			<xsl:apply-templates select="@*|node()"/>
		</Treenode>
	</Treenode>

</xsl:template>

<xsl:template match="atomcat[@type='s']" mode="res">

	<xsl:variable name="id" select="java:getPOS($obj)"/>		

	<atomcat type="s">
		<xsl:choose>
			<xsl:when test="string-length($id) &gt; 0">
				<fs id="1"/>
				<xsl:variable name="void" select="java:initPOS($obj)"/>
			</xsl:when>
			<xsl:otherwise>
				<fs inheritsFrom="1"/>
				<xsl:variable name="void" select="java:storePOS($obj,'1')"/>		
			</xsl:otherwise>
		</xsl:choose>
	</atomcat>
</xsl:template>
<xsl:template match="atomcat[@type='np']" mode="res">
	<atomcat type="np">
		<fs id="2"/>
	</atomcat>
</xsl:template>

<!--Emph final commas anchoring a verbal frame-->
<xsl:template match="Treenode[@cat0='(S\NP)\(S\NP)' and preceding::Leafnode[1]/@pos1='PUNCT_EMPH_FINAL_VRB']">

	<xsl:variable name="comma" select="preceding::Leafnode[1]"/>

	<Treenode>
		<xsl:apply-templates select="@*|*[1]"/>
		<Leafnode>
			<xsl:apply-templates select="$comma/@*"/>
			<complexcat>
				<xsl:apply-templates select="*[1]/*" mode="res"/>
				<xsl:variable name="void1" select="java:globalInit($obj)"/>				
				<slash dir="/" mode="*"/>
				<xsl:apply-templates select="*[2]/*[1]" mode="arg"/>
				<xsl:variable name="id" select="java:globalInit($obj)"/>		
			</complexcat>
		</Leafnode>
		<xsl:apply-templates select="*[2]"/>
	</Treenode>

</xsl:template>

<xsl:template match="atomcat[@type='s']" mode="arg">

	<xsl:variable name="id0" select="number(java:getglobalId($obj))-1"/>		

	<xsl:choose>
		<xsl:when test="$id0 &lt; 3">
			<xsl:variable name="void" select="java:setglobalId($obj,2)"/>		
		</xsl:when>	
		<xsl:otherwise>
			<xsl:variable name="void" select="java:setglobalId($obj,number($id0))"/>		
		</xsl:otherwise>
	</xsl:choose>

	<atomcat type="s">
		<xsl:variable name="id" select="java:getglobalId($obj)"/>		
		<fs id="{$id}"/>
	</atomcat>
	
</xsl:template>
<xsl:template match="atomcat[@type='np']" mode="arg">
	<atomcat type="np">
		<fs id="2"/>
	</atomcat>
</xsl:template>


<!--Delete orig CCGbank comma-->
<xsl:template match="Treenode[*[3][starts-with(@pos1,'PUNCT_EMPH_FINAL')]]">
	<xsl:apply-templates select="*[2]"/>
</xsl:template>


<!-- Spl copy rule 1-->
  <xsl:template match="@*|node()" mode="arg">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()" mode="arg"/>
    </xsl:copy>
  </xsl:template>

<!-- Spl copy rule 2-->
<xsl:template match="@*|node()" mode="res">
   <xsl:copy>
     <xsl:apply-templates select="@*|node()" mode="res"/>
   </xsl:copy>
</xsl:template>

<!--Default global copy rule-->
<xsl:template match="@*|node()">
	<xsl:copy>
 		<xsl:apply-templates select="@*|node()"/>
	</xsl:copy>
</xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/balanceAppos.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

<xsl:output method="xml" indent="yes" xalan2:indent-amount="2" omit-xml-declaration = "yes"/>

<xsl:strip-space elements="*"/>

<!--Java helper class-->
<xsl:variable name="obj" select="java:opennlp.ccgbank.convert.PunctHelper.new()"/>
<!--Transform which ensures balancing of appositive nps-->

<xsl:template match="/">
  <xsl:apply-templates/>
</xsl:template>

<!--Mark cat of unbal appos punct which actually has a balancing comma-->
<xsl:template match="Treenode[*[2][preceding::Leafnode[1]/@pos1='PUNCT_APPOS_WH' and count(descendant::atomcat[@type='punct'])=1] and following::Leafnode[1]/@pos1=',' ]">

	<Treenode>
		<xsl:apply-templates select="@*|*[1]"/>
	
		<Treenode>
			<xsl:apply-templates select="@*"/>
			<complexcat>
				<xsl:apply-templates select="*[1]/*"/>
				<slash dir="/" mode="*"/>
				<atomcat type="punct">
  				<fs id="3">
						<feat attr="lex" val=","/>
					</fs>
  			</atomcat>
			</complexcat>
			<Leafnode cat="{*[2]/@cat}" lexeme="{*[2]/@lexeme}" pos1="{*[2]/@pos1}" cat0="{*[2]/@cat0}">
				<xsl:apply-templates select="*[2]/@*"/>
				<complexcat>
					<xsl:apply-templates select="*[2]/*[1]/*[position() &lt; 6]" mode="punctFeat"/>
					<slash dir="/" mode="*"/>
					<atomcat type="punct">
  					<fs id="3">
							<feat attr="lex" val=","/>
						</fs>
  				</atomcat>
					<slash dir="/" mode="*"/>
					<xsl:apply-templates select="*[2]/*[1]/*[position() &gt; 6]"/>
				</complexcat>
 	 		</Leafnode>
			<xsl:apply-templates select="*[3]" mode="avoid"/>
		</Treenode>
		<Leafnode cat="" lexeme="," pos1="TRIAL_{*[2]/@pos1}_BAL"  pos="," cat0=",">
  		<atomcat type="punct">
   			<fs id="1">
					<feat attr="lex" val=","/>
				</fs>
  		</atomcat>
 		</Leafnode>
	</Treenode>
</xsl:template>

<!--Mark cat of unbal appos punct which actually has a balancing comma-->
<xsl:template match="Treenode[*[2][(@pos1='PUNCT_APPOS_MISC' or @pos1='PUNCT_APPOS' or @pos1 ='PUNCT_APPOS_VRB') and not (descendant::atomcat[@type='punct']) and not(../../preceding-sibling::Leafnode[1]/@cat0='(S[dcl]\S[dcl])/NP')] and (following::Leafnode[1]/@pos1=',' or *[3]/descendant::Leafnode[position()=last()]/@pos1=',')]">

	<Treenode>
		<xsl:apply-templates select="@*|*[1]"/>
	
		<Treenode>
			<xsl:apply-templates select="@*"/>
			<complexcat>
				<xsl:apply-templates select="*[1]/*"/>
				<slash dir="/" mode="*"/>
				<atomcat type="punct">
  				<fs id="3">
						<feat attr="lex" val=","/>
					</fs>
  			</atomcat>
			</complexcat>
			<Leafnode cat="{*[2]/@cat}" lexeme="{*[2]/@lexeme}" pos1="{*[2]/@pos1}" cat0="{*[2]/@cat0}">
				<xsl:apply-templates select="*[2]/@*"/>
				<complexcat>
					<xsl:apply-templates select="*[2]/*[1]/*[position() &lt; 4]" mode="punctFeat"/>
					<slash dir="/" mode="*"/>
					<atomcat type="punct">
  					<fs id="2">
							<feat attr="lex" val=","/>
						</fs>
  				</atomcat>
					<slash dir="/" mode="*"/>
					<xsl:apply-templates select="*[2]/*[1]/*[position() &gt; 4]"/>
				</complexcat>
 	 		</Leafnode>
			<xsl:apply-templates select="*[3]" mode="avoid"/>
		</Treenode>
		<Leafnode cat="" lexeme="," pos1="TRIAL_{*[2]/@pos1}_BAL"  pos="," cat0=",">
  		<atomcat type="punct">
   			<fs id="1">
					<feat attr="lex" val=","/>
				</fs>
  		</atomcat>
 		</Leafnode>
	</Treenode>
</xsl:template>

<xsl:template match="Leafnode/complexcat/*[1]/fs" mode="punctFeat">
	<fs>
		<xsl:apply-templates select="@*"/>
		<xsl:apply-templates mode="punctFeat"/>
	</fs>
</xsl:template>
<xsl:template match="Leafnode/complexcat/*[1]/fs/feat[@attr='bal']" mode="punctFeat"/>

<!--punctFeat global copy rule-->
  <xsl:template match="@*|node()" mode="punctFeat">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()" mode="punctFeat"/>
    </xsl:copy>
  </xsl:template>


<!--avoid global copy rule-->
  <xsl:template match="@*|node()" mode="avoid">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()" mode="avoid"/>
    </xsl:copy>
  </xsl:template>


<!--Default global copy rule-->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/balanceDash-Paren.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

<xsl:output method="xml" indent="yes" xalan2:indent-amount="2" omit-xml-declaration = "yes"/>

<xsl:strip-space elements="*"/>

<!--Transform which adds the balancing punct to dash and left bracket-->


<!--Java helper class-->
<xsl:variable name="obj" select="java:opennlp.ccgbank.convert.PunctHelper.new()"/>

<xsl:template match="/">
  <xsl:apply-templates/>
</xsl:template>

<!--Delete existing balancing dash-->
<xsl:template match="Treenode[*[3]/@lexeme='--' and descendant::Leafnode/@pos1='PUNCT_ELAB_DASH_CAT']">
	<xsl:apply-templates select="*[2]"/>
</xsl:template>

<!--Delete existing balancing bracket-->
<xsl:template match="Treenode[*[3][@lexeme='-rrb-' or @lexeme='-rcb-'] and *[2]/*[2]/@pos1='PUNCT_LPAREN0']">
	<xsl:apply-templates select="*[2]"/>
</xsl:template>

<xsl:template match="Treenode[*[2][@pos1='PUNCT_ELAB_DASH_CAT' or @pos1='PUNCT_LPAREN0']]">
	
	<xsl:choose>
		<xsl:when test="*[2]/@pos1='PUNCT_LPAREN0'">
      <xsl:variable name="dummy0" select="java:storePOS($obj,'PUNCT_LPAREN0')"/>
			<xsl:variable name="dummy1" select="java:storeFeat($obj,concat('-r',substring(*[2]/@lexeme,3,5)))"/>
    </xsl:when>
    <xsl:otherwise>
      <xsl:variable name="dummy0" select="java:storePOS($obj,'PUNCT_ELAB_DASH_CAT')"/>
			<xsl:variable name="dummy1" select="java:storeFeat($obj,*[2]/@lexeme)"/>
    </xsl:otherwise>
  </xsl:choose>
	<xsl:variable name="pos" select="java:getPOS($obj)"/>
	<xsl:variable name="lexVal" select="java:getFeat($obj)"/>

	<Treenode cat="" head="0" dtr="2" cat0="NP\NP">
		<xsl:apply-templates select="@*|*[1]"/>	
		<Treenode cat="np\np/*punct[,]" head="0" dtr="2" cat0="">
			<xsl:apply-templates select="@*"/>	
      <complexcat>
				<xsl:apply-templates select="*[1]/*"/>	
				<slash dir="/" mode="*"/>
        <atomcat type="punct">
         	<fs id="2">
           	<feat attr="lex" val="{$lexVal}"/>
         	</fs>
        </atomcat>
      </complexcat>
			<Leafnode cat="{*[2]/@cat}" lexeme="{*[2]/@lexeme}" pos1="{$pos}" cat0="{*[2]/@cat0}">
				<xsl:apply-templates select="*[2]/@*[not(name()='pos1')]"/>	
				<complexcat>
							
					<xsl:apply-templates select="*[2]/complexcat/*[position() &lt; last()-1]"/>

					<slash dir="/" mode="*"/>
					<atomcat type="punct">
  	  			<fs id="11">
    					<feat attr="lex" val="{$lexVal}"/>
						</fs>
      		</atomcat>
					<slash dir="/" mode="*"/>
					<xsl:apply-templates select="*[2]/complexcat/*[position()=last()]"/>
				</complexcat>
			</Leafnode>
			<xsl:apply-templates select="*[3]"/>	
		</Treenode>	
		<Leafnode cat="punct[--]_1" lexeme="{$lexVal}" pos=":" pos1="{$pos}_BAL" cat0=",">
    	<atomcat type="punct">
     		<fs id="1">
       		<feat attr="lex" val="{$lexVal}"/>
       	</fs>
     	</atomcat>
    </Leafnode>
		<xsl:variable name="dummy0" select="java:featInit($obj)"/>
		<xsl:variable name="dummy1" select="java:initPOS($obj)"/>	
	</Treenode>	
</xsl:template>

<!--Default global copy rule-->
	<xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
	</xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/catCheck.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

<xsl:output method="xml" indent="yes" xalan2:indent-amount="2" omit-xml-declaration = "yes"/>

<xsl:strip-space elements="*"/>

<!--Transform which checks discrepancies between cat0 and cat-->

<!--Java class which compares cat0 and cat-->
<xsl:variable name="obj" select="java:opennlp.ccgbank.convert.DiscrCheck.new()"/>

<xsl:template match="/">
  	<xsl:apply-templates/>
</xsl:template>

<xsl:template match="Treenode[@Header]">
	<xsl:variable name="dummy1" select="java:storeId($obj,@Header)"/>
	<xsl:apply-templates/>
</xsl:template>

<!--Check discrepancy between cat0 and cat-->
<xsl:template match="Leafnode">
	<Leafnode cat="{@cat}" lexeme="{@lexeme}" pos="{@pos}" cat0="{@cat0}">
		<xsl:apply-templates/>	
	</Leafnode>
	<xsl:variable name="dummy" select="java:checkCatDiscr($obj,@cat,@cat0,@lexeme)"/>
</xsl:template>


<!--Default global copy rule-->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/ccgRules.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->

<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

  <xsl:output method="xml" indent="yes" xalan2:indent-amount="2"/>
  <xsl:strip-space elements="*"/>

  <!--Transform which adds standard ccg rules -->
  
  <xsl:variable name="obj" select="java:opennlp.ccgbank.extract.RulesTally.new()"/>
  
  
  <!--Add attributes to the root for openccg-->
  <xsl:template match="rules"> 
    <rules name="protogrammar" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:noNamespaceSchemaLocation="../rules.xsd">
      <!-- combinatory rules -->
      <application dir="forward"/> 
      <application dir="backward"/>
      <composition dir="forward" harmonic="true"/>
      <composition dir="backward" harmonic="true"/>
      <!-- <composition dir="forward" harmonic="false"/> -->
      <composition dir="backward" harmonic="false"/>
      <typeraising dir="forward" useDollar="false"/>
      <typeraising dir="backward" useDollar="true"/>
      <typeraising dir="backward" useDollar="true">
        <arg><atomcat type="pp"/></arg>
      </typeraising>
      <!-- process extracted rules -->
      <xsl:apply-templates/>
      <!-- add extra rules -->
      <xsl:call-template name="add-extra-rules"/>
    </rules>
  </xsl:template>
  
  <!-- For dev, mark rule as unmatched if no other template matches -->
  <xsl:template match="typechanging" mode="refine">
    <xsl:if test="java:keepUnmatched($obj)">
      <typechanging name="{@name}" unmatched="true">
        <xsl:apply-templates mode="refine"/>
      </typechanging>
    </xsl:if>
  </xsl:template>
  
  
  <!-- Skip rules equivalent to type raising ones (except clausal type raising handled below) -->
  <xsl:template match="typechanging[arg/atomcat[@type='np' or @type='pp'] 
		       and result/complexcat/atomcat[1][@type='s']]"/>
  
  <!-- Skip rules with $ in them (presumably equivalent to ones without $) -->
  <xsl:template match="typechanging[contains(@name,'$')]"/>

  <!-- Skip s[adj]\np clausal adjunction (subsumed by more general rule) -->
  <xsl:template match="typechanging[@name='s[adj]\np_to_s[adj]\np\(s[adj]\np)']"/>

  <!-- Skip bogus s[dcl]\np_to_np\np rule -->
  <xsl:template match="typechanging[@name='s[dcl]\np_to_np\np']"/>


  <!-- Add type changing rules when seen with sufficient frequency -->
  <xsl:template match="typechanging">
    <xsl:if test="java:checkRuleFreqStatus($obj,string(@name))">
      <xsl:apply-templates select="." mode="refine"/>
    </xsl:if>
  </xsl:template>

  
  <!-- Refine n_to_np with nil det, coindexation --> 
  <!-- nb: should restrict, but need to handle bare plurals, mass nouns and proper nouns -->
  <xsl:template match="typechanging[@name='n_to_np']" mode="refine">
    <typechanging name="n_to_np">
      <arg>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index"> <lf> <nomvar name="X"/> </lf> </feat>
          </fs>
        </atomcat>
      </arg>
      <result>
        <atomcat type="np">
          <fs id="2">
            <feat attr="pers" val="3rd"/>
          </fs>
          <lf>
            <satop nomvar="X">
              <diamond mode="det"> <prop name="nil"/> </diamond>
            </satop>
          </lf>
        </atomcat>
      </result>
    </typechanging>
  </xsl:template>

  
  <!-- clausal modifiers -->
  <xsl:template match="typechanging[ 
		       arg/complexcat[atomcat[1][@type='s'] and atomcat[2][@type='np']]]" 
		mode="refine"> 
    <xsl:apply-templates select="." mode="refine-clausal"/>
  </xsl:template>
  
  <!-- clausal modifiers: s in arg -->
  <xsl:template match="arg/complexcat/atomcat[1][@type='s']" mode="refine-clausal">
    <atomcat type="{@type}">
      <fs>
        <feat attr="index"> <lf> <nomvar name="E"/> </lf> </feat>
        <xsl:apply-templates select="fs/*" mode="refine-clausal"/>
      </fs>
    </atomcat>
  </xsl:template>
  
  <!-- clausal modifiers: n|np -->
  <xsl:template match="atomcat[@type='n' or @type='np']" mode="refine-clausal">
    <atomcat type="{@type}">
      <fs id="2">
        <feat attr="index"> <lf> <nomvar name="X"/> </lf> </feat>
        <xsl:apply-templates select="fs/*" mode="refine-clausal"/>
      </fs>
    </atomcat>
  </xsl:template>
  
  <!-- clausal modifiers: s in result -->
  <xsl:template match="result//atomcat[@type='s']" mode="refine-clausal">
    <atomcat type="{@type}">
      <fs id="3">
        <feat attr="index"> <lf> <nomvar name="E0"/> </lf> </feat>
        <xsl:apply-templates select="fs/*" mode="refine-clausal"/>
      </fs>
    </atomcat>
  </xsl:template>
  
	
  <!-- clausal modifiers: add lf to postnominal result -->
  <xsl:template match="result/complexcat[atomcat[1][@type='np' or @type='n']]" mode="refine-clausal">
    <xsl:variable name="rel">
      <xsl:call-template name="clausal-mod-rel">
	<xsl:with-param name="arg" select="../../arg"/> 
      </xsl:call-template>
    </xsl:variable>
    <complexcat>
      <xsl:apply-templates mode="refine-clausal"/>
      <lf>
        <satop nomvar="X">
          <diamond mode="{$rel}"> <nomvar name="E"/> </diamond>
        </satop>
      </lf>
    </complexcat>
  </xsl:template>
  
  <!-- clausal modifiers: add lf to vp result -->
  <xsl:template match="result/complexcat[atomcat[1][@type='s']]" mode="refine-clausal">
    <xsl:variable name="rel">
      <xsl:call-template name="clausal-mod-rel">
	<xsl:with-param name="arg" select="../../arg"/> 
      </xsl:call-template>
    </xsl:variable>
    <complexcat>
      <xsl:apply-templates mode="refine-clausal"/>
      <lf>
        <satop nomvar="E0">
          <diamond mode="{$rel}"> <nomvar name="E"/> </diamond>
        </satop>
      </lf>
    </complexcat>
  </xsl:template>
  
  <!-- determine Purpose or GenRel for clausal-mod rule -->
  <xsl:template name="clausal-mod-rel">
    <xsl:param name="arg"/>
    <xsl:choose>
      <xsl:when test="$arg/complexcat/atomcat[1]/fs/feat[@attr='form']/@val='to'">Purpose</xsl:when>
      <xsl:otherwise>GenRel</xsl:otherwise>
    </xsl:choose>
  </xsl:template>
  
  
  <!-- clausal type raising -->
  <xsl:template match="typechanging[ 
		       @name='s[adj]\np_to_s\np\(s\np/(s[adj]\np))' or
		       @name='s[to]\np_to_s\np\(s\np/(s[to]\np))' ]" 
		mode="refine">
    <xsl:apply-templates select="." mode="refine-clausal-tr"/>
  </xsl:template>

  <!-- clausal TR: s in result -->
  <xsl:template match="result//atomcat[1][@type='s']" mode="refine-clausal-tr">
    <atomcat type="{@type}">
      <fs id="3">
        <xsl:apply-templates select="fs/*" mode="refine-clausal-tr"/>
      </fs>
    </atomcat>
  </xsl:template>
  
  <!-- clausal TR: np in result -->
  <xsl:template match="result//atomcat[2][@type='np']" mode="refine-clausal-tr">
    <atomcat type="{@type}">
      <fs id="4">
        <xsl:apply-templates select="fs/*" mode="refine-clausal-tr"/>
      </fs>
    </atomcat>
  </xsl:template>
  
  <!-- clausal TR: raised s in arg or result -->
  <xsl:template match="arg/complexcat/atomcat[1][@type='s'] | 
		       result/complexcat/complexcat/complexcat/atomcat[1][@type='s']" 
		mode="refine-clausal-tr">
    <atomcat type="{@type}">
      <fs id="1">
        <xsl:apply-templates select="fs/*" mode="refine-clausal-tr"/>
      </fs>
    </atomcat>
  </xsl:template>
  
  <!-- clausal TR: np in arg or result -->
  <xsl:template match="arg/complexcat/atomcat[2][@type='np'] | 
		       result/complexcat/complexcat/complexcat/atomcat[2][@type='np']" 
		mode="refine-clausal-tr">
    <atomcat type="{@type}">
      <fs id="2">
        <xsl:apply-templates select="fs/*" mode="refine-clausal-tr"/>
      </fs>
    </atomcat>
  </xsl:template>
  

  <!-- Some more unary rules (nb: these bypass frequency filter) -->

  <xsl:template match="typechanging[@name='s[dcl]_to_np\np']">
    <typechanging name="s[dcl]_to_np\np">
      <arg>
	<atomcat type="s">
          <fs>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
            <feat attr="form" val="dcl"/>
         </fs>
	</atomcat>
      </arg>
      <result>
	<complexcat>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
		<lf>
                  <nomvar name="X"/>
		</lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="^"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
		<lf>
                  <nomvar name="X"/>
		</lf>
              </feat>
            </fs>
          </atomcat>
          <lf>
            <satop nomvar="X">
              <diamond mode="GenRel">
		<nomvar name="E"/>
              </diamond>
            </satop>
          </lf>
	</complexcat>
      </result>
    </typechanging>
  </xsl:template>
	
  <xsl:template match="typechanging[@name='s[dcl]_to_s\s']">
    <typechanging name="s[dcl]_to_s\s">
      <arg>
	<atomcat type="s">
          <fs>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
            <feat attr="form" val="dcl"/>
         </fs>
	</atomcat>
      </arg>
      <result>
	<complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
		<lf>
                  <nomvar name="E0"/>
		</lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="*"/>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
		<lf>
                  <nomvar name="E0"/>
		</lf>
              </feat>
            </fs>
          </atomcat>
          <lf>
            <satop nomvar="E0">
              <diamond mode="GenRel">
		<nomvar name="E"/>
              </diamond>
            </satop>
          </lf>
	</complexcat>
      </result>
    </typechanging>
  </xsl:template>
	
  <xsl:template match="typechanging[@name='s[dcl]_to_s\np\(s\np)\(s\np\(s\np))']">
    <typechanging name="s[dcl]_to_s\np\(s\np)\(s\np\(s\np))">
      <arg>
	<atomcat type="s">
          <fs>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
            <feat attr="form" val="dcl"/>
          </fs>
	</atomcat>
      </arg>
      <result>
	<complexcat>
          <atomcat type="s">
            <fs inheritsFrom="1">
              <feat attr="mod-index">
		<lf>
                  <nomvar name="M"/>
		</lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
		<lf>
                  <nomvar name="X2"/>
		</lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <complexcat>
            <atomcat type="s">
              <fs id="1">
		<feat attr="index">
                  <lf>
                    <nomvar name="X1"/>
                  </lf>
		</feat>
              </fs>
            </atomcat>
            <slash dir="\" mode="&lt;"/>
            <atomcat type="np">
              <fs id="2">
		<feat attr="index">
                  <lf>
                    <nomvar name="X2"/>
                  </lf>
		</feat>
              </fs>
            </atomcat>
          </complexcat>
          <slash dir="\" mode="^"/>
          <complexcat>
            <atomcat type="s">
              <fs inheritsFrom="1">
		<feat attr="mod-index">
                  <lf>
                    <nomvar name="M"/>
                  </lf>
		</feat>
              </fs>
            </atomcat>
            <slash dir="\" mode="&lt;"/>
            <atomcat type="np">
              <fs id="2">
		<feat attr="index">
                  <lf>
                    <nomvar name="X2"/>
                  </lf>
		</feat>
              </fs>
            </atomcat>
            <slash dir="\" mode="&lt;"/>
            <complexcat>
              <atomcat type="s">
		<fs id="1">
                  <feat attr="index">
                    <lf>
                      <nomvar name="X1"/>
                    </lf>
                  </feat>
		</fs>
              </atomcat>
              <slash dir="\" mode="&lt;"/>
              <atomcat type="np">
		<fs id="2">
                  <feat attr="index">
                    <lf>
                      <nomvar name="X2"/>
                    </lf>
                  </feat>
		</fs>
              </atomcat>
            </complexcat>
          </complexcat>
          <lf>
            <satop nomvar="M">
              <diamond mode="GenRel">
		<nomvar name="E"/>
              </diamond>
            </satop>
          </lf>
	</complexcat>
      </result>
    </typechanging>
  </xsl:template>

  <xsl:template match="typechanging[@name='s[dcl]_to_s/s\(s/s)']">
    <typechanging name="s[dcl]_to_s/s\(s/s)">
      <arg>
	<atomcat type="s">
      	  <fs>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
            <feat attr="form" val="dcl"/>
          </fs>
      	</atomcat>
      </arg>
      <result>
	<complexcat>
          <atomcat type="s">
            <fs inheritsFrom="1">
              <feat attr="mod-index">
		<lf>
                  <nomvar name="M"/>
		</lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="/" mode="&gt;"/>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
		<lf>
                  <nomvar name="X1"/>
		</lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="^"/>
          <complexcat>
            <atomcat type="s">
              <fs inheritsFrom="1">
		<feat attr="mod-index">
                  <lf>
                    <nomvar name="M"/>
                  </lf>
		</feat>
              </fs>
            </atomcat>
            <slash dir="/" mode="&gt;"/>
            <atomcat type="s">
              <fs id="1">
		<feat attr="index">
                  <lf>
                    <nomvar name="X1"/>
                  </lf>
		</feat>
              </fs>
            </atomcat>
          </complexcat>
          <lf>
            <satop nomvar="M">
              <diamond mode="Mod">
		<nomvar name="E"/>
              </diamond>
            </satop>
          </lf>
	</complexcat>
      </result>
    </typechanging>
  </xsl:template>


  <!-- event nominalization (VP) -->
  <xsl:template match="typechanging[@name='s[ng]\np_to_np']">
    <typechanging name="s[ng]\np_to_np">
      <arg>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
		<lf>
		  <nomvar name="E"/>
		</lf>
              </feat>
	      <feat attr="form" val="ng"/>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="2">
	      <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
	      </feat>
            </fs>
          </atomcat>
        </complexcat>
      </arg>
      <result>
	<atomcat type="np">
          <fs>
	    <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
	    </feat>
          </fs>
          <lf>
            <satop nomvar="E">
              <diamond mode="nom">
		<prop name="+"/>
              </diamond>
            </satop>
          </lf>
	</atomcat>
      </result>
    </typechanging>
  </xsl:template>

  <!-- event nominalization (S) -->
  <xsl:template match="typechanging[@name='s[ng]_to_np']">
    <typechanging name="s[ng]_to_np">
      <arg>
	<atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
		<nomvar name="E"/>
              </lf>
            </feat>
	    <feat attr="form" val="ng"/>
          </fs>
	</atomcat>
      </arg>
      <result>
	<atomcat type="np">
          <fs>
	    <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
	    </feat>
          </fs>
          <lf>
            <satop nomvar="E">
              <diamond mode="nom">
		<prop name="+"/>
              </diamond>
            </satop>
          </lf>
	</atomcat>
      </result>
    </typechanging>
  </xsl:template>

  <!-- 'to' rel clause with no subject (eg 'anything to say') -->
  <xsl:template match="typechanging[@name='s[to]\np/np_to_np\np']">
    <typechanging name="s[to]\np/np_to_np\np">
      <arg>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
		<lf>
		  <nomvar name="E"/>
		</lf>
              </feat>
	      <feat attr="form" val="to"/>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="2">
	      <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
	      </feat>
            </fs>
          </atomcat>
          <slash dir="/" mode="&gt;"/>
          <atomcat type="np">
            <fs id="3">
	      <feat attr="index">
                <lf>
                  <nomvar name="Y"/>
                </lf>
	      </feat>
            </fs>
          </atomcat>
        </complexcat>
      </arg>
      <result>
	<complexcat>
          <atomcat type="np">
            <fs id="3">
              <feat attr="index">
		<lf>
                  <nomvar name="Y"/>
		</lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="^"/>
          <atomcat type="np">
            <fs id="3">
              <feat attr="index">
		<lf>
                  <nomvar name="Y"/>
		</lf>
              </feat>
            </fs>
          </atomcat>
          <lf>
            <satop nomvar="Y">
              <diamond mode="GenRel">
		<nomvar name="E"/>
              </diamond>
            </satop>
          </lf>
	</complexcat>
      </result>
    </typechanging>
  </xsl:template>

  <!-- np topicalization -->
  <xsl:template match="typechanging[@name='np_to_s/(s/np)']">
    <typechanging name="np_to_s/(s/np)">
      <arg>
        <atomcat type="np">
          <fs id="2">
	    <feat attr="index">
	      <lf>
                <nomvar name="X2"/>
	      </lf>
            </feat>
          </fs>
        </atomcat>
      </arg>
      <result>
	<complexcat>
          <atomcat type="s">
            <fs id="1">
	      <feat attr="index">
		<lf>
                  <nomvar name="X1"/>
		</lf>
	      </feat>
            </fs>
          </atomcat>
          <slash dir="/" mode="&gt;"/>
	  <complexcat>
            <atomcat type="s">
              <fs id="1">
            	<feat attr="index">
              	  <lf>
                    <nomvar name="X1"/>
              	  </lf>
            	</feat>
              </fs>
            </atomcat>
	    <slash dir="/" mode="&gt;"/>
	    <atomcat type="np">
              <fs id="2">
            	<feat attr="index">
              	  <lf>
                    <nomvar name="X2"/>
              	  </lf>
            	</feat>
              </fs>
            </atomcat>
	  </complexcat>
          <lf>
            <satop nomvar="X2">
              <diamond mode="top">
		<prop name="+"/>
              </diamond>
            </satop>
          </lf>
	</complexcat>
      </result>
    </typechanging>
  </xsl:template>
  
  <!-- np type raising rule with np result (eg "some/all of which") -->
  <xsl:template match="typechanging[@name='np_to_np/(np\np)']">
    <typechanging name="np_to_np/(np\np)">
      <arg>
        <atomcat type="np">
          <fs id="2">
	    <feat attr="index">
	      <lf>
                <nomvar name="X2"/>
	      </lf>
            </feat>
          </fs>
        </atomcat>
      </arg>
      <result>
	<complexcat>
          <atomcat type="np">
            <fs id="1">
	      <feat attr="index">
		<lf>
                  <nomvar name="X1"/>
		</lf>
	      </feat>
            </fs>
          </atomcat>
          <slash dir="/" mode="^"/>
	  <complexcat>
            <atomcat type="np">
              <fs id="1">
            	<feat attr="index">
              	  <lf>
                    <nomvar name="X1"/>
              	  </lf>
            	</feat>
              </fs>
            </atomcat>
	    <slash dir="\" mode="^"/>
	    <atomcat type="np">
              <fs id="2">
            	<feat attr="index">
              	  <lf>
                    <nomvar name="X2"/>
              	  </lf>
            	</feat>
              </fs>
            </atomcat>
	  </complexcat>
	</complexcat>
      </result>
    </typechanging>
  </xsl:template>
  
  <!-- This may play the same role as CandC's np np => np binary rule -->
  <xsl:template match="typechanging[@name='np_to_np\np']">
    <typechanging name="np_to_np\np">
      <arg>
	<atomcat type="np">
	  <fs>
	    <feat attr="index">
	      <lf>
		<nomvar name="E"/>
	      </lf>
	    </feat>
	  </fs>
	</atomcat>
      </arg>
      <result>
	<complexcat>
	  <atomcat type="np">
	    <fs id="2">
	      <feat attr="index">
		<lf>
		  <nomvar name="X"/>
		</lf>
	      </feat>
	    </fs>
	  </atomcat>
	  <slash dir="\" mode="^"/>
	  <atomcat type="np">
	    <fs id="2">
	      <feat attr="index">
		<lf>
		  <nomvar name="X"/>
		</lf>
	      </feat>
	    </fs>
	  </atomcat>
	  <lf>
	    <satop nomvar="X">
	      <diamond mode="ApposRel">
		<nomvar name="E"/>
	      </diamond>
	    </satop>
	  </lf>
	</complexcat>
      </result>
    </typechanging>
  </xsl:template>


  <!-- extra rules -->
  <xsl:template name="add-extra-rules">
    <!-- sent sequencing (also need s[dcl] s[dcl] => s[dcl], as in CandC?) -->
    <typechanging name="sent_to_sents\sent">
      <arg>
	<atomcat type="sent">
          <fs>
            <feat attr="index">
              <lf>
		<nomvar name="E2"/>
              </lf>
            </feat>
          </fs>
	</atomcat>
      </arg>
      <result>
	<complexcat>
          <atomcat type="sents">
            <fs>
              <feat attr="index">
		<lf>
                  <nomvar name="E"/>
		</lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="sent">
            <fs>
              <feat attr="index">
		<lf>
                  <nomvar name="E1"/>
		</lf>
              </feat>
            </fs>
          </atomcat>
          <lf>
            <satop nomvar="E">
              <prop name="SEQ"/>
              <diamond mode="Arg1">
		<nomvar name="E1"/>
              </diamond>
              <diamond mode="Arg2">
		<nomvar name="E2"/>
              </diamond>
            </satop>
          </lf>
	</complexcat>
      </result>
    </typechanging>
    <typechanging name="sents_to_sents\sent">
      <arg>
	<atomcat type="sents">
          <fs>
            <feat attr="index">
              <lf>
		<nomvar name="E2"/>
              </lf>
            </feat>
          </fs>
	</atomcat>
      </arg>
      <result>
	<complexcat>
          <atomcat type="sents">
            <fs>
              <feat attr="index">
		<lf>
                  <nomvar name="E"/>
		</lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="sent">
            <fs>
              <feat attr="index">
		<lf>
                  <nomvar name="E1"/>
		</lf>
              </feat>
            </fs>
          </atomcat>
          <lf>
            <satop nomvar="E">
              <prop name="SEQ"/>
              <diamond mode="Arg1">
		<nomvar name="E1"/>
              </diamond>
              <diamond mode="Arg2">
		<nomvar name="E2"/>
              </diamond>
            </satop>
          </lf>
	</complexcat>
      </result>
    </typechanging>
  </xsl:template>


  <!-- refine copy rule-->
  <xsl:template match="@*|node()" mode="refine">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()" mode="refine"/>
    </xsl:copy>
  </xsl:template>
  
  <!-- refine-clausal copy rule-->
  <xsl:template match="@*|node()" mode="refine-clausal">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()" mode="refine-clausal"/>
    </xsl:copy>
  </xsl:template>
  
  <!-- refine-clausal-tr copy rule-->
  <xsl:template match="@*|node()" mode="refine-clausal-tr">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"
      mode="refine-clausal-tr"/>
    </xsl:copy>
  </xsl:template>
  
  <!--Default global copy rule-->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>
  
</xsl:transform>


================================================
FILE: ccgbank/templates/changePunct.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

  <xsl:output method="xml" indent="yes" xalan2:indent-amount="2"/>
  <xsl:strip-space elements="*"/>
  
  <!-- Transform which modifies punctuation categories in parses. -->

  
  <!-- Change sentence-final punctuation to lex cats. -->
  <xsl:template match="Derivation/Treenode/*[1]">
    <xsl:variable name="head" select="../*[2]"/>
    <atomcat type="sent"> 
      <fs id="1">
        <xsl:apply-templates select="$head/atomcat/fs/* | $head/complexcat/atomcat[1]/fs/*"/>
      </fs>
    </atomcat>
  </xsl:template>
  
  <xsl:template match="Derivation/Treenode/*[3][self::Leafnode and @pos='.']">
    <Leafnode lexeme="{@lexeme}" pos="." cat0=".">
			<xsl:apply-templates select="@*"/>
      <complexcat>
        <atomcat type="sent"> <fs id="1"/> </atomcat>
        <slash dir="\" mode="*"/>
        <xsl:apply-templates select="../*[2]/*[1]" mode="add-id-1"/>
      </complexcat>
    </Leafnode>
  </xsl:template>
  
  <!-- add id="1" to result cat -->
  <xsl:template match="*[self::Treenode or self::Leafnode]/atomcat | *[self::Treenode or self::Leafnode]/complexcat/atomcat[1]" mode="add-id-1">
    <xsl:copy>
      <xsl:apply-templates select="@*" mode="add-id-1"/>
      <fs id="1">
        <xsl:apply-templates select="fs/*" mode="add-id-1"/>
      </fs>
    </xsl:copy>
  </xsl:template>
  
  <!-- add-id-1 copy rule -->
  <xsl:template match="@*|node()" mode="add-id-1">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()" mode="add-id-1"/>
    </xsl:copy>
  </xsl:template>

  
  <!-- default copy rule -->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>

================================================
FILE: ccgbank/templates/closedCatInsert.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->

<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

  <!-- Transform which loads word stems into closed lexical families -->

  <xsl:output method="xml" indent="yes" xalan2:indent-amount="2"/>
  <xsl:strip-space elements="*"/>
  
  <!-- For checking uniqueness of family members -->
  <xsl:variable name="obj" select="java:opennlp.ccgbank.extract.InsertLFHelper.new()"/>
  
  
  <!-- root -->
  <xsl:template match="ccg-lexicon">
    <ccg-lexicon>
      <!-- add licensing features for complementizer, infinitival-to, and expletive 'there' and 'it' -->
      <!-- nb: leaving out expletive 'there' and 'it' for now -->
      <licensing-features>
        <feat attr="form" val="emb" location="target-only"/>
        <feat attr="form" val="to" location="target-only"/>
	<!--
        <feat attr="form" val="thr" location="target-only"/>
        <feat attr="form" val="expl" location="target-only"/>
	-->
      </licensing-features>    
      <!-- process rest in descending order of frequency -->
      <xsl:apply-templates select="family">
        <xsl:sort select="@freq" order="descending" data-type="number"/>
      </xsl:apply-templates>
    </ccg-lexicon>
  </xsl:template>  


  <!-- closed families -->
  <xsl:template match="family[@closed='true']">           
    <family>
      <xsl:apply-templates select="@*"/>
     <!-- add indexRel -->
      <xsl:choose>
				<!-- case marking preps -->
        <xsl:when test="starts-with(@name,'pp[') and contains(@name,'~2') and not(@pos='CC' or @pos='PUNCT_CONJ')">
          <xsl:attribute name="indexRel">*NoSem*</xsl:attribute>
        </xsl:when>
        <!-- bare punct -->
        <xsl:when test="starts-with(@name,'punct')">
          <xsl:attribute name="indexRel">*NoSem*</xsl:attribute>
        </xsl:when>
				<!--Particles-->
				<xsl:when test="starts-with(@name,'prt')">
          <xsl:attribute name="indexRel">*NoSem*</xsl:attribute>
        </xsl:when>

        <!-- to-inf -->
        <xsl:when test="@name='s[to]_~1\np_2/(s[b]_1\np_2)' and @pos='TO'">
          <xsl:attribute name="indexRel">*NoSem*</xsl:attribute>
        </xsl:when>
        <!-- complementizer -->
        <xsl:when test="@name='s[em]_~1/s[dcl]_1'">
          <xsl:attribute name="indexRel">*NoSem*</xsl:attribute>
        </xsl:when>
        <!-- expletives -->
	<!-- nb: leaving out expletive 'there' and 'it' for now -->
	<!--
        <xsl:when test="@name='np[thr]_1' or @name='np[expl]_1'">
          <xsl:attribute name="indexRel">*NoSem*</xsl:attribute>
        </xsl:when>
	-->
        <!-- possessive -->
        <xsl:when test="@name='np_1/n_1\np_2' and @pos='POS'">
          <xsl:attribute name="indexRel">GenOwn</xsl:attribute>
        </xsl:when>
        <!--  relative pronouns -->
        <!-- nb: pos should be WDT or WP; but IN frequent w/ obj extr (!) -->
        <!-- nb: could distinguish 'that', 'which'; could distinguish 'who(m)' -->
        <xsl:when test="@name='np_~1\np_1/(s[dcl]_2\np_1)' or @name='np_~1\np_1/(s[dcl]_2/np_1)' 
          or @name='np_~1\np_1/s[dcl]_2\(np_3\np_4/np_1)'"
        >
          <!--<xsl:attribute name="indexRel">GenRel</xsl:attribute>-->
					<xsl:attribute name="indexRel">GenRel</xsl:attribute>
        </xsl:when>
        <!--  tbd: poss rel pro, 'whose' (WP$); free relatives? -->
      </xsl:choose>
      <xsl:apply-templates/>
      <!-- add members -->
      <!-- nb: should perhaps do indexing -->
      <xsl:variable name="fam" select="@name"/>
			<xsl:variable name="pos" select="@pos"/>
      <xsl:if test="java:resetStemRelPairs($obj)"/>
      <xsl:for-each select="../entry[@family=$fam and @pos=$pos]">
        <xsl:sort select="@stem"/>
        <xsl:sort select="@word"/>
        <xsl:variable name="stem">
          <xsl:choose>
            <xsl:when test="@stem"><xsl:value-of select="@stem"/></xsl:when>
            <xsl:otherwise><xsl:value-of select="@word"/></xsl:otherwise>
          </xsl:choose>
        </xsl:variable>
        <xsl:if test="not(java:containsStemRelPair($obj,$stem,@rel))">
          <member stem="{$stem}">
            <!-- add rel as pred when present -->
            <xsl:if test="@rel">
              <xsl:attribute name="pred"><xsl:value-of select="@rel"/></xsl:attribute>
            </xsl:if>
          </member>
        </xsl:if>
      </xsl:for-each>
    </family>
  </xsl:template>
  
  
  <!-- filter old internal punctuation categories (should eventually be replaced!) -->
  <!-- nb: use start of @name to catch old cats -->
  <!-- 
  <xsl:template match="family[@pos=',' or @pos=';' or @pos=':' or @pos='LRB' or @pos='RRB']"/>
  -->
  <xsl:template match="family[starts-with(@name,'.') or starts-with(@name,',') or starts-with(@name,';') or 
                              starts-with(@name,':') or starts-with(@name,'lrb') or starts-with(@name,'rrb')]"/>

  <!-- filter bogus conj cats -->
  <!-- eg: $_1\*($_1)/*($_1) and np_1\np_1\*($_1)/*(s[dcl]_2$_1) -->
  <xsl:template match="family[contains(@name,'($_1)')]"/>
  
  
  <!-- sentence-final punctuation --> 
  <!-- nb: could give int for syntactic questions with periods -->
  <xsl:template match="family[@pos='.' and ((starts-with(@name,'s_1') or starts-with(@name,'sent_1')))]"> 

    <family pos="{@pos}" name="{@name}" closed="true" indexRel="mood">
      <xsl:apply-templates/>
      <xsl:variable name="fam" select="@name"/>
      <xsl:variable name="argcat" select="entry/complexcat/*[3]"/>
      <xsl:for-each select="../entry[@family=$fam]">
        <xsl:variable name="pred">
          <xsl:choose>
            <xsl:when test="@word='?'">int</xsl:when>
            <xsl:when test="@word='!'">excl</xsl:when>
            <!-- mood is imperative for vp args -->
            <xsl:when test="$argcat/atomcat[1]/@type='s' and $argcat/atomcat[2]/@type='np'">imp</xsl:when>
            <xsl:otherwise>dcl</xsl:otherwise>
          </xsl:choose>
        </xsl:variable>
        <member stem="{@word}" pred="{$pred}"/>
      </xsl:for-each>
    </family>
  </xsl:template>

	<xsl:template match="family[@pos='``']">
		<family>
			<xsl:apply-templates select="@*"/>
			<xsl:apply-templates/>
			<member stem="``" pred="quote-rel"/>
		</family>
	</xsl:template>

  <!-- filter @freq -->
  <xsl:template match="@freq"/>
  
  <!-- filter atomcat/@dep -->
  <xsl:template match="atomcat/@dep"/>
  
  
  <!--Default global copy rule-->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/collapseMWUFull.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

<xsl:output method="xml" indent="yes" xalan2:indent-amount="2" omit-xml-declaration = "yes"/>

<xsl:strip-space elements="*"/>

<xsl:variable name="obj" select="java:opennlp.ccgbank.convert.InfoHelper.new()"/>

<!--Transform to collapse relevant MWUs completely-->

<xsl:template match="/">
  <xsl:apply-templates select="@*|node()"/>
</xsl:template>


<!--Completely collapse all BBN NEs-->

<xsl:template match="Treenode[@bbn-info and (*[1][self::atomcat] or java:checkTreeInfo($obj,ancestor-or-self::*[@Header]/@Header,@nt_id,number(count(*[1]/descendant::*[self::slash or self::atomcat]))))]">

	<xsl:variable name="leaf" select="descendant::Leafnode"/>

	<xsl:for-each select="$leaf">
		<xsl:variable name="void" select="java:collapse($obj,@lexeme,'1')"/>
	</xsl:for-each>

	<xsl:variable name="lexeme" select="java:collapse($obj,'','2')"/>

	<xsl:for-each select="$leaf">
		<xsl:variable name="void" select="java:collapse($obj,@lexeme0,'1')"/>
	</xsl:for-each>

	<xsl:variable name="lexeme0" select="java:collapse($obj,'','2')"/>
	<xsl:variable name="header" select="ancestor-or-self::*[@Header]/@Header"/>

	<Leafnode lexeme="{$lexeme}" lexeme0="{$lexeme0}" pos="{$leaf[last()]/@pos}" pos1="{$leaf[last()]/@pos1}" class="{substring-after(substring-before(@bbn-info,' '),'=')}">
		<xsl:apply-templates select="@*"/>

		<xsl:if test="$leaf[last()]/@class">
			<xsl:attribute name="class"><xsl:value-of select="$leaf[last()]/@class"/></xsl:attribute>
		</xsl:if>

		<xsl:choose>
			<xsl:when test="*[1][self::atomcat]">
				<atomcat type="{@cat}">
    			<fs id="1"/>
    		</atomcat>
			</xsl:when>
			<xsl:otherwise>
				<xsl:variable name="tree-info" select="java:getTreeInfo($obj,concat($header,' ',@nt_id))"/>
				<xsl:apply-templates select="*[1]" mode="tree-id"/>
				
			</xsl:otherwise>
		</xsl:choose>
	</Leafnode>
</xsl:template>

<!--Template which allots actual Treenode ids from info in the bkgrnd class-->
<xsl:template match="atomcat" mode="tree-id">
	<xsl:variable name="tree-cat" select="java:getTreeId($obj)"/>

	<atomcat type="{@type}">
		<xsl:choose>
			<xsl:when test="starts-with($tree-cat,'M_')">
				<fs inheritsFrom="{substring-after($tree-cat,'_')}">
					<xsl:if test="descendant::fs">
						<xsl:apply-templates select="descendant::fs/*"/>
					</xsl:if>
				</fs>
			</xsl:when>
			<xsl:otherwise>
				<fs id="{$tree-cat}">
					<xsl:if test="descendant::fs">
						<xsl:apply-templates select="descendant::fs/*"/>
					</xsl:if>
				</fs>
			</xsl:otherwise>	
		</xsl:choose>
	</atomcat>
</xsl:template>

<xsl:template match="slash" mode="tree-id">
	<xsl:variable name="slash" select="java:getTreeSlash($obj)"/>
	<slash dir="{substring-before($slash,'_')}" mode="{substring-after($slash,'_')}"/>
</xsl:template>

<!--Tree-id copy rule-->
   <xsl:template match="@*|node()" mode="tree-id">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()" mode="tree-id"/>
    </xsl:copy>
  </xsl:template>

<!--Default global copy rule-->

   <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/collapseMWUPart.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

<xsl:output method="xml" indent="yes" xalan2:indent-amount="2" omit-xml-declaration = "yes"/>

<xsl:strip-space elements="*"/>

<xsl:variable name="obj" select="java:opennlp.ccgbank.convert.InfoHelper.new()"/>

<!--Transform to collapse relevant MWUs completely-->

<xsl:template match="/">
  <xsl:apply-templates select="@*|node()"/>
</xsl:template>

<!--Completely collapse PERSON, ORG, WOA & GPE classes and partially all other Treenodes containing NNP(S),CD pos tags and %, $ lexemes-->

<xsl:template match="/">
  <xsl:apply-templates select="@*|node()"/>
</xsl:template>

<xsl:template match="Treenode[((starts-with(@bbn-info,'ENAMEX=PERSON') or starts-with(@bbn-info,'ENAMEX=ORGANIZATION|') or starts-with(@bbn-info,'ENAMEX=GPE|') or contains(@bbn-info,'ENAMEX=WORK_OF_ART')) or count(descendant::Leafnode)=count(descendant::Leafnode[starts-with(@pos,'NNP') or @pos='CD' or @lexeme='$' or @lexeme='%'])) and (*[1][self::atomcat] or java:checkTreeInfo($obj,ancestor-or-self::*[@Header]/@Header,@nt_id,number(count(*[1]/descendant::*[self::slash or self::atomcat]))))]">

	<xsl:variable name="leaf" select="descendant::Leafnode"/>

	<xsl:for-each select="$leaf">
		<xsl:variable name="void" select="java:collapse($obj,@lexeme,'1')"/>
	</xsl:for-each>

	<xsl:variable name="lexeme" select="java:collapse($obj,'','2')"/>
	<xsl:variable name="class" select="substring-after(substring-before(@bbn-info,' '),'=')"/>

	<xsl:for-each select="$leaf">
		<xsl:variable name="void" select="java:collapse($obj,@lexeme0,'1')"/>
	</xsl:for-each>

	<xsl:variable name="lexeme0" select="java:collapse($obj,'','2')"/>
	<xsl:variable name="header" select="ancestor-or-self::*[@Header]/@Header"/>

	<Leafnode>
		<xsl:apply-templates select="$leaf[last()]/@*[not(name()='lexeme' and name()='lexeme0')]"/>
		<xsl:attribute name="lexeme"><xsl:value-of select="$lexeme"/></xsl:attribute>
		<xsl:attribute name="lexeme"><xsl:value-of select="$lexeme0"/></xsl:attribute>
		<xsl:attribute name="class"><xsl:value-of select="$class"/></xsl:attribute>
		<xsl:if test="$leaf[last()]/@class">
			<xsl:attribute name="class"><xsl:value-of select="$leaf[last()]/@class"/></xsl:attribute>
		</xsl:if>
		<xsl:if test="$leaf[position()=1]/@fntag">
			<xsl:attribute name="fntag"><xsl:value-of select="$leaf[position()=1]/@fntag"/></xsl:attribute>
		</xsl:if>
				<xsl:if test="$leaf[position()=1]/@tpc">
			<xsl:attribute name="tpc"><xsl:value-of select="$leaf[position()=1]/@tpc"/></xsl:attribute>
		</xsl:if>

		<xsl:choose>
			<xsl:when test="*[1][self::atomcat]">
				<atomcat type="{@cat}">
    			<fs id="1"/>
    		</atomcat>
			</xsl:when>
			<xsl:otherwise>
				<xsl:variable name="tree-info" select="java:getTreeInfo($obj,concat($header,' ',@nt_id))"/>
				<xsl:apply-templates select="*[1]" mode="tree-id"/>
				
			</xsl:otherwise>
		</xsl:choose>
	</Leafnode>
</xsl:template>

<!--Template which allots actual Treenode ids from info in the bkgrnd class-->
<xsl:template match="atomcat" mode="tree-id">
	<xsl:variable name="tree-cat" select="java:getTreeId($obj)"/>

	<atomcat type="{@type}">
		<xsl:choose>
			<xsl:when test="starts-with($tree-cat,'M_')">
				<fs inheritsFrom="{substring-after($tree-cat,'_')}">
					<xsl:if test="descendant::fs">
						<xsl:apply-templates select="descendant::fs/*"/>
					</xsl:if>
				</fs>
			</xsl:when>
			<xsl:otherwise>
				<fs id="{$tree-cat}">
					<xsl:if test="descendant::fs">
						<xsl:apply-templates select="descendant::fs/*"/>
					</xsl:if>
				</fs>
			</xsl:otherwise>	
		</xsl:choose>
	</atomcat>
</xsl:template>

<xsl:template match="slash" mode="tree-id">
	<xsl:variable name="slash" select="java:getTreeSlash($obj)"/>
		<slash dir="{substring-before($slash,'_')}" mode="{substring-after($slash,'_')}"/>
</xsl:template>

<!--Tree-id copy rule-->
   <xsl:template match="@*|node()" mode="tree-id">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()" mode="tree-id"/>
    </xsl:copy>
  </xsl:template>

<!--Default global copy rule-->

   <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/collapseMWUSharedTask.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

<xsl:output method="xml" indent="yes" xalan2:indent-amount="2" omit-xml-declaration = "yes"/>

<xsl:strip-space elements="*"/>

<xsl:variable name="obj" select="java:opennlp.ccgbank.convert.InfoHelper.new()"/>

<!--Transform to collapse relevant MWUs (i.e. shared task ones) completely-->

<xsl:template match="/">
  <xsl:apply-templates select="@*|node()"/>
</xsl:template>

<xsl:template match="/">
  <xsl:apply-templates select="@*|node()"/>
</xsl:template>

<!--Only MW atomic treenodes with shared task NE annotation -->
<xsl:template match="Treenode[starts-with(@bbn-info,'ENAMEX=NAME') and count(child::*)>2 and descendant::Leafnode[last()]/child::atomcat]">

	<xsl:variable name="leaf" select="descendant::Leafnode"/>

	<xsl:for-each select="$leaf">
		<xsl:variable name="void" select="java:collapse($obj,@lexeme,'1')"/>
	</xsl:for-each>

	<xsl:variable name="lexeme" select="java:collapse($obj,'','2')"/>

	<xsl:for-each select="$leaf">
		<xsl:variable name="void" select="java:collapse($obj,@lexeme0,'1')"/>
	</xsl:for-each>

	<xsl:variable name="lexeme0" select="java:collapse($obj,'','2')"/>
	<xsl:variable name="header" select="ancestor-or-self::*[@Header]/@Header"/>

	<Leafnode lexeme="{$lexeme}" lexeme0="{$lexeme0}" pos="{$leaf[last()]/@pos}" pos1="{$leaf[last()]/@pos1}" >
    <xsl:apply-templates select="@*"/>
		<xsl:if test="$leaf[last()]/@class">
			<xsl:attribute name="class"><xsl:value-of select="$leaf[last()]/@class"/></xsl:attribute>
		</xsl:if>
		<atomcat type="{@cat}">
    	<fs id="1"/>
		</atomcat>
	</Leafnode>
	

</xsl:template>

<!--Default global copy rule-->
   <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/computeCats.xsl
================================================
<!--Copyright (C) 2005-2010 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform" 
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"  
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">
  
  <xsl:output method="xml" indent="yes" xalan2:indent-amount="2"/> 
  <xsl:strip-space elements="*"/>


  <!-- Transform which computes cat names and supertags. -->

  <!-- Set cat val to calculated cat name; likewise for (simpler) stag. -->
  <xsl:template match="Treenode|Leafnode">
    <xsl:copy>
      <xsl:attribute name="cat">
        <xsl:apply-templates mode="catname" select="*[1]"/>
      </xsl:attribute>
      <xsl:attribute name="stag">
        <xsl:apply-templates mode="supertag" select="*[1]"/>
      </xsl:attribute>
      <xsl:apply-templates select="@*[name(.)!='cat' and name(.)!='stag']"/>
      <xsl:apply-templates select="node()"/>
    </xsl:copy>
  </xsl:template>
  

  <!-- Calc cat name in catname mode. -->
  <xsl:template match="atomcat" mode="catname">
    <xsl:value-of select="@type"/>
    <xsl:apply-templates mode="catname"/>
  </xsl:template>
  
  <xsl:template match="complexcat/complexcat" mode="catname">
    <xsl:text>(</xsl:text>
    <xsl:apply-templates mode="catname"/>
    <xsl:text>)</xsl:text>
  </xsl:template>
  
  <xsl:template match="complexcat" mode="catname">
    <xsl:apply-templates mode="catname"/>
  </xsl:template>
  
  <xsl:template match="slash" mode="catname">
    <xsl:value-of select="@dir"/>
    <xsl:if test="(@dir='/' and @mode!='&gt;') or (@dir='\' and @mode!='&lt;')">
      <xsl:value-of select="@mode"/>
    </xsl:if>
  </xsl:template>
  
  <xsl:template match="dollar" mode="catname">
    <xsl:text>$</xsl:text>
    <xsl:if test="@name">
      <xsl:text>_</xsl:text>
      <xsl:value-of select="@name"/>
    </xsl:if>
  </xsl:template>
  
  <xsl:template match="fs" mode="catname">
    <xsl:if test="feat[1][@attr='form' or @attr='lex']">
      <xsl:text>[</xsl:text>
      <xsl:value-of select="feat[@attr='form' or @attr='lex']/@val"/>    
      <xsl:text>]</xsl:text>
    </xsl:if>
    <!-- skip ids with punctuation -->
    <xsl:if test="(@id or @inheritsFrom) and not(parent::*[@type='punct'])">
      <xsl:text>_</xsl:text>
      <xsl:choose>
        <xsl:when test="@id">
          <xsl:value-of select="@id"/>
        </xsl:when>
        <xsl:when test="@inheritsFrom">
          <xsl:text>~</xsl:text><xsl:value-of select="@inheritsFrom"/>
        </xsl:when>
      </xsl:choose>
    </xsl:if>
  </xsl:template>

  <!-- skip ids with punctuation -->  
  <xsl:template match="atomcat[@type='punct']/fs/@id"/>


  <!-- Calc simpler supertag in supertag mode. -->
  <xsl:template match="atomcat" mode="supertag">
    <xsl:value-of select="@type"/>
    <xsl:apply-templates mode="supertag"/>
  </xsl:template>
  
  <xsl:template match="complexcat/complexcat" mode="supertag">
    <xsl:text>(</xsl:text>
    <xsl:apply-templates mode="supertag"/>
    <xsl:text>)</xsl:text>
  </xsl:template>
  
  <xsl:template match="complexcat" mode="supertag">
    <xsl:apply-templates mode="supertag"/>
  </xsl:template>
  
  <xsl:template match="slash" mode="supertag">
    <xsl:value-of select="@dir"/>
  </xsl:template>
  
  <xsl:template match="dollar" mode="supertag">
    <xsl:text>$</xsl:text>
  </xsl:template>

  <xsl:template match="fs" mode="supertag">
    <xsl:if test="feat[1][@attr='form' or @attr='lex']">
      <xsl:text>[</xsl:text>
      <xsl:value-of select="feat[@attr='form' or @attr='lex']/@val"/>    
      <xsl:text>]</xsl:text>
    </xsl:if>
  </xsl:template>


  <!-- default copy rule (catname) -->
  <xsl:template match="@*|node()" mode="catname">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()" mode="catname"/>
    </xsl:copy>
  </xsl:template>

  <!-- default copy rule (supertag) -->
  <xsl:template match="@*|node()" mode="supertag">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()" mode="supertag"/>
    </xsl:copy>
  </xsl:template>

  <!-- default copy rule -->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/convTags.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

<xsl:output method="xml" indent="yes" xalan2:indent-amount="2" omit-xml-declaration = "yes"/>

<xsl:strip-space elements="*"/>

<xsl:template match="/">
  <xsl:apply-templates/>
</xsl:template>

<!--Flag abscence of pos or pos1
<xsl:template match="Leafnode">
	<Leafnode>
		<xsl:if test="(not(@pos or pos1) or string-length(@pos)=0 or string-length(@pos1)=0)">
			<xsl:attribute name="Warning">CHECK-POS</xsl:attribute>		
		</xsl:if>
		<xsl:apply-templates select="@*|node()"/>
	</Leafnode>
</xsl:template>-->

<xsl:template match="Leafnode[contains(@pos1,'PUNCT') and not(@pos1='PUNCT_LPAREN2' or @pos1='PUNCT_LPAREN1')]">
	<Leafnode pos="{@pos1}" pos1="{@pos}">
		<xsl:apply-templates select="@*[not(name()='pos' or name()='pos1')]|node()"/>
	</Leafnode>
</xsl:template>

<!--Default global copy rule-->
<xsl:template match="@*|node()">
   <xsl:copy>
     <xsl:apply-templates select="@*|node()"/>
   </xsl:copy>
</xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/correctMistakes1.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<!-- Transform which corrects previously marked mistakes in ccgbank. -->
<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

  <xsl:output method="xml" indent="yes" xalan2:indent-amount="2"/>
  <xsl:strip-space elements="*"/>
  
  <!-- correct s\n to s\np in cases such as cat="((np_1\np_1)/(s[dcl]_2\n_3))/n_3" -->
  <xsl:template match="complexcat/complexcat[atomcat[1][@type='s'] and slash[1][@dir='\']]
		       /atomcat[2][@type='n']">
    <atomcat type="np">
      <xsl:apply-templates select="@*[not(name(.)='type')]"/>
      <xsl:apply-templates select="node()"/>
    </atomcat>
  </xsl:template>

  <!-- Move sentence-final punctuation up to the top level. -->
  <xsl:template match="Derivation/Treenode[*[3] [not(self::Leafnode and @pos='.') and .//Leafnode[@whoops and @pos='.']]]">
    <xsl:copy>
      <xsl:apply-templates select="@*"/>
      <!-- copy result -->
      <xsl:copy-of select="*[1]"/>
      <!-- put current children under new treenode -->
      <Treenode>
        <xsl:apply-templates select="@*[not(name(.)='Header')]"/>
        <!-- copy result again -->
        <xsl:copy-of select="*[1]"/>
        <!-- recurse through children -->
        <xsl:apply-templates select="*[2]"/>
        <xsl:apply-templates select="*[3]"/>
      </Treenode>
      <!-- copy sentence-final punct -->
      <xsl:apply-templates select="*[3]//Leafnode[@whoops and @pos='.']"/>
    </xsl:copy>
  </xsl:template>

  <!--Newly added-->
  <xsl:template match="Derivation/Treenode[count(*)=2 and *[2][descendant::Leafnode[@whoops]]]">
    <Treenode dtr="2">
      <xsl:apply-templates select="@*|node()"/>     
      <xsl:apply-templates select="descendant::Leafnode[@whoops]"/>
    </Treenode>
  </xsl:template>

  <!-- Filter sentence-final punct lower down. -->
  <xsl:template match="Treenode[*[2][self::Treenode] and Leafnode[@whoops]]">
    <xsl:apply-templates select="*[2]"/>
  </xsl:template>

  <!--Newly added-->
  <xsl:template match="Treenode[*[2][self::Leafnode] and *[3][self::Leafnode[@whoops]]]">
    <xsl:apply-templates select="*[2]"/>
  </xsl:template>

  <!-- Filter @whoops on sentence-final punct. -->
  <xsl:template match="Leafnode[@pos='.']/@whoops"/>
	

  <!--Correct (sent .) whoops1 on (sent .) structure-->
  
  <!--Add new resultant-->
  <xsl:template match="Treenode[descendant::Leafnode[@whoops1] and parent::Treenode[@Header]]">  
    <xsl:variable name = "brack" select="descendant::Leafnode[@pos='RRB' and preceding::Leafnode[1][@whoops1]]"/>  
    <Treenode cat="sent_1" head="1" dtr="2" cat0="NewlyAdded">
      <atomcat type="sent">
      	<fs id="1"/>
      </atomcat>
      <Treenode cat="sent_1" head="1" dtr="2" cat0="NewlyAdded">
	<atomcat type="sent">
	  <fs id="1"/>
    	</atomcat>
	<Treenode>
	  <xsl:apply-templates select="@*|node()"/>
	</Treenode>	
	<Leafnode cat="._1" lexeme="." lexeme0="." pos="." pos1="." cat0=".">
	  <atomcat type=".">
	    <fs id="1"/>
	  </atomcat>
	</Leafnode>
      </Treenode>
      <xsl:apply-templates select="$brack"/>
    </Treenode>
  </xsl:template>

  <!--Delete extant full-stop-->
  <xsl:template match="Treenode[*[3][@whoops1]]">  
    <xsl:apply-templates select="*[2]"/>
  </xsl:template>

  <!--Delete extant rbrac-->
  <xsl:template match="Treenode[*[3][self::Leafnode[@pos='RRB' and preceding::Leafnode[1][@whoops1]]]]">  
    <xsl:apply-templates select="*[2]"/>
  </xsl:template>  

  <!-- default copy rule -->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>

================================================
FILE: ccgbank/templates/correctPPHeads.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

<!--Non-case marking prepositions should not be lexicalized: Radioactive-->
	<xsl:template match="Leafnode[not(../@roles)]/complexcat[not(atomcat[2][@type='pp'])]/atomcat[1][@type='pp']/fs/feat">
  </xsl:template>

	<!--Functors of Non-case marking prepositions should also not be lexicalized: Radioactive-->
	<xsl:template match="complexcat[not(atomcat[1][@type='pp'])]/atomcat[@type='pp']/fs/feat[not(ancestor::Leafnode/@argRoles) or not(contains(ancestor::Leafnode/@argRoles,concat('-',@val)))]">
  </xsl:template>

<!--Default global copy rule-->
<xsl:template match="@*|node()">
   <xsl:copy>
     <xsl:apply-templates select="@*|node()"/>
   </xsl:copy>
</xsl:template>

</xsl:transform>

================================================
FILE: ccgbank/templates/exportToAuto.xsl
================================================
<!--Copyright (C) 2010 Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->

<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:jstring="xalan://java.lang.String"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan jstring java">

  <xsl:output method="text"/>

  <xsl:strip-space elements="*"/>
  <xsl:variable name="newline">
    <xsl:text>&#10;</xsl:text>
  </xsl:variable>

  <xsl:template match="/">
    <xsl:for-each select="/*/Treenode[@Header]">
      <!-- header line -->
      <xsl:value-of select="@Header"/>
      <xsl:text> PARSER=GOLD NUMPARSE=1</xsl:text>
      <xsl:value-of select="$newline"/>
      <!-- curry cats in renaming -->
      <xsl:variable name="curried">
	<xsl:apply-templates select="." mode="curry"/>
      </xsl:variable>
      <!-- transform deriv -->
      <xsl:apply-templates select="xalan:nodeset($curried)/*"/>
      <xsl:value-of select="$newline"/>
    </xsl:for-each>
  </xsl:template>

  <xsl:template match="Treenode">
    <xsl:if test="not(@head) or not(@dtr)">
      <xsl:message>Missing head index or length in 
	<xsl:value-of select="ancestor::Treenode[@Header]/@Header"/>
      </xsl:message>
    </xsl:if>
    <xsl:text>(&lt;T </xsl:text>
    <xsl:value-of select="jstring:replaceAll(string(@cat),'_~?\d+','')"/> <xsl:text> </xsl:text>
    <xsl:value-of select="@head"/> <xsl:text> </xsl:text>
    <xsl:value-of select="@dtr"/>
    <xsl:text>&gt; </xsl:text>
    <xsl:apply-templates/>
    <xsl:text>) </xsl:text>
  </xsl:template>

  <xsl:template match="Leafnode">
    <xsl:text>(&lt;L </xsl:text>
    <xsl:value-of select="jstring:replaceAll(string(@cat),'_~?\d+','')"/> <xsl:text> </xsl:text>
    <xsl:value-of select="@pos"/> <xsl:text> </xsl:text>
    <xsl:value-of select="@pos1"/> <xsl:text> </xsl:text>
    <xsl:value-of select="@lexeme"/> <xsl:text> </xsl:text>
    <xsl:value-of select="@cat"/> 
    <xsl:text>&gt;) </xsl:text>
  </xsl:template>

  <!-- curry mode: set cat val to calculated cat name, curried -->
  <!-- this bit is adapted from computeCats transform -->
  <xsl:template match="Treenode|Leafnode" mode="curry">
    <xsl:copy>
      <xsl:attribute name="cat">
        <xsl:apply-templates mode="catname" select="*[1]"/>
      </xsl:attribute>
      <xsl:copy-of select="@*[name(.)!='cat']"/>
      <xsl:apply-templates select="node()" mode="curry"/>
    </xsl:copy>
  </xsl:template>
  
  <xsl:template match="atomcat" mode="catname">
    <xsl:value-of select="jstring:toUpperCase(string(@type))"/>
    <xsl:apply-templates mode="catname"/>
  </xsl:template>
  
  <!-- add parens around complex args -->
  <xsl:template match="complexcat/complexcat" mode="catname">
    <xsl:text>(</xsl:text>
    <xsl:apply-templates select="." mode="catname-cc"/>
    <xsl:text>)</xsl:text>
  </xsl:template>
  
  <xsl:template match="complexcat" mode="catname">
    <xsl:apply-templates select="." mode="catname-cc"/>
  </xsl:template>
  
  <!-- add parens for curried args -->
  <xsl:template match="complexcat" mode="catname-cc">
    <!-- add one left paren per slash, except the first -->
    <xsl:for-each select="slash[position() &gt; 1]">
      <xsl:text>(</xsl:text>
    </xsl:for-each>
    <xsl:for-each select="*">
      <!-- add right paren before each slash, after the first (which is in the 2nd position) -->
      <xsl:if test="self::slash and position() &gt; 2">
	<xsl:text>)</xsl:text>
      </xsl:if>
      <xsl:apply-templates select="." mode="catname"/>
    </xsl:for-each>
  </xsl:template>
  
  <xsl:template match="slash" mode="catname">
    <xsl:value-of select="@dir"/>
    <xsl:if test="(@dir='/' and @mode!='&gt;') or (@dir='\' and @mode!='&lt;')">
      <xsl:value-of select="@mode"/>
    </xsl:if>
  </xsl:template>
  
  <xsl:template match="dollar" mode="catname">
    <xsl:text>$</xsl:text>
    <xsl:if test="@name">
      <xsl:text>_</xsl:text>
      <xsl:value-of select="@name"/>
    </xsl:if>
  </xsl:template>
  
  <xsl:template match="fs" mode="catname">
    <xsl:if test="feat[1][@attr='form' or @attr='lex']">
      <xsl:text>[</xsl:text>
      <xsl:value-of select="feat[@attr='form' or @attr='lex']/@val"/>    
      <xsl:text>]</xsl:text>
    </xsl:if>
    <xsl:if test="@id or @inheritsFrom">
      <xsl:text>_</xsl:text>
      <xsl:choose>
        <xsl:when test="@id">
          <xsl:value-of select="@id"/>
        </xsl:when>
        <xsl:when test="@inheritsFrom">
          <xsl:text>~</xsl:text><xsl:value-of select="@inheritsFrom"/>
        </xsl:when>
      </xsl:choose>
    </xsl:if>
  </xsl:template>
  
  <!-- default copy rule (catname) -->
  <xsl:template match="@*|node()" mode="catname">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()" mode="catname"/>
    </xsl:copy>
  </xsl:template>

  <!-- default recursion rule (curry) -->
  <xsl:template match="@*|node()" mode="curry">
    <xsl:apply-templates select="@*|node()" mode="curry"/>
  </xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/filterLex.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

  <xsl:output method="xml" indent="yes" xalan2:indent-amount="2" omit-xml-declaration="yes"/>
  <xsl:strip-space elements="*"/>
  
  <!-- Transform which filters extracted cats and lex items by frequency cutoff in FreqTally -->
  

  <!-- Java Program in the grammar extractor package invoked -->
  <xsl:variable name="obj" select="java:opennlp.ccgbank.extract.FreqTally.new()"/>

  
  <!-- Filter family -->
  <xsl:template match="family">
    <!-- check freq -->
    <xsl:if test="java:checkFreqStatus($obj,@name,@pos)">
      <!-- set freq, closed attrs -->
      <family 
        freq="{java:getFreq($obj,@name,@pos)}"
        closed="{not(java:isOpen($obj,@name,@pos))}"
      >
        <!-- copy rest -->
        <xsl:apply-templates select="@*|node()"/>
      </family>
    </xsl:if>
  </xsl:template>
  
  
  <!-- Filter lex entry -->
  <xsl:template match="ccg-lexicon/entry">
    <!-- check freq -->
    <xsl:if test="java:checkFreqStatus($obj,@word,@family,@pos)">
      <!-- check for open family -->
      <xsl:if test="not(java:isOpen($obj,@name,@pos))">
        <entry>
          <xsl:apply-templates select="@*|node()"/>
        </entry>
      </xsl:if>
    </xsl:if>
  </xsl:template>

	<!--Filter some bogus cats-->  
	<xsl:template match="family[starts-with(@name,'$_') or starts-with(@name,'np_~1\np_2:')]">
	</xsl:template>

	<!--Add a "non-em" feat to prevent sent_1\s full-stop combining with complementizer sents-->
	<xsl:template match="fs[ancestor::family[@name='sent_1\*s_1'] and parent::atomcat[@type='s']]">
		<fs>
			<xsl:apply-templates select="@*|node()"/>
			<feat attr="form" val="non-em"/>
		</fs>
	</xsl:template>

  <!-- Copy Rule -->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>

================================================
FILE: ccgbank/templates/find-s-back-n.xsl
================================================
<!--Copyright (C) 2005-2010 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->

<!-- transform illustrating search for a pattern of interest (here, a buggy cat in the ccgbank) -->
<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

  <xsl:output method="xml" indent="yes" xalan2:indent-amount="2" omit-xml-declaration="yes"/>

  <xsl:strip-space elements="*"/>

  <!-- match leafnodes with eg cat="((np_1\np_1)/(s[dcl]_2\n_3))/n_3" where it should be s\np -->
  <xsl:template match="/">
    <yuck>
      <xsl:copy-of select=".//Leafnode[
			      .//complexcat/complexcat[
			         atomcat[1][@type='s'] and slash[1][@dir='\'] and atomcat[2][@type='n']]]"/>
    </yuck>
  </xsl:template>

  <!--Default global copy rule-->
  <!--
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>
  -->
</xsl:transform>


================================================
FILE: ccgbank/templates/genchal11-out.xsl
================================================
<?xml version="1.0"?>
<!-- 
Copyright (C) 20011 Michael White
$Revision: 1.1 $, $Date: 2011/08/12 03:14:03 $ 

This transformation takes openccg nbest output and transforms it into 
the required output format for the Generation Challenges 2011 shared task.
-->
<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

  <xsl:output method="xml" indent="yes" xalan2:indent-amount="2"/>
  <xsl:strip-space elements="*"/>

  <!-- Helper class for adjusting roles -->
  <xsl:variable name="obj" select="java:opennlp.ccgbank.convert.GenChal11Adjuster.new()"/>

  
  <!-- start -->
  <xsl:template match="/nbest">
    <tstset trglang="en" setid="genchal2011.sr.deep" sysid="OSU">
      <xsl:apply-templates/>
    </tstset>
  </xsl:template>

  <!-- seg: adjust id, grab top 5 outputs -->
  <xsl:template match="seg">
    <seg id="{substring-after(@id,'=')}">
      <xsl:apply-templates select="best|next[position() &lt;= 4]"/>
    </seg>
  </xsl:template>

  <!-- best|next: adjust text string with java call -->
  <xsl:template match="best|next">
    <xsl:copy>
      <xsl:value-of select="java:getAdjustedString($obj,text())"/>
    </xsl:copy>
  </xsl:template>


  <!-- Copy -->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/inferConjRules.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  xmlns:exsl="http://exslt.org/common"
  extension-element-prefixes="exsl"		
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

  <xsl:output method="xml" indent="yes" xalan2:indent-amount="2"/>
  <xsl:strip-space elements="*"/>

<!--Transform which infers conj rule of categories from the bare parse-->

<!--This transform copies the result,arg1 & arg2 of the conj rule from the source xml. So unlike constituents will be taken care of-->

<!--Java class to manipulate strings of args and results of conj rule-->
<xsl:variable name="obj" select="java:opennlp.ccgbank.convert.GenConjRule.new()"/>
<xsl:template match="/">
  <xsl:apply-templates/>
</xsl:template>

<!--Note: The extant ccgbank does not distinguish Appositives and NP list coordination involving commas. Ccgbank Manual Pg49-->

<!--Updating treenodes which are conjunct phrases-->
<xsl:template match="Treenode[not(@Header) and Treenode[Leafnode[1][@pos1='PUNCT_CONJ' or @cat='conj']]]">

	<xsl:variable name="res" select="@cat"/>
<xsl:variable name="resFrag" select="./*[1]"/>
	<xsl:variable name="conjUnar" select="java:getConjRes($obj,@cat)"/>

	<!--Select arg1-->
	<xsl:variable name="arg1" select="*[2]/@cat"/>

	<!--Select arg2-->
	<xsl:variable name="arg2" select="Treenode[Leafnode[1][@pos1='PUNCT_CONJ' or @cat='conj']]/*[3]/@cat"/>
	
	<xsl:variable name="dummy" select="java:dsInit($obj)"/>

	<xsl:call-template name="dollDecider">
		<xsl:with-param name = "cat1" select="$res"/>
 		<xsl:with-param name = "cat2" select="$arg1"/>
		<xsl:with-param name = "cat3" select="$arg2"/>
	</xsl:call-template>		

	<!--Initialize id tally-->
	<xsl:variable name="dummy0" select="java:globalInit($obj)"/>
	
	<!--Retrieve dollar status of conj-->
	<xsl:variable name="dollarStt" select="java:getDollarStatus($obj)"/>
	
	<Treenode cat="{@cat}" head="1" dtr="{@dtr}" cat0="{@cat0}" arg1="{$arg1}" arg2="{$arg2}">
		<xsl:apply-templates select="@*"/>
		<xsl:choose>
			<xsl:when test="$dollarStt='Dollar'">
				<xsl:call-template name = "localInit" />	
					
				<!--Result-->
				<complexcat>
					<xsl:apply-templates select="$resFrag/descendant-or-self::atomcat[1][@type='s']" mode="res"/>
	    		<slash/>
     			<dollar name="1"/>
				</complexcat>
			</xsl:when>
			<xsl:otherwise>
				<xsl:apply-templates select = "$resFrag"/>
			</xsl:otherwise>
		</xsl:choose>
		<xsl:apply-templates select="*[position()>1]"/>
	</Treenode>
</xsl:template>

<!--Updating intermediate treenodes having conj feature-->
<xsl:template match="Treenode[Leafnode[1][@pos1='PUNCT_CONJ'or @cat='conj']]">

	<xsl:variable name="dummy0" select="java:globalInit($obj)"/>

	<!--Parent ie result of the treenode selected -->
	<xsl:variable name="par" select="parent::Treenode"/>
	<xsl:variable name="res" select="$par/@cat"/>
	<xsl:variable name="resFrag" select="$par/*[1]"/>

	<!--Select the arg1-->
	<xsl:variable name="arg1" select="preceding-sibling::*/@cat"/>
	<xsl:variable name="arg1Frag" select="preceding-sibling::*[1]/*[1]"/>

	<!--Retrieve dollar status of conj-->
	<xsl:variable name="dollarStt" select="java:getDollarStatus($obj)"/>

	<xsl:variable name="dummy1" select="java:globalInit($obj)"/>		

	<Treenode cat="{$res}\*{$arg1}" head="0" dtr="{@dtr}" cat0="{@cat0}">
		<xsl:apply-templates select="@*"/>		
		<complexcat>		
			<xsl:apply-templates select = "$resFrag" mode="res"/>
			<slash dir="\" mode="*" />
			<xsl:apply-templates select = "$arg1Frag" mode="args"/>
		</complexcat>
		<xsl:apply-templates select="*[position()>1]"/>        	 
	</Treenode>

</xsl:template> 

<!--Select only those Leafnodes which have conj rules and commas-->
 <xsl:template match="Leafnode[1][@cat='conj' or @pos1='PUNCT_CONJ']">

	<!--Grandparent of the context leafnode selected -->
	<xsl:variable name="gpar" select="parent::Treenode/.."/>

	<!--Choose the result category ie the cat of the parent-->
	<xsl:variable name="res" select="$gpar/@cat"/>
	<xsl:variable name="resFrag" select="$gpar/*[1]"/>
	
	<!--Retrieving arg1 position from the grandparent-->
	<xsl:variable name="arg1" select="$gpar/*[2]/@cat"/>
	<xsl:variable name="arg1Frag" select="$gpar/*[2]/*[1]"/>

	<!--Retrieving arg2 position ie the following sibling of selected leafnode-->
	<xsl:variable name="arg2" select="following-sibling::*[1]/@cat"/>
	<xsl:variable name="arg2Frag" select="following-sibling::*[1]/*[1]"/>
	<xsl:variable name="commaTest" select="following-sibling::*[1]"/>

	<!--Initialization of id before start of new conj rule-->
	<xsl:variable name="dummy0" select="java:globalInit($obj)"/>
	<xsl:variable name="dummy1" select="java:dsInit($obj)"/>		

	<xsl:call-template name="dollDecider">
		<xsl:with-param name = "cat1" select="$res"/>
 		<xsl:with-param name = "cat2" select="$arg1"/>
		<xsl:with-param name = "cat3" select="$arg2"/>
	</xsl:call-template>		
	

	<!--Retrieve dollar status of conj-->
	<xsl:variable name="dollarStt" select="java:getDollarStatus($obj)"/>
	<xsl:variable name="dummy" select="java:dsInit($obj)"/>	

	<!--Conj rule inserted-->	

	<Leafnode>
		<xsl:apply-templates select="@*"/>
			
			<!--Debugging technique to mark unlike conjs-->
			<!--<xsl:if test="$dollarStt='No_Dollar'"> 
				<xsl:attribute name="dollar">No_Dollar</xsl:attribute>
			</xsl:if>-->

			<!--Inserting the new category for things marked "conj"-->
			<complexcat>

				<xsl:choose>
	
					<xsl:when test="$dollarStt='Dollar'">


						<xsl:call-template name = "localInit" />	
					
						<!--Result, Arg 1 & Arg2-->
						<xsl:apply-templates select="$resFrag/descendant-or-self::atomcat[1][@type='s']" mode="res"/>
	     			<slash/>
      			<dollar name="1"/>
						<slash dir="\" mode="*" />
						<xsl:call-template name = "localInit" />
						<complexcat>
							<xsl:apply-templates select="$arg1Frag/descendant-or-self::atomcat[1][@type='s']" mode="args"/>
	  					<slash/>
    					<dollar name="1"/>
						</complexcat>
						<slash dir="/" mode="*" />
						<xsl:call-template name = "localInit" />
						<complexcat>
							<xsl:apply-templates select="$arg2Frag/descendant-or-self::atomcat[1][@type='s']" mode="args"/>
	  					<slash/>
    					<dollar name="1"/>
						</complexcat>
					</xsl:when>
					<xsl:otherwise>
						
						<xsl:call-template name = "localInit" />
						<xsl:apply-templates select = "$resFrag" mode="res"/>
						<slash dir="\" mode="*" />
						<xsl:call-template name = "localInit" />
						<xsl:apply-templates select = "$arg1Frag" mode="args"/>
						<slash dir="/" mode="*" />
						<xsl:call-template name = "localInit" />
						<xsl:apply-templates select = "$arg2Frag" mode="args"/>			
					</xsl:otherwise>
				</xsl:choose>
			</complexcat>
			<xsl:apply-templates select="*[self::PRT]"/>        	 
	</Leafnode>
</xsl:template> 

<!--Function which initializes the idTally-->
<xsl:template name = "localInit" >
	<xsl:variable name="dummy" select="java:localInit($obj)"/>
</xsl:template> 

<xsl:template name="dollDecider">
	<xsl:param name="cat1"/>
	<xsl:param name="cat2"/>
	<xsl:param name="cat3"/>

	<xsl:if test="contains($cat1,'s') and not($cat1='(s\np)\(s\np)')">
		<xsl:variable name="dummy" select="java:storeDollarStatus($obj,'res')"/>
	</xsl:if>
	<xsl:if test="contains($cat2,'s') and not($cat2='(s\np)\(s\np)')">
		<xsl:variable name="dummy" select="java:storeDollarStatus($obj,'arg1')"/>	
	</xsl:if>
	<xsl:if test="contains($cat3,'s') and not($cat3='(s\np)\(s\np)')">
		<xsl:variable name="dummy" select="java:storeDollarStatus($obj,'arg2')"/>	
	</xsl:if>
	<xsl:variable name="dummy" select="java:dsCalc($obj)"/>	
</xsl:template>

<!--Eliminating the complexcat element in the result,if any-->
<xsl:template match="complexcat[position()=1]" mode="res">
	<xsl:apply-templates select="*[1]" mode="res"/>
	<xsl:apply-templates select="*[position()>1]" mode="args"/>
</xsl:template> 

<!--Adding the result category with a conj atomcat type-->
<xsl:template match="atomcat" mode="res">
	
	<atomcat type="{@type}">

		<xsl:variable name="newId" select="java:normId($obj,./fs/@id,./fs/@inheritsFrom,@type)"/>
 		<fs id="{$newId}">
			<xsl:apply-templates select="./fs/*" mode="res"/>
 		</fs>
 	</atomcat>
</xsl:template> 

<!--Eliminating the conj feature in the result-->
<xsl:template match="feat[@val='conj']" mode="res"/>

<!--Adding arg1 and arg2-->
<xsl:template match="atomcat" mode="args">

	<atomcat type="{@type}">
		<xsl:variable name="newId" select="java:normId($obj,./fs/@id,./fs/@inheritsFrom,@type)"/>
 		<fs id="{$newId}">
  		<xsl:apply-templates select="./fs/*" mode="args"/>  
 		</fs>
 	</atomcat>

</xsl:template> 

<!--Template which adds fs according as it is id or inheritsFrom-->
<xsl:template name="addFs">

	<xsl:variable name="newId" select="java:normId($obj,./fs/@id,./fs/@inheritsFrom,@type)"/>
	
	<xsl:if test="./fs/@id">
 		<fs id="{$newId}">
			<xsl:apply-templates select="./fs/*" mode="res"/>
 		</fs>
	</xsl:if>
	<xsl:if test="./fs/@inheritsFrom">
 		<fs inheritsFrom="{$newId}">
			<xsl:apply-templates select="./fs/*" mode="res"/>
 		</fs>
	</xsl:if>

</xsl:template> 

<!--res copy rule-->
<xsl:template match="@*|node()" mode="res">
	<xsl:copy>
	  <xsl:apply-templates select="@*|node()" mode="res"/>
  </xsl:copy>
</xsl:template>

<!--args copy rule-->
<xsl:template match="@*|node()" mode="args">
  <xsl:copy>
  	<xsl:apply-templates select="@*|node()" mode="args"/>
	</xsl:copy>
</xsl:template>

<!--Default global copy rule-->
<xsl:template match="@*|node()">
	<xsl:copy>
 		<xsl:apply-templates select="@*|node()"/>
	</xsl:copy>
</xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/insertLF.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->

<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

  <xsl:output method="xml" indent="yes" xalan2:indent-amount="2"/>
  <xsl:strip-space elements="*"/>
  
  
  <!--Transform which takes in as input the lexicon.xml file and outputs an augmented lexicon.xml with LF-->
  
  <!--Java Program in the grammar extractor package invoked-->
  <xsl:variable name="obj" select="java:opennlp.ccgbank.extract.InsertLFHelper.new()"/>
  
  <!-- root -->
  <xsl:template match="ccg-lexicon">
    <ccg-lexicon xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:noNamespaceSchemaLocation="../lexicon.xsd" name="protogrammar">
      <xsl:apply-templates/>
    </ccg-lexicon>
  </xsl:template>

  
  <!-- nouns (of various kinds) -->
  <!-- adding existential 'there' and 'it' for now -->
  <xsl:template match="family[
      @name='np_9' or @name='n_9' or @name='n_1' or @name='np_1' or @name='n[num]_1' or @name='np[thr]_1' or @name='np[expl]_1'
    ]/entry/atomcat"
  >
    <atomcat type="{@type}">
      <!-- 
      <xsl:variable name="dummy1" select="java:initFeat($obj)"/>
      <xsl:variable name="dummy2" select="java:putFeat($obj,'num')"/>
      -->
      <xsl:apply-templates/>
      <lf>
        <!--<satop nomvar="X1"> <prop name="[*DEFAULT*]"/> </satop>-->
				<satop nomvar="X{fs/@id}"> <prop name="[*DEFAULT*]"/> </satop>
      </lf>
    </atomcat>
  </xsl:template>

  <!-- n w/ arg -->
  <xsl:template match="family[@name='n_1/n[num]_2' or @name='n_1/s[em]_2']/entry/complexcat">
    <complexcat>
      <xsl:apply-templates/>
      <lf>
        <satop nomvar="X1">
          <prop name="[*DEFAULT*]"/>
          <diamond mode="Arg"> <nomvar name="X2"/> </diamond>
        </satop>
      </lf>
    </complexcat>
  </xsl:template>

  
  <!-- determiners -->
  <!-- nb: should be np_1/^n_1 -->
  <xsl:template match="family[@name='np_1/^n_1' or @name='np_1/n_1']/entry/complexcat">
    <complexcat>
      <xsl:apply-templates/>
      <lf>
        <satop nomvar="X1">
          <diamond mode="Det"> 
            <nomvar name="D"/> <prop name="[*DEFAULT*]"/> 
          </diamond>
        </satop>
      </lf>
    </complexcat>
  </xsl:template>

  
  <!-- possessive -->
  <xsl:template match="family[@pos='POS' and @name='np_1/n_1\np_2']/entry/complexcat">
    <complexcat>
      <xsl:apply-templates/>
      <lf>
        <satop nomvar="X1">
          <diamond mode="GenOwn"> <nomvar name="X2"/> </diamond>
        </satop>
      </lf>
    </complexcat>
  </xsl:template>
  
  
  <!-- sentence-final punct -->
  <xsl:template match="family[@pos='.' and starts-with(@name,'sent_1')]/entry/complexcat">
    <complexcat>
      <xsl:apply-templates/>
      <lf>
        <satop nomvar="X1">
          <diamond mode="mood"> <prop name="[*DEFAULT*]"/> </diamond>
        </satop>
      </lf>
    </complexcat>
  </xsl:template>

  <!-- nominal pre- and post-modifiers -->
  <!-- eg: n_~1/n_1 or np_~1\np_1 -->
  <!-- nb: pred adj separate -->
  <!-- nb: should look at np_1\np_1/n_2 POS: DT -->
  <xsl:template match="family/entry/complexcat[
    (atomcat[1][@type='n'] and *[3][self::atomcat][@type='n']) or (atomcat[1][@type='np'] and *[3][self::atomcat][@type='np'])]"
  >
    <complexcat>
      <xsl:apply-templates/>
      <lf>
        <satop nomvar="X1">
          <diamond mode="Mod">
            <nomvar name="M"/> <prop name="[*DEFAULT*]"/>
            <xsl:call-template name="add-ArgN"/>
          </diamond>
        </satop>
      </lf>
    </complexcat>
  </xsl:template>
  
  <!-- nominal modifier modifiers -->
  <!-- eg: n_~1/n_1/(n_~1/n_1) or np_~1\np_1/(np_~1\np_1) -->
  <xsl:template match="family/entry[
      count(.//complexcat[
        (atomcat[1][@type='n'] and *[3][self::atomcat][@type='n']) or (atomcat[1][@type='np'] and *[3][self::atomcat][@type='np'])
      ]) = 2
    ]/complexcat"
  >
    <complexcat>
      <xsl:apply-templates/>
      <lf>
        <satop nomvar="M">
          <diamond mode="Mod">
            <nomvar name="R"/> <prop name="[*DEFAULT*]"/>
            <xsl:call-template name="add-ArgN">
              <xsl:with-param name="min-pos" select="7"/>
            </xsl:call-template>
          </diamond>	  	  
        </satop>
      </lf>
    </complexcat>
  </xsl:template>
  
  
  <!-- tbd: nominal modifier modifier modifiers (!, eg "not"): np_~1\np_1/(np_3\np_1)/(np_~1\np_1/(np_3\np_1)) -->
  <xsl:template match="family/entry[
      count(.//complexcat[
        (atomcat[1][@type='n'] and *[3][self::atomcat][@type='n']) or (atomcat[1][@type='np'] and *[3][self::atomcat][@type='np'])
      ]) = 4
    ]/complexcat"
  >
    <complexcat>
      <xsl:apply-templates/>
    </complexcat>
  </xsl:template>

  
  <!-- tbd (?? for "in", "to"): n_~1/n_1\(n_~1/n_1)/(n_3/n_4) -->
  <!-- tbd (?? for "just", "roughly"): n_~1/n_1/(n_3/n_1)/(n_~1/n_1/(n_3/n_1)) -->
  <!-- tbd (?? for "as", "well"): np_1\*np_2\*punct[,]/*np_4/*(np_1\*np_2\*punct[,]/*np_4) -->
  <xsl:template match="family[@name='n_~1/n_1\(n_~1/n_1)/(n_3/n_4)' or @name='n_~1/n_1/(n_3/n_1)/(n_~1/n_1/(n_3/n_1))' or @name='np_1\*np_2\*punct[,]/*np_4/*(np_1\*np_2\*punct[,]/*np_4)']
    /entry/complexcat"
  >
    <complexcat>
      <xsl:apply-templates/>
    </complexcat>
  </xsl:template>
  
  
  <!-- relative pronouns -->
  <xsl:template match="family[@indexRel='GenRel']/entry/complexcat">
    <complexcat>
      <xsl:apply-templates/>
      <lf>
        <satop nomvar="X1">
          <diamond mode="GenRel"> <nomvar name="X2"/> </diamond>	  	  
        </satop>
      </lf>
    </complexcat>
  </xsl:template>
  
  <!-- tbd: free relatives, np_1/(s[dcl]_2/np_3) -->

  
  <!-- canonical pred and args (Arg0 .. ArgN) -->
  <!-- exclude: vp modifiers, passives, expletive subjects -->
  <!-- nb: leaving out expletive 'there' and 'it' for now -->
  <xsl:template match="family/entry/complexcat[
    atomcat[1][@type='s']/fs[@id='1' and not(feat[@attr='form']/@val='pss')] and 
    atomcat[2][@type='np']/fs[@id='2'] and
    not(complexcat/atomcat[1][@type='s']/fs[@id='1'])
  ]">
    <!--
    atomcat[2][@type='np']/fs[@id='2' and not(feat[@attr='form' and (@val='thr' or @val='expl')])] and
    -->
    <complexcat>
      <xsl:apply-templates/>
      <lf>
        <satop nomvar="X1">
          <prop name="[*DEFAULT*]"/>
          <diamond mode="Arg0"> <nomvar name="X2"/> </diamond>
          <!-- 
            vp args: in s\np_2/x_n/../x_3, x_3 to x_n map to Arg1 to ArgN-2, 
            except with double object (np np), where the order is reversed 
          -->
          <xsl:choose>
            <!-- Arg2 Arg1 for ind-obj dir-obj, ie s\np/np[X3]_3/np[X4]_4 -->
            <xsl:when test="atomcat[3][@type='np']/fs[@id='3'] and atomcat[4][@type='np']/fs[@id='4']">
              <diamond mode="Arg1"> <nomvar name="X3"/> </diamond>
              <diamond mode="Arg2"> <nomvar name="X4"/> </diamond>
            </xsl:when>
            <!-- general case: assign ArgN based on num args from end -->
            <xsl:otherwise>
              <xsl:call-template name="add-ArgN"/>
            </xsl:otherwise>
          </xsl:choose>
        </satop>
      </lf>
    </complexcat>
  </xsl:template>
  

  <!-- passive: subj is Arg1, rest are Arg2..N; exception for ditrans -->
  <!-- tbd: should mark passive topic with a (relational) feature -->
  <!-- tbd: by-PP as Arg0 (but not in sect 00?) -->
  <!-- nb: indices wrong on passives with s[pss]\np/(pp/np) -->
  <xsl:template match="family[starts-with(@name,'s[pss]_1\np_2') and @name!='s[pss]_1\np_2/np_3']/entry/complexcat">
    <complexcat>
      <xsl:apply-templates/>
      <lf>
        <satop nomvar="X1">
          <prop name="[*DEFAULT*]"/>
          <diamond mode="Arg1"> <nomvar name="X2"/> </diamond>
          <xsl:call-template name="add-ArgN">
            <xsl:with-param name="first-arg-num" select="2"/>
          </xsl:call-template>
        </satop>
      </lf>
    </complexcat>
  </xsl:template>
  
  
  <!-- ditrans passive: subj is Arg2, obj is Arg1 -->
  <!-- nb: also possible, but rare, for subj to be Arg1; this isn't marked in CCGbank though -->
  <xsl:template match="family[@name='s[pss]_1\np_2/np_3']/entry/complexcat">
    <complexcat>
      <xsl:apply-templates/>
      <lf>
        <satop nomvar="X1">
          <prop name="[*DEFAULT*]"/>
          <diamond mode="Arg2"> <nomvar name="X2"/> </diamond>
          <diamond mode="Arg1"> <nomvar name="X3"/> </diamond>
        </satop>
      </lf>
    </complexcat>
  </xsl:template>
  
  
  <!-- non-canonical s/.. pred and args (Arg0 .. ArgN) -->
  <!-- exclude: passives, s modifiers (implicit), s modifier modifiers -->
  <!-- nb: this works (somewhat) with 'who', but would be better to introduce bound var -->
  <xsl:template match="family[not(@indexRel)]/entry/complexcat[
    atomcat[1][@type='s']/fs[@id='1' and not(feat[@attr='form']/@val='pss')] and 
    slash[1][@dir='/'] and
    not(complexcat/atomcat[1][@type='s']/fs[@id='1'])
  ]">
    <complexcat>
      <xsl:apply-templates/>
      <lf>
        <satop nomvar="X1">
          <prop name="[*DEFAULT*]"/>
          <!-- 
            args: in s/x_n/../x_1, x_1 to x_n map to Arg0 to ArgN-1 
          -->
          <xsl:call-template name="add-ArgN">
            <xsl:with-param name="min-pos" select="3"/>
            <xsl:with-param name="first-arg-num" select="0"/>
          </xsl:call-template>
        </satop>
      </lf>
    </complexcat>
  </xsl:template>
  

  <!-- s\.. pred and args, eg s[dcl]_1\s[dcl]_2\np_3, as in "S, reporters said" (or inverted) -->
  <xsl:template match="family[@name='s[dcl]_1\s[dcl]_2\np_3' or @name='s[dcl]_1\s[dcl]_2/np_3']/entry/complexcat">
    <complexcat>
      <xsl:apply-templates/>
      <lf>
        <satop nomvar="X1">
          <prop name="[*DEFAULT*]"/>
          <diamond mode="Arg0"> <nomvar name="X3"/> </diamond>
          <diamond mode="Arg1"> <nomvar name="X2"/> </diamond>
        </satop>
      </lf>
    </complexcat>
  </xsl:template>
  
  <!-- nb: can also have s[dcl]_1\s[dcl]_2\np_3/np_4, "told" -->
  <xsl:template match="family[@name='s[dcl]_1\s[dcl]_2\np_3/np_4']/entry/complexcat">
    <complexcat>
      <xsl:apply-templates/>
      <lf>
        <satop nomvar="X1">
          <prop name="[*DEFAULT*]"/>
          <diamond mode="Arg0"> <nomvar name="X3"/> </diamond>
          <diamond mode="Arg1"> <nomvar name="X4"/> </diamond>
          <diamond mode="Arg2"> <nomvar name="X2"/> </diamond>
        </satop>
      </lf>
    </complexcat>
  </xsl:template>
  
  
  <!-- expletive subjects, eg s[dcl]_1\np[expl]_2/(s[to]_3\np_4)/(s[adj]_5\np_6) -->
  <!-- also: s[dcl]_1\np[thr]_2/(s[b]_3\np_4) -->
  <!-- rightward args:  Arg0, then Arg1 if present -->
  <!-- nb: should perhaps change pred, eg to there-be -->
  <!-- nb: should check arg assignments for there-be -->
  <!-- nb: leaving out expletive 'there' and 'it' for now -->
  <!--
  <xsl:template match="family/entry/complexcat[
    atomcat[1][@type='s']/fs[@id='1'] and 
    atomcat[2][@type='np']/fs[@id='2' and feat[@attr='form' and (@val='thr' or @val='expl')]]
  ]">
    <complexcat>
      <xsl:apply-templates/>
      <lf>
        <satop nomvar="X1">
          <prop name="[*DEFAULT*]"/>
          <xsl:variable name="arg0" select="*[not(self::slash)][3]"/>
          <diamond mode="Arg0"> 
            <nomvar name="X{$arg0/fs/@id | $arg0/atomcat[1]/fs/@id}"/>
          </diamond>
          <xsl:variable name="arg1" select="*[not(self::slash)][4]"/>
          <xsl:if test="$arg1">
            <diamond mode="Arg1"> 
              <nomvar name="X{$arg1/fs/@id | $arg1/atomcat[1]/fs/@id}"/>
            </diamond>
          </xsl:if>
        </satop>
      </lf>
    </complexcat>
  </xsl:template>
  -->
  
  <!-- s modifier (pre or post) -->
  <xsl:template match="family[not(@indexRel)]/entry/complexcat[
    atomcat[1][@type='s']/fs[@inheritsFrom='1'] and atomcat[2][@type='s']/fs[@id='1']
  ]">
    <complexcat>
      <xsl:apply-templates/>
      <lf>
        <satop nomvar="X1">
          <diamond mode="Mod">
            <nomvar name="M"/> <prop name="[*DEFAULT*]"/>
            <xsl:call-template name="add-ArgN"/>
          </diamond>	  	  
        </satop>
      </lf>
    </complexcat>
  </xsl:template>
  
  
  <!-- s modifier modifiers -->
  <!-- eg: s_~1/s_1/(s_~1/s_1) -->
  <xsl:template match="family/entry[
      count(.//complexcat[
        atomcat[1][@type='s'] and *[3][self::atomcat][@type='s']
      ]) = 2
    ]/complexcat"
  >
    <complexcat>
      <xsl:apply-templates/>
      <lf>
        <satop nomvar="M">
          <diamond mode="Mod">
            <nomvar name="R"/> <prop name="[*DEFAULT*]"/>
            <xsl:call-template name="add-ArgN">
              <xsl:with-param name="min-pos" select="7"/>
            </xsl:call-template>
          </diamond>	  	  
        </satop>
      </lf>
    </complexcat>
  </xsl:template>
  
  
  <!-- vp modifier (pre or post) -->
  <!-- eg: s_~1\np_2\(s_1\np_2)/np_3 -->
  <xsl:template match="family[not(@indexRel)]/entry/complexcat[
    atomcat[1][@type='s']/fs[@inheritsFrom='1'] and atomcat[2][@type='np']/fs[@id='2'] and
    complexcat[1][atomcat[1][@type='s']/fs[@id='1']]
  ]">
    <complexcat>
      <xsl:apply-templates/>
      <lf>
        <satop nomvar="X1">
          <diamond mode="Mod">
            <nomvar name="M"/> <prop name="[*DEFAULT*]"/>
            <xsl:call-template name="add-ArgN">
              <xsl:with-param name="min-pos" select="7"/>
            </xsl:call-template>
          </diamond>	  	  
        </satop>
      </lf>
    </complexcat>
  </xsl:template>
  

  <!-- vp modifier modifier, eg: s_~1\np_2\(s_1\np_2)/(s_~1\np_2\(s_1\np_2)) -->
  <xsl:template match="family/entry[
      count(.//complexcat[
        atomcat[1][@type='s'] and *[3][self::atomcat][@type='np']
      ]) = 4
    ]/complexcat"
  >
    <complexcat>
      <xsl:apply-templates/>
      <lf>
        <satop nomvar="M">
          <diamond mode="Mod">
            <nomvar name="R"/> <prop name="[*DEFAULT*]"/>
            <xsl:call-template name="add-ArgN">
              <xsl:with-param name="min-pos" select="9"/>
            </xsl:call-template>
          </diamond>	  	  
        </satop>
      </lf>
    </complexcat>
  </xsl:template>
  

  <!-- tbd (??, "than"): s_~1\np_2\(s_3\np_4)/(s_5\np_6\(s_7\np_8))/(s_1\np_2\(s_3\np_4)/(s_5\np_6\(s_7\np_8)))\(s[adj]_9\np_10) -->
  
  <!-- tbd: look at auxv -->  

  <!-- nominal conj, eg
    np_1\*np_2/*np_3
    np_1\*np_2\*punct[,]/*np_4
  -->
  <xsl:template match="family[not(@indexRel) and (@pos='CC' or @pos='PUNCT_CONJ' or @pos1='PUNCT_CONJ')]/entry/complexcat[
    atomcat[1][starts-with(@type,'n')]/fs[@id='1'] and 
    atomcat[2][starts-with(@type,'n')]/fs[@id='2'] and 
    atomcat[starts-with(@type,'n')]/fs[@id='3' or @id='4']
  ]">
    <complexcat>
      <xsl:apply-templates/>
      <xsl:variable name="rt-id" select="atomcat[starts-with(@type,'n')]/fs[@id='3' or @id='4']/@id"/>
      <lf>
        <satop nomvar="X1">
					<xsl:choose>
						<xsl:when test="ancestor::family[@pred]">
          		<prop name="{ancestor::family/@pred}"/>
						</xsl:when>
						<xsl:otherwise>
							<prop name="[*DEFAULT*]"/>
						</xsl:otherwise>
					</xsl:choose>
          <diamond mode="First"> <nomvar name="X2"/> </diamond> 
          <diamond mode="Next"> <nomvar name="X{$rt-id}"/> </diamond> 
        </satop>
      </lf>
    </complexcat>
  </xsl:template>

  <!-- verbal coord, eg
    s[dcl]_1$_1\*(s[dcl]_2$_1)/*(s[dcl]_3$_1)
    s[pss]_1$_1\*(s[pss]_2$_1)\*punct[,]/*(s[pss]_4$_1)
  -->
  <xsl:template match="family[not(@indexRel)]/entry/complexcat[
    atomcat[1][@type='s']/fs[@id='1'] and dollar and
    complexcat[atomcat[1][@type='s']/fs[@id='2'] and dollar] and
    complexcat[atomcat[1][@type='s']/fs[@id='3' or @id='4'] and dollar]
  ]">
    <complexcat>
      <xsl:apply-templates/>
      <xsl:variable name="rt-id" select="complexcat/atomcat[1][@type='s']/fs[@id='3' or @id='4']/@id"/>
      <lf>
        <satop nomvar="X1">
          <prop name="[*DEFAULT*]"/>
          <diamond mode="First"> <nomvar name="X2"/> </diamond> 
          <diamond mode="Next"> <nomvar name="X{$rt-id}"/> </diamond> 
        </satop>
      </lf>
    </complexcat>
  </xsl:template>

  <!-- tbd: other conj -->

	<!--PP conjn-->

  <xsl:template match="family[(@pos='CC' or @pos='PUNCT_CONJ' or @pos1='PUNCT_CONJ')]/entry/complexcat[
    atomcat[1][starts-with(@type,'pp')]/fs[@id='1'] and 
    atomcat[2][starts-with(@type,'pp')]/fs[@id='2'] and 
    atomcat[starts-with(@type,'pp')]/fs[@id='3' or @id='4']
  ]">
    <complexcat>
      <xsl:apply-templates/>
      <xsl:variable name="rt-id" select="atomcat[starts-with(@type,'pp')]/fs[@id='3' or @id='4']/@id"/>
      <lf>
        <satop nomvar="X1">
          <prop name="[*DEFAULT*]"/>
          <diamond mode="First"> <nomvar name="X2"/> </diamond> 
          <diamond mode="Next"> <nomvar name="X{$rt-id}"/> </diamond> 
        </satop>
      </lf>
    </complexcat>
  </xsl:template>


  <!-- tbd: 'easy', 'tough' -->  
  <!-- tbd: pp_1/pp_1 -->

  
  <!-- LF variable insertion in the syntax, excluding no sem cases -->
  <xsl:template match="family[not(@indexRel='*NoSem*')]//fs[@id]">
    <fs> 
      <xsl:apply-templates select="@*|node()"/>
      <feat attr="index"><lf><nomvar name="X{@id}"/></lf></feat>
      <!-- num feat -->
      <!-- 
      <xsl:variable name="feat" select="java:getFeat($obj)"/>
      <xsl:if test = "$feat != 'xxx'">
        <feat attr="{$feat}"><featvar name="NUM"/></feat>
      </xsl:if>
      -->
    </fs>
  </xsl:template>

  <xsl:template match="family[not(@indexRel='*NoSem*')]//fs[@inheritsFrom]">
    <fs> 
      <xsl:apply-templates select="@*|node()"/>
      <feat attr="mod-index"><lf><nomvar name="M"/></lf></feat>
    </fs>
  </xsl:template>

  
  <!-- special case for 'during which': need to unify indices for X2 and X3 -->
  <!-- 
  during :- np_~1\np_1/np_2 : @X1(<Mod>(M ^ during ^ <Arg1>X2))
  
  goal:
  during which :- np_~1\np_1/s[dcl_2] : @X1(<GenRel>(E ^ <Mod>(M ^ during ^ <Arg1>X1)))
  
  thus:
  which :- np_~1\np_1/s[dcl]_2\(np_3[X2]\np_4/np_1) : @X1(<GenRel>X2) 
  -->
  <xsl:template match="family[@name='np_~1\np_1/s[dcl]_2\(np_3\np_4/np_1)']//fs[@id='3']">
    <fs> 
      <xsl:apply-templates select="@*|node()"/>
      <feat attr="index"><lf><nomvar name="X2"/></lf></feat>
    </fs>
  </xsl:template>
  

  <!-- general case: assign ArgN based on num args from end -->
  <!-- eg, in s\np_2/x_n/../x_3, x_3 to x_n map to Arg1 to ArgN-2 -->
  <xsl:template name="add-ArgN">
    <xsl:param name="min-pos" select="5"/>
    <xsl:param name="first-arg-num" select="1"/>
    <xsl:variable name="compl" select="*[position() &gt;= $min-pos and not(self::slash) and not(self::atomcat and @type='punct')]"/>
    <xsl:variable name="num-compl" select="count($compl)"/>
    <xsl:for-each select="xalan:nodeset($compl)">
      <diamond mode="Arg{$first-arg-num + ($num-compl - position())}"> 
        <nomvar name="X{fs/@id | atomcat[1]/fs/@id}"/> 
      </diamond>
    </xsl:for-each>
  </xsl:template>


  <!-- cats with roles from propbank -->
  <!-- nb: assuming ~ distinguished modifier cats -->
  <xsl:template match="family[@argRoles and not(contains(@name,'~'))]/entry/complexcat">
    <xsl:if test="java:setRoles($obj,ancestor::family/@argRoles)"/>
    <complexcat>
      <xsl:apply-templates/>
      <lf>
        <satop nomvar="X1">
          <prop name="[*DEFAULT*]"/>
          <xsl:variable name="compl" select="*[position() &gt;= 3 and not(self::slash) and not(self::atomcat and @type='punct')]"/>
          <xsl:for-each select="xalan:nodeset($compl)">
            <xsl:variable name="role" select="java:getRole($obj,position()-1)"/>
            <xsl:if test="$role != 'null' and $role != 'e'">
              <diamond mode="{$role}"> 
                <nomvar name="X{fs/@id | atomcat[1]/fs/@id}"/> 
              </diamond>
            </xsl:if>
          </xsl:for-each>
        </satop>
      </lf>
    </complexcat>
  </xsl:template>

  <!-- modifier cats -->
  <xsl:template match="family[@argRoles and contains(@name,'~')]/entry/complexcat">
    <xsl:if test="java:setRoles($obj,ancestor::family/@argRoles)"/>
    <complexcat>
      <xsl:apply-templates/>
      <lf>
        <satop nomvar="X1">
          <diamond mode="ArgM">
            <nomvar name="M"/> <prop name="[*DEFAULT*]"/>
            <xsl:variable name="compl" select="*[position() &gt;= 3 and not(self::slash) and not(self::atomcat and @type='punct')]"/>
            <xsl:for-each select="xalan:nodeset($compl)">
              <xsl:variable name="role" select="java:getRole($obj,position()-1)"/>
              <!-- exclude ArgM here -->
              <xsl:if test="$role != 'null' and $role != 'e' and $role != 'ArgM'"> 
                <diamond mode="{$role}"> 
                  <nomvar name="X{fs/@id | atomcat[1]/fs/@id}"/> 
                </diamond>
              </xsl:if>
            </xsl:for-each>
          </diamond>
        </satop>
      </lf>
    </complexcat>
  </xsl:template>

  
  <!--Default global copy rule-->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>
  
</xsl:transform>


================================================
FILE: ccgbank/templates/insertOrigPunctsLF.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

<xsl:output method="xml" indent="yes" xalan2:indent-amount="2" omit-xml-declaration = "yes"/>

<xsl:strip-space elements="*"/>

<!--Transform which inserts orig punct cats i.e cats akin to binary rules-->

<xsl:template match="/">
 	<xsl:apply-templates/>
</xsl:template>

<!--Add *NoSem indexRel to punctuation cats except conj commas-->
<xsl:template match="family[@pos1='PUNCT' and not(@pos='PUNCT_CONJ')]">
	<family>
		<xsl:attribute name="indexRel">*NoSem*</xsl:attribute>
		<xsl:apply-templates select="@*|node()"/>
	</family>
</xsl:template>

<!--Strip off semantics conferred by default templates-->
<xsl:template match="lf[ancestor::family[@pos1='PUNCT' and not(@pos='PUNCT_CONJ')]]"/>
<xsl:template match="feat[(@attr='index' or @attr='mod-index') and ancestor::family[@pos1='PUNCT' and not(@pos='PUNCT_CONJ')]]"/>

<!--Default global copy rule-->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>

================================================
FILE: ccgbank/templates/insertPTBInfo.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

<xsl:output method="xml" indent="yes" xalan2:indent-amount="2" omit-xml-declaration = "yes"/>

<xsl:strip-space elements="*"/>


<xsl:variable name="obj" select="java:opennlp.ccgbank.convert.InfoHelper.new()"/>

<!--Transform to insert PTB info (SBJ, FN_TAG & TPC annotation) into the openccgbank-->

<xsl:template match="/">
  <xsl:apply-templates select="@*|node()"/>
</xsl:template>

<!--Confer PTB annotations (SBJ, FNTAG & TPC) onto Leafnodes-->
<xsl:template match="Leafnode">
	<xsl:variable name="sentId" select="ancestor-or-self ::*[@Header][1]/@Header"/>
	<xsl:variable name="sbj" select="java:getPTBInfo($obj,'SBJ',$sentId,@lexeme,@term_no)"/>
	<xsl:variable name="fntag" select="java:getPTBInfo($obj,'FNT',$sentId,@lexeme,@term_no)"/>
	<xsl:variable name="tpc" select="java:getPTBInfo($obj,'TPC',$sentId,@lexeme,@term_no)"/>
  <Leafnode>
		<xsl:if test="string-length($sbj) &gt; 0">
			<xsl:attribute name="sbj"><xsl:value-of select="$sbj"/></xsl:attribute>
		</xsl:if>
		<xsl:if test="string-length($fntag) &gt; 0">
			<xsl:attribute name="fntag"><xsl:value-of select="$fntag"/></xsl:attribute>
		</xsl:if>
		<xsl:if test="string-length($tpc) &gt; 0">
			<xsl:attribute name="tpc"><xsl:value-of select="$tpc"/></xsl:attribute>
		</xsl:if>
    <xsl:apply-templates select="@*"/>
		<xsl:apply-templates select="node()" mode="sbj"/>
  </Leafnode>
</xsl:template>

<!--Add sbj feature to result cat of relevant verbs-->
<xsl:template match="atomcat[position()=1 and (parent::Leafnode or parent::complexcat/parent::Leafnode)]" mode="sbj">

	<xsl:variable name="sentId" select="ancestor::*[@Header][1]/@Header"/>
	<xsl:variable name="sbj" select="java:getPTBInfo($obj,'SBJ',$sentId,ancestor::Leafnode[1]/@lexeme,ancestor::Leafnode[1]/@term_no)"/>
	<atomcat>
		<xsl:apply-templates select="@*" mode="sbj"/>
		<fs>
			<xsl:apply-templates select="./fs/@*|./fs/node()" mode="sbj"/>
			<xsl:if test="string-length($sbj) &gt; 0">
				<feat val="{$sbj}" attr="sbj"/>
			</xsl:if>
		</fs>
	</atomcat>
</xsl:template>

<!--Global copy rule for mode "sbj"-->

  <xsl:template match="@*|node()" mode="sbj">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()" mode="sbj"/>
    </xsl:copy>
  </xsl:template>

<!--Default global copy rule-->

   <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/insertPunctLF-PosMod.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->

<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

  <xsl:output method="xml" indent="yes" xalan2:indent-amount="2"/>
  <xsl:strip-space elements="*"/>

	<xsl:template match="/">
  	<xsl:apply-templates/>
	</xsl:template>

	<!--Transform which takes in as input the lexicon.xml file and adds LFs of certain comma cats-->

	<!--Bkgrnd java class-->
	<xsl:variable name="obj" select="java:opennlp.ccgbank.convert.PunctHelper.new()"/>

	<!--Add index rels to punctuation categories-->
	<!-- closed families -->
  <xsl:template match="family[@closed='true']">           
    <family>
      <xsl:apply-templates select="@*"/>
     <!-- add indexRel -->
      <xsl:choose>

				<!--Adv conj-->

				<!--Conjunction commas-->
				<xsl:when test="@pos='PUNCT_CONJ' or @pos1='PUNCT_CONJ'">
          <xsl:attribute name="indexRel">First</xsl:attribute>
        </xsl:when>
				
				<xsl:when test="(@pos='CC' or @pos='PUNCT_CONJ' or @pos1='CC' or @pos1='PUNCT_CONJ') and starts-with(@name,'s_1\np_2\(s_1\np_2)\*(s_3\np_4\(s_3\np_4))')">
          <xsl:attribute name="indexRel">GenRel</xsl:attribute>
        </xsl:when>

				<xsl:when test="@name='np_1/(s[dcl]_2\np_3)' or @name='np_1/(s[dcl]_2/np_3)'">
					<xsl:attribute name="indexRel">GenRel</xsl:attribute>
        </xsl:when>

				<xsl:when test="@name='n_1/n_1\*(n_2/n_2)/*(n_3/n_3)'">
					<xsl:attribute name="indexRel">GenRel</xsl:attribute>
        </xsl:when>

				<xsl:when test="@name='sent_1\*n_1'">
					<xsl:attribute name="indexRel">moodColon</xsl:attribute>
        </xsl:when>

				<!--Appos np commas-->

				<xsl:when test="@pos='PUNCT_APPOS' or @pos1='PUNCT_APPOS'">
          <xsl:attribute name="indexRel">ApposRel</xsl:attribute>
        </xsl:when>

				<xsl:when test="@pos='PUNCT_APPOS_PLACE' or @pos='PUNCT_APPOS_ADDR' or @pos1='PUNCT_APPOS_PLACE' or @pos1='PUNCT_APPOS_ADDR'">
          <xsl:attribute name="indexRel">ApposRel</xsl:attribute>
        </xsl:when>

				<xsl:when test="@pos='PUNCT_APPOS_MISC' or @pos1='PUNCT_APPOS_MISC'">
          <xsl:attribute name="indexRel">ApposRel</xsl:attribute>
        </xsl:when>

				<xsl:when test="@pos='PUNCT_APPOS_VRB' or @pos1='PUNCT_APPOS_VRB'">
          <xsl:attribute name="indexRel">ApposRel</xsl:attribute>
        </xsl:when>

				<!--Extraposed appositives-->
				<xsl:when test="@pos='PUNCT_EXTR-APPOS' or @pos1='PUNCT_EXTR-APPOS'">
          <xsl:attribute name="indexRel">ApposRel</xsl:attribute>
        </xsl:when>

				<xsl:when test="(@pos='WRB' or @pos='WP' or @pos='WDT') and contains(@name,'punct[,]')">
          <xsl:attribute name="indexRel">whApposRel</xsl:attribute>
        </xsl:when>

				<!--Commas which anchor pre-sentential adv adjuncts-->
				<xsl:when test="@pos='PUNCT_INIT_ADJ-MOD' or @pos1='PUNCT_INIT_ADJ-MOD'">
          <xsl:attribute name="indexRel">emph-intro</xsl:attribute>
        </xsl:when>
				<xsl:when test="@pos='PUNCT_INIT_ADJ-ARG' or @pos1='PUNCT_INIT_ADJ-ARG'">
          <xsl:attribute name="indexRel">EmphIntro</xsl:attribute>
        </xsl:when>
	
				<!--Commas which introduce say verbs-->
				<xsl:when test="substring(@pos,1,9)='PUNCT_SAY' or substring(@pos1,1,9)='PUNCT_SAY'">
					<xsl:attribute name="indexRel">ElabRel</xsl:attribute>
        </xsl:when>

				<!--post & pre vp adjunct commas-->
				<xsl:when test="@pos='PUNCT_PRE-VP_ADJ' or @pos='PUNCT_POST-VP_ADJ' or @pos1='PUNCT_PRE-VP_ADJ' or @pos1='PUNCT_POST-VP_ADJ'">
					<xsl:attribute name="indexRel">modFeat</xsl:attribute>
        </xsl:when>
			
				<!--Emph final commas-->
				<xsl:when test="@pos='PUNCT_EMPH_FINAL' or @pos1='PUNCT_EMPH_FINAL'">
					<xsl:attribute name="indexRel">emph-final</xsl:attribute>
        </xsl:when>
				<xsl:when test="@pos='PUNCT_EMPH_FINAL_VRB' or @pos1='PUNCT_EMPH_FINAL_VRB'">
					<xsl:attribute name="indexRel">EmphFinal</xsl:attribute>
        </xsl:when>

				<!--Parenthetical commas-->
				<xsl:when test="@pos='PUNCT_PARENTHETICAL' or @pos1='PUNCT_PARENTHETICAL'">
					<xsl:attribute name="indexRel">interrupt</xsl:attribute>
        </xsl:when>
				<xsl:when test="@pos='PUNCT_PARENTHETICAL_VRB' or @pos1='PUNCT_PARENTHETICAL_VRB'">
					<xsl:attribute name="indexRel">InterruptRel</xsl:attribute>
        </xsl:when>	

				<!--Brackets-->
				<xsl:when test="starts-with(@pos,'PUNCT_LPAREN') and not(starts-with(@name,'punct'))">
					<xsl:attribute name="indexRel">ParenRel</xsl:attribute>
				</xsl:when>

				<!--Colons after say verbs-->
				<xsl:when test="@pos='PUNCT_COLON_SAY' or @pos1='PUNCT_COLON_SAY'">
          <xsl:attribute name="indexRel">colonExp</xsl:attribute>
        </xsl:when>

				<!--Dash expansions-->
				<xsl:when test="@pos='IN-DASH' or @pos='PUNCT_ELAB_DASH_CAT' or @pos='PUNCT_ELAB_DASH' or @pos1='IN-DASH' or @pos1='PUNCT_ELAB_DASH_CAT' or @pos1='PUNCT_ELAB_DASH'">
          <xsl:attribute name="indexRel">DashInterp</xsl:attribute>
        </xsl:when>
				
				<!--Ellipsis relations ie dots in text-->
				<xsl:when test="@pos='PUNCT_DOTS1' or @pos='PUNCT_DOTS2' or @pos1='PUNCT_DOTS1' or @pos1='PUNCT_DOTS2'">
          <xsl:attribute name="indexRel">EllipsisRel</xsl:attribute>
        </xsl:when>

				<!--Quotation marks-->
				<xsl:when test="@pos1='PUNCT_QUOTE' and not(starts-with(@name,'punct['))">
          <xsl:attribute name="indexRel">quote-rel</xsl:attribute>
        </xsl:when>

			</xsl:choose>
			<xsl:apply-templates/>
		</family>
	</xsl:template>		

	
	<!--LF of a non-case marking prep from Steve's corpus. To shifted from here shortly-->

	<!--To evaluate orig ccgbank-->
	<xsl:template match="complexcat[parent::entry[../@name='pp_1/np_2']]">

		<complexcat>	
			<xsl:apply-templates select="*[not(name()='lf')]"/>
			<lf>
        <satop nomvar="X1">
					<prop name="[*DEFAULT*]"/>
        	<diamond mode="Arg1">
	          <nomvar name="X2"/>
          </diamond>
      	</satop>
      </lf>
		</complexcat>		
	</xsl:template>


	<!--<xsl:template match="complexcat[parent::entry and ancestor::family[substring-after(@name,'_')='~2\(s_2\np_3\(s_4\np_5))/np_6' and starts-with(@name,'pp')]]">

		<complexcat>	
			<xsl:apply-templates select="*[not(name()='lf')]"/>
			<lf>
        <satop nomvar="X2">
					<diamond mode="Mod">
          	<nomvar name="M"/>
						<prop name="[*DEFAULT*]"/>
        		<diamond mode="Arg1">
	          	<nomvar name="X6"/>
          	</diamond>
					</diamond>
      	</satop>
      </lf>
		</complexcat>		
	</xsl:template>-->


	<!--LF of a renegade dollar sign cat. To shifted from here shortly-->
	<xsl:template match="complexcat[parent::entry and ancestor::family[@name='n_1/n[num]_2']]">

		<complexcat>	
			<xsl:apply-templates select="*[not(name()='lf')]"/>
			<lf>
        <satop nomvar="X1">
					<prop name="[*DEFAULT*]"/>
        	<diamond mode="Num">
	          <nomvar name="X2"/>
          </diamond>
      	</satop>
      </lf>
		</complexcat>		
	</xsl:template>

	<xsl:template match="complexcat[parent::entry and ancestor::family[@name='sent_1\*n_1']]">

		<complexcat>	
			<xsl:apply-templates select="*[not(name()='lf')]"/>
			<lf>
				<satop nomvar="X1">
     			<diamond mode="moodColon">
        		<prop name="[*DEFAULT*]"/>
        	</diamond>
     		</satop>	
			</lf>
		</complexcat>		
	</xsl:template>


	<xsl:template match="complexcat[parent::entry and ancestor::family[@name='np_1/(s[dcl]_2\np_3)' or @name='np_1/(s[dcl]_2/np_3)']]">
		<complexcat>	
			<xsl:apply-templates select="*[not(name()='lf')]"/>
			<lf>
        <satop nomvar="X1">
        	<diamond mode="GenRel">
	          <nomvar name="X2"/>
          </diamond>
      	</satop>
      </lf>
		</complexcat>		
	</xsl:template>
	
	<!--Conjunctions of certain cats which are not dealt with elsewhere-->

	 <xsl:template match="complexcat[parent::entry and ancestor::family[(@pos='PUNCT_CONJ' or @pos='CC' or @pos1='PUNCT_CONJ' or @pos1='CC') and starts-with(@name,'s_1\np_2\(s_1\np_2)\*(s_3\np_4\(s_3\np_4))')]]">
		<complexcat>	
			<xsl:apply-templates select="*[not(name()='lf')]"/>
			<lf>
				<satop nomvar="X1">
        	<diamond mode="GenRel">
						<nomvar name="M"/>
						<prop name="[*DEFAULT*]"/>
          	<diamond mode="Arg0">
        			<nomvar name="X3"/>
							<prop name="has-rel"/>
							<diamond mode="Of">
								<nomvar name="X1"/>
							</diamond>
						</diamond>
						<diamond mode="Arg1">
							<xsl:choose>
								<xsl:when test="descendant::punct">
									<nomvar name="X6"/>
								</xsl:when>
								<xsl:otherwise>
									<nomvar name="X5"/>
								</xsl:otherwise>
							</xsl:choose>
							<prop name="has-rel"/>
							<diamond mode="Of">
								<nomvar name="X1"/>
							</diamond>							
						</diamond>
        	</diamond>
        </satop>
      </lf>
		</complexcat>		
	</xsl:template>

	<xsl:template match="complexcat[parent::entry and ancestor::family[@name='n_1/n_1\*(n_2/n_2)/*(n_3/n_3)']]">

		<complexcat>	
			<xsl:apply-templates select="*[not(name()='lf')]"/>
			<lf>
				<satop nomvar="X1">
        	<diamond mode="GenRel">
						<nomvar name="M"/>
						<prop name="[*DEFAULT*]"/>
          	<diamond mode="Arg0">
        			<nomvar name="X2"/>
							<prop name="has-rel"/>
							<diamond mode="Of">
								<nomvar name="X1"/>
							</diamond>
						</diamond>
						<diamond mode="Arg1">
							<nomvar name="X3"/>
							<prop name="has-rel"/>
							<diamond mode="Of">
								<nomvar name="X1"/>
							</diamond>
						</diamond>							
        	</diamond>
        </satop>
      </lf>
		</complexcat>		
	</xsl:template>

<!--LFs of high freq punct cats-->
<xsl:template match="complexcat[parent::entry and ancestor::family[starts-with(@pos,'PUNCT_INIT_ADJ-MOD') or starts-with(@pos1,'PUNCT_INIT_ADJ-MOD')]]">
	<complexcat>	
		<xsl:apply-templates select="*[not(name()='lf')]"/>
		<lf>
      <satop nomvar="M">
	     	<diamond mode="emph-intro">
					<prop name="+"/>
        </diamond>
    	</satop>
    </lf>	
	</complexcat>		
</xsl:template>

<xsl:template match="complexcat[parent::entry and ancestor::family[@pos='PUNCT_INIT_ADJ-ARG' or @pos1='PUNCT_INIT_ADJ-ARG']]">
	<complexcat>	
		<xsl:apply-templates select="*[not(name()='lf')]"/>
		<lf>
			<satop nomvar="X1">
      	<diamond mode="EmphIntro">
        	<nomvar name="X2"/>
      	</diamond>
      </satop>
		</lf>		
	</complexcat>	
</xsl:template>

<xsl:template match="complexcat[parent::entry and ancestor::family[@pos='PUNCT_APPOS' or @pos1='PUNCT_APPOS']]">

	<complexcat>	
		<xsl:apply-templates select="*[not(name()='lf')]"/>
		<lf>
    	<satop nomvar="X1">
      	<diamond mode="ApposRel">
          <nomvar name="X3"/>
        </diamond>
      </satop>
    </lf>		
	</complexcat>				
</xsl:template>

<xsl:template match="complexcat[parent::entry and ancestor::family[@pos='PUNCT_APPOS_PLACE' or @pos1='PUNCT_APPOS_PLACE']]">

	<complexcat>	
		<xsl:apply-templates select="*[not(name()='lf')]"/>
		<lf>
    	<satop nomvar="X1">
      	<diamond mode="ApposRel">
          <nomvar name="X3"/>
        </diamond>
      </satop>
    </lf>
	</complexcat>				
</xsl:template>

<xsl:template match="complexcat[parent::entry and ancestor::family[@pos='PUNCT_APPOS_ADDR' or @pos1='PUNCT_APPOS_ADDR']]">

	<complexcat>	
		<xsl:apply-templates select="*[not(name()='lf')]"/>
		<lf>
			<satop nomvar="X1">
        <diamond mode="ApposRel">
        	<nomvar name="M"/>
      	</diamond>
      </satop>
    	<!--<satop nomvar="M">
        <diamond mode="PlaceRel">
        	<prop name="+"/>
      	</diamond>
      </satop>-->
    </lf>
	</complexcat>				
</xsl:template>

<xsl:template match="complexcat[parent::entry and ancestor::family[@pos='PUNCT_APPOS_VRB' or @pos1='PUNCT_APPOS_VRB']]">

	<complexcat>	
		<xsl:apply-templates select="*[not(name()='lf')]"/>
		<lf>
    	<satop nomvar="X1">
      	<diamond mode="ApposRel">
         	<nomvar name="X4"/>
        </diamond>
      </satop>
    </lf>
	</complexcat>				
</xsl:template>

<xsl:template match="complexcat[parent::entry and ancestor::family[starts-with(@pos,'PUNCT_APPOS_MISC') or starts-with(@pos1,'PUNCT_APPOS_MISC')]]">
	<complexcat>	
		<xsl:apply-templates select="*[not(name()='lf')]"/>
		<lf>
			<satop nomvar="X1">
	     	<diamond mode="ApposRel">
					<nomvar name="M"/>
        </diamond>
			</satop>

      <!--<satop nomvar="M">
	     	<diamond mode="ApposRel">
					<prop name="+"/>
        </diamond>
    	</satop>-->
    </lf>	
	</complexcat>		
</xsl:template>

<!--Extraposed appositives-->
<xsl:template match="complexcat[parent::entry and ancestor::family[@pos='PUNCT_EXTR-APPOS' or @pos1='PUNCT_EXTR-APPOS']]">

	<complexcat>	
		<xsl:apply-templates select="*[not(name()='lf')]"/>
		<lf>
    	<satop nomvar="X1">
      	<diamond mode="ApposRel">
          <nomvar name="X3"/>
        </diamond>
      </satop>
    </lf>
	</complexcat>	
</xsl:template>

<xsl:template match="complexcat[parent::entry and ancestor::family[@name='n_1\*(n_2/n_2)/*n_3']]">
	<complexcat>	
		<xsl:apply-templates select="*[not(name()='lf')]"/>
		<lf>
    	<satop nomvar="X1">
      	<prop name="[*DEFAULT*]"/>
     	 	<diamond mode="Arg0">
        	<nomvar name="X2"/>
					<prop name="has-rel"/>
					<diamond mode="Of">
						<nomvar name="X3"/>
					</diamond>
        </diamond>
				<diamond mode="Arg1">
					<nomvar name="X3"/>
				</diamond>
      </satop>
    </lf>
	</complexcat>		
</xsl:template>

<xsl:template match="complexcat[parent::entry and ancestor::family[@name='np_1\*np_2/*s[em]_3']]">

	<complexcat>	
		<xsl:apply-templates select="*[not(name()='lf')]"/>
		<lf>
    	<satop nomvar="X1">
      	<prop name="[*DEFAULT*]"/>
      	<diamond mode="First">
        	<nomvar name="X2"/>
        </diamond>
        <diamond mode="Next">
        	<nomvar name="X3"/>
        </diamond>
      </satop>
    </lf>
	</complexcat>		
</xsl:template>

<xsl:template match="complexcat[parent::entry and ancestor::family[(@pos='WRB' or @pos='WP' or @pos='WDT') and contains(@name,'punct[,]')]]">
		<complexcat>	
		<xsl:apply-templates select="*[not(name()='lf')]"/>
		<lf>
    	<satop nomvar="X1">
      	<diamond mode="whApposRel">
        	<nomvar name="X2"/>
        </diamond>
      </satop>
    </lf>
	</complexcat>				
</xsl:template>

<!--say verbs-->
<xsl:template match="complexcat[parent::entry and ancestor::family[substring(@pos,1,9)='PUNCT_SAY' or substring(@pos1,1,9)='PUNCT_SAY']]">

	<xsl:variable name="satop1" select="*[1]/fs/@inheritsFrom"/>
	<xsl:variable name="satop2" select="*[1]/fs/@id"/>

	<xsl:variable name="arg0" select="slash[last()]/following::atomcat[1]/descendant::nomvar/@name"/>

	<xsl:variable name="args" select="descendant::atomcat"/>
	<xsl:variable name="arg1" select="$args[last()]/descendant::nomvar/@name"/>

	<complexcat>	
		<xsl:apply-templates select="*[not(name()='lf')]"/>
		<lf>
    	<satop nomvar="X{$satop1}">
				<xsl:if test="$satop2">
					 <xsl:attribute name="nomvar"><xsl:value-of select="concat('X',$satop2)"/></xsl:attribute>
				</xsl:if>
      	<diamond mode='ElabRel'>
        	<nomvar name="{$arg0}">
					</nomvar>
        </diamond>
      </satop>
    </lf>
	</complexcat>	
</xsl:template>
<xsl:template match="complexcat[parent::entry and ancestor::family[@pos='PUNCT_COLON_SAY' or @pos1='PUNCT_COLON_SAY']]">

	<complexcat>	
		<xsl:apply-templates select="*[not(name()='lf')]"/>
		<lf>
    	<satop nomvar="X2">
      	<diamond mode="colonExp">
	       	<nomvar name="X1"/>
        </diamond>
      </satop>
    </lf>
	</complexcat>	
</xsl:template>

<!--Dash interpolations-->
<xsl:template match="complexcat[parent::entry and ancestor::family[@pos='PUNCT_ELAB_DASH_CAT' or @pos1='PUNCT_ELAB_DASH_CAT']]">

	<xsl:variable name="satop" select="*[1]/fs/@inheritsFrom"/>
	<xsl:variable name="arg1" select="slash[last()]/following::atomcat[1]/descendant::nomvar/@name"/>

	<complexcat>	
		<xsl:apply-templates select="*[not(name()='lf')]"/>
		<lf>
    	<satop nomvar="X{$satop}">
      	<diamond mode='DashInterp'>
        	<nomvar name="{$arg1}"/>
        </diamond>
      </satop>
    </lf>
	</complexcat>	
</xsl:template>
<xsl:template match="complexcat[parent::entry and ancestor::family[@pos='PUNCT_ELAB_DASH' or @pos1='PUNCT_ELAB_DASH']]">
	<complexcat>	
		<xsl:apply-templates select="*[not(name()='lf')]"/>
		<lf>
			<satop nomvar="X1">
	     	<diamond mode="DashInterp">
					<nomvar name="M"/>
        </diamond>
			</satop>
*    </lf>
	</complexcat>				
</xsl:template>
<!--<xsl:template match="complexcat[parent::entry and ancestor::family[@pos='IN-DASH' or @pos1='IN-DASH']]">
	<complexcat>	
		<xsl:apply-templates select="*[not(name()='lf')]"/>
		<lf>
			<satop nomvar="X1">
				<diamond mode="DashInterp">
        	<nomvar name="M"/>
          <prop name="[*DEFAULT*]"/>
          <diamond mode="Arg1">
          	<nomvar name="X3"/>
          </diamond>
        </diamond>
			</satop>
    </lf>
	</complexcat>
</xsl:template>-->			


<!--Ellipsis Relation-->
<xsl:template match="diamond[@mode='Mod' and ancestor::family[@pos='PUNCT_DOTS1'or @pos='PUNCT_DOTS2' or @pos1='PUNCT_DOTS1'or @pos1='PUNCT_DOTS2']]">
	<diamond mode="EllipsisRel">
  	<xsl:apply-templates/>
  </diamond>
</xsl:template>

<!--Brackets-->
<xsl:template match="complexcat[parent::entry and ancestor::family[@pos='PUNCT_LPAREN0' or @pos1='PUNCT_LPAREN0']]">

	<xsl:variable name="satop" select="*[1]/fs/@inheritsFrom"/>
	<xsl:variable name="arg1" select="slash[last()]/following::atomcat[1]/descendant::nomvar/@name"/>

	<complexcat>	
		<xsl:apply-templates select="*[not(name()='lf')]"/>
		<lf>
    	<satop nomvar="X{$satop}">
      	<diamond mode='ParenRel'>
          <nomvar name="{$arg1}"/>
        </diamond>
      </satop>
    </lf>
	</complexcat>	
</xsl:template>
<xsl:template match="complexcat[parent::entry and ancestor::family[@pos1='PUNCT_LPAREN1' or @pos1='LPAREN2']]">

	<complexcat>	
		<xsl:apply-templates select="*[not(name()='lf')]"/>
		<lf>
			<satop nomvar="X1">
        <diamond mode="ParenRel">
           <nomvar name="M"/>
           <prop name="[*DEFAULT*]"/>
      	</diamond>
      </satop>
    </lf>	
	</complexcat>	
</xsl:template>

<!--Vp Mod feature-->
<xsl:template match="complexcat[parent::entry and ancestor::family[@pos='PUNCT_PRE-VP_ADJ' or @pos='PUNCT_POST-VP_ADJ' or @pos1='PUNCT_PRE-VP_ADJ' or @pos1='PUNCT_POST-VP_ADJ']]">
	<complexcat>	
		<xsl:apply-templates select="*[not(name()='lf')]"/>
		<lf>
			<satop nomvar="X1">
      	<diamond mode="modFeat">
          <nomvar name="M"/>
        </diamond>
	    </satop>
			<!--<satop nomvar="X1">
            <diamond mode="modFeat">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>-->
		</lf>
	</complexcat>	
</xsl:template>

<!--Emph final-->
<!--<xsl:template match="complexcat[parent::entry and ancestor::family[@pos='PUNCT_FINAL_ADJ-MOD' or @pos1='PUNCT_FINAL_ADJ-MOD']]">-->
<xsl:template match="complexcat[parent::entry and ancestor::family[@pos='PUNCT_EMPH_FINAL' or @pos1='PUNCT_EMPH_FINAL']]">
	<complexcat>	
		<xsl:apply-templates select="*[not(name()='lf')]"/>
		<lf>
			<satop nomvar="M">
      	<diamond mode="emph-final">
					<prop name="+"/>
        </diamond>
	    </satop>
		</lf>
	</complexcat>	
</xsl:template>
<!--<xsl:template match="complexcat[parent::entry and ancestor::family[@pos='PUNCT_FINAL_ADJ-ARG' or @pos1='PUNCT_FINAL_ADJ-ARG']]">-->
<xsl:template match="complexcat[parent::entry and ancestor::family[@pos='PUNCT_EMPH_FINAL_VRB' or @pos1='PUNCT_EMPH_FINAL_VRB']]">
	<complexcat>	
		<xsl:apply-templates select="*[not(name()='lf')]"/>
		<lf>
			<satop nomvar="X1">
      	<diamond mode="EmphFinal">
        	<nomvar name="X3"/>
      	</diamond>
      </satop>
    </lf>
	</complexcat>	
</xsl:template>

<!--Parentheticals-->
<xsl:template match="complexcat[parent::entry and ancestor::family[@pos='PUNCT_PARENTHETICAL' or @pos1='PUNCT_PARENTHETICAL']]">
	<complexcat>	
		<xsl:apply-templates select="*[not(name()='lf')]"/>
		<lf>
			<satop nomvar="M">
      	<diamond mode="interrupt">
					<prop name="+"/>
        </diamond>
	    </satop>
		</lf>
	</complexcat>	
</xsl:template>
<xsl:template match="complexcat[parent::entry and ancestor::family[@pos='PUNCT_PARENTHETICAL_VRB' or @pos1='PUNCT_PARENTHETICAL_VRB']]">
	<complexcat>	
		<xsl:apply-templates select="*[not(name()='lf')]"/>
		<lf>
			<satop nomvar="X1">
      	<diamond mode="InterruptRel">
        	<nomvar name="X3"/>
      	</diamond>
      </satop>
    </lf>
	</complexcat>	
</xsl:template>


<!--Quotation marks-->

<xsl:template match="complexcat[parent::entry and ancestor::family[@pos1='PUNCT_QUOTE' and not(starts-with(@name,'punct'))]]">
	<complexcat>	
		<xsl:apply-templates select="*[not(name()='lf')]"/>
		<lf>
			<satop nomvar="X1">
				<prop name="quote-rel"/>
				<diamond mode="Arg">
					<nomvar name="X2"/>
				</diamond>
      </satop>
    </lf>
	</complexcat>	
</xsl:template>

<!--Removing cases where punct args of lexicalized cats had alloted args in the lf -->
<xsl:template match="diamond[starts-with(@mode,'Arg') and nomvar/@name=ancestor::entry/descendant::atomcat[@type='punct']/fs/feat/lf/nomvar/@name and  ancestor::lf]"/>

	<!--Default global copy rule-->	
	<xsl:template match="@*|node()">
	  <xsl:copy>
    	<xsl:apply-templates select="@*|node()"/>
  	</xsl:copy>
	</xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/insertPunctLF.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->

<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

  <xsl:output method="xml" indent="yes" xalan2:indent-amount="2"/>
  <xsl:strip-space elements="*"/>

	<xsl:template match="/">
  	<xsl:apply-templates/>
	</xsl:template>

	<!--Transform which takes in as input the lexicon.xml file and adds LFs of certain comma cats-->

	<!--Bkgrnd java class-->
	<xsl:variable name="obj" select="java:opennlp.ccgbank.convert.PunctHelper.new()"/>

	<!--Add index rels to punctuation categories-->
	<!-- closed families -->
  <xsl:template match="family[@closed='true']">           
    <family>
      <xsl:apply-templates select="@*"/>
     <!-- add indexRel -->
      <xsl:choose>

				<!--Adv conj-->

				<!--Conjunction commas-->
				<xsl:when test="@pos='PUNCT_CONJ'">
          <xsl:attribute name="indexRel">First</xsl:attribute>
        </xsl:when>

				<xsl:when test="(@pos='CC' or @pos='PUNCT_CONJ') and starts-with(@name,'s_1\np_2\(s_1\np_2)\*(s_3\np_4\(s_3\np_4))')">
          <xsl:attribute name="indexRel">GenRel</xsl:attribute>
        </xsl:when>

				<xsl:when test="@name='np_1/(s[dcl]_2\np_3)' or @name='np_1/(s[dcl]_2/np_3)'">
					<xsl:attribute name="indexRel">GenRel</xsl:attribute>
        </xsl:when>

				<xsl:when test="@name='n_1/n_1\*(n_2/n_2)/*(n_3/n_3)'">
					<xsl:attribute name="indexRel">GenRel</xsl:attribute>
        </xsl:when>

				<xsl:when test="@name='sent_1\*n_1'">
					<xsl:attribute name="indexRel">moodColon</xsl:attribute>
        </xsl:when>


				<!--Appos np commas-->

				<xsl:when test="@pos='PUNCT_APPOS'">
          <xsl:attribute name="indexRel">ApposRel</xsl:attribute>
        </xsl:when>

				<xsl:when test="@pos='PUNCT_APPOS_PLACE' or @pos='PUNCT_APPOS_ADDR'">
          <xsl:attribute name="indexRel">ApposRel</xsl:attribute>
        </xsl:when>

				<xsl:when test="@pos='PUNCT_APPOS_MISC'">
          <xsl:attribute name="indexRel">ApposRel</xsl:attribute>
        </xsl:when>

				<xsl:when test="@pos='PUNCT_APPOS_VRB'">
          <xsl:attribute name="indexRel">ApposRel</xsl:attribute>
        </xsl:when>

				<!--Extraposed appositives-->
				<xsl:when test="@pos='PUNCT_EXTR-APPOS'">
          <xsl:attribute name="indexRel">ApposRel</xsl:attribute>
        </xsl:when>

				<xsl:when test="(@pos='WRB' or @pos='WP' or @pos='WDT') and contains(@name,'punct[,]')">
          <xsl:attribute name="indexRel">whApposRel</xsl:attribute>
        </xsl:when>

				<!--Commas which anchor pre-sentential adv adjuncts-->
				<xsl:when test="@pos='PUNCT_INIT_ADJ-MOD'">
          <xsl:attribute name="indexRel">emph-intro</xsl:attribute>
        </xsl:when>
				<xsl:when test="@pos='PUNCT_INIT_ADJ-ARG'">
          <xsl:attribute name="indexRel">EmphIntro</xsl:attribute>
        </xsl:when>
	
				<!--Commas which introduce say verbs-->
				<xsl:when test="substring(@pos,1,9)='PUNCT_SAY'">
					<xsl:attribute name="indexRel">ElabRel</xsl:attribute>
        </xsl:when>

				<!--post & pre vp adjunct commas-->
				<xsl:when test="@pos='PUNCT_PRE-VP_ADJ' or @pos='PUNCT_POST-VP_ADJ'">
					<xsl:attribute name="indexRel">modFeat</xsl:attribute>
        </xsl:when>
			
				<!--Emph final commas-->
				<xsl:when test="@pos='PUNCT_EMPH_FINAL'">
					<xsl:attribute name="indexRel">emph-final</xsl:attribute>
        </xsl:when>
				<xsl:when test="@pos='PUNCT_EMPH_FINAL_VRB'">
					<xsl:attribute name="indexRel">EmphFinal</xsl:attribute>
        </xsl:when>

				<!--Parenthetical commas-->
				<xsl:when test="@pos='PUNCT_PARENTHETICAL'">
					<xsl:attribute name="indexRel">interrupt</xsl:attribute>
        </xsl:when>
				<xsl:when test="@pos='PUNCT_PARENTHETICAL_VRB'">
					<xsl:attribute name="indexRel">InterruptRel</xsl:attribute>
        </xsl:when>	

				<!--Brackets-->
				<xsl:when test="starts-with(@pos,'PUNCT_LPAREN') and not(starts-with(@name,'punct'))">
					<xsl:attribute name="indexRel">ParenRel</xsl:attribute>
				</xsl:when>

				<!--Colons after say verbs-->
				<xsl:when test="@pos='PUNCT_COLON_SAY'">
          <xsl:attribute name="indexRel">colonExp</xsl:attribute>
        </xsl:when>

				<!--Dash expansions-->
				<xsl:when test="@pos='IN-DASH' or @pos='PUNCT_ELAB_DASH_CAT' or @pos='PUNCT_ELAB_DASH'">
          <xsl:attribute name="indexRel">DashInterp</xsl:attribute>
        </xsl:when>
				
				<!--Ellipsis relations ie dots in text-->
				<xsl:when test="@pos='PUNCT_DOTS1' or @pos='PUNCT_DOTS2'">
          <xsl:attribute name="indexRel">EllipsisRel</xsl:attribute>
        </xsl:when>
			</xsl:choose>
			<xsl:apply-templates/>
		</family>
	</xsl:template>		

	<!--LF of a non-case marking prep from Steve's corpus. To shifted from here shortly-->

	<!--To evaluate orig ccgbank-->
	<xsl:template match="complexcat[parent::entry[../@name='pp_1/np_2']]">

		<complexcat>	
			<xsl:apply-templates select="*[not(name()='lf')]"/>
			<lf>
        <satop nomvar="X1">
					<prop name="[*DEFAULT*]"/>
        	<diamond mode="Arg1">
	          <nomvar name="X2"/>
          </diamond>
      	</satop>
      </lf>
		</complexcat>		
	</xsl:template>


	<!--<xsl:template match="complexcat[parent::entry and ancestor::family[substring-after(@name,'_')='~2\(s_2\np_3\(s_4\np_5))/np_6' and starts-with(@name,'pp')]]">

		<complexcat>	
			<xsl:apply-templates select="*[not(name()='lf')]"/>
			<lf>
        <satop nomvar="X2">
					<diamond mode="Mod">
          	<nomvar name="M"/>
						<prop name="[*DEFAULT*]"/>
        		<diamond mode="Arg1">
	          	<nomvar name="X6"/>
          	</diamond>
					</diamond>
      	</satop>
      </lf>
		</complexcat>		
	</xsl:template>-->


	<!--LF of a renegade dollar sign cat. To shifted from here shortly-->
	<xsl:template match="complexcat[parent::entry and ancestor::family[@name='n_1/n[num]_2']]">

		<complexcat>	
			<xsl:apply-templates select="*[not(name()='lf')]"/>
			<lf>
        <satop nomvar="X1">
					<prop name="[*DEFAULT*]"/>
        	<diamond mode="Num">
	          <nomvar name="X2"/>
          </diamond>
      	</satop>
      </lf>
		</complexcat>		
	</xsl:template>

	<xsl:template match="complexcat[parent::entry and ancestor::family[@name='sent_1\*n_1']]">

		<complexcat>	
			<xsl:apply-templates select="*[not(name()='lf')]"/>
			<lf>
				<satop nomvar="X1">
     			<diamond mode="moodColon">
        		<prop name="[*DEFAULT*]"/>
        	</diamond>
     		</satop>	
			</lf>
		</complexcat>		
	</xsl:template>


	<xsl:template match="complexcat[parent::entry and ancestor::family[@name='np_1/(s[dcl]_2\np_3)' or @name='np_1/(s[dcl]_2/np_3)']]">
		<complexcat>	
			<xsl:apply-templates select="*[not(name()='lf')]"/>
			<lf>
        <satop nomvar="X1">
        	<diamond mode="GenRel">
	          <nomvar name="X2"/>
          </diamond>
      	</satop>
      </lf>
		</complexcat>		
	</xsl:template>
	
	<!--Conjunctions of certain cats which are not dealt with elsewhere-->

	<xsl:template match="complexcat[parent::entry and ancestor::family[(@pos='PUNCT_CONJ' or @pos='CC') and starts-with(@name,'s_1\np_2\(s_1\np_2)\*(s_3\np_4\(s_3\np_4))')]]">

		<complexcat>	
			<xsl:apply-templates select="*[not(name()='lf')]"/>
			<lf>
				<satop nomvar="X1">
        	<diamond mode="GenRel">
						<nomvar name="M"/>
						<prop name="[*DEFAULT*]"/>
          	<diamond mode="Arg0">
        			<nomvar name="X3"/>
							<prop name="has-rel"/>
							<diamond mode="Of">
								<nomvar name="X1"/>
							</diamond>
						</diamond>
						<diamond mode="Arg1">
							<xsl:choose>
								<xsl:when test="descendant::punct">
									<nomvar name="X6"/>
								</xsl:when>
								<xsl:otherwise>
									<nomvar name="X5"/>
								</xsl:otherwise>
							</xsl:choose>
							<prop name="has-rel"/>
							<diamond mode="Of">
								<nomvar name="X1"/>
							</diamond>							
						</diamond>
        	</diamond>
        </satop>
      </lf>
		</complexcat>		
	</xsl:template>

	<xsl:template match="complexcat[parent::entry and ancestor::family[@name='n_1/n_1\*(n_2/n_2)/*(n_3/n_3)']]">

		<complexcat>	
			<xsl:apply-templates select="*[not(name()='lf')]"/>
			<lf>
				<satop nomvar="X1">
        	<diamond mode="GenRel">
						<nomvar name="M"/>
						<prop name="[*DEFAULT*]"/>
          	<diamond mode="Arg0">
        			<nomvar name="X2"/>
							<prop name="has-rel"/>
							<diamond mode="Of">
								<nomvar name="X1"/>
							</diamond>
						</diamond>
						<diamond mode="Arg1">
							<nomvar name="X3"/>
							<prop name="has-rel"/>
							<diamond mode="Of">
								<nomvar name="X1"/>
							</diamond>
						</diamond>							
        	</diamond>
        </satop>
      </lf>
		</complexcat>		
	</xsl:template>

<!--LFs of high freq punct cats-->
<xsl:template match="complexcat[parent::entry and ancestor::family[starts-with(@pos,'PUNCT_INIT_ADJ-MOD')]]">
	<complexcat>	
		<xsl:apply-templates select="*[not(name()='lf')]"/>
		<lf>
      <satop nomvar="M">
	     	<diamond mode="emph-intro">
					<prop name="+"/>
        </diamond>
    	</satop>
    </lf>	
	</complexcat>		
</xsl:template>

<xsl:template match="complexcat[parent::entry and ancestor::family[@pos='PUNCT_INIT_ADJ-ARG']]">
	<complexcat>	
		<xsl:apply-templates select="*[not(name()='lf')]"/>
		<lf>
			<satop nomvar="X1">
      	<diamond mode="EmphIntro">
        	<nomvar name="X2"/>
      	</diamond>
      </satop>
		</lf>		
	</complexcat>	
</xsl:template>

<xsl:template match="complexcat[parent::entry and ancestor::family[@pos='PUNCT_APPOS']]">

	<complexcat>	
		<xsl:apply-templates select="*[not(name()='lf')]"/>
		<lf>
    	<satop nomvar="X1">
      	<diamond mode="ApposRel">
          <nomvar name="X3"/>
        </diamond>
      </satop>
    </lf>		
	</complexcat>				
</xsl:template>

<xsl:template match="complexcat[parent::entry and ancestor::family[@pos='PUNCT_APPOS_PLACE']]">

	<complexcat>	
		<xsl:apply-templates select="*[not(name()='lf')]"/>
		<lf>
    	<satop nomvar="X1">
      	<diamond mode="ApposRel">
          <nomvar name="X3"/>
        </diamond>
      </satop>
    </lf>
	</complexcat>				
</xsl:template>

<xsl:template match="complexcat[parent::entry and ancestor::family[@pos='PUNCT_APPOS_ADDR']]">

	<complexcat>	
		<xsl:apply-templates select="*[not(name()='lf')]"/>
		<lf>
			<satop nomvar="X1">
        <diamond mode="ApposRel">
        	<nomvar name="M"/>
      	</diamond>
      </satop>
    	<!--<satop nomvar="M">
        <diamond mode="PlaceRel">
        	<prop name="+"/>
      	</diamond>
      </satop>-->
    </lf>
	</complexcat>				
</xsl:template>

<xsl:template match="complexcat[parent::entry and ancestor::family[@pos='PUNCT_APPOS_VRB']]">

	<complexcat>	
		<xsl:apply-templates select="*[not(name()='lf')]"/>
		<lf>
    	<satop nomvar="X1">
      	<diamond mode="ApposRel">
         	<nomvar name="X4"/>
        </diamond>
      </satop>
    </lf>
	</complexcat>				
</xsl:template>

<xsl:template match="complexcat[parent::entry and ancestor::family[starts-with(@pos,'PUNCT_APPOS_MISC')]]">
	<complexcat>	
		<xsl:apply-templates select="*[not(name()='lf')]"/>
		<lf>
			<satop nomvar="X1">
	     	<diamond mode="ApposRel">
					<nomvar name="M"/>
        </diamond>
			</satop>

      <!--<satop nomvar="M">
	     	<diamond mode="ApposRel">
					<prop name="+"/>
        </diamond>
    	</satop>-->
    </lf>	
	</complexcat>		
</xsl:template>

<!--Extraposed appositives-->
<xsl:template match="complexcat[parent::entry and ancestor::family[@pos='PUNCT_EXTR-APPOS']]">

	<complexcat>	
		<xsl:apply-templates select="*[not(name()='lf')]"/>
		<lf>
    	<satop nomvar="X1">
      	<diamond mode="ApposRel">
          <nomvar name="X3"/>
        </diamond>
      </satop>
    </lf>
	</complexcat>	
</xsl:template>

<xsl:template match="complexcat[parent::entry and ancestor::family[@name='n_1\*(n_2/n_2)/*n_3']]">
	<complexcat>	
		<xsl:apply-templates select="*[not(name()='lf')]"/>
		<lf>
    	<satop nomvar="X1">
      	<prop name="[*DEFAULT*]"/>
     	 	<diamond mode="Arg0">
        	<nomvar name="X2"/>
					<prop name="has-rel"/>
					<diamond mode="Of">
						<nomvar name="X3"/>
					</diamond>
        </diamond>
				<diamond mode="Arg1">
					<nomvar name="X3"/>
				</diamond>
      </satop>
    </lf>
	</complexcat>		
</xsl:template>

<xsl:template match="complexcat[parent::entry and ancestor::family[@name='np_1\*np_2/*s[em]_3']]">

	<complexcat>	
		<xsl:apply-templates select="*[not(name()='lf')]"/>
		<lf>
    	<satop nomvar="X1">
      	<prop name="[*DEFAULT*]"/>
      	<diamond mode="First">
        	<nomvar name="X2"/>
        </diamond>
        <diamond mode="Next">
        	<nomvar name="X3"/>
        </diamond>
      </satop>
    </lf>
	</complexcat>		
</xsl:template>

<xsl:template match="complexcat[parent::entry and ancestor::family[(@pos='WRB' or @pos='WP' or @pos='WDT') and contains(@name,'punct[,]')]]">
		<complexcat>	
		<xsl:apply-templates select="*[not(name()='lf')]"/>
		<lf>
    	<satop nomvar="X1">
      	<diamond mode="whApposRel">
        	<nomvar name="X2"/>
        </diamond>
      </satop>
    </lf>
	</complexcat>				
	</xsl:template>

<!--say verbs-->
<xsl:template match="complexcat[parent::entry and ancestor::family[substring(@pos,1,9)='PUNCT_SAY']]">

	<xsl:variable name="satop1" select="*[1]/fs/@inheritsFrom"/>
	<xsl:variable name="satop2" select="*[1]/fs/@id"/>

	<xsl:variable name="arg0" select="slash[last()]/following::atomcat[1]/descendant::nomvar/@name"/>

	<xsl:variable name="args" select="descendant::atomcat"/>
	<xsl:variable name="arg1" select="$args[last()]/descendant::nomvar/@name"/>

	<complexcat>	
		<xsl:apply-templates select="*[not(name()='lf')]"/>
		<lf>
    	<satop nomvar="X{$satop1}">
				<xsl:if test="$satop2">
					 <xsl:attribute name="nomvar"><xsl:value-of select="concat('X',$satop2)"/></xsl:attribute>
				</xsl:if>
      	<diamond mode='ElabRel'>
        	<nomvar name="{$arg0}">
					</nomvar>
        </diamond>
      </satop>
    </lf>
	</complexcat>	
</xsl:template>
<xsl:template match="complexcat[parent::entry and ancestor::family[@pos='PUNCT_COLON_SAY']]">

	<complexcat>	
		<xsl:apply-templates select="*[not(name()='lf')]"/>
		<lf>
    	<satop nomvar="X2">
      	<diamond mode="colonExp">
	       	<nomvar name="X1"/>
        </diamond>
      </satop>
    </lf>
	</complexcat>	
</xsl:template>

<!--Dash interpolations-->
<xsl:template match="complexcat[parent::entry and ancestor::family[@pos='PUNCT_ELAB_DASH_CAT']]">

	<xsl:variable name="satop" select="*[1]/fs/@inheritsFrom"/>
	<xsl:variable name="arg1" select="slash[last()]/following::atomcat[1]/descendant::nomvar/@name"/>

	<complexcat>	
		<xsl:apply-templates select="*[not(name()='lf')]"/>
		<lf>
    	<satop nomvar="X{$satop}">
      	<diamond mode='DashInterp'>
        	<nomvar name="{$arg1}"/>
        </diamond>
      </satop>
    </lf>
	</complexcat>	
</xsl:template>
<xsl:template match="complexcat[parent::entry and ancestor::family[@pos='PUNCT_ELAB_DASH']]">
	<complexcat>	
		<xsl:apply-templates select="*[not(name()='lf')]"/>
		<lf>
			<satop nomvar="X1">
	     	<diamond mode="DashInterp">
					<nomvar name="M"/>
        </diamond>
			</satop>
*    </lf>
	</complexcat>				
</xsl:template>
<!--<xsl:template match="complexcat[parent::entry and ancestor::family[@pos='IN-DASH']]">
	<complexcat>	
		<xsl:apply-templates select="*[not(name()='lf')]"/>
		<lf>
			<satop nomvar="X1">
				<diamond mode="DashInterp">
        	<nomvar name="M"/>
          <prop name="[*DEFAULT*]"/>
          <diamond mode="Arg1">
          	<nomvar name="X3"/>
          </diamond>
        </diamond>
			</satop>
    </lf>
	</complexcat>
</xsl:template>-->			


<!--Ellipsis Relation-->
<xsl:template match="diamond[@mode='Mod' and ancestor::family[@pos='PUNCT_DOTS1'or @pos='PUNCT_DOTS2']]">
	<diamond mode="EllipsisRel">
  	<xsl:apply-templates/>
  </diamond>
</xsl:template>

<!--Brackets-->
<xsl:template match="complexcat[parent::entry and ancestor::family[@pos='PUNCT_LPAREN0']]">

	<xsl:variable name="satop" select="*[1]/fs/@inheritsFrom"/>
	<xsl:variable name="arg1" select="slash[last()]/following::atomcat[1]/descendant::nomvar/@name"/>

	<complexcat>	
		<xsl:apply-templates select="*[not(name()='lf')]"/>
		<lf>
    	<satop nomvar="X{$satop}">
      	<diamond mode='ParenRel'>
          <nomvar name="{$arg1}"/>
        </diamond>
      </satop>
    </lf>
	</complexcat>	
</xsl:template>
<xsl:template match="complexcat[parent::entry and ancestor::family[@pos1='PUNCT_LPAREN1' or @pos1='LPAREN2']]">

	<complexcat>	
		<xsl:apply-templates select="*[not(name()='lf')]"/>
		<lf>
			<satop nomvar="X1">
        <diamond mode="ParenRel">
           <nomvar name="M"/>
           <prop name="[*DEFAULT*]"/>
      	</diamond>
      </satop>
    </lf>	
	</complexcat>	
</xsl:template>

<!--Vp Mod feature-->
<xsl:template match="complexcat[parent::entry and ancestor::family[@pos='PUNCT_PRE-VP_ADJ' or @pos='PUNCT_POST-VP_ADJ']]">
	<complexcat>	
		<xsl:apply-templates select="*[not(name()='lf')]"/>
		<lf>
			<satop nomvar="X1">
      	<diamond mode="modFeat">
          <nomvar name="M"/>
        </diamond>
	    </satop>
			<!--<satop nomvar="X1">
            <diamond mode="modFeat">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>-->
		</lf>
	</complexcat>	
</xsl:template>

<!--Emph final-->
<!--<xsl:template match="complexcat[parent::entry and ancestor::family[@pos='PUNCT_FINAL_ADJ-MOD']]">-->
<xsl:template match="complexcat[parent::entry and ancestor::family[@pos='PUNCT_EMPH_FINAL']]">
	<complexcat>	
		<xsl:apply-templates select="*[not(name()='lf')]"/>
		<lf>
			<satop nomvar="M">
      	<diamond mode="emph-final">
					<prop name="+"/>
        </diamond>
	    </satop>
		</lf>
	</complexcat>	
</xsl:template>
<!--<xsl:template match="complexcat[parent::entry and ancestor::family[@pos='PUNCT_FINAL_ADJ-ARG']]">-->
<xsl:template match="complexcat[parent::entry and ancestor::family[@pos='PUNCT_EMPH_FINAL_VRB']]">
	<complexcat>	
		<xsl:apply-templates select="*[not(name()='lf')]"/>
		<lf>
			<satop nomvar="X1">
      	<diamond mode="EmphFinal">
        	<nomvar name="X3"/>
      	</diamond>
      </satop>
    </lf>
	</complexcat>	
</xsl:template>

<!--Parentheticals-->
<xsl:template match="complexcat[parent::entry and ancestor::family[@pos='PUNCT_PARENTHETICAL']]">
	<complexcat>	
		<xsl:apply-templates select="*[not(name()='lf')]"/>
		<lf>
			<satop nomvar="M">
      	<diamond mode="interrupt">
					<prop name="+"/>
        </diamond>
	    </satop>
		</lf>
	</complexcat>	
</xsl:template>
<xsl:template match="complexcat[parent::entry and ancestor::family[@pos='PUNCT_PARENTHETICAL_VRB']]">
	<complexcat>	
		<xsl:apply-templates select="*[not(name()='lf')]"/>
		<lf>
			<satop nomvar="X1">
      	<diamond mode="InterruptRel">
        	<nomvar name="X3"/>
      	</diamond>
      </satop>
    </lf>
	</complexcat>	
</xsl:template>

<!--Removing cases where punct args of lexicalized cats had alloted args in the lf -->
<xsl:template match="diamond[starts-with(@mode,'Arg') and nomvar/@name=ancestor::entry/descendant::atomcat[@type='punct']/fs/feat/lf/nomvar/@name and  ancestor::lf]"/>

	<!--Default global copy rule-->	
	<xsl:template match="@*|node()">
	  <xsl:copy>
    	<xsl:apply-templates select="@*|node()"/>
  	</xsl:copy>
	</xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/insertQuoteSemClassInfo.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

<xsl:output method="xml" indent="yes" xalan2:indent-amount="2" omit-xml-declaration = "yes"/>

<xsl:strip-space elements="*"/>

<xsl:variable name="obj" select="java:opennlp.ccgbank.convert.InfoHelper.new()"/>

<!--Transform to insert BBN tag info into OpenCCGbank-->

<xsl:template match="/">
  <xsl:apply-templates select="@*|node()"/>
</xsl:template>

<!--Retrieve semantic classes of Treenodes dominating bbn tagged phrases-->
<xsl:template match="Treenode">

	<xsl:variable name="header" select="ancestor-or-self::*[@Header]/@Header"/>

	<xsl:variable name="desc" select="descendant::Leafnode"/>

	<!--Get words in phrase to check with BBN annotation stored in the bkgrnd class-->
	<xsl:for-each select="$desc">
		<xsl:variable name="void" select="java:collapse($obj,@lexeme0,'1')"/>
	</xsl:for-each>
	<xsl:variable name="words" select="java:collapse($obj,'','2')"/>

	<xsl:variable name="leaf1" select="$desc[position()=1]/@term_no"/>
	<xsl:variable name="leaf2" select="$desc[position()=last()]/@term_no"/>
	<xsl:variable name="span"> 
		<xsl:value-of select="concat(concat($leaf1,','),$leaf2)"/>
	</xsl:variable> 

	<xsl:variable name="bbn-info" select="java:getBBNInfo($obj,$header,$span,$words)"/>
	<xsl:variable name="quote-info" select="java:getQuoteInfo($obj,$header,number($leaf1),number($leaf2),$words)"/>

	<Treenode>
		 
		<!-- Confer NEs info on treenodes -->
    <xsl:choose>
			<!-- Alloting bbn-info -->
			 <xsl:when test="string-length($bbn-info)>0">
				 <xsl:attribute name="bbn-info"><xsl:value-of select="$bbn-info"/></xsl:attribute>
       </xsl:when>
			 <!-- Alloting ne-info for shared task -->
       <xsl:otherwise>
				 <xsl:variable name="pless_ind1" select="$desc[position()=1]/@pless_ind"/>
				 <xsl:variable name="pless_ind2" select="$desc[position()=last()]/@pless_ind"/>
				 <xsl:variable name="pless_span"> 
					 <xsl:value-of select="concat(concat($pless_ind1,','),$pless_ind2)"/>
				 </xsl:variable> 
				 <xsl:variable name="ne-info" select="java:getBBNInfo($obj,$header,$pless_span,$words)"/>
         <xsl:if test="string-length($ne-info)>0">
					 <xsl:attribute name="bbn-info"><xsl:value-of select="$ne-info"/></xsl:attribute>
				 </xsl:if>
       </xsl:otherwise>
    </xsl:choose>

		<xsl:if test="string-length($quote-info)>0 and not(@Header)">
			<xsl:attribute name="quote-info"><xsl:value-of select="$quote-info"/></xsl:attribute>
    </xsl:if>   
		<xsl:apply-templates select="@*|node()"/>
	</Treenode>

</xsl:template>

<!--Retrieve semantic classes of Leafnodes from java bkgrnd class-->
<xsl:template match="Leafnode">
  <Leafnode>

		<xsl:variable name="span"> 
			<xsl:value-of select="concat(concat(@term_no,','),@term_no)"/>
		</xsl:variable> 
		<xsl:variable name="header" select="ancestor-or-self::*[@Header]/@Header"/>
		<xsl:variable name="sem-class" select="java:getBBNClass($obj,$header,@lexeme0,@pos,@cat,number(@term_no))"/>
		<xsl:variable name="quote-info" select="java:getQuoteInfo($obj,$header,number(@term_no),number(@term_no),@lexeme)"/>
		
		<xsl:choose>
			<!-- Alloting bbn-info -->
			<xsl:when test="string-length($sem-class)>0 and not(contains(@pos1,'PUNCT'))">			<xsl:attribute name="class"><xsl:value-of select="$sem-class"/></xsl:attribute>
			</xsl:when>
			<xsl:when test="starts-with(@pos,'NNP')"><xsl:attribute name="class">NAME</xsl:attribute>
			</xsl:when>
			<!-- Alloting ne-info for shared task -->
			<xsl:otherwise>
				<xsl:variable name="ne-info" select="java:getBBNClass($obj,$header,@lexeme0,@pos,@cat,number(@pless_ind))"/>
				<xsl:if test="string-length($ne-info)>0">
					<xsl:attribute name="ne-info"><xsl:value-of select="$ne-info"/></xsl:attribute>
				</xsl:if>
			</xsl:otherwise>
			
		</xsl:choose>
		<xsl:if test="string-length($quote-info)>0">      
        <xsl:attribute name="quote-info"><xsl:value-of select="$quote-info"/></xsl:attribute>
    </xsl:if>
    <xsl:apply-templates select="@*|node()"/>
  </Leafnode>
</xsl:template>


<!--Default global copy rule-->

   <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/insertSemFeats.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->

<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

  <xsl:output method="xml" indent="yes" xalan2:indent-amount="2"/>
  <xsl:strip-space elements="*"/>
  
  
  <!-- Adds semantic categories to the logical forms. -->
  <!-- Also adds features for subject-verb agreement. -->
  
  <!-- 
  <xsl:variable name="obj" select="java:opennlp.ccgbank.extract.InsertLFHelper.new()"/>
  -->
  
  <!-- add features for verbal morphology  -->
  <xsl:template match="
    family[starts-with(@pos,'VB')]/entry/*/lf/satop/prop |
    family[starts-with(@pos,'VB')]/entry/*/lf/satop/diamond[nomvar[@name='M']]/prop
  ">
    <xsl:variable name="pos" select="ancestor::family/@pos"/>
    <xsl:variable name="cat" select="ancestor::family/@name"/>
    <xsl:copy-of select="."/>
    <xsl:choose>
      <xsl:when test="$pos='VBD'"> 
        <diamond mode="tense"> <prop name="past"/> </diamond> 
      </xsl:when>
      <xsl:when test="$pos='VBZ' or $pos='VBP'"> 
        <diamond mode="tense"> <prop name="pres"/> </diamond> 
      </xsl:when>
      <xsl:when test="$pos='VBN' and starts-with($cat,'s[pss]')"> 
        <diamond mode="partic"> <prop name="pass"/> </diamond> 
      </xsl:when>
      <xsl:when test="$pos='VBN' and starts-with($cat,'s[pt]')"> 
        <diamond mode="partic"> <prop name="past"/> </diamond> 
      </xsl:when>
      <xsl:when test="$pos='VBG'"> 
        <diamond mode="partic"> <prop name="pres"/> </diamond> 
      </xsl:when>
    </xsl:choose>
  </xsl:template>
  
  
  <!-- add number (sg or pl) for nouns -->
  <xsl:template match="
    family[starts-with(@pos,'NN')]/entry/*/lf/satop/prop |
    family[starts-with(@pos,'NN')]/entry/*/lf/satop/diamond[nomvar[@name='M']]/prop
  ">
    <xsl:variable name="pos" select="ancestor::family/@pos"/>
    <xsl:copy-of select="."/>
    <xsl:choose>
      <xsl:when test="$pos='NN' or $pos='NNP'"> 
        <diamond mode="num"> <prop name="sg"/> </diamond> 
      </xsl:when>
      <xsl:when test="$pos='NNS' or $pos='NNPS'"> 
        <diamond mode="num"> <prop name="pl"/> </diamond> 
      </xsl:when>
    </xsl:choose>
  </xsl:template>

  
  <!--Default global copy rule-->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>
  
</xsl:transform>


================================================
FILE: ccgbank/templates/introduceMMExtns.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

<xsl:output method="xml" indent="yes" xalan2:indent-amount="2" omit-xml-declaration = "yes"/>

<xsl:strip-space elements="*"/>

<xsl:template match="/">
  <xsl:apply-templates/>
</xsl:template>

<!--The first slash of all non-conj punct cats made associative
<xsl:template match="Leafnode[contains(@pos1,'PUNCT') and not(contains(@pos1,'CONJ'))]/complexcat/slash[position()=1]">
	<slash dir="{@dir}" mode="^"/>
</xsl:template>-->

<!--Remaining slashes of non-conj punct cats made application only
Commented out as this does not work completely as 8 LFs are not created. Will look into it
<xsl:template match="Leafnode[not(contains(@pos1,'SAY')) and contains(@pos1,'PUNCT') and not(contains(@pos1,'CONJ'))]/complexcat/slash[position()>1]">
	<slash dir="{@dir}" mode="*"/>
</xsl:template>-->

<!--Change all the top-level slashes of selected punctuation categories to application-only (*)-->

<xsl:template match="Leafnode[contains(@pos1,'PUNCT_SAY')]/complexcat[*[1]/@type='s' and *[3]/@type='s']/slash">
	<slash dir="{@dir}" mode="*"/>
</xsl:template>
<xsl:template match="Leafnode[@pos1='PUNCT_APPOS']/complexcat/slash">
	<slash dir="{@dir}" mode="*"/>
</xsl:template>

<!--For this kind of apposition, the first slash should be associative-->
<xsl:template match="Leafnode[@pos1='PUNCT_APPOS_MISC']/complexcat/slash[position()=1]">
	<slash dir="{@dir}" mode="^"/>
</xsl:template>

<!--Slash in determiners np_1/n_1 made associative-->
<xsl:template match="Leafnode[@cat='np_1/n_1']/*[1]/slash[@dir='/']">
	<slash dir="{@dir}" mode="^"/>
</xsl:template>

<!--Default global copy rule-->
<xsl:template match="@*|node()">
   <xsl:copy>
     <xsl:apply-templates select="@*|node()"/>
   </xsl:copy>
</xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/labelAppos.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

<xsl:output method="xml" indent="yes" xalan2:indent-amount="2" omit-xml-declaration = "yes"/>

<xsl:strip-space elements="*"/>

<!--Java helper class-->
<xsl:variable name="obj" select="java:opennlp.ccgbank.convert.PunctHelper.new()"/>
<!--Transform which identifies & labels various punct cat part of speech -Part II-->

<xsl:template match="/">
  	<xsl:apply-templates/>
</xsl:template>

<!--Correct existing NP appositives-->
<xsl:template match="Leafnode[@pos1=',' and preceding-sibling::Treenode[not(descendant::Leafnode/@pos1='PUNCT_APPOS') and  @cat0='NP'] and parent::Treenode[@cat0='NP']/following-sibling::Treenode/@cat0='NP\NP']">

	<xsl:choose>
		<xsl:when test="parent::Treenode/following-sibling::Treenode/@dtr='1'">
			<xsl:variable name="dummy0" select="java:storePOS($obj,'PUNCT_APPOS_VRB')"/>	
		</xsl:when>

		<xsl:when test="parent::Treenode/following-sibling::Treenode[descendant::Leafnode[1][@pos1='WDT' or @pos1='WP' or @pos1='WRB']]">
			<xsl:variable name="dummy0" select="java:storePOS($obj,'PUNCT_APPOS_WH')"/>	
		</xsl:when>
		<xsl:otherwise>	
			<xsl:variable name="dummy0" select="java:storePOS($obj,'PUNCT_APPOS_MISC')"/>	
		</xsl:otherwise>
	</xsl:choose>
	
	<xsl:variable name="pos" select="java:getPOS($obj)"/>		
	<Leafnode cat="{@cat}" lexeme="{@lexeme}" pos1="{$pos}" cat0="{@cat0}">
		<xsl:apply-templates select="@*[not(name()='pos1')]|node()"/>
  </Leafnode>
	<xsl:variable name="dummy1" select="java:initPOS($obj)"/>
</xsl:template>

<!--Detect balancing commas for above and leave them untouched-->
<xsl:template match="Leafnode[@pos1=',' and preceding-sibling::Treenode[1]/*[2]/*[3][@pos1=',' and preceding-sibling::Treenode/@cat0='NP' and parent::Treenode[@cat0='NP']/following-sibling::Treenode/@cat0='NP\NP']]">

	<Leafnode>
		<xsl:apply-templates select="@*|node()"/>		
	</Leafnode>

</xsl:template>


<!--Default global copy rule-->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/labelConj1.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

<xsl:output method="xml" indent="yes" xalan2:indent-amount="2" omit-xml-declaration = "yes"/>

<xsl:strip-space elements="*"/>

<!--Java helper classes-->
<xsl:variable name="obj" select="java:opennlp.ccgbank.convert.PunctHelper.new()"/>
<xsl:variable name="obj-mw" select="java:opennlp.ccgbank.convert.MWHelper.new()"/><xsl:variable name="obj-info" select="java:opennlp.ccgbank.convert.InfoHelper.new()"/>

<!--Transform which labels various punct cat part of speech-->

<xsl:template match="/">
  <xsl:apply-templates/>
</xsl:template>

<!--Mark cat of punct like comma/semi-colon which itself acts as a punct-->
<xsl:template match="Leafnode[not(../@cat0='NP\NP[conj]') and  contains(../@cat0,'[conj]') and (@lexeme=',' or @lexeme=';' or @lexeme='--') and not(contains(following-sibling::*/@cat0,'[conj]'))]">

	<Leafnode cat="punct[{@lexeme}]" lexeme="{@lexeme}" lexeme0="{@lexeme0}" pos1="PUNCT_CONJ" cat0="{@cat0}">
		<xsl:apply-templates select="@*[not(name()='pos1')]"/>
  	<atomcat type="punct">
    	<fs id="1">
				<feat attr="lex" val="{@lexeme}"/>
			</fs>
    </atomcat>
  </Leafnode>
</xsl:template>

<!--Mark multi word conjn units-->
<xsl:template match="Treenode[contains(@cat0,'conj') and starts-with(@ptb-tag0,'CONJP')]">

	<xsl:variable name="word" select="descendant::Leafnode"/>

	 <xsl:for-each select="$word">
    <xsl:variable name="void" select="java:concatWords($obj-mw,@lexeme,@pos1,@term_no)"/>
   </xsl:for-each>

	<xsl:variable name="lex" select="java:getInfo($obj-mw,1)"/>
	<xsl:variable name="pos" select="java:getInfo($obj-mw,2)"/>
	<xsl:variable name="term_no" select="java:getInfo($obj-mw,3)"/>

	<Leafnode stem="{$lex}" lexeme="{substring-before($lex,'_')}" pos="CC" pos1="CONJP_HEAD" term_no="{$term_no}">
		<xsl:apply-templates select="@*[not(name()='dtr' or name()='head' or name()='term_no')]"/>
		<xsl:for-each select="$word[position()>1]">
    	<PRT dir="/" type="prt">
				<xsl:apply-templates select="./@*"/>
			</PRT>
   </xsl:for-each>

	</Leafnode>

</xsl:template>	

<!--Default global copy rule-->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/labelConj2.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

<xsl:output method="xml" indent="yes" xalan2:indent-amount="2" omit-xml-declaration = "yes"/>

<xsl:strip-space elements="*"/>

<!--Java helper class-->
<xsl:variable name="obj" select="java:opennlp.ccgbank.convert.PunctHelper.new()"/>
<!--Transform which labels various punct cat part of speech-->

<xsl:template match="/">
  <xsl:apply-templates/>
</xsl:template>

<!--Mark cat of comma,semi-colon,dash-dash puncts which are followed by lexical conjs-->

<xsl:template match="Treenode[@Header]">
  <xsl:variable name="dummy0" select="java:storePOS($obj,@Header)"/>
  <Treenode>
    <xsl:apply-templates select="@*|node()"/>
  </Treenode>
</xsl:template>

<xsl:template match="Leafnode[(@pos1=',' or @pos1=';' or @lexeme='--') and following-sibling::*[ancestor::Treenode[@Header=(java:getPOS($obj))] and (*[2][contains(@cat0,'conj')] or contains(@cat0,'conj'))]]">

	<Leafnode cat="punct[{@lexeme}]" lexeme="{@lexeme}" pos1="PUNCT_LEX_CONJ" cat0="{@cat0}">
		<xsl:apply-templates select="@*[not(name()='pos1')]"/>
  	<atomcat type="punct">
    	<fs id="1">
				<feat attr="lex" val="{@lexeme}"/>
			</fs>
    </atomcat>
  </Leafnode>
</xsl:template>

<xsl:template match="Leafnode[@pos1='PUNCT_CONJ' and preceding::Leafnode[1][ancestor::Treenode[@Header=(java:getPOS($obj))] and @pos1='CC']]">

	<Leafnode cat="," lexeme="{@lexeme}" pos1="PUNCT_LEX_CONJ-SUCC" cat0="{@cat0}">
		<xsl:apply-templates select="@*[not(name()='pos1')]"/>
  	<atomcat type="{@lexeme}">
    	<fs id="1">
				<feat attr="lex" val="{@lexeme}"/>
			</fs>
    </atomcat>
  </Leafnode>
</xsl:template>


<!--Default global copy rule-->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/labelConj3.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

<xsl:output method="xml" indent="yes" xalan2:indent-amount="2" omit-xml-declaration = "yes"/>

<xsl:strip-space elements="*"/>

<!--Java helper class-->
<xsl:variable name="obj-mw" select="java:opennlp.ccgbank.convert.MWHelper.new()"/>
<!--Transform which labels various punct cat part of speech-->

<xsl:template match="/">
  <xsl:apply-templates/>
</xsl:template>


<xsl:template match="Treenode[*[2][@pos1='PUNCT_LEX_CONJ' or @pos1='PUNCT_LEX_CONJ-SUCC']]">
	<xsl:apply-templates select="*[3]"/>
</xsl:template>

<xsl:template match="Leafnode[preceding::Leafnode[1]/@pos1='PUNCT_LEX_CONJ']">

	<Leafnode>
		<xsl:apply-templates select="@*|node()"/>
		<PRT dir="\" type="punct">
			<xsl:apply-templates select="preceding::Leafnode[1]/@*"/>
		</PRT>
	</Leafnode>
	
</xsl:template>

<xsl:template match="Leafnode[following::Leafnode[1]/@pos1='PUNCT_LEX_CONJ-SUCC']">

	<Leafnode>
		<xsl:apply-templates select="@*|node()"/>
		<PRT dir="/" type="punct">
			<xsl:apply-templates select="following::Leafnode[1]/@*"/>
		</PRT>
	</Leafnode>
	
</xsl:template>

<!--Default global copy rule-->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/labelPlace1.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

<xsl:output method="xml" indent="yes" xalan2:indent-amount="2" omit-xml-declaration = "yes"/>

<xsl:strip-space elements="*"/>

<!--Java helper class-->
<xsl:variable name="obj" select="java:opennlp.ccgbank.convert.PunctHelper.new()"/>
<!--Transform which labels mark place name intro punct part of speech-->

<xsl:template match="/">
 	<xsl:apply-templates/>
</xsl:template>

<!--Mark place names-->
<xsl:template match="Leafnode[1][@pos1=',' and starts-with(following-sibling::*/@pos1,'NNP')and parent::Treenode[@dtr='2' and @cat0='NP\NP[conj]']]">

	<Leafnode cat=",_1" lexeme="," pos1="PUNCT_APPOS_PLACE1" cat0=",">
		<xsl:apply-templates select="@*[not(name()='pos1')]"/>
		<atomcat type=",">
    	<fs id="1">
			</fs>
    </atomcat>
	</Leafnode>
</xsl:template>


<!--Mark some more place names-->
<xsl:template match="Leafnode[@pos1=',' and preceding-sibling::Treenode/@cat0='NP' and parent::Treenode[@cat0='NP']/following-sibling::Leafnode/@cat0='NP\NP']">

	<Leafnode cat="{@cat}" lexeme="{@lexeme}" pos1="PUNCT_APPOS_PLACE2" cat0="{@cat0}">
		<xsl:apply-templates select="@*[not(name()='pos1')]"/>
	 	<atomcat type=",">
    	<fs id="1"/>
    </atomcat>
  </Leafnode>
</xsl:template>

<!--Default global copy rule-->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/labelPlace2.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

<xsl:output method="xml" indent="yes" xalan2:indent-amount="2" omit-xml-declaration = "yes"/>

<xsl:strip-space elements="*"/>

<!--Java helper class-->
<xsl:variable name="obj" select="java:opennlp.ccgbank.convert.PunctHelper.new()"/>
<!--Transform which detects & ensures balancing of appositive place nps-->

<xsl:template match="/">
 <xsl:apply-templates/>
</xsl:template>

<!--Mark balancing comma of place name appositive-->
<xsl:template match="Leafnode[@pos1=',' and preceding::Leafnode[2][starts-with(@pos1,'PUNCT_APPOS_PLACE')]]">

	<Leafnode cat="{@cat}" lexeme="{@lexeme}" pos1="PUNCT_APPOS_PLACE_BAL" cat0="{@cat0}">
		<xsl:apply-templates select="@*[not(name()='pos1')]"/>
  	<atomcat type=",">
    	<fs id="1"/>
    </atomcat>
  </Leafnode>
</xsl:template>

<!--Default global copy rule-->
 <xsl:template match="@*|node()">
   <xsl:copy>
     <xsl:apply-templates select="@*|node()"/>
   </xsl:copy>
 </xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/labelPuncts.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

<xsl:output method="xml" indent="yes" xalan2:indent-amount="2" omit-xml-declaration = "yes"/>

<xsl:strip-space elements="*"/>

<!--Java helper class-->
<xsl:variable name="obj" select="java:opennlp.ccgbank.convert.PunctHelper.new()"/>
<!--Transform which identifies & labels various punct cat part of speech -Part II-->

<xsl:template match="/">
  	<xsl:apply-templates/>
</xsl:template>

<!--APPOS_VRB stray case appositive-->
<xsl:template match="Leafnode[@pos1=',' and parent::Treenode/@cat0='NP\NP' and following-sibling::Treenode[@cat0='NP\NP' and *[3]/@pos1=',']]">

	<Leafnode cat="{@cat}" lexeme="{@lexeme}" pos1="PUNCT_NP_MOD" cat0="{@cat0}">
		<xsl:apply-templates select="@*[not(name()='pos1')]"/>
  	<atomcat type=",">
    	<fs id="1"/>
    </atomcat>
  </Leafnode>
	<xsl:variable name="dummy1" select="java:initPOS($obj)"/>
</xsl:template>

<xsl:template match="Leafnode[@pos1=',' and parent::Treenode[preceding-sibling::*/@cat0='N/N' and @cat0='N'] and following-sibling::Treenode/@cat0='N']">

	<Leafnode cat="{@cat}" lexeme="{@lexeme}" pos1="PUNCT_NOM_CONJ" cat0="{@cat0}">
		<xsl:apply-templates select="@*[not(name()='pos1')]"/>
  	<atomcat type=",">
    	<fs id="1"/>
    </atomcat>
  </Leafnode>

</xsl:template>

<!--Label comma which introduces a pre-sentential adjunct-->
<xsl:template match="Leafnode[parent::Treenode/@cat0='S[dcl]' and @pos1=',' and following-sibling::Treenode/@cat0='S[dcl]']">

	<xsl:choose>

		<xsl:when test="../../*[2]/@dtr='1' and not(parent::*/parent::*/descendant::Leafnode[1][contains(@cat0,'S/S')])">
			<xsl:variable name="dummy0" select="java:storePOS($obj,'PUNCT_INIT_ADJ-ARG')"/>
		</xsl:when>
	
		<xsl:otherwise>
			<xsl:variable name="dummy0" select="java:storePOS($obj,'PUNCT_SENT_ADJ')"/>
		</xsl:otherwise>

	</xsl:choose>
	
	<xsl:variable name="pos" select="java:getPOS($obj)"/>
	<Leafnode cat=",_1" lexeme="," pos1="{$pos}"  cat0=",">
		<xsl:apply-templates select="@*[not(name()='pos1')]"/>
    <atomcat type=",">
    	<fs id="1"/>
  	</atomcat>
	</Leafnode>
	<xsl:variable name="dummy0" select="java:initPOS($obj)"/>
</xsl:template>

<xsl:template match="Treenode[*[2][@pos1='PUNCT_LEX_CONJ' and preceding::Leafnode[1]/@pos1='PUNCT_APPOS_BAL']]">
	<xsl:apply-templates select="*[3]"/>
</xsl:template>

<!--Lex conj balancing comma
<xsl:template match="Leafnode[@pos1=',' and preceding-sibling::Treenode[1][*[3]/*[2]/@pos1='PUNCT_LEX_CONJ']]">

	<Leafnode cat="{@cat}" lexeme="{@lexeme}" pos1="PUNCT_LEX_CONJ_BAL" cat0="{@cat0}">
		<xsl:apply-templates select="@*[not(name()='pos1')]"/>
  	<atomcat type=",">
    	<fs id="1"/>
    </atomcat>
  </Leafnode>
</xsl:template>-->


<!--Pre and post vp commas-->

<xsl:template match="Leafnode[@pos1=',' and preceding-sibling::Treenode[java:purgeCat($obj,@cat)='s\np' and java:purgeCat($obj,../@cat)='s\np']]">

	<xsl:variable name="sentId" select="ancestor::*[@Header]/@Header"/>

	<xsl:choose>

		<xsl:when test="following::Treenode[1][ancestor::*[@Header=$sentId] and @cat0='(S\NP)\(S\NP)' and @dtr='1']">
			<xsl:variable name="dummy0" select="java:storePOS($obj,'PUNCT_EMPH_FINAL_VRB')"/>
    </xsl:when>

		<xsl:when test="following::Treenode[1][ancestor::*[@Header=$sentId] and @cat0='(S\NP)\(S\NP)']">
			<xsl:variable name="dummy0" select="java:storePOS($obj,'PUNCT_EMPH_FINAL')"/>
    </xsl:when>

		<xsl:otherwise>
			<xsl:variable name="dummy0" select="java:storePOS($obj,'PUNCT_POST-VP_ADJ')"/>
		</xsl:otherwise>

	</xsl:choose>

	<xsl:variable name="pos" select="java:getPOS($obj)"/>
	<Leafnode cat=",_1" lexeme="," pos1="{$pos}" cat0=",">
		<xsl:apply-templates select="@*[not(name()='pos1')]"/>
    <atomcat type=",">
    	<fs id="1"/>
  	</atomcat>
	</Leafnode>	
</xsl:template>
<xsl:template match="Leafnode[@pos1=',' and following-sibling::Treenode[java:purgeCat($obj,@cat)='s\np' and java:purgeCat($obj,../@cat)='s\np']]">

	<Leafnode cat=",_1" lexeme="," pos1="PUNCT_PRE-VP_ADJ" cat0=",">
		<xsl:apply-templates select="@*[not(name()='pos1')]"/>
    <atomcat type=",">
    	<fs id="1"/>
  	</atomcat>
	</Leafnode>	
</xsl:template>


<!--Verbal Parentheticals 2-->
<xsl:template match="Leafnode[parent::Treenode/@cat0='(S\NP)\(S\NP)' and @pos1=',' and following-sibling::Treenode/@cat0='(S\NP)\(S\NP)']"> 

	<xsl:variable name="anch" select="following::Leafnode[1]"/>

	<xsl:choose>
		
		<xsl:when test="following-sibling::Treenode[1]/*[2][@cat0='S[dcl]\S[dcl]' or @cat0='S[dcl]/S[dcl]' or @cat0='S[dcl]']">
			<xsl:variable name="dummy0" select="java:storePOS($obj,'PUNCT_SAY5')"/>
    </xsl:when>

    <xsl:when test="$anch[not(../following-sibling::Leafnode[1])]/*[1]/*[position()=last()-1 and @dir='/']">
			<xsl:variable name="dummy0" select="java:storePOS($obj,'PUNCT_VPAREN3')"/>
    </xsl:when>
		
		<xsl:when test="$anch/*[1]/*[position()=last()-1 and @dir='\']">
			<xsl:variable name="dummy0" select="java:storePOS($obj,'PUNCT_VPAREN4')"/>
    </xsl:when>
		<xsl:otherwise>
			<xsl:variable name="dummy0" select="java:storePOS($obj,',')"/>
		</xsl:otherwise>
	</xsl:choose>

	<xsl:variable name="pos" select="java:getPOS($obj)"/>

	<xsl:choose>
		<xsl:when test="not($pos=',')">
			<Leafnode cat=",_1" lexeme="," pos1="{$pos}" cat0=",">
				<xsl:apply-templates select="@*[not(name()='pos1')]"/>
    		<atomcat type="punct">
					<fs>
    				<feat attr="lex" val=","/>
      		</fs>
  			</atomcat>
			</Leafnode>
		</xsl:when>	
		<xsl:otherwise>
			<Leafnode>
				<xsl:copy-of select="@*"/>
				<xsl:apply-templates/>
			</Leafnode>
		</xsl:otherwise>
	</xsl:choose>
</xsl:template>
<!--Balancing comma of above-->
<xsl:template match="Leafnode[@pos1=','and parent::Treenode/preceding-sibling::Leafnode[parent::Treenode/@cat0='(S\NP)\(S\NP)' and @pos1=',' and following-sibling::Treenode[@cat0='(S\NP)\(S\NP)' and *[last()]/@pos1=',']]]">

	<xsl:variable name="pos" select="java:getPOS($obj)"/>
	<xsl:choose>
		<xsl:when test="not($pos=',')">
			<Leafnode cat=",_1" lexeme="," pos1="{$pos}_BAL" cat0=",">
				<xsl:apply-templates select="@*[not(name()='pos1')]"/>
    		<atomcat type="punct">
					<fs>
    				<feat attr="lex" val=","/>
      		</fs>
  			</atomcat>
			</Leafnode>
		</xsl:when>	
		<xsl:otherwise>
			<Leafnode>
				<xsl:copy-of select="@*"/>
				<xsl:apply-templates/>
			</Leafnode>
		</xsl:otherwise>
	</xsl:choose>
	<xsl:variable name="dummy0" select="java:initPOS($obj)"/>
</xsl:template>

<!--Dash cat1-->
<xsl:template match="Leafnode[@cat0=':' and @lexeme='--' and following-sibling::Treenode/@cat0='NP\NP']">
	<Leafnode cat="{@cat}" lexeme="{@lexeme}" pos1="PUNCT_ELAB_DASH" cat0="{@cat0}">
		<xsl:apply-templates select="@*[not(name()='pos1')]"/>
    <atomcat type=",">
    	<fs id="1"/>
  	</atomcat>
	</Leafnode>
</xsl:template>

<!--Dash cat2-->
<xsl:template match="Leafnode[not(@cat0=':') and @lexeme='--' and (parent::Treenode/parent::Treenode/*[3][@lexeme='--' and @cat0=':'] or ../parent::Treenode/parent::Treenode/*[3][@lexeme='--' and @cat0=':'])]">

	<Leafnode cat="{@cat}" lexeme="{@lexeme}" pos1="PUNCT_ELAB_DASH_CAT" cat0="{@cat0}">
		<xsl:apply-templates select="@*[not(name()='pos1')]"/>
    <xsl:apply-templates/>
	</Leafnode>
</xsl:template>


<!--lrb cat1-->
<xsl:template match="Leafnode[not(@cat0='LRB') and (@lexeme='-lrb-' or @lexeme='-lcb-')and (parent::Treenode/parent::Treenode/*[3][(@lexeme='-rcb' or @lexeme='-rrb-') and @cat0='RRB'] or ../parent::Treenode/parent::Treenode/*[3][(@lexeme='-rrb-' or @lexeme='-rcb-') and @cat0='RRB'])]">

	<Leafnode cat="{@cat}" lexeme="{@lexeme}" pos1="PUNCT_LPAREN0" cat0="{@cat0}">
		<xsl:apply-templates select="@*[not(name()='pos1')]|node()"/>
	</Leafnode>
</xsl:template>

<!--lrb cat2: Parens around sentences-->
<xsl:template match="Leafnode[@cat='lrb' and (parent::Treenode/@cat0='S[dcl]' and following-sibling::Treenode[1]/@cat='sent_1') ]">

	<Leafnode pos1="PUNCT_LPAREN1">
    <xsl:apply-templates select="@*[not(name()='pos1')]|node()"/>
	</Leafnode>
</xsl:template>

<!--lrb cat3: Parens around np mods-->
<xsl:template match="Leafnode[@cat='lrb' and ( (parent::Treenode/@cat0='NP\NP' and following-sibling::Treenode/@cat0='NP\NP') ) ]">

	<Leafnode pos1="PUNCT_LPAREN2">
    <xsl:apply-templates select="@*[not(name()='pos1')]|node()"/>
	</Leafnode>
</xsl:template>

<!--Default global copy rule-->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/lexExtr.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

  <xsl:output method="xml" indent="yes" xalan2:indent-amount="2" omit-xml-declaration = "yes"/>
  
  <xsl:strip-space elements="*"/>
  
  <!--Transform which reads in a xml parse rep and creates in temp.xml lexical entries for that file and compiles a freq tally-->
  
  <!--Java Program in the grammar extractor package invoked-->
  <xsl:variable name="obj" select="java:opennlp.ccgbank.extract.FreqTally.new()"/>
  
  
  <!--Eliminating the root of the xml parse rep and processing children-->
  <xsl:template match="Derivation">
    <xsl:apply-templates />
  </xsl:template>
  
  <!--Skip Treenodes-->
  <xsl:template match="Treenode">
    <!--Store ccgbank id for recording example sentences-->	
    <xsl:if test="@Header">
      <xsl:variable name="id" select="java:storeId($obj,@Header)"/>
      <!-- nb: need to pretend to use result to avoid having above call "optimized" away--> 
      <xsl:variable name="boo" select="$id"/>
    </xsl:if>
    <xsl:apply-templates/>
  </xsl:template>
  
  
  <!--Leafnodes Processed-->
  <xsl:template match="Leafnode">

    <!--Load cat into freq tally java class and see whether it is first occurence-->
		<!--Change the case of the lexeme if it is not of pos NNP/NNPS
		<xsl:variable name="lexCase" select="java:changeCase($obj,@lexeme,@pos)"/>-->
    <xsl:variable name="firstCatPos" select="java:loadTally($obj,@lexeme,@cat,@pos)"/>

    <!--First occcurence of a catspec-->
    <xsl:if test="$firstCatPos">
      <!--Lexical entry for openccg lexicon generated-->              
      <family name="{@cat}" pos="{@pos}">
        <xsl:copy-of select="@pos1"/>
        <xsl:copy-of select="@argRoles"/>
        <entry name="Primary">
          <xsl:apply-templates mode="leaf"/>
        </entry>
      </family> 
    </xsl:if>             
    
    <!-- Add lex entry for new lex combos --> 
    <!-- nb: for now, need to ignore rel for particles -->
    <xsl:variable name="rel">
      <xsl:choose>
        <xsl:when test="starts-with(@pos,'VB')"><xsl:value-of select="@rel"/></xsl:when>
        <xsl:otherwise/>
      </xsl:choose>
    </xsl:variable>
    <xsl:variable name="firstLexCombo" select="java:firstLexCombo($obj,@lexeme,@stem,$rel,@cat,@pos,@class)"/>
    <xsl:if test="$firstLexCombo">
      <entry word="{@lexeme}" pos="{@pos}" family="{@cat}">
        <!-- add stems when present -->
        <xsl:copy-of select="@stem"/>
        <!-- add rel too -->
        <xsl:if test="$rel != ''">
          <xsl:attribute name="rel"><xsl:value-of select="$rel"/></xsl:attribute>
        </xsl:if>

				<!--Add BBN semantic class if present-->
				<xsl:if test="@class">
          <xsl:attribute name="class"><xsl:value-of select="@class"/></xsl:attribute>
        </xsl:if>
      </entry>
    </xsl:if>
  
  </xsl:template>
  
  <!--Copy Rule for leaf nodes-->
  <xsl:template match="@*|node()" mode="leaf">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()" mode="leaf"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>

================================================
FILE: ccgbank/templates/macroInsert.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->

<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

  <xsl:output method="xml" indent="yes" xalan2:indent-amount="2"/>
  <xsl:strip-space elements="*"/>
  
  
  <!--Transform which takes in as input the morph.xml file and outputs a morph.xml file -->
  
  <!--Java Program in the grammar extractor package invoked-->
  <!-- 
  <xsl:variable name="obj" select="java:opennlp.ccgbank.extract.MorphExtrHelper.new()"/>
  -->
  

  <xsl:template match="morph">

    <morph xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:noNamespaceSchemaLocation="../morph.xsd" name="protogrammar">
  
      <xsl:apply-templates>
        <xsl:sort select="@word"/>
        <xsl:sort select="@stem"/>
        <xsl:sort select="@pos"/>
      </xsl:apply-templates>

      <!--
      <macro name="@sg">
         <fs id="1">
           <feat attr="num" val="sg"/>
         </fs>
      </macro>
      <macro name="@pl">
         <fs id="1">
           <feat attr="num" val="pl"/>
         </fs>
      </macro> -->
      

    </morph>
  </xsl:template>
  

  <!-- include relevant atts for each entry -->
  <xsl:template match="entry">
    <entry word="{@word}" pos="{@pos}">
      <xsl:copy-of select="@stem"/>
			<xsl:call-template name = "sem-class" />
    </entry>
  </xsl:template>
  
  <xsl:template match="entry[@family='N']">
    <entry word="{@word}" pos="{@pos}" macros="@sg @sg-X0">
      <xsl:copy-of select="@stem"/>
			 <xsl:call-template name = "sem-class" />
    </entry>
  </xsl:template>
  
  <xsl:template match="entry[@actualPos='NNS']">
    <entry word="{@word}" pos="{@pos}" macros="@pl @pl-X0">
      <xsl:copy-of select="@stem"/>
			<xsl:call-template name = "sem-class" />
    </entry>
  </xsl:template>

	<!--Add semantic class (BBN) to morph entry if present-->
	<xsl:template name="sem-class">
		<xsl:if test="@class">  
			<xsl:copy-of select="@class"/>
		</xsl:if>
  </xsl:template>
  
  <!--Default global copy rule-->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>
  
</xsl:transform>


================================================
FILE: ccgbank/templates/macroLexDef.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->

<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

  <xsl:output method="xml" indent="yes" xalan2:indent-amount="2"/>
  <xsl:strip-space elements="*"/>
  
  
  <!--Transform which takes in as input the morph.xml file and outputs a morph.xml file -->
  
  <!--Java Program in the grammar extractor package invoked-->
  <xsl:variable name="obj" select="java:opennlp.ccgbank.extract.MorphExtrHelper.new()"/>

	<xsl:template match="ccg-lexicon">
		<ccg-lexicon>
		<xsl:apply-templates select="@*|node()"/>

		<!--Strategy 2-->
		<family  closed="true" pos="Dummy" name="Dummy">
			<entry name="n">
				<atomcat type="n">
				<fs id="9">
					<feat attr="anim">
						<featvar name="ANIM"/>
					</feat>
					<feat attr="num">
						<featvar name="NUM"/>
					</feat>
				</fs>
				</atomcat>
			</entry>
			<entry name="np">
				<atomcat type="np">
				<fs id="9">
					<feat attr="anim">
						<featvar name="ANIM"/>
					</feat>
					<feat attr="num">
						<featvar name="NUM"/>
					</feat>
				</fs>
				</atomcat>
			</entry>	
			<member stem="*dummy*"/>
		</family>
		</ccg-lexicon>
	</xsl:template>

  <!--Strategy 1-->
	<!--<xsl:template match="fs[ancestor::family[@name='n_9' or @name='np_9']]">
		<fs>
			<xsl:apply-templates select="@*|node()"/>
			 <feat attr="anim">
				 <featvar name="ANIM"/>
       </feat>
		</fs>
  </xsl:template>-->

	
  <!--Default global copy rule-->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>
  
</xsl:transform>


================================================
FILE: ccgbank/templates/markMistakes.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

  <xsl:output method="xml" indent="yes" xalan2:indent-amount="2"/>
  <xsl:strip-space elements="*"/>
  
  <!-- Transform which marks certain mistakes in ccgbank. -->

  
  <!-- mark sentence-final punct not at root level 
  <xsl:template match="
    Treenode[not(parent::Derivation)]/*[3][self::Leafnode and @pos='.' and
      not(following::Treenode[1][not(parent::Derivation)])
    ]
  ">-->

	<!--Change made by Raja Nov24,2007-->

	<xsl:template match="Treenode[not(parent::Derivation)]/*[3][self::Leafnode and @pos='.' and (following::*[1][parent::Derivation] or count(following::Leafnode)=0   )]">

    <Leafnode whoops="true">
      <xsl:apply-templates select="@*|node()"/>
    </Leafnode>
  </xsl:template>
  
	<!--Added by Raja Nov24,2007: Marks structures of the form(sent .) -->
	<xsl:template match="Treenode[not(parent::Derivation)]/*[3][self::Leafnode[@cat0='.' and ancestor::Treenode[@Header and *[2]/@pos='LRB'] and following::Leafnode[1][@pos='RRB']]]">

		<Leafnode whoops1="true">
      <xsl:apply-templates select="@*|node()"/>
    </Leafnode>

	</xsl:template>

  <!-- default copy rule -->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>

================================================
FILE: ccgbank/templates/markUnmatched.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->

<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

  <xsl:output method="xml" indent="yes" xalan2:indent-amount="2"/>
  <xsl:strip-space elements="*"/>
  
  
  <!-- Transform which marks families as unmatched if there's no LF and it's not marked *NoSem* -->
  <!-- Also filters out @argRoles -->
  
  <!-- Check for missing LF -->
  <xsl:template match="family[not(@indexRel='*NoSem*') and not(entry/*/lf)]">
    <!-- Mark unmatched -->
    <family unmatched="true">
      <xsl:apply-templates select="@*|node()"/>
    </family>
  </xsl:template>
  
  
  <!-- Filter out @argRoles -->
  <xsl:template match="@argRoles"/>

  
  <!-- tmp: for comparison, remove all slash modes -->
  <!-- nb: this didn't have that much of an effect! -->
  <!--
  <xsl:template match="slash[@dir]">
    <slash dir="{@dir}"/>
  </xsl:template>
  -->

  
  <!--Default global copy rule-->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>
  
</xsl:transform>

================================================
FILE: ccgbank/templates/mergeMorph.xsl
================================================
<?xml version="1.0"?>
<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

  <xsl:output method="xml" indent="yes" xalan2:indent-amount="2"/>
  <xsl:strip-space elements="*"/>
  
  <!-- Transform which mergies entries from a second ('new') morph file -->
  
  <!-- root and member key, for efficient checks of seen items -->
  <xsl:variable name="morphroot" select="/morph"/>
  <xsl:key name="entrykey" match="entry" use="concat(@word,'_',@stem,'_',@pos,'_',@class)"/>
  
  <!-- new morph file -->
  <xsl:param name="newmorphfile">morph.xml</xsl:param>
  <xsl:variable name="newmorphroot" select="document($newmorphfile)/morph"/>
  
  <!-- start here -->
  <xsl:template match="/morph">
    <morph>
      <!-- copy existing entries -->
      <xsl:apply-templates select="@*|node()"/>
      <!-- add new ones -->
      <xsl:for-each select="$newmorphroot/entry">
	<xsl:variable name="newkey" select="concat(@word,'_',@stem,'_',@pos,'_',@class)"/>
	<!-- ensure word not already there -->
	<xsl:if test="not($morphroot[key('entrykey',$newkey)])">
	  <xsl:copy-of select="."/>
	</xsl:if>
      </xsl:for-each>
    </morph>
  </xsl:template>
  
  
  <!-- Copy Rule -->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/morphExtr.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->

<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

  <xsl:output method="xml" indent="yes" xalan2:indent-amount="2"/>
  <xsl:strip-space elements="*"/>
  
  
  <!--Transform which takes in as input the temp.xml file and outputs a morph.xml file -->
  
  <!--Java Program in the grammar extractor package invoked-->
  <xsl:variable name="obj" select="java:opennlp.ccgbank.extract.MorphExtrHelper.new()"/>
  
  <!--Insert appropriate openccg morph.xml root element--> 
  <xsl:template match="ccg-lexicon">
    <morph xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:noNamespaceSchemaLocation="../morph.xsd" name="protogrammar">
      <xsl:apply-templates/>
      <!-- 
			<entry word="*dummy*" pos="Dummy"/>
      -->
    </morph>
  </xsl:template>

  <!--Exclude all family elements from the temp file-->
  <xsl:template match="family"/>
  

  <!--Pest control for determiners--> 
  <!-- 
  <xsl:template match="entry[@word='the' and not(@family='np_1/n_1')]"/>
  -->
  
  <!-- no longer eliminating punct entries ... -->
  <!-- 
  <xsl:template match="entry[@word=',' or @word=';' or @pos=':' or @pos='LRB' or @pos='RRB']"/>
  -->

  
  <!-- Frequency and novelty check -->
  <xsl:template match="entry">
    <xsl:if test="java:checkFreqAndNoveltyStatus($obj,@word,@stem,@family,@pos,@class)">
      <xsl:copy>
        <xsl:apply-templates select="@*|node()"/>
      </xsl:copy>
    </xsl:if>
  </xsl:template>

  
  <!--Default global copy rule-->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/normPTBTags.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  xmlns:exsl="http://exslt.org/common"
  extension-element-prefixes="exsl"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

  <xsl:output method="xml" indent="yes" xalan2:indent-amount="2"/>
  <xsl:strip-space elements="*"/>

<!--Java class to manipulate strings of args and results of conj rule-->
<xsl:variable name="obj" select="java:opennlp.ccgbank.convert.InfoHelper.new()"/>
<xsl:template match="/">
  <xsl:apply-templates/>
</xsl:template>

<xsl:template match="Treenode[@ptb-tag=@ptb-tag0]">
  <Treenode>
    <xsl:apply-templates select="@*[not(name()='ptb-tag0')]|node()"/>
  </Treenode>
</xsl:template>

<xsl:template match="Treenode[not(@ptb-tag=@ptb-tag0) and @ptb-tag and @ptb-tag0]">
  <Treenode>
		<xsl:attribute name="CAUTION">X</xsl:attribute>
    <xsl:apply-templates select="@*[not(name()='ptb-tag0')]|node()"/>
  </Treenode>
</xsl:template>

<xsl:template match="Treenode[@ptb-tag0 and not(@ptb-tag)]">
  <Treenode>
		 <xsl:attribute name="ptb-tag"><xsl:value-of select="@ptb-tag0"/></xsl:attribute>
	   <xsl:apply-templates select="@*[not(name()='ptb-tag0')]|node()"/>
  </Treenode>
</xsl:template>


<xsl:template match="Leafnode[@ptb-tag=@ptb-tag0]">
  <Leafnode>
    <xsl:apply-templates select="@*[not(name()='ptb-tag0')]|node()"/>
  </Leafnode>
</xsl:template>

<xsl:template match="Leafnode[@ptb-tag0 and not(@ptb-tag)]">
  <Leafnode>
		 <xsl:attribute name="ptb-tag"><xsl:value-of select="@ptb-tag0"/></xsl:attribute>
	   <xsl:apply-templates select="@*[not(name()='ptb-tag0')]|node()"/>
  </Leafnode>
</xsl:template>

<xsl:template match="Leafnode[not(@ptb-tag=@ptb-tag0) and @ptb-tag and @ptb-tag0]">
  <Leafnode>
		<xsl:attribute name="CAUTION">X</xsl:attribute>
    <xsl:apply-templates select="@*[not(name()='ptb-tag0')]|node()"/>
  </Leafnode>
</xsl:template>


<!--Default global copy rule-->
<xsl:template match="@*|node()">
  <xsl:copy>
    <xsl:apply-templates select="@*|node()"/>
  </xsl:copy>
</xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/normPunctPos.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  xmlns:exsl="http://exslt.org/common"
  extension-element-prefixes="exsl"		
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

  <xsl:output method="xml" indent="yes" xalan2:indent-amount="2"/>
  <xsl:strip-space elements="*"/>

<!--Java class to manipulate strings of args and results of conj rule-->
<xsl:variable name="obj" select="java:opennlp.ccgbank.convert.PunctHelper.new()"/>
<xsl:template match="/">
  <xsl:apply-templates/>
</xsl:template>


<!--Remove PRT tag from the corpus-->
<xsl:template match="PRT"/>

<xsl:template match="Treenode[@ptb-tag=*[2]/@ptb-tag]">
	<Treenode>
		<xsl:apply-templates select="@*[not(name()='ptb-tag')]|node()"/>
	</Treenode>
</xsl:template> 

<!--Remove dependency evaluation label :B and :U-->
<xsl:template match="atomcat[@dep]">
	<atomcat>
		<xsl:apply-templates select="@*[not(name()='dep')]|node()"/>
	</atomcat>
</xsl:template> 


<xsl:template match="Leafnode[@cat='punct[,]_1' or @cat='punct[,]']">

	<Leafnode cat="{@cat}" lexeme="{@lexeme}" pos1="PUNCT_COMMA" cat0="{@cat0}">
		<xsl:apply-templates select="@*[not(name()='pos1')]|node()"/>
	</Leafnode>
</xsl:template>

<xsl:template match="Leafnode[@cat='punct[--]_1' or @cat='punct[--]']">

	<Leafnode cat="{@cat}" lexeme="{@lexeme}" pos1="PUNCT_DASH" cat0="{@cat0}">
		<xsl:apply-templates select="@*[not(name()='pos1')]|node()"/>
	</Leafnode>
</xsl:template>

<!--Revert wrongly detected balancing commas back to orig form-->
<xsl:template match="Leafnode[@pos1='_BAL']">

	<Leafnode cat=",_1" lexeme="," lexeme0="," pos1="," cat0=",">
		<xsl:apply-templates select="@*"/>
  	<atomcat type="*[1]/@type">
    	<fs id="1"/>
    </atomcat>
  </Leafnode>
</xsl:template>

<!--Change pos of dashes marked with pos=IN
<xsl:template match="Leafnode[@lexeme='' and @pos='IN']">
	<Leafnode>
		<xsl:copy-of select="@*"/>	
			<xsl:attribute name="pos">IN-DASH</xsl:attribute>
		<xsl:apply-templates/>
	</Leafnode>
</xsl:template>-->

<!--Changing commas connecting place names to regular appositives-->
<xsl:template match="Leafnode[@pos1='PUNCT_APPOS_PLACE']">
	<Leafnode>
		<xsl:copy-of select="@*"/>	
			<xsl:attribute name="pos1">PUNCT_APPOS</xsl:attribute>
		<xsl:apply-templates/>
	</Leafnode>
</xsl:template>


<!--Corrections that need to be made to the original corpus ideally. Steve? -->

<!--wh-rels-->
<xsl:template match="Leafnode[@cat='np_~1\np_1/s[dcl]_2\(np_3\np_4/np_5)' and starts-with(@pos,'W')]">
	
	<Leafnode>
		<xsl:copy-of select="@*"/>

		<xsl:attribute name="cat">np_~1\np_1/s[dcl]_2\(np_3\np_4/np_1)</xsl:attribute>
		<xsl:apply-templates select="*[1]" mode="wh-corr"/>
	</Leafnode>
</xsl:template>
<xsl:template match="atomcat[@type='np']/fs[@id='5']" mode="wh-corr">
	<fs id="1"/>
</xsl:template>

<!--Changing id=1 of n and np cats to id=9-->
<xsl:template match="Leafnode[@cat='np_1' or @cat='n_1']">
	<Leafnode cat="{substring-before(@cat,'_')}_9">
		<xsl:copy-of select="@*[not(name()='cat')]"/>
		<xsl:apply-templates mode="np-id-corr"/>
	</Leafnode>
</xsl:template>
<xsl:template match="fs" mode="np-id-corr">
	<fs id="9">
		<xsl:apply-templates mode="np-id-corr"/>
	</fs>	
</xsl:template>

<!--Correct treenode of non-case marking preps-->

<xsl:template match="Treenode[*[1][self::atomcat[@type='pp']] and starts-with(@cat,'pp[') and *[2]/@cat='pp_1/np_2']">

	<Treenode cat="pp">
	<xsl:apply-templates select="@*[not(name()='cat')]"/>
	<xsl:apply-templates select="*[position()>0]"/>
	</Treenode>
</xsl:template>

<!--Make sure that result treenodes of non-case marking preps are not lexicalized-->
<xsl:template match="Treenode[starts-with(@cat,'pp[') and *[2]/@cat='pp_1/np_2']/*[1]/fs/feat[@attr='lex']">
</xsl:template>

<!--Replace pp[] by pp-->
<xsl:template match="Leafnode[contains(@cat,'pp[]')]">

	<Leafnode>
		<xsl:copy-of select="@*"/>

		 <xsl:variable name="cat" select="java:cleanPP($obj,@cat)"/>

		 <xsl:attribute name="cat">
			<xsl:value-of select = "$cat" />
		 </xsl:attribute>
		<xsl:apply-templates/>
  </Leafnode>
</xsl:template>

<!--Changing pp[]~2/np_2 to pp[lex]_~2/np_2-->
<xsl:template match="Leafnode[@cat='pp[]_~2/np_2']">

	<Leafnode>
		<xsl:copy-of select="@*"/>

		 <xsl:attribute name="cat">pp[<xsl:value-of select="@lexeme"/>]_~2/np_2</xsl:attribute>
		 <complexcat>
        <atomcat type="pp">
          <fs inheritsFrom="2">
            <feat attr="form">
              <featvar name="FORM"/>
            </feat>
						<feat attr="lex" val="{@lexeme}"/>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="2"/>
        </atomcat>
      </complexcat>
  </Leafnode>
</xsl:template>

<!--Remove an erroneous ARG assignment to to a case-marking preposition-->
<xsl:template match="Leafnode[@cat='pp[in]_1/np_2:Arg0' or @cat='pp[in]_~2/np_2:Arg0']">
	<Leafnode cat="{substring-before(@cat,':')}">
		<xsl:apply-templates select="@*[not(name()='cat' or starts-with(name(),'argRoles'))]|node()"/>
	</Leafnode>
</xsl:template>

<!--Remove erroneous unary rules-->
<xsl:template match="Treenode[count(*)=2 and @cat=*[2]/@cat]">
	<xsl:apply-templates select="*[position()>1]"/>
</xsl:template>

<xsl:template match="Treenode[count(*)=2 and @cat='s/s' and *[2]/@cat='s[dcl]/s[dcl]']">
	<xsl:apply-templates select="*[position()>1]"/>
</xsl:template>

<xsl:template match="Treenode[count(*)=2 and @cat='sent_1' and not(java:purgeCat1($obj,@cat0)=java:purgeCat1($obj,@cat))]">

	<Treenode cat="{java:purgeCat1($obj,@cat0)}">
		<xsl:apply-templates select="@*[not(name()='cat')]"/>	
		<atomcat type="{java:purgeCat1($obj,@cat0)}">
      <fs id="1"/>
    </atomcat>
		<xsl:apply-templates select="*[position()>1]"/>
	</Treenode>
</xsl:template>

<!--Spl copy rule for np-id-corr-->
<xsl:template match="@*|node()" mode="np-id-corr">
	<xsl:copy>
 		<xsl:apply-templates select="@*|node()" mode="np-id-corr"/>
	</xsl:copy>
</xsl:template>

<!--Spl copy rule for wh-corr-->
<xsl:template match="@*|node()" mode="wh-corr">
	<xsl:copy>
 		<xsl:apply-templates select="@*|node()" mode="wh-corr"/>
	</xsl:copy>
</xsl:template>

<!--Default global copy rule-->
<xsl:template match="@*|node()">
	<xsl:copy>
 		<xsl:apply-templates select="@*|node()"/>
	</xsl:copy>
</xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/origPunctRules.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

<xsl:output method="xml" indent="yes" xalan2:indent-amount="2" omit-xml-declaration = "yes"/>

<xsl:strip-space elements="*"/>

<!--Transform which inserts punct cats corresponding to orig binary rules in corpus-->

<!--Java helper class-->
<xsl:variable name="obj" select="java:opennlp.ccgbank.convert.OrigPunctRules.new()"/>

<!--Punctuation whose context is to be determined-->
<xsl:variable name="punct">,</xsl:variable>


<xsl:template match="/">
 	<xsl:apply-templates/>
</xsl:template>

<!--Store the sentence id of a sent in the bkgrnd java class-->
<xsl:template match="Treenode[@Header]">
	<xsl:variable name="dummy1" select="java:storeId($obj,@Header)"/>
	<Treenode>
		<xsl:copy-of select="@*"/>
		<xsl:apply-templates/>
	</Treenode>
</xsl:template>

<xsl:template match="Leafnode[@Header]">
	<xsl:variable name="dummy1" select="java:storeId($obj,@Header)"/>
	<Leafnode>
		<xsl:copy-of select="@*"/>
		<xsl:apply-templates/>
	</Leafnode>
</xsl:template>

<!--For every leaf node which has the selected punctuation mark-->
<xsl:template match="Leafnode[(@lexeme=',' and @cat0=',') or (@lexeme='--' or @lexeme=':' or @lexeme='...' and (@cat0=':'))  or (@pos='.' and @cat='._1')]">
	
	<!--Send arguments and results of the mark to the bkgrnd java class-->
	<xsl:variable name="res" select="parent::Treenode/*[1]"/>
	<xsl:variable name="prec" select="preceding-sibling::*[1][self::Leafnode or self::Treenode]/*[1]"/>
	<xsl:variable name="foll" select="following-sibling::*[1][self::Leafnode or self::Treenode]/*[1]"/>

	<xsl:variable name="dummy0" select="java:initId($obj)"/>	
	<Leafnode cat="{@cat}" lexeme="{@lexeme}" lexeme0="{@lexeme0}" pos="{@pos}" cat0="{@cat0}" pos1="PUNCT">
		<complexcat>
			<xsl:apply-templates select="$res" mode="res"/>
			<xsl:if test="count($prec)>0">
				<slash dir="\" mode="*"/>	
				<xsl:apply-templates select="$prec" mode="arg"/>
			</xsl:if>	
			<xsl:if test="count($foll)>0">
				<slash dir="/" mode="*"/>	
				<xsl:apply-templates select="$foll" mode="arg"/>
			</xsl:if>			
		</complexcat>
	</Leafnode>
</xsl:template>

<xsl:template match="atomcat[1]" mode="res">
	<atomcat>
		<xsl:copy-of select="@*"/>
		<fs inheritsFrom="1">
		</fs>
		<xsl:apply-templates mode="res"/>
	</atomcat>
</xsl:template>

<xsl:template match="atomcat[1]" mode="arg">
	<atomcat>
		<xsl:copy-of select="@*"/>
		<fs id="1">
		</fs>
		<xsl:apply-templates mode="arg"/>
	</atomcat>
</xsl:template>

<xsl:template match="fs" mode="res"/>
<xsl:template match="fs" mode="arg"/>

<xsl:template match="@*|node()" mode="res">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()" mode="res"/>
    </xsl:copy>
  </xsl:template>

<xsl:template match="@*|node()" mode="arg">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()" mode="arg"/>
    </xsl:copy>
  </xsl:template>

<!--Default global copy rule-->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/overtWHLexRels.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->

<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

  <xsl:output method="xml" indent="yes" xalan2:indent-amount="2"/>
  <xsl:strip-space elements="*"/>

	<xsl:template match="/">
  	<xsl:apply-templates/>
	</xsl:template>

	 <!--Java Program in the grammar extractor package invoked-->
  <xsl:variable name="obj" select="java:opennlp.ccgbank.extract.MorphExtrHelper.new()"/>


	<!-- Relative pronouns WH relative pronouns indentified as appositions-->
  <xsl:template match="family[(@indexRel='GenRel' or @indexRel='whApposRel') and not(@pos='CC')]">
		<xsl:for-each select = "member" >  
			<xsl:variable name="fam" select="ancestor::family"/>
			<family indexRel="{$fam/@indexRel}-{@stem}">
				<xsl:apply-templates select="$fam/@*[not(name()='indexRel')]"/>
				<xsl:variable name="void" select="java:storeWHLex($obj,./@stem)"/>
				<xsl:apply-templates select="$fam/*[not(name()='member')]" mode="genrel-lex"/>
				<member>
					<xsl:apply-templates select="@*" mode="genrel-lex"/>
				</member>
			</family>
		</xsl:for-each>  
  </xsl:template>

	<xsl:template match="diamond[@mode='GenRel' or @mode='whApposRel']" mode="genrel-lex">
		<xsl:variable name="wh-lex" select="java:getWHLex($obj)"/>
		<diamond mode="{@mode}-{$wh-lex}">
			<xsl:apply-templates select="node()|@*[not(name()='mode')]"/>
		</diamond>
	</xsl:template>

	<!--genrel-lex copy rule-->
	<xsl:template match="@*|node()" mode="genrel-lex">
	  <xsl:copy>
    	<xsl:apply-templates select="@*|node()" mode="genrel-lex"/>
  	</xsl:copy>
	</xsl:template>

	<!--Default global copy rule-->	
	<xsl:template match="@*|node()">
	  <xsl:copy>
    	<xsl:apply-templates select="@*|node()"/>
  	</xsl:copy>
	</xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/overtWHPronouns.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->

<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

  <xsl:output method="xml" indent="yes" xalan2:indent-amount="2"/>
  <xsl:strip-space elements="*"/>

	<xsl:template match="/">
  	<xsl:apply-templates/>
	</xsl:template>

	<!-- relative pronouns -->
  <xsl:template match="family[@indexRel='GenRel']/entry/complexcat">
    <complexcat>
      <xsl:apply-templates select="*[not(name()='lf')]"/>
			<lf>
			<satop nomvar="X1">
				<diamond mode="GenRel">
					<nomvar name="M"/>
          <prop name="[*DEFAULT*]"/>
          <diamond mode="Arg1">
            <nomvar name="X2"/>
					</diamond>
				</diamond>
      </satop>
    </lf>
		</complexcat>
  </xsl:template>

	<!--WH relative pronouns indentified as appositions-->
	<xsl:template match="complexcat[parent::entry and ancestor::family[(@pos='WRB' or @pos='WP' or @pos='WDT') and contains(@name,'punct[,]')]]">
		<complexcat>	
		<xsl:apply-templates select="*[not(name()='lf')]"/>

		<lf>
			<satop nomvar="X1">
				<diamond mode="whApposRel">
					<nomvar name="M"/>
          <prop name="[*DEFAULT*]"/>
          <diamond mode="Arg1">
            <nomvar name="X2"/>
					</diamond>
				</diamond>
      </satop>
    </lf>
	</complexcat>				
	</xsl:template>

	<!--Default global copy rule-->	
	<xsl:template match="@*|node()">
	  <xsl:copy>
    	<xsl:apply-templates select="@*|node()"/>
  	</xsl:copy>
	</xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/phraseExtractor.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

<xsl:output method="xml" indent="yes" xalan2:indent-amount="2" omit-xml-declaration = "yes"/>

<xsl:strip-space elements="*"/>

<xsl:template match="/">
  <xsl:apply-templates/>
</xsl:template>

<xsl:variable name="obj" select="java:opennlp.ccgbank.convert.PhraseExtractor.new()"/>

<xsl:template match="Derivation">
	<Derivation>
		<xsl:apply-templates select="@*|node()"/>
	</Derivation>
	<xsl:variable name="void" select="java:printInfo($obj)"/>
</xsl:template>

<!--Store id-->
<xsl:template match="Treenode[@Header]">
	<xsl:variable name="void" select="java:storeSentId($obj,@Header)"/>
	<Treenode>
		<xsl:apply-templates select="@*|node()"/>
	</Treenode>
</xsl:template>

<!--Store VPs
<xsl:template match="Treenode[(java:stripLex($obj,@cat)) and count(descendant::Leafnode) &gt; 1]">-->

<!--Store NPs-->
<xsl:template match="Treenode[@cat0='N' and descendant::Leafnode[1]/@cat0='N/N' and descendant::Leafnode[2]/@cat0='N/N' and descendant::Leafnode[3]/@cat0='N']">

	<xsl:for-each select="descendant::Leafnode">
		<xsl:variable name="void" select="java:storeWord($obj,@lexeme)"/>
	</xsl:for-each>

	<xsl:variable name="void" select="java:storePhrase($obj,'NP')"/>

	<!--Once a VP is detected, skip all lower level phrases-->
	<Treenode>
		<xsl:apply-templates select="@*|node()"/>
	</Treenode>
</xsl:template>

<!--Default global copy rule-->
<xsl:template match="@*|node()">
   <xsl:copy>
     <xsl:apply-templates select="@*|node()"/>
   </xsl:copy>
</xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/preSentAdj.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  xmlns:exsl="http://exslt.org/common"
  extension-element-prefixes="exsl"		
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

  <xsl:output method="xml" indent="yes" xalan2:indent-amount="2"/>
  <xsl:strip-space elements="*"/>

<!--Transform which deals with pre-sentential adjuncts--> 

<!--Java class to manipulate strings of args and results of conj rule-->
<xsl:variable name="obj" select="java:opennlp.ccgbank.convert.PunctHelper.new()"/>

<xsl:template match="/">
  <xsl:apply-templates/>
</xsl:template>


<!--Parent of the pre-sentential adjunct -->

<!--Cat0 : Comma anchors the pre-sentential adjunct containing a frame-verb-->
<!--In the process eliminate a vp to s/s unary rule-->

<xsl:template match="Treenode[@cat0='S/S' and following-sibling::Treenode/*[2]/@pos1='PUNCT_INIT_ADJ-ARG']">

	<Treenode>
		
		<xsl:apply-templates select="@*|node()"/>		

		<!--Comma cat-->
		<Leafnode cat="s_~1/s_1\*(s_2\np_3)" lexeme="," pos1="PUNCT_INIT_ADJ-ARG" pos=",">
			<complexcat>
				<xsl:apply-templates select="*[1]/*" mode="res"/>
				<xsl:variable name="void1" select="java:globalInit($obj)"/>				
				<slash dir="\" mode="*"/>
				<xsl:apply-templates select="*[2]/*[1]" mode="vrb-arg"/>
			</complexcat>
		</Leafnode>		
	</Treenode>	
	
</xsl:template>

<xsl:template match="atomcat[@type='s']" mode="vrb-arg">

	<atomcat type="s">
		<fs id="2"/>
	</atomcat>
	
</xsl:template>

<xsl:template match="atomcat[@type='np']" mode="vrb-arg">
	<atomcat type="np">
		<fs id="3"/>
	</atomcat>
</xsl:template>


<!--Cat1 : Comma anchors the pre-sentential adjunct containing a frame-adv-->

<xsl:template match="Treenode[@cat0='S/S' and following-sibling::Treenode/*[2]/@pos1='PUNCT_SENT_ADJ']">

	<Treenode cat="" head="1" dtr="2" cat0="NewlyAdded">
		<xsl:apply-templates select="@*|*[1]"/>
		<Treenode>
			<xsl:copy-of select="@*"/>	
			<xsl:apply-templates/>
		</Treenode>

		<!--Comma cat-->
		<Leafnode cat="s_~1/s_~1\*(s_1/s_1)" lexeme="," pos1="PUNCT_INIT_ADJ-MOD" pos=",">
			<complexcat>
				<xsl:apply-templates select="*[1]/*" mode="res"/>
				<xsl:variable name="void1" select="java:globalInit($obj)"/>				
				<slash dir="\" mode="*"/>
				<xsl:apply-templates select="*[1]" mode="res"/>
				<xsl:variable name="void2" select="java:globalInit($obj)"/>				
			</complexcat>
		</Leafnode>		
	</Treenode>	
	
</xsl:template>


<!--Cat2 (Another option) : Comma and a single adv as pre-sent adjunct-->

<xsl:template match="Leafnode[@cat0='S/S' and following-sibling::Treenode/*[2]/@pos1='PUNCT_SENT_ADJ']">

	<Treenode cat="" head="1" dtr="2" cat0="NewlyAdded">
		<xsl:apply-templates select="@*|*[1]"/>
		<Leafnode>
			<xsl:copy-of select="@*"/>
			<complexcat>
				<atomcat type="s">
        	<fs inheritsFrom="1">
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="s">
        	<fs id="1">
          </fs>
        </atomcat>
			</complexcat>
		</Leafnode>
		<!--Comma cat-->
		<Leafnode cat="s_~1/s_~1\*(s_1/s_1)" lexeme="," pos="," pos1="PUNCT_INIT_ADJ-MOD">
		
			<complexcat>
				<xsl:apply-templates select="*[1]/*" mode="res"/>
				<xsl:variable name="void1" select="java:globalInit($obj)"/>				
				<slash dir="\" mode="*"/>
				<xsl:apply-templates select="*[1]" mode="res"/>
				<xsl:variable name="void2" select="java:globalInit($obj)"/>				
			</complexcat>
		</Leafnode>		
	</Treenode>
</xsl:template>

<xsl:template match="atomcat[@type='s']" mode="res">

	<xsl:variable name="id" select="java:getPOS($obj)"/>		

	<atomcat type="s">
		<xsl:choose>
			<xsl:when test="string-length($id) &gt; 0">
				<fs id="1"/>
				<xsl:variable name="void" select="java:initPOS($obj)"/>
			</xsl:when>
			<xsl:otherwise>
				<fs inheritsFrom="1"/>
				<xsl:variable name="void" select="java:storePOS($obj,'1')"/>		
			</xsl:otherwise>
		</xsl:choose>
	</atomcat>
</xsl:template>
<xsl:template match="atomcat[@type='np']" mode="res">
	<atomcat type="np">
		<fs id="2"/>
	</atomcat>
</xsl:template>

<!--Delete the original position of the commas-->
<xsl:template match="Treenode[*[2][@pos1='PUNCT_INIT_ADJ-ARG'  or @pos1='PUNCT_SENT_ADJ']]">
	<xsl:apply-templates select="*[position()>2]"/>
</xsl:template>

<!-- Spl copy rule 2-->
<xsl:template match="@*|node()" mode="res">
   <xsl:copy>
     <xsl:apply-templates select="@*|node()" mode="res"/>
   </xsl:copy>
</xsl:template>

<!-- Spl copy rule -->
  <xsl:template match="@*|node()" mode="vrb-arg">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()" mode="vrb-arg"/>
    </xsl:copy>
  </xsl:template>

<!--Default global copy rule-->
<xsl:template match="@*|node()">
	<xsl:copy>
 		<xsl:apply-templates select="@*|node()"/>
	</xsl:copy>
</xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/punctLexConjRules.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  xmlns:exsl="http://exslt.org/common"
  extension-element-prefixes="exsl"		
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

  <xsl:output method="xml" indent="yes" xalan2:indent-amount="2"/>
  <xsl:strip-space elements="*"/>

<!--Transform which infers conj rule for punct followed by lexical conjn -->

<!--Java class to manipulate strings of args and results of conj rule-->
<xsl:variable name="obj" select="java:opennlp.ccgbank.convert.GenConjRule.new()"/>
<xsl:template match="/">
  <xsl:apply-templates/>
</xsl:template>


<!--The template dollDecider decides whether this is a dollar conj cat-->

<!--Updating the conjunct phrase-->
<xsl:template match="Treenode[child::Treenode[2][contains(@cat0,'[conj]') and Leafnode/@pos1='PUNCT_LEX_CONJ' and contains(Treenode/@cat0,'[conj]')]]">
	
	<xsl:variable name="res" select="@cat"/>
	<xsl:variable name="resFrag" select="./*[1]"/>

	<!--Initialize id tally-->
	<xsl:variable name="dummy0" select="java:globalInit($obj)"/>
	
	<Treenode cat="{@cat}" head="1" dtr="{@dtr}" cat0="{@cat0}">
		<xsl:apply-templates select="@*"/>
		<xsl:choose>  
			<xsl:when test="name($resFrag)='atomcat'">
				<xsl:call-template name="dollDecider">
					<xsl:with-param name = "frag"  select="$resFrag"/>
 	    		<xsl:with-param name = "cat" select="$res"/>
					<xsl:with-param name = "argStt" >args</xsl:with-param>
				</xsl:call-template>		
			</xsl:when>
			<xsl:otherwise>
				<complexcat>
					<xsl:call-template name="dollDecider">
						<xsl:with-param name = "frag"  select="$resFrag"/>
 	    			<xsl:with-param name = "cat" select="$res"/>
						<xsl:with-param name = "argStt" >res</xsl:with-param>
					</xsl:call-template>		
				</complexcat>
			</xsl:otherwise>
		</xsl:choose > 
		<xsl:apply-templates select="*[position()>1]"/>
	</Treenode>

</xsl:template>

<!--Updating the distal intermediate treenode having conj feature-->
<!--<xsl:template match="Treenode[contains(@cat0,'[conj]') and Leafnode/@pos1='PUNCT_LEX_CONJ' and contains(Treenode/@cat0,'[conj]')]">-->

<xsl:template match="Treenode[Leafnode/@pos1='PUNCT_LEX_CONJ']">

<xsl:variable name="dummy0" select="java:globalInit($obj)"/>

	<!--Parent ie result of the treenode selected -->
	<xsl:variable name="par" select="parent::Treenode"/>
	<xsl:variable name="res" select="$par/@cat"/>
	<xsl:variable name="resFrag" select="$par/*[1]"/>

	<!--Select the argument required-->
	<xsl:variable name="arg1" select="preceding-sibling::*/@cat"/>
	<xsl:variable name="arg1Frag" select="preceding-sibling::*[1]/*[1]"/>

	<!--Init id tally-->
	<xsl:variable name="dummy1" select="java:globalInit($obj)"/>		

	<Treenode cat="{$res}\*{$arg1}" head="0" dtr="{@dtr}" cat0="{@cat0}">
		<xsl:apply-templates select="@*"/>		
		<complexcat>		
			<!--Result,arg1 inserted with id initialization before each insertion-->
			<xsl:call-template name="dollDecider">
				<xsl:with-param name = "frag"  select="$resFrag"/>
 	    	<xsl:with-param name = "cat" select="$res"/>
				<xsl:with-param name = "argStt" >res</xsl:with-param>
			</xsl:call-template>		

			<slash dir="\" mode="*" />
			<xsl:call-template name = "localInit" />
			<xsl:call-template name="dollDecider">
				<xsl:with-param name = "frag"  select="$arg1Frag"/>
 	    	<xsl:with-param name = "cat" select="$arg1"/>
				<xsl:with-param name = "argStt" >args</xsl:with-param>
			</xsl:call-template>					
		</complexcat>	
		<xsl:apply-templates select="*[position()>1]"/>
	</Treenode>

</xsl:template>

<!--Updating the proximal intermediate treenode having conj feature and next to comma-->

<!--<xsl:template match="Treenode[contains(@cat0,'[conj]')and Leafnode/@pos1='CC' and preceding-sibling::Leafnode/@pos1='PUNCT_LEX_CONJ']">-->

<xsl:template match="Treenode[Leafnode/@pos1='CC' and preceding-sibling::Leafnode/@pos1='PUNCT_LEX_CONJ']">

	<xsl:variable name="dummy0" select="java:globalInit($obj)"/>

	<!--Grandparent of intermediate tree ie final result of the conjPhrase -->
	<xsl:variable name="gpar" select="../parent::Treenode"/>

	<!--Choose the result category ie the cat of the parent-->
	<xsl:variable name="res" select="$gpar/@cat"/>
	<xsl:variable name="resFrag" select="$gpar/*[1]"/>

	<!--Select the argument required-->
	<xsl:variable name="arg1" select="$gpar/*[2]/@cat"/>
	<xsl:variable name="arg1Frag" select="$gpar/*[2]/*[1]"/>

	<!--Retrieving punct position-->
	<xsl:variable name="argPunct" select="preceding-sibling::Leafnode"/>
	<xsl:variable name="argPunctFrag" select="$argPunct/*[1]"/>

	<!--Init id tally-->
	<xsl:variable name="dummy1" select="java:globalInit($obj)"/>		

	<Treenode cat="{$res}\*{$arg1}\*{$argPunct}" head="0" dtr="{@dtr}" cat0="{@cat0}">
		<xsl:apply-templates select="@*"/>		
		<complexcat>	
	
			<xsl:call-template name="dollDecider">
				<xsl:with-param name = "frag"  select="$resFrag"/>
 	    	<xsl:with-param name = "cat" select="$res"/>
				<xsl:with-param name = "argStt" >res</xsl:with-param>
			</xsl:call-template>		

			<slash dir="\" mode="*" />
			<xsl:call-template name = "localInit" />
			<xsl:call-template name="dollDecider">
				<xsl:with-param name = "frag"  select="$arg1Frag"/>
 	    	<xsl:with-param name = "cat" select="$arg1"/>
				<xsl:with-param name = "argStt" >args</xsl:with-param>
			</xsl:call-template>						

			<slash dir="\" mode="*" />
			<xsl:call-template name = "localInit" />
			<xsl:call-template name="dollDecider">
				<xsl:with-param name = "frag"  select="$argPunctFrag"/>
 	    	<xsl:with-param name = "cat" select="$argPunct"/>
				<xsl:with-param name = "argStt" >args</xsl:with-param>
			</xsl:call-template>					

		</complexcat>

		<xsl:choose>
			<xsl:when test="following::Leafnode[1]/@pos1='PUNCT_LEX_CONJ_BAL'">
			<!--Init id tally-->
			<xsl:variable name="dummy1" select="java:globalInit($obj)"/>		

			<Treenode cat="X/*punct[,]" head="0" dtr="2">
      	<complexcat>
					<xsl:call-template name="dollDecider">
						<xsl:with-param name = "frag"  select="$resFrag"/>
 	    			<xsl:with-param name = "cat" select="$res"/>
						<xsl:with-param name = "argStt" >res</xsl:with-param>
					</xsl:call-template>
					<slash dir="\" mode="*" />
				<xsl:call-template name = "localInit" />
				<xsl:call-template name="dollDecider">
					<xsl:with-param name = "frag"  select="$arg1Frag"/>
 	    		<xsl:with-param name = "cat" select="$arg1"/>
					<xsl:with-param name = "argStt" >args</xsl:with-param>
				</xsl:call-template>						
					<slash dir="\" mode="*"/>
        	<atomcat type="punct">
          	<fs id="9">
            	<feat attr="lex" val=","/>
          	</fs>
        	</atomcat>
					<slash dir="/" mode="*"/>
        	<atomcat type="punct">
          	<fs id="10">
            	<feat attr="lex" val=","/>
          	</fs>
        	</atomcat>
      	</complexcat>
				<xsl:apply-templates select="*[position()>1]"/>
			</Treenode>	
			<Leafnode cat="punct[,]_1" lexeme="," pos="," pos1="PUNCT_LEX_CONJ_BAL" cat0=",">
    		<atomcat type="punct">
      		<fs id="1">
        		<feat attr="lex" val=","/>
        	</fs>
      	</atomcat>
    	</Leafnode>
			</xsl:when>
			<xsl:otherwise>
				<xsl:apply-templates select="*[position()>1]"/>
			</xsl:otherwise>
		</xsl:choose>
	</Treenode>

</xsl:template> 

<xsl:template match="Treenode[*[3]/@pos1='PUNCT_LEX_CONJ_BAL']">
	<xsl:apply-templates select="*[2]"/>
</xsl:template> 

<!--Leafnode where the lexical conjn ie "or" / "and" / "but" resides-->
<!--<xsl:template match="Leafnode[contains(../@cat0,'[conj]') and @cat0='conj' and ../preceding-sibling::*/@pos1='PUNCT_LEX_CONJ']">-->

<xsl:template match="Leafnode[contains(@cat0,'conj') and preceding::Leafnode[1]/@pos1='PUNCT_LEX_CONJ']">

	<!--Great Grandparent of the context leafnode selected -->
	<xsl:variable name="ggpar" select="../parent::Treenode/.."/>

	<!--Choose the result category ie the cat of the parent-->
	<xsl:variable name="res" select="$ggpar/@cat"/>
	<xsl:variable name="resFrag" select="$ggpar/*[1]"/>
	
	<!--Retrieving arg1 position from the grandparent-->
	<xsl:variable name="arg1" select="$ggpar/*[2]/@cat"/>
	<xsl:variable name="arg1Frag" select="$ggpar/*[2]/*[1]"/>

	<!--Retrieving punct position-->
	<xsl:variable name="argPunct" select="preceding::Leafnode[1]"/>
	<xsl:variable name="argPunctFrag" select="$argPunct/*[1]"/>

	<!--Retrieving arg2 position ie the following sibling of selected leafnode-->
	<xsl:variable name="arg2" select="following-sibling::*[1]/@cat"/>
	<xsl:variable name="arg2Frag" select="following-sibling::*[1]/*[1]"/>
	<xsl:variable name="commaTest" select="following-sibling::*[1]"/>

	<!--Initialization of id before start of new conj rule-->
	<xsl:variable name="dummy0" select="java:globalInit($obj)"/>

	<!--Conj rule inserted-->	
	
	<Leafnode>
		<xsl:copy-of select="@*"/>	

		<!--Inserting the new category for things marked "conj"-->
		<complexcat>

			<xsl:call-template name="dollDecider">
				<xsl:with-param name = "frag"  select="$resFrag"/>
 	    	<xsl:with-param name = "cat" select="$res"/>
				<xsl:with-param name = "argStt" >res</xsl:with-param>
			</xsl:call-template>		

			<slash dir="\" mode="*" />
			<xsl:call-template name = "localInit" />
			<xsl:call-template name="dollDecider">
				<xsl:with-param name = "frag"  select="$arg1Frag"/>
 	    	<xsl:with-param name = "cat" select="$arg1"/>
				<xsl:with-param name = "argStt" >args</xsl:with-param>
			</xsl:call-template>						

			<slash dir="\" mode="*" />
			<xsl:call-template name = "localInit" />
			<xsl:call-template name="dollDecider">
				<xsl:with-param name = "frag"  select="$argPunctFrag"/>
 	    	<xsl:with-param name = "cat" select="$argPunct"/>
				<xsl:with-param name = "argStt" >args</xsl:with-param>
			</xsl:call-template>					
				
			<xsl:if test="parent::Treenode/following::Leafnode[1]/@pos1='PUNCT_LEX_CONJ_BAL'">
				<slash dir="/" mode="*" />
				<xsl:call-template name = "localInit" />
				<xsl:call-template name="dollDecider">
					<xsl:with-param name = "frag"  select="$argPunctFrag"/>
 	    		<xsl:with-param name = "cat" select="$argPunct"/>
					<xsl:with-param name = "argStt" >args</xsl:with-param>
				</xsl:call-template>					
			</xsl:if>

			<slash dir="/" mode="*" />
			<xsl:call-template name = "localInit" />
			<xsl:call-template name="dollDecider">
				<xsl:with-param name = "frag"  select="$arg2Frag"/>
 	    	<xsl:with-param name = "cat" select="$arg2"/>
				<xsl:with-param name = "argStt" >args</xsl:with-param>
			</xsl:call-template>					

		</complexcat>        	 
	</Leafnode>

</xsl:template> 

<!--Function which initializes the idTally-->
<xsl:template name = "localInit" >
	<xsl:variable name="dummy" select="java:localInit($obj)"/>
</xsl:template> 

<!--Local fn which decides whether any given arg/res is a dollar cat-->
<xsl:template name="dollDecider">
	<xsl:param name="frag"/>
	<xsl:param name="cat"/>
	<xsl:param name="argStt"/>
	
	<xsl:choose>
		<!--Dollar result-->
		<xsl:when test="contains($cat,'s') and $argStt='res' and not($cat='(s\np)\(s\np)' or $cat='s/s')">
				<xsl:apply-templates select="$frag/descendant-or-self::atomcat[1][@type='s']" mode="res"/>
	     	<slash/>
       	<dollar name="1"/>
		</xsl:when>
		<!--Dollar arg-->
		<xsl:when test="contains($cat,'s') and $argStt='args' and not($cat='(s\np)\(s\np)' or $cat='s/s')">
			<complexcat>
				<xsl:apply-templates select="$frag/descendant-or-self::atomcat[1][@type='s']" mode="args"/>
	  		<slash/>
    		<dollar name="1"/>
			</complexcat>
		</xsl:when>
		<!--All otherwise cases-->
		<xsl:otherwise>
			<xsl:if test="$argStt='res'">
				<xsl:apply-templates select = "$frag" mode="res"/>
			</xsl:if>
			<xsl:if test="$argStt='args'">
				<xsl:apply-templates select = "$frag" mode="args"/>
			</xsl:if>
		</xsl:otherwise>
	</xsl:choose>	

</xsl:template> 


<!--Eliminating the complexcat element in the result,if any-->
<xsl:template match="complexcat[position()=1]" mode="res">
	<xsl:apply-templates select="*[1]" mode="res"/>
	<xsl:apply-templates select="*[position()>1]" mode="args"/>
</xsl:template> 

<!--Adding the result category with a conj atomcat type-->
<xsl:template match="atomcat" mode="res">
	
	<atomcat type="{@type}">
		<xsl:variable name="newId" select="java:normId($obj,./fs/@id,./fs/@inheritsFrom,@type)"/>
 		<fs id="{$newId}">
			<xsl:apply-templates select="./fs/*" mode="res"/>
 		</fs>
 	</atomcat>
	
</xsl:template> 

<!--Eliminating the conj feature in the result-->
<xsl:template match="feat[@val='conj']" mode="res"/>

<!--Adding arg1 and arg2-->
<xsl:template match="atomcat" mode="args">

	<atomcat type="{@type}">
		<xsl:variable name="newId" select="java:normId($obj,./fs/@id,./fs/@inheritsFrom,@type)"/>
 		<fs id="{$newId}">
  		<xsl:apply-templates select="./fs/*" mode="args"/>  
 		</fs>
 	</atomcat>

</xsl:template> 

<!--res copy rule-->
<xsl:template match="@*|node()" mode="res">
	<xsl:copy>
	  <xsl:apply-templates select="@*|node()" mode="res"/>
  </xsl:copy>
</xsl:template>

<!--args copy rule-->
<xsl:template match="@*|node()" mode="args">
  <xsl:copy>
  	<xsl:apply-templates select="@*|node()" mode="args"/>
	</xsl:copy>
</xsl:template>

<!--Default global copy rule-->
<xsl:template match="@*|node()">
	<xsl:copy>
 		<xsl:apply-templates select="@*|node()"/>
	</xsl:copy>
</xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/reinsertPTBInfo.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

<xsl:output method="xml" indent="yes" xalan2:indent-amount="2" omit-xml-declaration = "yes"/>

<xsl:strip-space elements="*"/>


<xsl:variable name="obj" select="java:opennlp.ccgbank.convert.InfoHelper.new()"/>

<!--Transform to perform uncurrying & allot term_nos to lexical items-->

<xsl:template match="/">
  <xsl:apply-templates select="@*|node()"/>
</xsl:template>

<xsl:template match="Treenode">

	<xsl:if test="@Header">
		<xsl:variable name="void" select="java:storeSentId($obj,@Header)"/>
	</xsl:if>

	<xsl:if test="@ptb-tag0">
		<xsl:variable name="void" select="java:removeFirstPassAnnotation($obj,@ptb-tag0)"/>
	</xsl:if>


	<xsl:variable name="chi" select="descendant::Leafnode"/>

  <xsl:for-each select="$chi">
    <xsl:variable name="void1" select="java:storeEdges($obj,number(@term_no))"/>
  </xsl:for-each>

	<xsl:variable name="tag" select="java:getTag($obj,'true')"/>

  <Treenode>

		<xsl:if test="string-length($tag) &gt; 0 ">
			<xsl:attribute name="ptb-tag"><xsl:value-of select="$tag"/></xsl:attribute>
			<xsl:variable name="void" select="java:countSecPass($obj)"/>

		</xsl:if>

    <xsl:apply-templates select="@*|node()"/>
  </Treenode>

	<xsl:if test="@Header">
		<xsl:variable name="void" select="java:recordRem($obj)"/>
	</xsl:if>

</xsl:template>

<!--Leafnodes containing function tags-->
<xsl:template match="Leafnode">
  <xsl:variable name="tag" select="java:getTag($obj,@term_no,'true')"/>

  <Leafnode>
		<xsl:if test="string-length($tag) &gt; 0">
    	<xsl:attribute name="ptb-tag"><xsl:value-of select="$tag"/></xsl:attribute>
			<xsl:variable name="void" select="java:countSecPass($obj)"/>		
			
		</xsl:if>
    <xsl:apply-templates select="@*|node()"/>
  </Leafnode>
</xsl:template>


<!--Default global copy rule-->

   <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/repairUnmatched.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->

<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

  <xsl:output method="xml" indent="yes" xalan2:indent-amount="2"/>
  <xsl:strip-space elements="*"/>
  
  <!-- Transform which adds semantics to hitherto unmarked cats-->

	<xsl:variable name="obj" select="java:opennlp.ccgbank.extract.DefaultLFHelper.new()"/>
  
  <!-- Check for unmatched-->

	<xsl:template match="family[@unmatched='true']">
		<family repaired="true">
			<xsl:apply-templates select="@*[not(name()='unmatched')]|node()" mode="lf-insert"/>
		</family>
	</xsl:template>

	<!--<xsl:template match="atomcat[parent::entry]" mode="lf-insert">

		<atomcat>
			<xsl:apply-templates mode="lf-insert"/>
			<lf>
				<satop nomvar="{descendant::nomvar/@name}">
					<prop name="[*DEFAULT*]"/>
				</satop>
			</lf>
		</atomcat>
	</xsl:template>-->

  <!--<xsl:template match="family[@unmatched='true']/entry/complexcat">-->

	<xsl:template match="complexcat[parent::entry]" mode="lf-insert">
		<xsl:variable name="void1" select="java:init($obj)"/>

		<xsl:for-each select="descendant::fs">
			<xsl:variable name="void1" select="java:storeCat($obj,../@type,@id,'id')"/>
			<xsl:variable name="void2" select="java:storeCat($obj,../@type,@inheritsFrom,'inherits')"/>
		</xsl:for-each>

		<!--Find args-->
		<xsl:variable name="args" select="descendant::atomcat[descendant::fs[@id] and java:isArg($obj,descendant::fs/@id) and preceding::slash[1][parent::complexcat[parent::entry]]]"/>

		<xsl:variable name="lf-type" select="java:getType($obj)"/>
	
		<complexcat>
			<xsl:apply-templates mode="lf-insert"/>
			<lf>
				<satop nomvar="{*[1]/descendant::nomvar/@name}">
					<xsl:choose>
						<xsl:when test="$lf-type='mod' or $lf-type='mod-mod'">
							<diamond mode="Mod">
								<xsl:if test="$lf-type='mod'">					
									<nomvar name="M"/>
								</xsl:if>
								<xsl:if test="$lf-type='mod-mod'">					
									<nomvar name="R"/>
								</xsl:if>
								<prop name="[*DEFAULT*]"/>
								<xsl:call-template name="printArgs">
									<xsl:with-param name = "args" select="$args"/>
								</xsl:call-template>		
							</diamond>
						</xsl:when>
						<xsl:otherwise>
							<prop name="[*DEFAULT*]"/>
							<xsl:call-template name="printArgs">
								<xsl:with-param name = "args" select="$args"/>
							</xsl:call-template>		
						</xsl:otherwise>
					</xsl:choose>
				</satop>
			</lf>
		</complexcat>
  </xsl:template>

	<xsl:template name="printArgs">
		<xsl:param name="args"/>

		<xsl:variable name="argCount" select="number(count($args))"/>

		<xsl:for-each select="$args">
			<diamond mode="Arg{java:getArgNo($obj,$argCount)}">
				<nomvar name="{./descendant::nomvar/@name}"/>
   		</diamond>
		</xsl:for-each>
	</xsl:template>		
  
	<!--LF-insertion copy rule-->
	<xsl:template match="@*|node()" mode="lf-insert">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()" mode="lf-insert"/>
    </xsl:copy>
  </xsl:template>

  <!--Default global copy rule-->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>
  
</xsl:transform>

================================================
FILE: ccgbank/templates/replaceColons.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

<xsl:output method="xml" indent="yes" xalan2:indent-amount="2" omit-xml-declaration = "yes"/>

<xsl:strip-space elements="*"/>

<xsl:variable name="obj" select="java:opennlp.ccgbank.convert.InfoHelper.new()"/>

<!--Colons offend maxent as it searches for the first colon in a feature name-->
<!--Colons delimit real-valued feat names and their activation vals-->

<!--Replace ':' in lexeme & cat attrs by '|'-->

<xsl:template match="/">
  <xsl:apply-templates select="@*|node()"/>
</xsl:template>

	<!--Colons seem to offend maxent. So replace ':' with '|' -->
	<xsl:template match="Leafnode[contains(@lexeme,':') or contains(@pos,':') or contains(@pos1,':')]">  
		<Leafnode>
			
			<xsl:apply-templates select="@*"/>

			<xsl:if test="contains(@lexeme,':')">
					<xsl:variable name="newStr" select="java:replaceColon($obj,@lexeme0)"/>
					<xsl:attribute name="lexeme"><xsl:value-of select="$newStr"/></xsl:attribute>	
			</xsl:if>

			<xsl:if test="contains(@pos,':')">
					<xsl:variable name="newStr" select="java:replaceColon($obj,@pos)"/>
					<xsl:attribute name="pos"><xsl:value-of select="$newStr"/></xsl:attribute>	
			</xsl:if>
			<xsl:if test="contains(@pos1,':')">
					<xsl:variable name="newStr" select="java:replaceColon($obj,@pos1)"/>
					<xsl:attribute name="pos1"><xsl:value-of select="$newStr"/></xsl:attribute>	
			</xsl:if>
      <xsl:apply-templates/>
		</Leafnode>
	</xsl:template>

	<!--Change atomcat type from ':' to its lexical item type-->
	<xsl:template match="atomcat[parent::Leafnode and contains(@type,':')]">

		<atomcat>
			<xsl:variable name="newStr" select="java:replaceColon($obj,../@lexeme)"/>
			<xsl:attribute name="type"><xsl:value-of select="$newStr"/></xsl:attribute>	
			<xsl:apply-templates select="@*[not(name()='type')]"/>
			<xsl:apply-templates/>
		</atomcat>

	</xsl:template>

<!--Change feature vals with ':' to '|'-->
<xsl:template match="feat[contains(@val,':')]">

	<feat>
		
		<xsl:variable name="newStr" select="java:replaceColon($obj,@val)"/>
		<xsl:attribute name="val"><xsl:value-of select="$newStr"/></xsl:attribute>	
		<xsl:apply-templates select="@*[not(name()='val')]"/>
		<xsl:apply-templates/>
	</feat>
</xsl:template>

<!--Default global copy rule-->

   <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/rulesExtr.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

  <xsl:output method="xml" indent="yes" xalan2:indent-amount="2" omit-xml-declaration = "yes"/>
  <xsl:strip-space elements="*"/>
  
  
  <!--Transform which extracts unary rules (incl those for conjs) into rules.xml. -->
  
  <!--Declaring java class to store rules,their freqs-->
  <xsl:variable name="obj" select="java:opennlp.ccgbank.extract.RulesTally.new()"/>
    
  <xsl:template match="Derivation">
    <xsl:apply-templates />
  </xsl:template>

  
  <xsl:template match = "Treenode">
    
    <!--Store ccgbank id for recording example sentences-->	
    <xsl:if test="@Header">
      <xsl:variable name="id" select="java:storeId($obj,@Header)"/>
      <!-- nb: need to pretend to use result to avoid having above call "optimized" away -->
    <xsl:variable name="boo" select="$id"/>
    </xsl:if>
    
    <!--Store unary rule in a freq tally-->
    <!--Unary rules present in the xml derivation-->		  
    <xsl:if test="count(*)=2"> <!--and not(@cat0=./*[2]/@cat0)">-->

      <xsl:variable name="rule" select="java:loadTally($obj,@cat,./*[2]/@cat)"/>
      <!--Check if this rule has not been detected hitherto-->		  
      <xsl:if test="java:checkRuleStatus($obj,string($rule))"> 

      	<typechanging name="{$rule}">
        	<arg>
						<xsl:choose>
							<xsl:when test="contains(*[2]/@cat,'$')">
								<xsl:apply-templates select="./*[2]/*[2]/*[1]" mode="unaryRule"/> 
							</xsl:when>
							<xsl:otherwise>
           			<xsl:apply-templates select="./*[2]/*[1]" mode="unaryRule"/> 
							</xsl:otherwise>
						</xsl:choose>
						<!--<xsl:apply-templates select="./*[2]/*[1]" mode="unaryRule"/>--> 
          </arg>
          <result>
           	<xsl:apply-templates select="./*[1]" mode="unaryRule"/> 
          </result>
        </typechanging>
      </xsl:if> 
    </xsl:if>
    <xsl:apply-templates/>
  
  </xsl:template>
  
  
  <!--Special template for extracting unary rules in the xml-->
  <xsl:template match="@*|node()" mode="unaryRule">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()" mode="unaryRule"/>
    </xsl:copy>
  </xsl:template>
      
</xsl:transform>


================================================
FILE: ccgbank/templates/sentFinalPuncts.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  xmlns:exsl="http://exslt.org/common"
  extension-element-prefixes="exsl"		
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

  <xsl:output method="xml" indent="yes" xalan2:indent-amount="2"/>
  <xsl:strip-space elements="*"/>

<!--Transform which provides feats for sent final puncts like !,? . etc-->

<!--Java bkgrd class which helps punct annotation-->
<xsl:variable name="obj" select="java:opennlp.ccgbank.convert.PunctHelper.new()"/>
<xsl:template match="/">
  <xsl:apply-templates/>
</xsl:template>

<!--Take away extra stuff for sents with parens around them-->
<xsl:template match="Treenode[@cat0='S[dcl]' and *[2]/*[2]/@pos1='LPAREN']">
	<xsl:apply-templates select="*[position()>1]"/>		
</xsl:template>

<!--Remove extra colons-->
<xsl:template match="Treenode[not(@Header) and *[3][following::Leafnode[1]/@pos1=':' and  @lexeme=':' and @cat0=':']]">
	<xsl:apply-templates select="*[2]"/>
</xsl:template>


<!--Periods of sentences enclosed by brackets-->
<xsl:template match="Leafnode[@cat='._1' and @pos1='.' and parent::Treenode[@cat='sent_1']/*[2]/@cat0='S[dcl]']">

	<Leafnode>
		<xsl:apply-templates select="@*"/>
		<complexcat>
    	<atomcat type="sent">
      	<fs id="1"/>
       </atomcat>
       <slash dir="\" mode="*"/>
			 <atomcat type="s">
					<fs id="1">
       			<xsl:apply-templates select="../*[2]/*[1]/fs/*"/>
					</fs>
			 </atomcat>
    </complexcat>
	</Leafnode>
	
</xsl:template>

<!--Default global copy rule-->
<xsl:template match="@*|node()">

	<xsl:copy>
 		<xsl:apply-templates select="@*|node()"/>
	</xsl:copy>
</xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/trueCaser.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

<xsl:output method="xml" indent="yes" xalan2:indent-amount="2" omit-xml-declaration = "yes"/>

<xsl:strip-space elements="*"/>

<xsl:variable name="obj" select="java:opennlp.ccgbank.convert.XSLTTrueCaser.new()"/>

<!--Transform to true case words-->

<xsl:template match="/">
  <xsl:apply-templates select="@*|node()"/>
</xsl:template>

<!-- Confer true-cased word forms -->
<xsl:template match="Leafnode[not(@class!='') and not(@pless_ind='-1') and not(@pos='NNP') and not(@pos='NNPS')]">
  <xsl:variable name="trueCasedWord" select="java:trueCase($obj,@lexeme,null,@pos,@pless_ind)"/>  
  <Leafnode>
    <xsl:attribute name="lexeme"><xsl:value-of select="$trueCasedWord"/></xsl:attribute>
    <xsl:apply-templates select="@*[not(name()='lexeme')]|node()"/>
  </Leafnode>
</xsl:template>

<!--Default global copy rule-->

   <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: ccgbank/templates/uncurryBareParse.xsl
================================================
<!--Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
 
 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.
 
 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU Lesser General Public License for more details.
 
 You should have received a copy of the GNU Lesser General Public
 License along with this program; if not, write to the Free Software
 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.-->


<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

<xsl:output method="xml" indent="yes" xalan2:indent-amount="2" omit-xml-declaration = "yes"/>

<xsl:strip-space elements="*"/>

<xsl:template match="/">
  <xsl:apply-templates/>
</xsl:template>


<!--Make a copy of pos for future modification-->
<xsl:template match="Leafnode">
	<Leafnode pos1="{@pos}">
		<xsl:apply-templates select="@*|node()"/>
	</Leafnode>
</xsl:template>

<!--Select only those complexcats which are first children of complexcats-->
<xsl:template match="complexcat/*[1][self::complexcat]">
	<xsl:apply-templates/>
</xsl:template> 

<!--Default global copy rule-->
<xsl:template match="@*|node()">
   <xsl:copy>
     <xsl:apply-templates select="@*|node()"/>
   </xsl:copy>
</xsl:template>

</xsl:transform>


================================================
FILE: devel/BEN.TODO
================================================
for tuesday 1/9/07:

-- test new code in ccg.ply for --prefix and such.  first make sure it
   still works with no --prefix option, producing files with prefixes from
   the filename and that foo-grammar.xml has the right names in it that it
   points to. (and no interference from the graphics code.) then test with
   --prefix and make sure it does what it should (again check grammar.xml),
   even if --prefix is specified to be blank.
-- make sure that the existing test grammars still work. (might need to be
   done after resolving the issue of caps vs. lowercase, since the current
   grammars already use switch feature vars to lowercase, which will be
   wrongly interpreted as semantic vars.) check that the testbed still does
   what it should and gives results it should.
-- take a look at the rough grammar; make sure it gets compiled OK by TeX
   and the results come out.  maybe add some more text.
-- think about that mod to family, so that a simple family with one entry
   can appear without extra syntax:

family foo: entry of some sort: hybrid logic spec;

which is the same as


family foo {
  entry: entry of some sort: hybrid logic spec;
}


================================================
FILE: devel/schedule.txt
================================================
CCG editor schedule

Step 1

- get a simple editor working; has buttons and/or menu across the top with
  new/edit/save buttons; for "formatted text" just display text as-is
  -- add some small buttons at top of editing area for insertion of common
     CCG structures
  -- add popup help on these buttons (right click, select "help", or something)
     that shows in more detail the expected format
  -- add extra buttons (top or bottom) for particular CCG symbols (e.g. the
     symbols used to indicate different slash modes); pressing on them
     inserts the appropriate symbol char(s) and they have help text shown
     when moving over them

More strictly:

-- use the PyEdit code from Python Cookbook (not sure about legality; if
   not, we can just rewrite it, but i don't think it'll be a problem).
-- run the editor, examine it in action, figure out how it works by examining
   the code; in particular, figure out how keystrokes are handled, since i
   don't see any keystroke code.
-- create two separate modules.  one just compiles the code, while the other
   is the GUI.
-- one idea for layout:
(1) for the GUI, originally follow Wikipedia's model in which the layout
    view is the "normal" view and editing is performed as a temporary
    operation with a "preview" that brings up the layout view in a pane
    above the edit window, so that further editing can be performed,
    in addition to an "accept" that goes back to the regular layout view only.

(2) this one is editor centric.  View pops up a "view" [FIX THIS] add a
    toolbar under the window with textual buttons for Load, New, View;
    originally display an empty edit screen.  New, Load create new
    top-level windows; make sure that multiple windows work. Load loads an
    existing file into a new window.  View runs the compiler (see below),
    and displays the error results into a new pane below the edit window.
    There should be next-error and previous-error commands.  This pane can
    be hidden, but it reappears on the next next/previous-error commands.

-- copy all related files from quiche/mangue, get full environment set up
   locally; also create subversion repository

-- add a "compile" button; this runs the CCG2XML compiler and displays any
   error messages in a separate pane of the window; pane can be viewed or
   hidden using menu item or button
  -- then, parse error messages to get the line number; clicking on an error
     message shows the appropriate line in the text
-- improve on display
  -- run compiler before displaying; using result of parsing, display separate
     sections corresponding to major sections of text (e.g. feature {}
     declaration, family {} declarations)
     -- initially, just show actual text corresponding to section
     -- get working the ability to hide/display a particular section and to
        edit just that section
     -- gradually, format into something more intelligent; do this section
        by section
        -- we already have some code for formatting CCG categories
     -- add controls for display of CCG categories
-- figure out what to do about macros
  -- at first, just do whatever works in order to get the editor up and running
  -- macro definitions themselves should be shown with their raw text; it's
     not clear we can do much more
  -- macros can cause arbitrary text to be expanded at a particular position;
     perhaps in display we show macro-expanded sections in a separate color,
     and allow the sections to be collapsed back to the original text that
     led to the expansions, on a macro-by-macro basis (some sort of options
     menu showing all macros and check marks by them for expansion or not)


Step 1:

toolbar across top, with buttons "Display", "Edit", "Test"
each of these changes the widgets below it, and potentially the menubar above
  it; each has a second toolbar above a large text widget showing something
title bar should show name of file
status bar at the bottom, ala emacs
  shows the current mode (display/edit/test) plus other mode-specific info
  (e.g. for edit, success or failure of recent compilation)
Display:
  buttons for controlling the display (e.g. presence or absence of features)
  widget showing formatted display
Edit:
  buttons for editing common CCG structures
  has a preview button, which compiles the text and then displays a second
    pane below, showing either the errors from compilation or 
  has a save button, which saves 
  text editor widget
Test:
  FIXME: fill in; should allow for running the CCG interpreter and/or web
  front end (or something that behaves similarly)

implementation:

- should allow for multiple top-level windows editing different files;
  hence do not use global variables for status information, but store
  inside of a "file" object

Display, Edit, Test are subclasses of Frame
clicking on Display/Edit/Test toolbar buttons:
  -- hides the existing frame for this mode and displays the new frame
  -- should not cause window resize!

-- should start in Edit mode
-- when switching from edit to display, if text has been modified, we either
need to bring up a dialog box asking whether to discard the text, or
remember the modified text and display in the status bar that the text has
been modified
-- in Edit mode, you have Save and Display buttons; Display asks to save Save saves text

  another row of toolbar buttons below, for inserting common brings up a 
- get a simple editor working; has buttons and/or menu across the top with
  new/edit/save buttons; for "formatted text" just display text as-is
  -- add some small buttons at top of editing area for insertion of common
     CCG structures
  -- add popup help on these buttons (right click, select "help", or something)
     that shows in more detail the expected format
  -- add extra buttons (top or bottom) for particular CCG symbols (e.g. the
     symbols used to indicate different slash modes); pressing on them
     inserts the appropriate symbol char(s) and they have help text shown
     when moving over them


================================================
FILE: docs/build.xml
================================================
<?xml version="1.0"?>

<project name="OpenCCG Documentation" basedir="." default="compile">

  <target name="compile">
  	<subant antfile="./guide/build.xml" buildpath="${basedir}"/>
  	<subant antfile="./realizer/build.xml" buildpath="${basedir}"/>
  </target>

  <target name="clean">
    <subant antfile="./guide/build.xml" buildpath="${basedir}" target="clean"/>
    <subant antfile="./realizer/build.xml" buildpath="${basedir}"
      target="clean"/>
  </target>
  
</project>

================================================
FILE: docs/ccgbank-README
================================================

Introduction
============

This README describes how to use the pre-built English models trained
using the CCGbank, as well as how to train these models yourself
starting with the CCGbank.  On the realization side, the models make
use of all published work on realization ranking (as of March, 2013)
-- including discriminatively trained syntactic models, various
n-grams, features for syntactic agreement and balanced punctuation,
and features for dependency ordering and dependency length
minimization -- as well as unpublished improvements to the hypertagger
that make use of a two-stage, 'stacked' approach to supertag
prediction.  For linux, this release also includes support for using a
very large 5-gram memory-mapped language model with KenLM. On the
parsing side, a reimplementation of Hockenmaier's generative parse
model is used, along with a reimplementation of Curran, Clark &
Vadas's supertagger in Java.  Note that the supertagger can also be
used as a stand-alone tool; see taggers-README for details.  The
grammars take advantage of refinements to the CCGbank that make use of
Propbank analyses as well as more precise analyses of punctuation.
(See references at bottom.)

Since the pre-built English models and CCGbank data for training
represent much larger downloads than the OpenCCG core files, they are
available as separate downloads (where YYYY-MM-DD represents the date
of creation):

english-models.YYYY-MM-DD.tgz
ccgbank-data.YYYY-MM-DD.tgz

For linux, the very large KenLM language model, based on 5-grams in
the Gigaword-4 corpus, is available as follows:
 
gigaword4.5g.kenlm.bin


Using the pre-built English models
==================================

The pre-built statisical models for English allow you to parse novel
text in English and to generate English sentences from the (quasi-)
logical forms of the resulting parses, thereby producing a variety of
grammatical paraphrases.  Future releases will contain tools for
generating a broader range of paraphrases using disjunctive logical
forms, which can handle logical forms with similar, but not identical,
structures.

It is also possible to use the pre-built models to realize sentences
from logical forms constructed programmatically.  Note, however, that
in comparison to realization with small, hand-crafted grammars,
realization with the broad coverage grammar derived from the CCGbank
is much slower (with realization typically taking a few seconds per
sentence).  For NLG applications, an interesting task for future work
would be to automatically shrink the grammar's coverage to what is
needed for a specific domain, which should yield considerable
improvements in efficiency.

The pre-built statistical models do not require you to have a copy of
the CCGbank, and should run across different Java platforms.  They do,
however, assume the use of the Stanford Core NLP tools for
tokenization, named entity tagging and morphological analysis.  The
Stanford NLP tools are licensed under the full GPL (rather than the
LGPL, as with OpenCCG), and thus these tools are only loosely
integrated into a chain of command-line tool invocations.  If the GPL
is not adequate for your purposes, you'll need to find your own
substitute tools.

The first step is to make sure you have configured your environment
variables and increased your Java memory limit as described in the
main README ($OPENCCG_HOME/README).  A limit of 2g may be ok, though
4g may work even better; when using the very large KenLM language
model, you should use a limit of at least 8g.

The next step is to download the current version of
english-models.YYYY-MM-DD.tgz, and move it into the ccgbank directory,
i.e. $OPENCCG_HOME/ccgbank/, with the undated name english-models.tgz.
From this directory, you can unpack the English models archive as
shown below:

$ mv english-models.YYYY-MM-DD.tgz $OPENCCG_HOME/ccgbank/english-models.tgz
$ cd $OPENCCG_HOME/ccgbank
$ ccg-build -f build-release.xml extract-models

This command uses ant to extract the models in a cross-platform way.
As noted in the main README, ccg-build is a simple front end for ant
that configures the classpath (and a couple of properties) before
invoking ant.  The option '-f build-release.xml' simply says to use
the build-release.xml build file instead of the default build file.
The 'extract-models' target unpacks the archive in a way that makes
sure the archive is in the right place before unpacking it.  If
extracting the models this way yields an error, however, you should
use tar (or some other archive extraction tool), eg as follows:

$ mv english-models.YYYY-MM-DD.tgz $OPENCCG_HOME/ccgbank/english-models.tgz
$ cd $OPENCCG_HOME/ccgbank
$ tar xzf english-models.tgz

On linux, after downloading the very large language model file, you
can install it for use as follows:

$ mv gigaword4.5g.kenlm.bin $OPENCCG_HOME/ccgbank/models/realizer/.

As noted in the main README, to use the very large LM, you'll also
need to set the library load path:

$ export LD_LIBRARY_PATH=$LD_LIBRARY_PATH:$OPENCCG_HOME/lib

If the file gigaword4.5g.kenlm.bin is not found, the Treebank-trained
trigram model is reused as a stand-in, which will negatively impact
realization quality to some extent.  In principle it should also be
possible to build your own large binary 5-gram model.  At present,
however, there is no working JNI interface to KenLM for OS X or
Windows included.  See http://kheafield.com/code/kenlm/ for further
information on building large language models and getting KenLM to
compile on different platforms, if you would like to try getting the
JNI interface working beyond linux.

After that, the next step is installing the Stanford Core NLP tools,
as described in the section with this name below.

At this point you should be ready to try out the models.  You can try
parsing and realization on a file with a couple of novel sentences
containing some named entities that did not exist when the Penn
Treebank was created, as well as an adverb that is too infrequent to
appear in the training set lexicon, as follows:

$ ccg-build -f build-ps.xml test-novel &> logs/log.ps.test.novel &

You can follow the progress of the parsing tool chain by looking in
the log file.  The input file is data/novel/two-sents, and the output
files are stored in a newly created directory
data/novel/two-sents.dir/.  The tool chain does PTB tokenization,
truecasing, named entity tagging, POS tagging and stemming in order to
create a truecased version of each sentence as well as a morph file
that includes all the words in the file.  The sentences are then
parsed, and the resulting logical forms appear in a testbed file
data/novel/two-sents.dir/tb.xml.  The tool chain takes a while to run
(a couple of minutes, perhaps) as it must load several large data
models; thus, for more efficient processing, it will make sense to run
many more than two sentences in a batch.

Once the parser has run, you can test the realizer on the resulting
testbed file as follows:

$ ccg-build -f build-rz.xml test-novel &> logs/log.rz.test.novel &

Again, you can follow the progress by consulting the log file.  The
realizations should appear in data/novel/two-sents.dir/realize.nbest.

The input file for this test is given by the novel.file property (in
build-models.properties).  You can override this property on the
command line to re-use these build files on your own text, where
<myfile> is the name of your file:

$ ccg-build -Dnovel.file=<myfile> -f build-ps.xml test-novel &> logs/log.ps.test.novel &
$ ccg-build -Dnovel.file=<myfile> -f build-rz.xml test-novel &> logs/log.rz.test.novel &

After running these commands, the parses and realizations will be in a
new directory <myfile>.dir/.


Tokenization and Normalization of Novel Input Texts
===================================================

Note that when parsing text, we assume Penn Treebank III (PTB3) 
tokenization and character escaping conventions (see the PTB3 
documentation).***

We assume the following:

-Text is one sentence (or coherent utterance) per line with no 
 intervening blank lines. (This you must do yourself.)

-PTB3 parser-friendly tokenization, e.g.:

    do n't, wo n't, it 's, John 's, etc.

    and not: 

    don 't, won 't, it ' s, John ' s, etc.
    (as some tokenization scripts are fond of doing)

 Of course, punctuation should be split off from words, so, e.g.:

    John said ``Hello'' to Mary, who replied ``Hi, John''.

    should be tokenized as:

    John said `` Hello '' to Mary , who replied `` Hi , John '' .

-PTB3 escapes for characters that are meta-symbols in the PTB3, e.g.:
    (, ), { and } 

    become: 

    -LRB-, -RRB-, -LCB- and -RCB-, respectively.

-"LaTeX"-style double quotation marks:

    `` Hello '' , said John to Mary .

    and not:

    " Hello " , said John to Mary .
	
-Attributive quotations should be formatted in the "logical"
 or "British" style and not the "American" style, so, e.g.:

    `` Hello '' , said John to Mary .

    and NOT:

    `` Hello , '' said John to Mary.

 (N.B. this is the only other thing related to sentence segmentation
 and tokenization that the Stanford PTBTokenizer.java code does not 
 accomplish.)

-Also, Unicode punctuation symbols outside the ASCII range
 should be converted to their ASCII equivalents, e.g.:

    … should be re-written as ... 

-When a sentence-final abbreviation ending with a period/full-stop,
 ends a declarative sentence (i.e., there is therefore no sentence
 final punctuation mark), the final period/full-stop should not be
 split off so that we have, e.g.:

    Many products sold at Smithy's Department Store are not produced
    in the U.S.

    tokenized as:

    Many products sold at Smithy 's Department Store are not produced
    in the U.S. 

    and not:

    Many products sold at Smithy 's Department Store are not produced
    in the U.S . 

These text transformations will bring novel texts more in line with the 
texts the parser and realizer were trained on and will improve parsing
and realization performance.  

Finally, all text passed to the parser is assumed to be encoded as 
UTF-8 or ASCII (the latter being a subset of UTF-8).  Other encodings
may cause the parser or realizer to crash in unforseen ways.  

***The Stanford Core NLP tools (which we use, see below) already do most
of what this section covers, so if you plan not to use the Stanford
tools you will need to find a replacement. The Stanford PTBTokenizer.java
code does all that we mentioned above, except transforming "American"-
style quotations to "British/logical"-style quotations, and ensuring 
that texts are encoded in UTF-8.  American-to-logical quotation 
transformation is performed by the code in:

$OPENCCG_HOME/ccgbank/bin/american-to-logical-quotes.py 

This is invoked by Ant through build-ps.xml.

Unicode X-to-UTF-8 conversion can be accomplished with the script: 

$OPENCCG_HOME/ccgbank/bin/toUTF-8.py 
(assuming that Python's 'chardet' package has been installed).  

The first takes text from <stdin> and pipe text to <stdout>; the second
has various option flags (type 'python toUTF-8.py -h' for more 
information. Both have only been tested with Python 2.6x.

As for formatting your texts to be one sentence per line, this you
must do yourself, as we cannot anticipate what forms of marked up
texts will be passed in for parsing.


Building the English models from the CCGbank
============================================

You can train your own English models if you have a licensed copy of
the CCGbank.  To build the models, you'll need to download and patch
Zhang Le's maxent toolkit and install the SRILM language modeling
toolkit, assuming their licenses are compatible with your usage.  In
theory it may be possible to use these tools on different platforms,
but in practice it will be much easier to use a linux platform,
preferably one with multiple processors and lots of memory. For
installing Zhang Le's maxent toolkit, see the section with this title
below.  For the SRILM toolkit, follow the installation instructions on
the SRILM website, and make sure the SRILM executables are available
on your PATH environment variable.

After installing the required toolkits, the next step is to download
the current version of ccgbank-data.YYYY-MM-DD.tgz, and move it into
the ccgbank directory, i.e. $OPENCCG_HOME/ccgbank/, with the undated
name ccgbank-data.tgz.  You'll also need to create a symbolic link to
your original CCGbank directory from $OPENCCG_HOME/ccgbank/.
(Alternatively, you can edit the original.ccgbank.dir property in the
build.properties file in the ccgbank directory.)  From this directory,
you can unpack the data archive as shown below (where
<path_to_ccgbank> is the path to your original CCGbank directory):

$ mv ccgbank-data.YYYY-MM-DD.tgz $OPENCCG_HOME/ccgbank/ccgbank-data.tgz
$ cd $OPENCCG_HOME/ccgbank
$ ln -s <path_to_ccgbank>/ccgbank1.1
$ ccg-build -f build-release.xml extract-data

The ccgbank-data tarball contains a patch file for converting the
original CCGbank to the Propbank-enhanced version described in Boxwell
and White (2008).  The 'extract-data' target in build-release.xml does
the patching after unpacking the archive and doing a space-to-newline
conversion that enables the patch file to only contain the real
differences between these CCGbank versions, given that diff works
line-by-line and CCGbank derivations are given one per line.  (Note
that this conversion also ensures that the CCGbank cannot be recovered
from the patch file, thereby avoiding a copyright violation for
distributing the CCGbank.)

The ccgbank-data tarball also contains various auxiliary files that
make it possible to use the BBN named entity annotations on the Penn
Treebank as well as to insert the quotes that were unfortunately
removed from the original CCGbank.

Once the Propbank-enhanced version of the CCGbank has been created and
the aux files unpacked, the next step is to convert this version of
the CCGbank to the one used by OpenCCG, which has a refined treatment
of punctuation, refined categories for various function words,
collapsed named entities and truecased text.  The conversion is done
by a series of XSLT transformations, which have the advantage of the
declarative use of XPATH matching but unfortunately end up making the
conversion quite slow.  As such, the best way to do the conversion is
to convert the sections in parallel.  The bin/convert_all script
converts all sections in parallel, as follows:

$ cd $OPENCCG_HOME/ccgbank
$ bin/convert_all

As each section requires up to 1GB of memory to convert, it really
only makes sense to convert all sections in parallel on a machine with
at least 25GB of memory and multiple processors.  The bin/convert_all
script is very simple and can easily be edited to run fewer sections
in parallel at a time.  Running all sections in parallel should take
less than an hour.

Once the corpus conversion is complete, the next step is to extract
grammars for the training, development and test sections of the
CCGbank.  (For testing, normally only the morph file is used from the
dev and test sets, together with the training set grammar.)  The
grammar extraction process also creates testbed files for these
sections, which contain logical forms derived by following the
gold-standard derivations.  Grammar extraction is done using the
'extract-various' target in the main build file (build.xml, the
default):

$ cd $OPENCCG_HOME/ccgbank
$ ccg-build extract-various &> logs/log.extract.various &

Extracting the grammars and creating the logical forms may take up to
an hour and a half or so.  Following corpus conversion and grammar
extraction, the next step is to train the models.  Most of the models
can be trained using the 'all' target in build-models.xml:

$ cd $OPENCCG_HOME/ccgbank
$ ccg-build -f build-models.xml all &> logs/log.models.all &

This target trains the supertagger and hypertagger as well as the
generative parsing and realization models.  As these models require
several maxent training runs, this step will take a while, for example
up to 24 hours depending on the speed of the machine.  (In principle
these steps could be partly parallelized, but doing so would be
nontrivial given the existing dependencies between steps.)

The final step is to train the realizer's averaged perceptron model.
(It is also possible to train an averaged perceptron model for the
parser, but it has not been found to yield significant gains over the
generative model, most likely due to the size of the discrimination
space.)  Note that you should first install the very large language
model as described in the section on using the pre-built models, if
possible.

Training the perceptron model requires generating training events for
each training section, which is quite time consuming.  Event
generation is easily done in parallel, so the perceptron training
sequence has been broken up to allow this step to be done separately:

$ cd $OPENCCG_HOME/ccgbank
$ ccg-build -f build-rz.xml event-gen-prep &> logs/log.rz.event.gen.prep &
$ bin/gen_realizer_events_a &
$ bin/gen_realizer_events_b &
$ bin/gen_realizer_events_c &
$ bin/gen_realizer_events_d &
$ bin/gen_realizer_events_e &

Preparing for event generation is fairly quick; once that's done, the
bin/gen_realizer_events* scripts can all be run at the same time.  These
scripts are set up to run five sections at a time; they can be easily
edited to run more or fewer in parallel.  Event generation may take up
to 12 hours, even with running 5 sections in parallel.

Once event generation is complete, the actual perceptron training can
be run:

$ ccg-build -f build-rz.xml train-perceptron &> logs/log.rz.train.perceptron &

Perceptron training is apt to take 8 hours.  If your machine has 16g
of memory available, training can be run in less than half the time by
commenting in the "-in_mem" options in build-rz.xml, and editing
bin/ccg-env to use a memory limit of 16g.

With the models all built, the parser and realizer can be tested on
the CCGbank development section:

$ cd $OPENCCG_HOME/ccgbank
$ ccg-build -f build-ps.xml test &> logs/log.ps.test &
$ ccg-build -f build-rz.xml test-perceptron &> logs/log.rz.test.perceptron &

If the models have been built correctly, the realization exact matches
should be over 46% (using the very large language model), and the
parsing unlabeled dependencies f-score should be about 0.89.  (Note
that with named entities collapsed and some function words not
represented in the logical forms, these f-scores are not comparable to
the dependency f-scores reported for other CCG parsers on the
CCGbank.)

Naturally, the models can also be run on novel text, as described in
the section on using pre-built models.


Viewing CCGbank derivations
===========================

Derivations in the original or converted CCGbank can be viewed as
trees using ccg-draw-tree, a front-end to the tree-drawing routine in
NLTK's Tree class.  This tool reads in .auto files, so to view
converted CCGbank derivations, you must first export them to .auto
format, as shown below:

$ cd $OPENCCG_HOME/ccgbank
$ ccg-build export-to-auto
$ ccg-draw-tree convert/00/wsj_0001.auto wsj_0001.1

The export-to-auto target creates auto files for the current 'sect'
and 'file' properties, which can be set in build.properties or
provided on the command line (e.g. by -Dfile=*).  This example assumes
that the first file in Section 00 is included in the files to export
in .auto format.  Displaying the derivation for the first sentence in
the converted CCGbank shows how balanced appositive commas are handled
with "Pierre_Vinken , 61 years old ," (as well as a collapsed named
entity), and also shows how "as a nonexecutive director" has been
converted into an adjunct rather than an argument of "join".


Installing the Stanford Core NLP tools
======================================

For novel text, it is useful to perform named entity (NE) 
recognition and labelling, as well as morphological processing 
(lemmatization).  For this we use the Stanford Core NLP tools, 
available at:

http://www-nlp.stanford.edu/software/corenlp.shtml

To install them, simply download the archive from the
above link, unpack it, and place the Core NLP JAR file
in the 'ccgbank/stanford-nlp' directory, re-naming it
'stanford-core-nlp.jar'. 

If you wish to use another location or naming convention, 
you will need to update the properties file 
(ccgbank/build-ps.properties).

If you're using a bash shell, you might do the following:

$ mkdir $OPENCCG_HOME/ccgbank/tmp
$ cd $OPENCCG_HOME/ccgbank/tmp
$ wget http://www-nlp.stanford.edu/software/stanford-corenlp-20xx-xx-xx.tgz
$ tar xvfz stanford-corenlp-20xx-xx-xx.tgz
$ cd stanford-corenlp-20xx-xx-xx
$ cp stanford-corenlp-20xx-xx-xx.jar $OPENCCG_HOME/ccgbank/stanford-nlp/stanford-core-nlp.jar

Note you will need to fill in the date, 20xx-xx-xx, with whatever 
the date of the most recent release is (see the particular file
you get from the Stanford website).

To get the NE tagging models out of this download (the Stanford NE 
tagger combines preditions from multiple models), you will need to 
locate the 'stanford-corenlp-20xx-xx-xx-models.jar' file (in the 
same directory as the other JAR files) and un-jar it, like so 
[assuming you're still in the same directory as above]:

$ jar xf stanford-corenlp-20xx-xx-xx-models.jar
$ cp edu/stanford/nlp/models/ner/* $OPENCCG_HOME/ccgbank/stanford-nlp/classifiers/.
$ rm -rf edu

You should check that the filenames for the NE tagging models copied
to $OPENCCG_HOME/ccgbank/stanford-nlp/classifiers match those listed
in $OPENCCG_HOME/ccgbank/build-ps.properties as ner.model1, ner.model2
and ner.model3, updating this properties file if necessary.

This will set up the only external dependency we have for
parsing novel text using 'ccgbank/build-ps.xml'.

If you wish to recompile (perhaps after modifying) the 
application that interfaces with the Stanford NE tagger's API, 
see the ant build file $OPENCCG_HOME/ccgbank/bin/ner/build-ner-api.xml
and its corresponding properties file (in the same location).


Installing Zhang Le's maxent toolkit
====================================

To train the models, you'll need to have Zhang Le's maxent toolkit
working with a small patch.  Do the following to install the patched
version of Zhang Le's toolkit in a directory of your choice:

$ cd
$ wget http://homepages.inf.ed.ac.uk/lzhang10/software/maxent/maxent-20061005.tar.bz2

Unpack and patch the maxent.cpp file (it doesn't
cover the case where ':' can be part of the feature
symbol itself, and not just a delimiter that separates
string representations of features (contextual predicates, 
actually) from their real-valued activations).

$ bunzip2 maxent-20061005.tar.bz2
$ tar xf maxent-20061005.tar
$ cd maxent-20061005/src
$ patch maxent.cpp $OPENCCG_HOME/docs/maxent.cpp.patched

Now compile the maxent code.

$ cd 
$ cd maxent-20061005
$ make clean all unittest

Test to make sure it (more or less) works (7 out of the 8 tests only
seem to pass, but the training seems to work):

$ cd test
$ ./runall.py

Finally, add the 'maxent' binary (under 'maxent-20061005/src/opt')
to your PATH environment variable.


References
==========

Michael White and Rajakrishnan Rajkumar. 2012. Minimal Dependency
Length in Realization Ranking. In Proc. EMNLP-12.
http://aclweb.org/anthology-new/D/D12/D12-1023.bib

Rajakrishnan Rajkumar and Michael White. 2010. Designing Agreement
Features for Realization Ranking. In Proc. of COLING-10.
http://aclweb.org/anthology-new/C/C10/C10-2119.bib

Michael White and Rajakrishnan Rajkumar. 2009. Perceptron Reranking
for CCG Realization. In Proc. of the Conference on Empirical Methods
in Natural Language Processing (EMNLP 2009).
http://aclweb.org/anthology-new/D/D09/D09-1043.bib

Rajakrishnan Rajkumar, Michael White and Dominic
Espinosa. 2009. Exploiting Named Entity Classes in CCG Surface
Realization. In Proc. of Human Language Technologies: The 2009 Annual
Conference of the North American Chapter of the Association for
Computational Linguistics (NAACL HLT 2009).
http://aclweb.org/anthology-new/N/N09/N09-2041.bib

Michael White and Rajakrishnan Rajkumar. 2008. A More Precise Analysis
of Punctuation for Broad-Coverage Surface Realization with CCG. In
Proc. of the Workshop on Grammar Engineering Across Frameworks (GEAF08).
http://aclweb.org/anthology-new/W/W08/W08-1704.bib

Dominic Espinosa, Michael White and Dennis Mehay. 2008. Hypertagging:
Supertagging for Surface Realization with CCG. In Proceedings of the
46th Annual Meeting of the Association for Computational Linguistics:
Human Language Technologies (ACL-08: HLT).
http://aclweb.org/anthology-new/P/P08/P08-1022.bib

Stephen A. Boxwell and Michael White. 2008. Projecting Propbank Roles
onto the CCGbank. In Proceedings of the Sixth International Conference
on Language Resources and Evaluation (LREC-08).
http://www.lrec-conf.org/proceedings/lrec2008/pdf/789_paper.pdf

James R. Curran, Stephen Clark and David Vadas. 2006.  Multi-Tagging
for Lexicalized-Grammar Parsing. In Proc. ACL-06.
http://aclweb.org/anthology-new/P/P06/P06-1088.bib

Julia Hockenmaier and Mark Steedman. 2002.  Generative Models for
Statistical Parsing with Combinatory Categorial Grammar.  In Proc. ACL-02.
http://aclweb.org/anthology-new/P/P02/P02-1043.bib


================================================
FILE: docs/guide/build.xml
================================================
<?xml version="1.0"?>

<project name="OpenCCG Guide" basedir="." default="compile">

	<uptodate property="rough-guide.upToDate"
	    srcfile="./guide.tex"
	    targetfile="../grammars-rough-guide.pdf"/>
		
	  <!-- =================================================================== -->
	  <!-- Compiles Grammar Rough Guide                                        -->
	  <!-- =================================================================== -->
	  <target name="compile" unless="rough-guide.upToDate">
	    <echo message="Compiling grammar rough guide"/>
	    
	    <available file="./gb4e.sty" property="gb4e.sty.present"/>
	    <fail unless="gb4e.sty.present" message="gb4e.sty is not present"/>

	  	<available file="./cgloss4e.sty" property="cgloss4e.sty.present"/>
	    <fail unless="cgloss4e.sty.present" message="cgloss4e.sty is not present"/>

	    <available file="./openccg.sty" property="openccg.sty.present"/>
	    <fail unless="openccg.sty.present" message="openccg.sty is not present"/>
		    
	    <available file="./openccg.bib" property="openccg.bib.present"/>
	    <fail unless="openccg.bib.present" message="openccg.bib is not present"/>
		    
	    <!-- branch on cygwin, then finish -->
	    <antcall target="compile.default"/>
	    <antcall target="compile.cygwin"/>
	    <antcall target="compile.finish"/>
	  </target>

	  <target name="compile.default" unless="cygwin">
	    <echo message="(default compile)"/>
	    <exec executable="pdflatex" dir="." failonerror="true">
	      <arg value="guide.tex"/>
	    </exec>
	    <exec executable="bibtex" dir="." failonerror="true">
	      <arg value="guide"/>
	    </exec>
	    <exec executable="pdflatex" dir="." failonerror="true">
	      <arg value="guide.tex"/>
	    </exec>
	    <exec executable="pdflatex" dir="." failonerror="true">
	      <arg value="guide.tex"/>
	    </exec>
	  </target>
		  
	  <target name="compile.cygwin" if="cygwin">
	    <echo message="(cygwin compile)"/>
	    <exec executable="bash" dir="." failonerror="true">
	      <arg value="-c"/> <arg value="pdflatex guide.tex"/>
	    </exec>
	    <exec executable="bash" dir="." failonerror="true">
	      <arg value="-c"/> <arg value="bibtex guide"/>
	    </exec>
	    <exec executable="bash" dir="." failonerror="true">
	      <arg value="-c"/> <arg value="pdflatex guide.tex"/>
	    </exec>
	    <exec executable="bash" dir="." failonerror="true">
	      <arg value="-c"/> <arg value="pdflatex guide.tex"/>
	    </exec>
	  </target>
		  
	  <target name="compile.finish">
	    <copy file="./guide.pdf" tofile="../grammars-rough-guide.pdf" overwrite="true" />
	  </target>
		
	  <target name="clean">
	    <delete>
	      <fileset dir="." includes="guide.*" excludes="guide.tex"/>
	    </delete>
	  </target>

</project>

================================================
FILE: docs/guide/cgloss4e.sty
================================================
% -*- LaTeX -*-
% Following borrows from Covington's style files inspired by Midnight by M.
% de Groot, adapted to be used with gb4e.sty: examples beginning with \ex can
% contain glosses directly. Default is
% Linguistic Inquiry style with all lines in \rm; to change a line (eg. to
% \it for a particular journal, change the appropriate line: e.g.,
% \let\eachwordone=\rm in a copy of this file. Note that it will NOT work
% to put \it before the line as the words are parsed separately.

% Use \singlegloss to force single-spaced glosses even in double-space
% environments. Works also in footnotes (^M as delimiter replaced by
% \\)---hpk
%
%%%
%%% Sentences with word-by-word glosses
%%%

% See covingtn.tex for full documentation.  Some examples:
%
% Displayed sentence with gloss and translation:
%
%             \gll Dit is een Nederlands voorbeeld.\\
%                  This is a Dutch example.\\
%             \glt `This is an example in Dutch.'
%
% Same, using bracketing where words do not correspond one-to-one:
%
%             \gll Dit is een voorbeeldje     in het Nederlands.\\
%                  This is a {little example} in {}  Dutch.\\
%             \glt `This is a little example in Dutch.'
%
% If you want to align 3 lines rather than two, use \glll instead of \gll.
%
% Layout is critical between \gll (or \glll) and \glt (or \gln).
%
% Thanks to Marcel R. van der Goot for permission to reproduce code.
\let\@gsingle=1
\def\singlegloss{\let\@gsingle=1}
\def\nosinglegloss{\let\@gsingle=0}
\@ifundefined{new@fontshape}%
   {\def\@selfnt{\ifx\@currsize\normalsize\@normalsize\else\@currsize\fi}}
   {\def\@selfnt{\selectfont}}

\def\gll%                 % Introduces 2-line text-and-gloss.
   {\begin{flushleft}
     \ifx\@gsingle1%           conditionally force single spacing (hpk/MC)
        \vskip\baselineskip\def\baselinestretch{1}%
        \@selfnt\vskip-\baselineskip\fi%
    \bgroup
    \twosent
   }

\def\glll%                 % Introduces 3-line text-and-gloss.
   {\begin{flushleft}
     \ifx\@gsingle1%        conditionally force single spacing (hpk/MC)
        \vskip\baselineskip\def\baselinestretch{1}%
        \@selfnt\vskip-\baselineskip\fi%
    \bgroup
    \threesent
   }

\def\glt{\vskip.17\baselineskip}
% Introduces a translation
\let\trans\glt

\def\glend{} % obsolete
      % Ends the gloss environment.

% The following TeX code is adapted, with permission, from:
% gloss.tex: Macros for vertically aligning words in consecutive sentences.
% Version: 1.0  release: 26 November 1990
% Copyright (c) 1991 Marcel R. van der Goot (marcel@cs.caltech.edu).
% Original Midnight/gloss.tex and Midnight/gloss.doc are available from
% csvax.cs.caltech.edu [131.215.131.131] in pub/tex
% and many other anonymous ftp archives.

\newbox\lineone% boxes with words from first line
\newbox\linetwo%
\newbox\linethree%
\newbox\wordone% a word from the first line (hbox)
\newbox\wordtwo%
\newbox\wordthree%
\newbox\gline% the constructed double line (hbox)
\newskip\glossglue% extra glue between glossed pairs or triples
\glossglue = 0pt plus 2pt minus 1pt % allow stretch/shrink between words
%\glossglue = 5pt plus 2pt minus 1pt % allow stretch/shrink between words
\newif\ifnotdone

\@ifundefined{eachwordone}{\let\eachwordone=\rm}{\relax}
\@ifundefined{eachwordtwo}{\let\eachwordtwo=\rm}{\relax}
\@ifundefined{eachwordthree}{\let\eachwordthree=\rm}{\relax}

\def\lastword#1#2#3% #1 = \each, #2 = line box, #3 = word box
   {\setbox#2=\vbox{\unvbox#2%
                    \global\setbox#3=\lastbox%
                   }%
    \ifvoid#3\global\setbox#3=\hbox{#1\strut{} }\fi
        % extra space following \strut in case #1 needs a space
   }

\def\testdone
   {\ifdim\ht\lineone=0pt
         \ifdim\ht\linetwo=0pt \notdonefalse % tricky space after pt
         \else\notdonetrue
         \fi
    \else\notdonetrue
    \fi
   }

\gdef\getwords(#1,#2)#3 #4\\% #1=linebox, #2=\each, #3=1st word, #4=remainder
   {\setbox#1=\vbox{\hbox{#2\strut#3 }% adds space
                    \unvbox#1%
                   }%
    \def\more{#4}%
    \ifx\more\empty\let\more=\donewords
    \else\let\more=\getwords
    \fi
    \more(#1,#2)#4\\%
   }

\gdef\donewords(#1,#2)\\{}%

\gdef\twosent#1\\ #2\\{% #1 = first line, #2 = second line
    \getwords(\lineone,\eachwordone)#1 \\%
    \getwords(\linetwo,\eachwordtwo)#2 \\%
    \loop\lastword{\eachwordone}{\lineone}{\wordone}%
         \lastword{\eachwordtwo}{\linetwo}{\wordtwo}%
         \global\setbox\gline=\hbox{\unhbox\gline
                                    \hskip\glossglue
                                    \vtop{\box\wordone   % vtop was vbox
                                          \nointerlineskip
                                          \box\wordtwo
                                         }%
                                   }%
         \testdone
         \ifnotdone
    \repeat
    \egroup % matches \bgroup in \gloss
   \gl@stop}

\gdef\threesent#1\\ #2\\ #3\\{% #1 = first line, #2 = second line, #3 = third
    \getwords(\lineone,\eachwordone)#1 \\%
    \getwords(\linetwo,\eachwordtwo)#2 \\%
    \getwords(\linethree,\eachwordthree)#3 \\%
    \loop\lastword{\eachwordone}{\lineone}{\wordone}%
         \lastword{\eachwordtwo}{\linetwo}{\wordtwo}%
         \lastword{\eachwordthree}{\linethree}{\wordthree}%
         \global\setbox\gline=\hbox{\unhbox\gline
                                    \hskip\glossglue
                                    \vtop{\box\wordone   % vtop was vbox
                                          \nointerlineskip
                                          \box\wordtwo
                                          \nointerlineskip
                                          \box\wordthree
                                         }%
                                   }%
         \testdone
         \ifnotdone
    \repeat
    \egroup % matches \bgroup in \gloss
   \gl@stop}

\def\gl@stop{{\hskip -\glossglue}\unhbox\gline\end{flushleft}}

\endinput


================================================
FILE: docs/guide/gb4e.sty
================================================
% -*- LaTeX -*-
\def\gbVersion{4e}
%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
%  Version 4export (= v. 4 minus the compatibility code)
%  Based on hpk's gb.sty, revised for GM syllabus by ct,
%  and incorporating macros adapted from J.Frampton, M. de Groot en M.
%  Covington. Full documentation soon to come in gb4doc.tex. Bug-reports
%  and suggestions for improvements, other used features, please!
%
%  Notes:
%  
%  Various styles for X-bar levels; can be changed, but note that {picture}
%  environements (e.g. trees) will then come out wrong and have to be
%  fixed
%
%  This file allows _ and ^ to be used in ordinary text, hence must be
%  loaded AFTER any file that uses them in their TeX meaning. Hence
%  cgloss(n).sty is loaded early in this file.
%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%

%%%%%%%%%%%%%%%%%%%%%%%%
%  Format of examples: %
%%%%%%%%%%%%%%%%%%%%%%%%
% \begin{exe} or \exbegin
% <examples>                           (arab.)
% \begin{xlist} or \xlist
% <subexamples>                        (1st embedding, alph.)
% \begin{xlisti} or \xlisti
% <subsubexamples>                     (2st embedding, rom.)
% \end{xlisti}  or \endxlisti
% <more examples>
% \end{xlist} or \endxlist
% <still more examples>
% \end{exe} or \exend
%
% Other sublist-styles: xlistA (Alph.), xlistI (Rom.), xlistn (arab)
%
% \ex                               (produces Number)
% \ex <sentence>                    (numbered example)
% \ex[jdgmt]{sentence}              (numbered example with judgement)
%
% \exi{ident}                      (produces identifier)
% \exi{ident} <sentence>           (example numbered with identifier)
% \exi{ident}[jdgmt]{sentence}     (dito with judgement)
%                      (\exr, \exp and \sn are defined in terms of \exi)
%
% \exr{label}                       (produces cross-referenced Num.)
% \exr{label} <sentence>            (cross-referenced example)
% \exr{label}[jdgmt]{sentence}      (cross-referenced example with judgement)
%
% \exp{label}                       (same as
% \exp{label} <sentence>                     \exr but
% \exp{label}[jdgmt]{sentence}                        with prime)
%
% \sn <sentence>                    (unnumbered example)
% \sn[jdgmt]{sentence}              (unnumbered example with judgement)
%
%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%

\@ifundefined{new@fontshape}{\def\reset@font{}\let\mathrm\rm}{}

\let\prmbrs=0
\def\primebars{\let\prmbrs=1}
\def\obar#1{\ifmmode#1^{0}\else#1$^{0}$\fi}  %% FIX
\def\mbar#1{\ifmmode#1^{\mathrm{max}}\else#1$^{\mathrm{max}}$\fi}
\def\ibar#1{\ifx\prmbrs0%
                 \ifmmode\overline{\mathrm{#1}}\else$\overline{\mbox{#1}}$\fi%
            \else\ifmmode#1^{'}\else#1$^{'}$\fi\fi}
\def\iibar#1{\ifx\prmbrs0%
                  \ifmmode\overline{\overline{\mathrm{#1}}}%
                  \else$\overline{\overline{\mbox{#1}}}$\fi%
             \else #1P\fi}
\def\th{\ifmmode\theta\else$\theta$\fi}
\def\al{\ifmmode\alpha\else$\alpha$\fi}
\def\be{\ifmmode\beta\else$\beta$\fi}
\def\ga{\ifmmode\gamma\else$\gamma$\fi}
\def\de{\ifmmode\delta\else$\delta$\fi}
\def\spec#1{[Spec,#1]} %Def. of "Specifier of #1"
\def\ct#1{{\em #1\/}} %Citation of linguistic material with alternative style:
%\def\ct#1{`#1'}
\def\tx{\bf} %Introduction of technical terms with alternative style:
%\def\tx{\em}

\input{cgloss\gbVersion.sty}

%%% NEWSTUFF:
%\newcommand{\indexgroupmark}[1]{\item{\bf #1}}  % ?? -CT

% this allows _ to be used in horizontal mode (from J.Frampton):
% \catcode`_=\active
% \def_#1{\ifmmode\mit{\sb{#1}}\else${}\sb{#1}$\fi}
% \catcode`^=\active
% \def^#1{\ifmmode\mit{\sp{#1}}\else${}\sp{#1}$\fi}

% \def\lb#1{\@ifnextchar [{\@glarph{#1}}{\@bl{#1}}}
%\def\@glarph#1[#2]{\ifmmode{[}\sb{{\mathrm{#1}}\sb{#2}}\else%
%                            ${[}\sb{{\mathrm{#1}}\sb{#2}}$\fi}
% \def\@bl#1{\ifmmode{[}\sb{\mathrm{#1}}\;\else${[}\sb{\mathrm{#1}}\;$\fi}

% \def\rb#1{\@ifnextchar [{\@grarph{#1}}{\@br{#1}}}
%\def\@grarph#1[#2]{\ifmmode{]}\sb{{\mathrm{#1}}\sb{#2}}\else%
%                         ${]}\sb{{\mathrm{#1}}\sb{#2}}$\fi}
% \def\@br#1{\ifmmode{]}\sb{\mathrm{#1}}\;\else${]}\sb{\mathrm{#1}}\;$\fi}

%%% END_NEWSTUFF.


%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
%  Macros for examples, roughly following Linguistic Inquiry style.   %
%  From here on best not to tamper, else all the examples and cross-  %
%  references will come out scrambled! (see also note below) - CT     %
%  Completely rewritten for more robustness and flexibility. (hpk)    %
%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%

\def\qlist{\begin{list}{\Alph{xnum}.}{\usecounter{xnum}%
\setlength{\rightmargin}{\leftmargin}}}
\def\endqlist{\end{list}}

\newif\if@noftnote\@noftnotetrue
\newif\if@xrec\@xrecfalse
\@definecounter{fnx}

%%%% adapted from latex.tex to get examples in footnotes right
\long\def\@footnotetext#1{%
    \@noftnotefalse\setcounter{fnx}{0}%
    \insert\footins{\reset@font\footnotesize
    \interlinepenalty\interfootnotelinepenalty
    \splittopskip\footnotesep
    \splitmaxdepth \dp\strutbox \floatingpenalty \@MM
    \hsize\columnwidth \@parboxrestore
   \edef\@currentlabel{\csname p@footnote\endcsname\@thefnmark}\@makefntext
    {\rule{\z@}{\footnotesep}\ignorespaces
      #1\strut}}\@noftnotetrue}

\newcount\@xnumdepth \@xnumdepth = 0

\@definecounter{xnumi}
\@definecounter{xnumii}
\@definecounter{xnumiii}
\@definecounter{xnumiv}
\@definecounter{exx}
\setcounter{exx}{0}
\def\thexnumi{\@xsi{xnumi}}
\def\thexnumii{\@xsii{xnumii}}
\def\thexnumiii{\@xsiii{xnumiii}}
\def\thexnumiv{\@xsiv{xnumiv}}
\def\p@xnumii{\thexnumi}
\def\p@xnumiii{\thexnumi\thexnumii-}
\def\p@xnumiv{\thexnumi\thexnumii-\thexnumiii-}

\def\xs@default#1{\csname @@xs#1\endcsname}
\def\@@xsi{\let\@xsi\arabic}
\def\@@xsii{\let\@xsii\alph}
\def\@@xsiii{\let\@xsiii\roman}
\def\@@xsiv{\let\@xsi\arabic}

\@definecounter{rxnumi}
\@definecounter{rxnumii}
\@definecounter{rxnumiii}
\@definecounter{rxnumiv}

\def\save@counters{%
\setcounter{rxnumi}{\value{xnumi}}%
\setcounter{rxnumii}{\value{xnumii}}%
\setcounter{rxnumiii}{\value{xnumiii}}%
\setcounter{rxnumiv}{\value{xnumiv}}}%


\def\reset@counters{%
\setcounter{xnumi}{\value{rxnumi}}%
\setcounter{xnumii}{\value{rxnumii}}%
\setcounter{xnumiii}{\value{rxnumiii}}%
\setcounter{xnumiv}{\value{rxnumiv}}}%


\def\exewidth#1{\def\@exwidth{#1}} \exewidth{(234)}
\def\exe{\@ifnextchar [{\@exe}{\@exe[\@exwidth]}}

\def\@exe[#1]{\ifnum \@xnumdepth >0%
                 \if@xrec\@exrecwarn\fi%
                 \if@noftnote\@exrecwarn\fi%
                 \@xnumdepth0\@listdepth0\@xrectrue%
                 \save@counters%
              \fi%
                 \advance\@xnumdepth \@ne \@@xsi%
                 \begin{list}{(\thexnumi)}%
                             {\usecounter{xnumi}\@subex{#1}{1em}%
                              \if@noftnote%
                                 \setcounter{xnumi}{\value{exx}}%
                              \else%
                                 \setcounter{xnumi}{\value{fnx}}%
                              \fi}}

\def\endexe{\if@noftnote\setcounter{exx}{\value{xnumi}}%
                   \else\setcounter{fnx}{\value{xnumi}}%
                        \reset@counters\@xrecfalse\fi\end{list}}

\def\@exrecwarn{\typeout{*** Recursion on "exe"---your
                example numbering will probably be screwed up!}}

\def\xlist{\@ifnextchar [{\@xlist{}}{\@xlist{}[iv.]}}
\def\xlista{\@ifnextchar [{\@xlist{\alph}}{\@xlist{\alph}[m.]}}
\def\xlisti{\@ifnextchar [{\@xlist{\roman}}{\@xlist{\roman}[iv.]}}
\def\xlistn{\@ifnextchar [{\@xlist{\arabic}}{\@xlist{\arabic}[9.]}}
\def\xlistA{\@ifnextchar [{\@xlist{\Alph}}{\@xlist{\Alph}[M.]}}
\def\xlistI{\@ifnextchar [{\@xlist{\Roman}}{\@xlist{\Roman}[IV.]}}

\def\endxlist{\end{list}}
\def\endxlista{\end{list}}
\def\endxlistn{\end{list}}
\def\endxlistA{\end{list}}
\def\endxlistI{\end{list}}
\def\endxlisti{\end{list}}


%%% a generic sublist-styler
\def\@xlist#1[#2]{\ifnum \@xnumdepth >3 \@toodeep\else%
    \advance\@xnumdepth \@ne%
    \edef\@xnumctr{xnum\romannumeral\the\@xnumdepth}%
    \def\@bla{#1}
    \ifx\@bla\empty\xs@default{\romannumeral\the\@xnumdepth}\else%
      \expandafter\let\csname @xs\romannumeral\the\@xnumdepth\endcsname#1\fi
    \begin{list}{\csname the\@xnumctr\endcsname.}%
                {\usecounter{\@xnumctr}\@subex{#2}{1.5ex}}\fi}

\def\@subex#1#2{\settowidth{\labelwidth}{#1}\itemindent\z@\labelsep#2%
         \ifnum\the\@xnumdepth=1\topsep 7\p@ plus2\p@ minus3\p@\else%
         \topsep 2\p@ plus2\p@\fi\parsep 2\p@ plus\p@ minus\p@%
         \itemsep \parsep\leftmargin\labelwidth\advance\leftmargin#2\relax}

%%% the example-items
\def\ex{\@ifnextchar [{\@ex}{\item}}
\def\@ex[#1]#2{\item\@exj[#1]{#2}}
\def\@exj[#1]#2{\@exjbg{#1} #2 \end{list}}
\def\exi#1{\item[#1]\@ifnextchar [{\@exj}{}}
\def\judgewidth#1{\def\@jwidth{#1}}
\judgewidth{??}
\def\@exjbg#1{\begin{list}{#1}{\@subex{\@jwidth}{.5ex}}\item}
\def\exr#1{\exi{{(\ref{#1})}}}
\def\exp#1{\exi{{(\ref{#1}$'$)}}}
\def\sn{\exi{}}
\def\bu{\item[$\bullet$]}


%%%%%%% \lcomment for breaks in (example-)lists (leaves all counters
%%%%%%% as they are)    (hpk) 
\newlength{\lcommentsep}
\lcommentsep = 1ex

\long\def\lcomment#1%
   {\vspace{\lcommentsep}
    \item[]\hspace*{-\leftmargin}%
    \@tempskipa=\linewidth%
    \addtolength{\@tempskipa}{\rightmargin}%
    \addtolength{\@tempskipa}{\leftmargin}%
    \parbox{\@tempskipa}{#1}%
    \vspace{\lcommentsep}%
   }

%%%%%% control the alignment of exampleno. and (picture-)example
%%%%%%         (by Lex Holt <lex@cogsci.ed.ac.uk>).
\def\attop#1{\leavevmode\vtop{\strut\vskip-\baselineskip\vbox{#1}}}
\def\atcenter#1{$\vcenter{#1}$}
%%%%%%

%-------------------Move Arrows (from J.Frampton):

\def\leaderfill{\leaders\hrule\hfil}
\def\pointerup{\hbox to 0pt{\hss
  \vbox{\offinterlineskip\vskip-1pt\hbox{\elevenex\char'170}\null}\hss}}
\def\pointerdown{\hbox to 0pt{\hss
  \vtop{\offinterlineskip\null\hbox{\elevenex\char'171}\vskip-1pt}\hss}}

\let\pu=\pointerup
\let\pd=\pointerdown
\let\lf=\leaderfill

\def\spacer{\hskip4.5pt}
\def\fillright#1{\hfil#1\leaderfill}
\def\fillleft#1{\leaderfill#1\hfil}
% Changed spelling to \centr, else conflicts with LaTeX \center{} -CT
\def\centr#1{\leaderfill#1\leaderfill}
\def\link#1{\multispan#1\leaderfill}

\def\arrowalign#1{\vtop{\baselineskip=0pt \lineskiplimit=0pt \lineskip=2pt
  \halign{&##\cr#1}}}

%\font\elevenex=cmex10 scaled\magstephalf  % just for the arrow!
      %PS: this may not work on some installations, not sure why. CT
      %%PPS: (e.g., PCTeX, but it works find works fine with EmTeX)
%----------------END Move Arrows

\def\pijl{$\rightarrow$\ }

% Special accents for Vata & Gbadi; Navajo coming soon, I hope...:
%\def\bb#1{$\mathrm{\overline{#1}}$} Following looks better:
\def\bb#1{\ifmmode\overline{\mathrm{#1}}\else$\bar{\mathrm{#1}}$\fi}

\def\boven#1#2{\raisebox{-0.2pt}{$\stackrel{#1}{\mathrm{#2}}$}}
\def\bovenop#1#2{\raisebox{-0.06ex}[0ex][0ex]{$\stackrel{#1}{\mathrm{#2}}$}}
\def\vl{\rule{0.05em}{0.30em}}
\def\|#1{\ifmmode\vert#1\else\bovenop{\vl}{#1}\fi}


================================================
FILE: docs/guide/guide.tex
================================================

%%
%% nb: use pdflatex to create pdf file with hyperlinks
%%

%% =====================================================================
%% DOCUMENT DATA
%% =====================================================================

\documentclass[11pt]{article}

\title{Specifying Grammars for OpenCCG: \\ A Rough Guide}
\author{Cem Boz\c{s}ahin \and Geert-Jan M. Kruijff \and Michael White}


%% =====================================================================
%% PACKAGES
%% =====================================================================

\usepackage{openccg} % for hlds/ccg
\usepackage{graphicx} % for figs
\usepackage{gb4e} % for examples

\usepackage[
  colorlinks=true, linkcolor=blue, citecolor=blue, urlcolor=blue,
  pdfstartview=FitH,
  pdftitle={Specifying Grammars for OpenCCG: A Rough Guide},
  pdfauthor={Cem Bozsahin, Geert-Jan M. Kruijff and Michael White}
]{hyperref}


%% =====================================================================
%% NEW COMMANDS
%% =====================================================================

%\newcommand{\occg}{\textsf{OpenCCG}}
\newcommand{\occg}{OpenCCG}
\newcommand{\tccg}{\textsf{tccg}}

 
%% =====================================================================
%% DOCUMENT BODY
%% =====================================================================

\begin{document}

\thispagestyle{empty}
\maketitle
\tableofcontents
\listoftables
\listoffigures
\newpage

\section{OpenCCG} 

\occg\ is an open source natural language processing library written in
Java, which provides parsing and realization services based on Mark
Steedman's Combinatory Categorial Grammar (CCG) formalism
\cite{Steedman:SynProc}. The library makes use of the multi-modal
extensions to CCG devised by Jason Baldridge in his dissertation
\cite{Baldridge:2002} and in a joint EACL-03 paper with Geert-Jan
Kruijff \cite{Baldridge/Kruijff:2003}. For a concise introduction to CCG
with these extensions, see \cite{Steedman/Baldridge:2003}.

\occg\ grew out of the Grok system developed by Gann Bierner and Jason
Baldridge, and has been refined and extended by Michael White, with
further contributions from Cem Boz\c{s}ahin, G\"une\c{s} Erkan,
Geert-Jan Kruijff, David Reitter and Alexandros Triantafyllidis. Recent
development efforts, managed by Michael White, have focused on making
the realizer
\cite{White/Baldridge:2003,White-RLAC:2004,White-INLG:2004,White-ACLSoft:2005}
practical to use in dialogue systems, and improving (somewhat) the grammar
development process.

You can download and install \occg\ from its website, located at
\url{http://openccg.sourceforge.net}. Once you've unpacked the archive,
have a look at the \texttt{README} file for installation
instructions.


\section{About this (rough) guide}

This guide is intended to provide a brief introduction to writing grammars for
\occg. The system is implemented in Java, but you do not need to know Java.
\occg\ provides its own formats for describing grammars, including the
combinatory rules, the lexicon (i.e.\ the lexicalized grammar), feature
structures, LF, morphology etc. Two formats are available; one is based on XML
and one is a higher-level format that looks similar to C or Java. The syntax of
the XML-based format is very simple, but at the same time it can be verbose and
hard-to-read. The other format, the so-called ``CCG format'' (\texttt{.ccg}),
was specifically designed to be written by hand, and has a richer and more
concise syntax. It is a ``front-end'' format in that it is converted internally
to XML before it is actually used by \occg, using the \texttt{ccg2xml} tool. As
a result, the two formats share many conceptual similarities.
\textbf{NB:} Note that the XML format is more stable than the \texttt{.ccg} format, and in particular, the way in which unification constraints are 
specified in the \texttt{.ccg} format is apt to change.

This manual was originally created before the CCG format existed. As a result,
it is primarily geared towards writing grammars directly in XML. Over time,
however, it will be updated to cover the use of the CCG format as well. For the
time being, see \texttt{src/ccg2xml/README} for documentation of the
\texttt{.ccg} format.


\section{Using the XML-based format}

In order to write \occg grammars directly in the XML-based format, you
should be familiar with XML. Actually, all you need to know is that tags
can be hierarchically and linearly organized, and that they must be
``closed'' (by
\texttt{</tag>} or
\texttt{/>}) with proper nesting, e.g.

\begin{verbatim}
  <name> 
    <surname> Bond </surname> <first> James </first>
    <aka> Jimbo </aka> <aka> Double-Oh (Seven) </aka>
  </name>
\end{verbatim}

\begin{verbatim} 
  <feat attr="case" val="acc"/>
\end{verbatim}

All the \occg-defined elements and attributes are listed in the XML
schema validation files. For reference documentation, you can have a
look at these files, which are located in the
\texttt{\$OPENCCG\_HOME/grammars/} directory of your installation. For
example, \texttt{categories.xsd} describes the tags that go into \occg\
categories.

For more advanced use of \occg, it helps to know
\href{http://www.w3.org/Style/XSL/}{XSLT}.

\subsection{XML-based grammar architecture in \occg}

A run-time grammar for \occg\ typically consists of 
five primary files, with the following canonical names:

\begin{description}

\item[\texttt{grammar.xml}] Specifies the name of the grammar, and lists
the names of the other files.  This file may also specify XSLT
transformations to use in converting LFs to/from XML, and/or properties
of a custom tokenizer (see \texttt{grammar.xsd} for details).
      
\item[\texttt{lexicon.xml}] Specifies \emph{lexical families}. A lexical
family specifies one or more related categories, with their associated
feature structures and logical forms. Lexical families are loosely based
on the notion of \emph{tree families} in
\href{http://www.cis.upenn.edu/~xtag/}{XTAG}.
      
\item[\texttt{morph.xml}] Specifies the \emph{words} of the grammar.
Each word is related to a lexical family through the part-of-speech tag
of the word. If a family is a closed class, we specify explicitly with a
family what words are its members.

\item[\texttt{rules.xml}] Specifies which combinatory rules are
available to the grammar. For the purpose of this document, we assume
that application, type-raising, and composition (harmonic as well as
crossed) are available. Unary type changing rules are also placed into
\texttt{rules.xml}.

\item[\texttt{types.xml} (optional)] Specifies the syntactic and semantic
type/sort hierarchies. Unlike HPSG, only atomic types are
supported in \occg. Multiple-inheritance is allowed \cite{erkanms03}.
      
\end{description}

Standard practice is to store these files in a directory under the
\texttt{grammars} directory of the \occg\ distribution. Besides the
above files, it is also a good idea to have a \texttt{testbed.xml} file.
A testbed is a list of test expressions, where we specify for each
expression the number of parses ($\geq 0$) the grammar should yield, and
optionally the intended LF.


\section{Words and categories}
\label{sec:cats}

\subsection{Lexical families}

Traditionally, the lexicon for a categorial grammar specifies for each
word its own category. In \occg, categories are instead organized into
lexical \textsl{families}, which are related to whole sets of words. (As
mentioned earlier, the idea of families we employ here is loosely based
on the notion of \emph{tree families} in XTAG.) This makes it possible
to avoid giving the same specification over and over again in a lexicon.

The simplest way in which words can be related to families is through
their parts of speech: for a word we have to specify its part of speech,
and for a family we have to specify the part of speech a word has to
have for the family to be applicable. To control the applicability of a
family, we can also declare it to be \textsl{closed}. A closed 
family is not applicable to \emph{every} word that has the appropriate
part of speech, but only to those words (stems) that are listed with the
family as its members.  Note that a closed family does not exactly
correspond to the notion of a closed class word, as open class words
(especially verbs) are often listed as members of closed families, in
order to assign them appropriate subcategorization frames.

To illustrate, let's look at some examples from the \texttt{tiny} sample
grammar. A family is defined within the following element:

\begin{verbatim}
  <family name="Noun" pos="N">
    <entry name="Primary">
      :
    </entry>
  </family>

  <family name="ProNP" pos="Pro" closed="true">
    <entry name="Primary">
      :
    </entry>
    <member stem="pro1"/>
    <member stem="pro2"/>
    <member stem="pro3f"/>
    <member stem="pro3m"/>
    <member stem="pro3n"/>
  </family>
\end{verbatim}

\noindent These two families are for nouns and pronominal NPs, as their
\textsl{name} attributes indicate; they have parts of speech \texttt{N}
and \texttt{Pro}, respectively, given by the \textsl{pos} attribute.
The pronominal NP family has \texttt{closed="true"}, indicating that
it's a closed family.  The members are \texttt{pro1} \ldots
\texttt{pro3n}, where \texttt{pro1} is an abstract stem for the first
person pronouns \gf{I, we, me, us}, and so on.

In each family, we define one or more entries, using an \textsl{entry}
element. Each entry defines a category with accompanying feature
structure and logical form. Each entry is given a name; we usually give 
the main entry \texttt{name="Primary"}.  An example of a family with
multiple (ok, two) entries appears below.  The first entry is named
\texttt{DTV}, for ditransitive verb, as it specifies a category with two
NP complements; the second entry is named \texttt{NP-PPfor}, as it
specifies a category with an NP complement followed by a PP complement
headed by \gf{for}.  In both cases, the extra complement plays the role
of Beneficiary in the semantics, motivating the grouping of these two
entries into a single family.

\begin{small}
\begin{verbatim}
  <family name="DitransitiveBeneficiaryVerbs" pos="V" closed="true">
    <entry name="DTV">
      :
    </entry>
    <entry name="NP-PPfor">
      :
    </entry>
    <member stem="buy"/>
    <member stem="rent"/>
  </family>
\end{verbatim}
\end{small}

\subsection{Categories}

Within an entry we define a category. A category can either be atomic 
or complex (i.e.\ a function). The example below illustrates how we 
specify an atomic category using the \textsl{atomcat} element, 
giving its label as a value of the attribute \textsl{type}. 

\begin{verbatim}
  <family name="Noun" pos="N">
    <entry name="Primary">
      <atomcat type="n">
        :
      </atomcat>
    </entry>
  </family>
\end{verbatim}

We can assign a feature structure to an atomic category using the
\textsl{fs} element. The \textsl{fs} element has an \textsl{id}
attribute so that we can explicitly reference the feature structure,
when needed.

\begin{verbatim}
  <atomcat type="n">
    <fs id="2"> .. </fs>
    :
  </atomcat>
\end{verbatim}

We can add individual features using \textsl{feat} elements. In their
simplest form, a feature has an \textsl{attr} specifying the
attribute and a \textsl{val} giving the value of the attribute.

\begin{verbatim}
  <fs id="2">
    <feat attr="num" val="sg"/>
  </fs>
\end{verbatim}

Now, since we don't want all nouns to be singular, we can instead
declare the value of the \texttt{num} feature to be a variable, as
follows:

\begin{verbatim}
  <atomcat type="n">
    <fs id="2">
      <feat attr="num"> <featvar name="NUM"/> </feat>
      :
    </fs>
    :
  </atomcat>
\end{verbatim}

\noindent Here the \textsl{featvar} element introduces a variable with
\texttt{name="NUM"} as the value of the feature. Note that this feature
specification serves as an implicit declaration that nouns have a
\texttt{num} feature. As such, it interacts with the
\textsl{inheritsFrom} mechanism for default unification, as will be
explained below. With basic categories such as this one, it is a good
idea to specify all relevant features.

An entry can also specify a \emph{complex} category, i.e.\ a function.
For that, we use the \textsl{complexcat} element. This element is
essentially a list, enumerating the result category and its arguments in
the order as given by a Steedman-style category. Argument categories may
be atomic or complex (i.e., creating a higher-order function); the
result category must be atomic (see \cite{Baldridge:2002} for
discussion).

\begin{table}
\begin{center}
\begin{tabular}{rcc}
Rules                          & \occg       & MMCCG \\ \hline
application only               & \texttt{*}  & $\star$ \\
associative                    & \verb+^+    & $\diamond$ \\
permutative                    & \texttt{x}  & $\times$ \\
permutative right              & \texttt{x>} & $\times\triangleright$\\
permutative left               & \texttt{<x} & $\triangleleft\times$\\
associative permutative right  & \texttt{>}  & $\triangleright$\\
associative permutative left   & \texttt{<}  & $\triangleleft$\\
all rules                      & \texttt{.}  & $\bullet$ \\  \hline %[.2em]
\end{tabular}
\end{center}
\caption{Slash modes}
\label{slash-modes}
\end{table}

For each argument we give the slash using a \textsl{slash} element that
has attributes \textsl{mode} and \textsl{dir} to specify what kind of
slash we are dealing with. The available slash modes are given in
Table~\ref{slash-modes}. (Note that in XML, the angle brackets
\texttt{<} and \texttt{>} must be escaped as \texttt{\&lt;} and
\texttt{\&gt;}, respectively.) See \cite{Baldridge:2002}[p.\ 100] and
\cite{Baldridge/Kruijff:2003} for discusion of the slash modes in
multimodal CCG. Slashes may also have variables over modes, and may be
inert, as discussed in \cite{Baldridge:2002}[Ch.\ 8].

\begin{figure}
\begin{quote}
\begin{verbatim}
<complexcat>
  <atomcat type="s">
    <fs id="1"> .. </fs>
  </atomcat>
  <slash dir="\" mode="&lt;"/>
  <atomcat type="np">
    <fs id="2"> <feat attr="case" val="nom"/> .. </fs>
  </atomcat>
  <slash dir="/" mode="&gt;"/>
  <atomcat type="np">
    <fs id="3"> <feat attr="case" val="acc"/> .. </fs>
  </atomcat>
  :
</complexcat>
\end{verbatim}
\end{quote}
\[
\cf{s\fsb{1}{}} \bs \cf{np\fsb{2}{nom}} / \cf{np\fsb{3}{acc}} 
\]
\caption{Transitive verb category}
\label{tv-cat}
\end{figure}

Figure~\ref{tv-cat} shows how the category for a transitive verb can be
defined; at the bottom of the figure is a more human-friendly notation
for the category. The result category is \cf{s}. There are two argument
categories, an \cf{np} with accusative case to the right, and an \cf{np}
with nominative case to the left. In the human notation, the feature
structure id's are shown subscripted in angle brackets, followed by the
features themselves. Note that when the intended feature is evident from
the feature value, the feature name is left off; also, when the slash
mode is consistent with the slash direction (e.g.\ $\triangleright$ and
/), the mode is not shown, as in \cite{Baldridge:2002}.

\subsection{Words}
\label{words}

Since pronouns retain case marking in English, the case requirements on
the arguments of a transitive verb have the effect of determining which
pronouns can appear in which positions. For example, the first person
pronoun \gf{I} is allowed in subject position, while \gf{me} is
allowed in object position, but not vice-versa. 

This naturally leads us to how we specify properties of words in the
\texttt{morph.xml} file. For each word, we have to give its wordform 
and part of speech, as follows:

\begin{verbatim}
  <entry pos="Prep" word="for"/>
\end{verbatim}

\noindent If the word's stem differs from its form, the stem must be
listed too:

\begin{verbatim}
  <entry pos="N" word="policemen" stem="policeman" .. />
\end{verbatim}

\begin{figure}
%\begin{quote}
\begin{small}
\begin{verbatim}
<entry pos="Pro" word="I" stem="pro1" macros="@1st @sg @nom .."/>
<entry pos="Pro" word="me" stem="pro1" macros="@1st @sg @acc .."/>
<entry pos="Pro" word="we" stem="pro1" macros="@1st @pl @nom .."/>
<entry pos="Pro" word="us" stem="pro1" macros="@1st @pl @acc .."/>
:
<macro name="@nom"> 
  <fs id="2" attr="case" val="nom"/>
</macro>
<macro name="@acc">
  <fs id="2" attr="case" val="acc"/>
</macro>
\end{verbatim}
\end{small}
%\end{quote}
\[
\begin{array}{rcl}
\gf{I} & \vdash & \cf{np\fsb{2}{1st,sg,nom}} \\ 
\gf{me} & \vdash & \cf{np\fsb{2}{1st,sg,acc}} \\
\gf{we} & \vdash & \cf{np\fsb{2}{1st,pl,nom}} \\ 
\gf{us} & \vdash & \cf{np\fsb{2}{1st,pl,acc}} \\
\end{array}
\]
\caption{Case macros}
\label{case-macros}
\end{figure}

To add further information, such as case, we use \textsl{macros}, as
illustrated in Figure~\ref{case-macros}. In the figure, the entries for
the first person pronouns are given, along with their syntactic macros,
specified by the \textsl{macros} attribute. The case macros, named
\texttt{@nom} and \texttt{@acc}, appear next in the figure, defined by
the \textsl{macro} elements. These macros set the case feature on the
category associated with the word (via its part of speech), by accessing
the feature structure with id 2 and setting the value of the
\texttt{case} feature to \texttt{nom} and \texttt{acc}, respectively.
(The number macros \texttt{@sg} and \texttt{@pl} are analogous.) 
The effects of the macros are shown at the bottom of the figure, where
the word forms for the first person pronouns are paired with their
associated categories, which differ in their number and case values.

\begin{figure}
%\begin{quote}
\begin{small}
\begin{verbatim}
<entry pos="V" word="buy" macros="@pres @non-3rd @sg"/>
<entry pos="V" word="buys" stem="buy" macros="@pres @3rd @sg"/>
<entry pos="V" word="buy" macros="@pres @pl"/>
<entry pos="V" word="bought" stem="buy" macros="@past"/>
:
<macro name="@1st"> <fs id="2" attr="pers" val="1st"/> </macro>
<macro name="@2nd"> <fs id="2" attr="pers" val="2nd"/> </macro>
<macro name="@3rd"> <fs id="2" attr="pers" val="3rd"/> </macro>
<macro name="@non-3rd"> 
  <fs id="2" attr="pers" val="non-3rd"/> 
</macro>
\end{verbatim}
\end{small}
%\end{quote}
\[
\begin{array}{rcl}
\gf{buy} & \vdash & 
\cf{s\fsb{1}{}} \bs \cf{np\fsb{2}{non\mbox{-}3rd,sg,nom}} / \cf{np\fsb{3}{acc}} \\ 
\gf{buys} & \vdash & 
\cf{s\fsb{1}{}} \bs \cf{np\fsb{2}{3rd,sg,nom}} / \cf{np\fsb{3}{acc}} \\
\gf{buy} & \vdash & 
\cf{s\fsb{1}{}} \bs \cf{np\fsb{2}{pl,nom}} / \cf{np\fsb{3}{acc}} \\ 
\gf{bought} & \vdash & 
\cf{s\fsb{1}{}} \bs \cf{np\fsb{2}{nom}} / \cf{np\fsb{3}{acc}} \\ 
\end{array} 
\]
\caption{Person macros}
\label{pers-macros}
\end{figure}

As another example, Figure~\ref{pers-macros} shows how the person macros
are used (together with the number macros) in setting up person and
number agreement constraints with various forms of the verb \gf{buy}.
Note that the tense macros \texttt{@pres} and \texttt{@past} do not
contribute syntactic features; instead they contribute semantic features
to the logical form (cf.\ Section~\ref{lfs}). Additionally, note that
the macro \texttt{@non-3rd} supplies a syntactic person value that is
compatible with both \texttt{1st} and \texttt{2nd}, as specified in
\texttt{types.xml} (cf.\ Section~\ref{types}).

It is important to note that macro instantiation does not involve
unification: macros set feature values regardless of any value that
might already be present for the feature in the feature structure.
Conceivably, it would be convenient on occasion (though computationally 
more expensive) to use unification, rather than overwriting, during
macro instantiation, but there is no support for doing so at present.

\subsection{Unification}

\begin{figure}
\begin{quote}
%\begin{small}
\begin{verbatim}
<complexcat>
  <atomcat type="np">
    <fs id="2"> <feat attr="pers" val="3rd"/> .. </fs>
  </atomcat>
  <slash dir="/" mode="^"/>
  <atomcat type="n">
    <fs id="2"> .. </fs>
  </atomcat>
</complexcat>
\end{verbatim}
%\end{small}
\end{quote}
\[
\gf{the} ~ \vdash ~ \cf{np\fsb{2}{3rd}}/_{\!\!\diamond}\cf{n\fsb{2}{}}
\]
\caption{The definite article}
\label{def-art}
\end{figure}

\begin{figure}
\begin{center}
\deriv{3}{
\gf{the} & \gf{teacher} & \gf{buys} \\
\uline{1} & \uline{1} & \uline{1} \\
\cf{np\fsb{2}{3rd}}/_{\!\!\diamond}\cf{n\fsb{2}{}} &
\cf{n\fb{sg}} & 
\cf{s} \bs \cf{np\fb{3rd,sg,nom}} / \cf{np\fb{acc}} \\
\fapply{2} \\
\cmc{2}{\cf{np\fsb{2}{3rd,sg}}} \\
\ftype{2} \\
\cmc{2}{\cf{s\fsb{1}{}} / \cf{s\fsb{1}{}} \bs \cf{np\fsb{2}{3rd,sg}}} \\
\fcomp{3} \\
\cmc{3}{\cf{s\fsb{1}{}} / \cf{np\fb{acc}}}
}

\vspace{1cm}
\deriv{3}{
\gf{the} & \gf{teachers} & \gf{*buys} \\
\uline{1} & \uline{1} & \uline{1} \\
\cf{np\fsb{2}{3rd}}/_{\!\!\diamond}\cf{n\fsb{2}{}} &
\cf{n\fb{pl}} & 
\cf{s} \bs \cf{np\fb{3rd,sg,nom}} / \cf{np\fb{acc}} \\
\fapply{2} \\
\cmc{2}{\cf{np\fsb{2}{3rd,pl}}} \\
\ftype{2} \\
\cmc{2}{\cf{s\fsb{1}{}} / \cf{s\fsb{1}{}} \bs \cf{np\fsb{2}{3rd,pl}}} \\
\badcomb{3}{{>}\mathbf{B}} \\
\cmc{3}{\cf{s\fsb{1}{}} / \cf{np\fb{acc}}}
}
\end{center}
\caption{Unification and subject-verb agreement}
\label{subj-v-agr}
\end{figure}

Speaking of unification, let's examine the role it plays in enforcing
subject-verb agreement. The category for the definite article is given
in Figure~\ref{def-art}. The definite article is compatible with both
singular and plural nouns, but it must retain this number information
for subject-verb agreement to work. Propagating number information is
accomplished here by setting the feature structure id to be same on both
the \cf{np} result category and on the argument category \cf{n} (i.e.,
we have \texttt{id="2"} in both cases). Figure~\ref{subj-v-agr} provides
an illustration, showing how \gf{the teacher} ends up as a singular
\cf{np}, while \gf{the teachers} ends up as a plural one.\footnote{Note
that feature structure id's are only shown when relevant to unification.
Also, in \occg\ derivations, the id's are actually mapped to ``fresh''
ones after lexical lookup, to avoid any accidental coindexations across
different lexical items.} Type raising the \cf{np} and forward composing
it with \gf{buys} requires it to unify with the backwards \cf{np}
argument of the verb, and in particular, requires the number feature to
be singular. Since this is only the case with \gf{the teacher}, the last
step in the derivation of \gf{the teachers *buys} will be blocked by a
unification failure.

\begin{figure}
%\begin{quote}
\begin{small}
\begin{verbatim}
<complexcat>
  <atomcat type="pp">
    <fs inheritsFrom="3"> <feat attr="lex" val="[*DEFAULT*]"/> </fs>
  </atomcat>
  <slash mode="&lt;" dir="/"/>
  <atomcat type="np">
    <fs id="3"> <feat attr="case" val="acc"/> </fs>
  </atomcat>
</complexcat>
\end{verbatim}
\end{small}
%\end{quote}
\[
\gf{for} ~ \vdash ~ \cf{pp\fb{for,acc,X}} \, /_{\!\!\triangleleft} \, \cf{n\fb{acc,X}}
\]
\caption{Default unification with case marking prepositions}
\label{prep-nom}
\end{figure}

Coindexing two feature structures ensures that all their features will
take on the same values. There are times, however, when we want two
feature structures to just mostly take on the same values, except for
one or two particular features. To support such cases, \occg\ includes a
limited form of default unification, specified by the
\textsl{inheritsFrom} attribute of a feature structure element.

The \textsl{inheritsFrom} mechanism is implemented by compiling out the
default unification of two feature structures into individual feature
equations at the time of lexical lookup. This works as follows. First,
any features appearing on the target category, but not the result
category, are copied over. Then, for every feature that has been
observed in the grammar for the result category---except for any
features that already appear there---a feature equation is added, i.e.\
the feature is set to the same variable on both the target and result
categories.

As an example, Figure~\ref{prep-nom} shows the category for ``case
marking'' prepositions, i.e.\ those prepositions which are assumed to
play a purely syntactic role. The \cf{pp} result category has a
\texttt{lex} feature which is instantiated by the stem of the actual
lexical item, as specified by the keyword \texttt{"[*DEFAULT*]"}. Its
remaining features are ``inherited from'' the feature structure with id
3, i.e.\ the one for the argument \cf{np}, as specified by
\texttt{inheritsFrom="3"}. When the category for a case-marking
preposition (such as \gf{for} here) is instantiated, a feature equation
is established between the \cf{pp} and \cf{np} categories for the
\texttt{index} feature (whose purpose will be discussed in the next
section); the value of the \texttt{case} feature is also copied over.
Thus, in the figure, both the \cf{pp} result category and the \cf{np}
argument category have an index variable \texttt{X} (and accusative
case), while only the result PP has a \texttt{lex} feature, with
\texttt{for} as its value.\footnote{Since the case feature is arguably
superfluous on the result PP, one could avoid it by just including an
explicit feature equation for the \texttt{index} variable. Generally
though, it's simpler and less error-prone to use the
\textsl{inheritsFrom} mechanism than to manually include all the
relevant feature equations.}

\subsection{Set args}

\begin{figure}
\begin{quote}
\begin{verbatim}
<complexcat>
  <atomcat type="s"> .. </atomcat>
  <setarg>
    <slash dir="/" mode="&gt;"/>
    <atomcat type="np">
      <fs> <feat attr="case" val="nom"/> .. </fs>
    </atomcat>
    <slash dir="/" mode="x"/>
    <atomcat type="np">
      <fs> <feat attr="case" val="gen"/> .. </fs>
    </atomcat>
  </setarg>
  :
</complexcat>
\end{verbatim}
\end{quote}
\[
\gf{nanghuhuli (``catches'')} ~ \vdash ~ 
\cf{s} \{ / \cf{np\fb{nom}}, /\!_{\times} \cf{np\fb{gen}} \} 
\]
\caption{Tagalog transitive verb with set args}
\label{tagalog-set-args}
\end{figure}

To conclude our discussion of specifying syntactic categories, we should
mention the availability of set args and dollar variables in \occg. Set
args enable us to define categories that allow arguments to appear in
any order, as illustrated in Figure~\ref{tagalog-set-args} for the
Tagalog verb \gf{nanghuhuli (``catches'')}. In the figure, both the
nominative and genitive arguments must appear to the right of the verb,
but their relative order is unconstrained. Note that the nominative
argument is given the more powerful associative and permutative slash,
while the genitive argument is given the permutative-only slash; see
\cite{Baldridge:2002}[Ch.\ 7] for discussion, and
\cite{bozsahinsteedman03} for further examples.

\subsection{Dollar variables}

\begin{figure}
\begin{quote}
\begin{verbatim}
<complexcat>
  <atomcat type="s"> .. </atomcat>
  <slash/>
  <dollar name="1"/>
  <slash dir="\" mode="*"/>
  <complexcat>
    <atomcat type="s"> .. </atomcat>
    <slash/>
    <dollar name="1"/>
  </complexcat>
  <slash dir="/" mode="*"/>
  <complexcat>
    <atomcat type="s"> .. </atomcat>
    <slash/>
    <dollar name="1"/>
  </complexcat>
</complexcat>
\end{verbatim}
\end{quote}
\[
\gf{and} ~ \vdash ~ \cf{s}\$_{1} \bs_{\star} \cf{s}\$_{1} /\!_{\star} \cf{s}\$_{1}
\]
\caption{Category with dollar variables for sentential coordination}
\label{sent-coord-dollar}
\end{figure}

Dollar variables range over a stack of arguments, and can be useful in
defining categories for conjunctions, type-raised categories for
quantifiers, and categories for unary rules (cf.\
\cite{Baldridge:2002}[Ch.\ 8]). Figure~\ref{sent-coord-dollar} shows the
category for \gf{and} that allows a range of clausal categories to be
coordinated---e.g., transitive verbs, verb phrases, or subject-verb
constituents, in right-node raising---as discussed in
\cite{White-RLAC:2004}.


\section{Logical forms}
\label{lfs}

\subsection{Hybrid logic dependency semantics}

To associate meanings with categories, we need to take care of two
things: the structure of the meaning (logical form) itself, and the
relation between the category and that meaning. Usually the latter comes
down to specifying how the meanings of arguments are to be fit into the
logical form.

As logical forms we use \emph{hybrid logical terms} that specify
semantic dependency structures; for details, see
\cite{Kruijff:2001,Baldridge/Kruijff:2002,White/Baldridge:2003,White-RLAC:2004}.
(If you're wondering where the $\lambda$'s have gone, see
Section~\ref{tko-lambdas}.)

We give the logical form of a category using the \textsl{lf} element:

\begin{verbatim}
  <complexcat>
    :
    <lf> .. </lf>
  </complexcat>
\end{verbatim}

\noindent The \textsl{lf} element must always appear at the end of a
category specification (whether atomic or complex).

The simplest logical form is of the form $@_{X} \phi$, with $\phi$ a
proposition. We interpret $X$ as the \emph{discourse referent} of the
proposition. For the proposition itself, we can follow linguistic
tradition and use a word's stem to represent its meaning, except that
we'll use boldface rather than prime notation (i.e., we'll represent the
meaning of \gf{word} as \C{word} rather than $\mathit{word}'$). We
achieve exactly this effect using the keyword \texttt{"[*DEFAULT*]"}, as
shown below:

\begin{verbatim}
  <lf>
    <satop nomvar="X:sem-obj"> 
      <prop name="[*DEFAULT*]"/> 
    </satop>
  </lf>
\end{verbatim}

\noindent The \textsl{satop} element introduces a satisfaction operator
@, along with a nominal variable, or \textsl{nomvar}, $X$. (In the
grammar, we use logic variables rather than concrete instantiations for
nominals; during parsing or realization, \occg\ instantiates these
variables dynamically.) Nominals can have types (or sorts) associated
with them, as will be explained further in Section~\ref{types}; here,
$X$ is allowed to be any subtype of semantic object. The \textsl{prop}
element specifies the proposition.

\begin{figure}
\begin{small}
\begin{verbatim}
[lexicon.xml]
  <family name="Noun" pos="N">
    <entry name="Primary">
      <atomcat type="n">
        <fs id="2">
          <feat attr="num"> <featvar name="NUM"/> </feat>
          <feat attr="index">
            <lf> <nomvar name="X"/> </lf>
          </feat>
        </fs>
        <lf>
          <satop nomvar="X:sem-obj">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </atomcat>
    </entry>
  </family>

[morph.xml]
  <entry pos="N" word="flower" class="thing" macros="@sg @sg-X"/>
  :
  <macro name="@sg-X">
    <lf>
      <satop nomvar="X">
        <diamond mode="num"> <prop name="sg"/> </diamond>
      </satop>
    </lf>
  </macro>
\end{verbatim}
\end{small}
\[
\gf{flower} ~ \vdash ~ \cf{n\fsb{2}{sg,X\!:\con{thing}}} ~ : ~ 
@_{X\!:\con{thing}}(\C{flower} \wedge \modp{num}\con{sg})
\]
\caption{Noun with logical form}
\label{noun-lf}
\end{figure}

\subsection{The syntax-semantics interface}

To establish the interface between syntactic structure, as defined by
the category, and the logical form, we co-index categories with nominals
in the logical form, by adding an attribute \texttt{index} to the
feature structure of each category and giving that attribute the
corresponding nominal as value. To illustrate, Figure~\ref{noun-lf}
(top) shows the complete category definition for nouns.  Note how the
feature structure includes a feature named \texttt{index}, whose value
is a logical form just consisting of the nominal variable $X$---that is,
a variable with the same name as the one introduced in the satisfaction
operator of the LF further down.\footnote{It suffices to put all the
semantic type restrictions on the nominals in the LF; i.e., it's not
necessary to put them on the \texttt{index} variables as well.}

In the middle of Figure~\ref{noun-lf}, the entry for the noun
\gf{flower} in \texttt{morph.xml} is shown. This entry includes
\texttt{thing} as the semantic class (i.e.\ its semantic type), which is
unified with the type of the nominal head $X$ during lexical
instantiation. The entry also includes the macros \texttt{@sg} and
\texttt{@sg-X}, where the former adds the syntactic feature of singular
number, while the latter adds the semantic feature of singular number on
the nominal $X$ (as shown below the entry). At the bottom of the figure
is the complete category that results from lexical lookup and
instantiation of \gf{flower}.

Note that it is possible to fill in the semantic head's proposition with
something other than the stem. To do so, we can specify a \textsl{pred}
to use in place of the stem, when listing a stem as a member of a
family:

\begin{verbatim}
  <family closed="true" pos="V" name="TV">
    <entry name="primary">
      :
    </entry>
    :
    <member stem="nanghuhuli" pred="catch"/>
    :
  </family>
\end{verbatim}

\noindent With this specification, the proposition \C{catch} will
appear in the logical form for the Tagalog verb \gf{nanghuhuli}:

\begin{exe}
\ex \label{tg-catch}
\(
\begin{array}{rcl}
\gf{nanghuhuli} & \vdash & 
\cf{s\fb{E}} \{ / \cf{np\fb{nom,X}}, /\!_{\times} \cf{np\fb{gen,Y}} \} 
~ : ~ \\
&& @_{E}(\C{catch} \wedge \modp{Actor}X \wedge \modp{Patient}Y) \\
\end{array} 
\)
\end{exe}

\begin{figure}
\begin{small}
\begin{verbatim}
  <complexcat>
    <atomcat type="s">
      <fs id="1">
        <feat attr="index"><lf><nomvar name="E"/></lf></feat>
      </fs>
    </atomcat>
    <slash dir="\" mode="&lt;"/>
    <atomcat type="np">
      <fs id="2"> ..
        <feat attr="index"><lf><nomvar name="X"/></lf></feat>
      </fs>
    </atomcat>
    <slash dir="/" mode="&gt;"/>
    <atomcat type="np">
      <fs id="3"> ..
        <feat attr="index"><lf><nomvar name="Y"/></lf></feat>
      </fs>
    </atomcat>
    <lf>
      <satop nomvar="E:action">
        <prop name="[*DEFAULT*]"/>
        <diamond mode="Actor">
          <nomvar name="X:animate-being"/>
        </diamond>
        <diamond mode="Patient">
          <nomvar name="Y:sem-obj"/>
        </diamond>
      </satop>
    </lf>
  </complexcat>
\end{verbatim}
\end{small}
\[
\begin{array}{rcl}
\gf{bought} & \vdash & 
\cf{s\fsb{1}{E:\con{action}}} 
  \bs \cf{np\fsb{2}{nom,X\!:\con{animate\mbox{-}being}}} 
  / \cf{np\fsb{3}{acc,Y\!:\con{sem\mbox{-}obj}}} ~ : \\
&& @_{E:\con{action}}(\C{buy} \wedge \modp{tense}\con{past}) \wedge \\ 
&& @_{E:\con{action}}(\modp{Actor}X\!\!:\!\con{animate\mbox{-}being}) \wedge \\
&& @_{E:\con{action}}(\modp{Patient}Y\!\!:\!\con{sem\mbox{-}obj}) \\
\end{array}
\]
\caption{Transitive verb with logical form}
\label{tv-lf}
\end{figure}

\subsection{Dependency relations}

To introduce dependency relations---like those we just saw for the
Tagalog verb \gf{nanghuhuli}---we use the \textsl{diamond} element. For
example, to state that an English transitive verb has a logical form
with an \modp{Actor} and a \modp{Patient}, we can specify the category
shown in Figure~\ref{tv-lf}. At the bottom of the figure, this category
appears instantiated for the verb \gf{bought}. Note that for ease of
display, the logical form has been partially flattened, with each
dependency relation appearing on a separate line. (In \occg, logical
forms are automatically flattened prior to parsing or realization.)

\begin{figure}
\begin{small}
\begin{verbatim}
  <family name="Det" pos="Det" closed="true" indexRel="det">
    <entry name="Primary">
      <complexcat>
        <atomcat type="np">
          <fs id="2"> ..
            <feat attr="index"><lf><nomvar name="X"/></lf></feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="^"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index"><lf><nomvar name="X"/></lf></feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="det"><prop name="[*DEFAULT*]"/></diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="a"/>
    <member stem="the"/>
    <member stem="some"/>
  </family>
\end{verbatim}
\end{small}
\[
\gf{the} ~ \vdash ~ 
\cf{np\fsb{2}{3rd,X\!:\con{sem\mbox{-}obj}}}/_{\!\!\diamond}\cf{n\fsb{2}{X\!:\con{sem\mbox{-}obj}}} ~ : ~
@_{X\!:\con{sem\mbox{-}obj}}(\modp{det}\con{the})
\]
\caption{Determiner with logical form}
\label{det-lf}
\end{figure}

\subsection{Function words}

Finally, Figure~\ref{det-lf} illustrates how we can specify the meaning
of function words, i.e.\ words that have no independent meaning. The
example gives a specification for determiners, which add a semantic
feature $\modp{det}$ to the meaning of the nominal head they modify. The
noun itself provides the meaning through co-indexation with $X$, the
root nominal of the logical form for the determiner. At the bottom of
the figure is the category instantiated for the definite article
\gf{the}.

To support the realization of function words, the semantic relation or
feature introduced by the word must be declared using the
\textsl{indexRel} attribute on the \textsl{family} element.\footnote{In
principle, it would be possible for \occg\ to figure out when a semantic
relation or feature should be used for indexing purposes, but the
possibility of adding further semantic content via macros makes it
non-trivial to do so.} For example, in Figure~\ref{det-lf} we have
\texttt{indexRel="det"}, which indicates that the $\modp{det}$ feature
should be used to trigger the lookup of the appropriate determiner.
(Normally, semantic relations or features are introduced as part of the
meaning of content words.) When function words are semantically
null---e.g., with case-marking prepositions in the \texttt{tiny}
grammar---the keyword \texttt{*NoSem*} should be given as the value of
the \textsl{indexRel} attribute.

\subsection{Relation sorting}

It is possible to specify the order in which to display relations
appearing at the same level in the logical forms. By default, relations
are sorted alphabetically, with a few exceptions, e.g.\ that
$\modp{Restr}$ should appear before $\modp{Body}$. You can customize the
order in which relations appear using the optional
\textsl{relation-sorting} element in \texttt{lexicon.xml}. See the
\texttt{lexicon.xsd} schema for details.
      
\subsection{From CCG to \occg: Taking care of lambdas}
\label{tko-lambdas}

In CCG, logical forms are normally given using terms from the lambda
calculus, e.g.

\begin{exe}
\ex \label{buy-lambdas}
\(
\gf{buy} ~ \vdash ~ 
(\cf{s} \bs \cf{np\fb{nom}}) / \cf{np\fb{acc}} ~ : ~
\lambda x_2 x_1 . \mathrm{buy}^\prime x_2 x_1
\)
\end{exe}

\begin{exe}
\ex \label{tg-catch-lambdas}
\(
\gf{nanghuhuli} ~ \vdash ~ 
\cf{s} \{ / \cf{np\fb{nom}}, /\!_{\times} \cf{np\fb{gen}} \} ~ : ~ 
\lambda \{ x_1, x_2 \} . \mathrm{catch}^\prime x_2 x_1
\)
\end{exe}

\noindent In (\ref{buy-lambdas}), $x_2$ corresponds to the outermost
argument, $/ \cf{np\fb{acc}}$, and $x_1$ to the innermost one, $\bs
\cf{np\fb{nom}}$. Example (\ref{tg-catch-lambdas}) uses set-lambda
notation with the following convention (cf. \cite{bozsahinsteedman03}):
the lambda operator binds a set of variables which are paired with the
set of arguments in left-to-right order. Thus, in the second example
above, $x_1$ corresponds to $/ \cf{np\fb{nom}}$, and $x_2$ to
$/\!_{\times} \cf{np\fb{gen}}$.

The interpretation of the CCG $\lambda$-terms above is as in
(\ref{pas}), where the argument $x_i$ c-commands $x_{i+j}$ for
$j=1,2,\cdots n-i$, at the level of predicate-argument structure
(c-command is called LF-command in CCG for that reason). This is how
(and where) CCG defines binding constraints.

\begin{exe}
\ex \label{pas}
\begin{minipage}{0.7\textwidth}
\includegraphics{pas.pdf}
\end{minipage}
\end{exe}

As we have seen earlier in this section, \occg\ uses hybrid logic
dependency semantics (HLDS) terms, rather than $\lambda$-terms, in its
logical forms. For example, the HLDS terms for (\ref{buy-lambdas}) and
(\ref{tg-catch-lambdas}) appeared in Figure~\ref{tv-lf} and in
(\ref{tg-catch}). These terms differ from their $\lambda$-counterparts
in a couple of ways. First, in semantic construction, argument binding
is accomplished through unification, rather than via function
application. And second, predicates are typically connected to their
arguments via semantic roles, such as $\modp{Agent}$ and
$\modp{Patient}$---though nothing prevents relations such as
$\modp{Arg1}$ and $\modp{Arg2}$ from being used instead. Using semantic
roles can be more convenient for applications, and makes it possible to
capture semantic similarities across argument structure alternations.
The downside is that it makes it impossible to enforce binding
constraints. In principle, relations encoding semantic roles (e.g.\
$\modp{Agent}$ and $\modp{Patient}$) could be combined with ones for
argument structure (e.g.\ $\modp{Arg1} \ldots \modp{ArgN}$) in the same
HLDS logical form, though this has not yet been tried.


\section{Types}
\label{types}

Types (aka sorts) allow for some abstraction, generalization and
specialization in an \occg\ grammar. Unlike HPSG, \occg\ only employs
atomic types. These types may be used as restrictions on syntactic or
semantic feature variables, or given as values of syntactic or semantic
features. Multiple-inheritance is allowed (see \cite{erkanms03} for
further information).

Types are kept in the types file, usually named \texttt{types.xml}. This
file is optional, which means that features can be untyped (actually,
all features will be considered to be of type \texttt{top} in this case,
which is the only predefined type). 

\begin{figure}
\begin{verbatim}
  <!-- person vals -->
  <type name="pers-vals"/>
  <type name="3rd" parents="pers-vals"/>
  <type name="non-3rd" parents="pers-vals"/>
    <type name="1st" parents="non-3rd"/>
    <type name="2nd" parents="non-3rd"/>
\end{verbatim}
\caption{Hierarchy of syntactic person values}
\label{pers-vals}
\end{figure}

In Section~\ref{words}, Figure~\ref{pers-macros}, we saw how the value
of the person feature \texttt{non-3rd} could be used to define a
category compatible with both \texttt{1st} and \texttt{2nd} person
singular subjects. This definition relies on the following specification
of person values in the \texttt{tiny} grammar's \texttt{types.xml} file,
listed in Figure~\ref{pers-vals}. As this example shows, types are
defined using a \textsl{type} element and are required to have a
\textsl{name}. They may also have a space-separated list of one or more
\textsl{parent} types. Indenting may be used to show the primary
type-subtype hierarchy:\footnote{Since multiple parents are allowed,
nesting of elements is not used to define type-subtype relationships.}
here, \texttt{1st} and \texttt{2nd} are subtypes of \texttt{non-3rd},
while \texttt{non-3rd} and \texttt{3rd} are subtypes of
\texttt{pers-vals}. If no parent types are listed---as with
\texttt{pers-vals}---the type is implicitly a subtype of \texttt{top}.

\begin{figure}
\begin{verbatim}
  <!-- ontological sorts -->
  <type name="sem-obj"/>
    <type name="phys-obj" parents="sem-obj"/>
      <type name="animate-being" parents="phys-obj"/>
        <type name="person" parents="animate-being"/>
      <type name="thing" parents="phys-obj"/>
    <type name="situation" parents="sem-obj"/>
      <type name="change" parents="situation"/>
        <type name="action" parents="change"/>
      <type name="state" parents="situation"/>
\end{verbatim}
\caption{Hierarchy of semantic types/sorts}
\label{ont-sorts}
\end{figure}

The \occg\ type system does not distinguish between syntactic and
semantic types; it is up to the grammar designer to ensure their
systematic use. For example, if there is to be a syntactic hierarchy and
a semantic hierarchy of types, it is a good idea to define a `top
object' for each (or at least for one of them), e.g.\ \texttt{sem-obj}
as the root of the semantic type hierarchy, as illustrated in
Figure~\ref{ont-sorts}. The types in this figure are the ones assumed by
the transitive verb category given in Figure~\ref{tv-lf}. With these
types, \occg\ can parse and realize \gf{he bought a flower}, but not
\gf{*a flower bought he}, since \gf{flower} has type \texttt{thing}, and
\texttt{thing} is not compatible with the type \texttt{animate-being},
as is required for the \modp{Actor} of a \C{buy} action.


\section{Rules}
\label{rules}

The rules file, typically named \texttt{rules.xml}, specifies the
combinatory rules for a grammar. The rule specifications for the
\texttt{tiny} grammar appear below:

\begin{verbatim}
  <!-- Application -->
  <application dir="forward"/>
  <application dir="backward"/>

  <!-- Harmonic Composition -->
  <composition dir="forward" harmonic="true"/>
  <composition dir="backward" harmonic="true"/>

  <!-- Crossed Composition -->
  <composition dir="forward" harmonic="false"/>
  <composition dir="backward" harmonic="false"/>

  <!-- Type-raising -->
  <typeraising dir="forward" useDollar="false"/>
  <typeraising dir="backward" useDollar="true"/>
  <typeraising dir="backward" useDollar="true">
    <arg><atomcat type="pp"/></arg>
  </typeraising>
\end{verbatim}

\noindent In addition to the rules shown here, it is also possible to
have substitution rules, as well as additional type raising rules. By
default, the argument and result categories for a type raising rule are
\cf{np} and \cf{s}, respectively. To create a type raising rule using
different categories, you can use an \textsl{arg} and/or \textsl{result}
element to specify the desired atomic category. For example, a backward
type raising rule for prepositional phrases is included as the last rule
above.

Theoretically speaking, CCG combinatory rules are universal; \emph{any}
lexicalized grammar has access to them if it uses in the lexical
categories the modalities licensed by the rules (see
\cite{Steedman/Baldridge:2003} for further information). The rules file
can also incorporate rules that are language specific. To illustrate,
let's consider the case of pro drop in Turkish. Turkish is a pro-drop
language, which means that subjects of finite clauses can be dropped
because morphology of the finite verb already indicates the subject:

\begin{itemize}
\item[(a)]
\begin{tabular}{ll}
Ben & uyu-du-m/*-n \\
I & sleep-PAST-1SG/*-2SG \\
\multicolumn{2}{l}{`I slept.'} \\
\end{tabular}

\item[(b)]
\begin{tabular}{l}
Uyu-du-m \\
sleep-PAST-1SG \\
`(I) slept.' \\
\end{tabular}
\end{itemize}

Pro drop can be modelled in different ways. For example, one can write a
lexical rule to generate the derived lexical entries of finite verbs
\emph{in} the lexicon, so that every finite verb has two lexical
entries, one derived from the other---e.g.\ (\ref{ex:prodrop}) below,
which asserts $\cf{s\fb{fin}}\bs\cf{np\fb{acc}}$ and $\cf{s\fb{fin}}$
entries in the lexicon from
$\cf{s\fb{fin}}\bs\cf{np\fb{nom}}\bs\cf{np\fb{acc}}$ and
$\cf{s\fb{fin}}\bs\cf{np\fb{nom}}$, etc.

\begin{equation}
\label{ex:prodrop}
\cf{s\fb{fin}}\bs\cf{np\fb{nom}}\$_1
\Rightarrow 
\cf{s\fb{fin}}\$_1
\end{equation}

This strategy has theoretical and practical implications. Theoretically,
it assumes that \emph{all} morphology is confined to the lexicon,
including inflectional morphology, which is usually regarded as part of
syntax (see e.g.\ \cite{bozsahin02cl} for its implications for the
transparency of syntax-semantics correspondence). \occg\ does not assume
that there are only words in the lexicon; anything that can bear a
category (words, affixes, clitics) can be a lexical
item.\footnote{Currently, \occg\ does not have any mechanism to enforce
the \emph{Lexical Integrity Principle} of \cite{bresnanmchombo95}, which
basically states that words are islands as far as syntax is concerned,
e.g.\ it is not possible to extract out of a word. \cite{bozsahin02cl}
proposes that different attachment characteristics of words and bound
morphemes can be factored into CCG's lexical entries and combinatory
rules (the latter simply projects them onto surface grammar), in effect
rendering LIP as a phonological principle, but this is an open problem
for now.}

On the practical side, it assumes that all inflected forms of the verb
are listed in the lexicon. For morphologically rich languages such as
Turkish, this amounts to around 2$^{8}$ entries per verb because Turkish
has 8 inflections in the verb paradigm, all of which are optional.

\begin{figure}
\begin{verbatim}
  <typechanging name="pd">
    <arg>
      <complexcat>
        <atomcat type="s"> 
          <fs id="1"> 
            <feat attr="v-form" val="finite"/>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="n"> 
          <fs> <feat attr="case" val="nom"/> </fs>
        </atomcat>
      </complexcat>
    </arg>
    <result>
      <atomcat type="s"> <fs id="1"/> </atomcat>
    </result>
  </typechanging>
</rules>
\end{verbatim}
\caption{Unary rule for pro drop}
\label{pro-drop-rule}
\end{figure}

An alternative is to add a unary rule for pro drop to
\texttt{rules.xml}. This rule will apply ``on the fly'', that is, it can
apply to lexical or combinatorially-derived inflected verb forms. The
rule, which implements (\ref{ex:prodrop}), may be specified as shown in
Figure~\ref{pro-drop-rule} (we omit the \$ variable for simplicity).
Unary rules are defined using a \textsl{typechanging} element, since
such rules must change the type of the argument category---otherwise,
nothing would prevent the rule from applying again and again to its own
output.


\section{Trying it out}

Once you've configured and built \occg\, per the \texttt{README} file,
you're ready to try out the grammar testing tools. You can experiment
with the grammars described in \texttt{SAMPLE\_GRAMMARS} or make one of
your own. In the latter case, it will be easier if you create your
grammar in its own subdirectory of the \texttt{grammars} directory.

There are (at present) three command line tools for trying grammars out:
\texttt{tccg}, \texttt{ccg-test} and \texttt{ccg-realize}.

\subsection{\texttt{tccg}}

The \texttt{tccg} tool (for ``text CCG'') is for interactively testing a
grammar. Its (primary) usage is

\begin{verbatim}
  tccg (<grammarfile>)
\end{verbatim}

\noindent The default grammar file name is \texttt{grammar.xml}. You can
try it out by going to the \texttt{grammars/tiny} directory and running
\texttt{tccg}, like so:\footnote{Examples like this one may have  
an occasional extra line break to improve readability.}

\begin{small}
\begin{verbatim}
D:\Mike\dev\openccg\grammars\tiny>tccg
Loading grammar from URL: file:/D:/Mike/dev/openccg/grammars
/tiny/grammar.xml
Grammar 'tiny' loaded.

Enter strings to parse.
Type ':r' to realize selected reading of previous parse.
Type ':h' for help on display options and ':q' to quit.
You can use the tab key for command completion,
Ctrl-P (prev) and Ctrl-N (next) to access the command history,
and emacs-style control keys to edit the line.

tccg>
\end{verbatim}
\end{small}

Typing in \texttt{:h} shows all the available commands.  For example,
\texttt{:derivs} turns on the display of derivations when you parse an
expression:

\begin{small}
\begin{verbatim}
tccg> :derivs
tccg> the teacher buys
3 parses found.

Parse 1: s/np
------------------------------
(lex)  the :- np/^n
(lex)  teacher :- n
(>)    the teacher :- np
(>T)   the teacher :- s/@i(s\@inp)
(lex)  buys :- s\np/np
(>B)   the teacher buys :- s/np

tccg>
\end{verbatim}
\end{small}

\noindent Here we see a (simplified) vertical display of the derivation
seen earlier in Figure~\ref{subj-v-agr}. (If you have \LaTeX\ installed,
it's also possible to see derivations like those in
Figure~\ref{subj-v-agr} using the \texttt{:vison} command, but note that
its current behavior is a bit flaky.) Only the first parse is shown; the
other two parses, for the ditransitive and \cf{np} \cf{pp\fb{for}}
categories of the verb, can be seen by turning on all derivations with
the \texttt{:all} command. To see the features on the categories, you
can use the \texttt{:feats} command, optionally with a subset of
features to show.

Logical forms can be shown with the \texttt{:sem} command:

\begin{small}
\begin{verbatim}
tccg> :noderivs
tccg> :sem
tccg> she bought the policeman a flower
1 parse found.

Parse: s :
  @b1:action(buy ^
             <tense>past ^
             <Actor>(p1:animate-being ^ pro3f ^
                     <num>sg) ^
             <Beneficiary>(p2:person ^ policeman ^
                           <det>the ^
                           <num>sg) ^
             <Patient>(f1:thing ^ flower ^
                       <det>a ^
                       <num>sg))
tccg>
\end{verbatim}
\end{small}

To see the realizations for this logical form (i.e., the one from the 
previous parse), use the \texttt{:r} command:

\begin{small}
\begin{verbatim}
tccg> :nosem
tccg> :r
[1.000] she bought the policeman a flower :- s
[0.167] she bought a flower for the policeman :- s
tccg>
\end{verbatim}
\end{small}

\noindent Realizations are ordered by their n-gram similarity to the
previously entered expression. You can have a look in the
\texttt{morph.xml} file for more words to form expressions with.

Note that the settings of the various options available in
\texttt{tccg}; use \texttt{:reset} to undo all these settings and return
to the default ones.

\subsection{\texttt{ccg-test}}

The \texttt{ccg-test} tool is for regression testing, and also provides
options for timing the realizer. Its (primary) usage is

\begin{verbatim}
  ccg-test (-noparsing|-norealization) 
           (-g <grammarfile>) 
           (<regressionfile>)
\end{verbatim}

By default, \texttt{ccg-test} will use the grammar in the current
directory and the default regression file, \texttt{testbed.xml}.

Note that you can set realizer options, such as its time limit, in
\texttt{tccg}, e.g.\ by issuing the command \texttt{:tl 1000} (for time
limit 1000 ms.), and this value will persist and be used by
\texttt{ccg-test}.

\subsection{\texttt{ccg-realize}}

The \texttt{ccg-realize} tool provides a sample interface to the
realizer (see the underlying \texttt{opennlp/ccg/Realize.java} file),
and can be an aid in debugging realization. It loads a grammar, runs the
realizer on an input XML file, and logs its processing to an output text
file (or to system out). Its usage is

\begin{verbatim}
  ccg-realize (-g <grammarfile>) <inputfile> (<outputfile>)
\end{verbatim}
  
You can create input files for \texttt{ccg-realize} using the
\texttt{:2xml} option in \texttt{tccg}.

\section{Building grammars}

\occg\ comes with various utilities to help you build the files used by
the runtime system---and to validate their contents---rather than
writing them entirely by hand. The utilities take advantage of the
\texttt{ccg-build} front end to the Apache Ant
(\url{http://ant.apache.org}) build tool. In principle,
\texttt{ccg-build} allows you to organize your files in any way you like
to produce the runtime grammar files.

\subsection{Validating the grammar files}

You can use \texttt{ccg-build} to validate the grammar files against
their XML schemas. To do so, you need to have a \texttt{build.xml} file
in your grammar directory, which contains build tasks for the Apache Ant
tool to carry out.  The \texttt{tiny} grammar directory contains a build
file which just validates the runtime files, as shown below:

\begin{small}
\begin{verbatim}
D:\Mike\dev\openccg\grammars\tiny>ccg-build
Buildfile: build.xml

init:
     [echo] ----------- OpenCCG ------------

grammar:
     [echo] Validating grammar.xml, lexicon.xml, morph.xml, 
            rules.xml and types.xml

BUILD SUCCESSFUL
Total time: 4 seconds
\end{verbatim}
\end{small}

\noindent If there are any errors, validation with \texttt{ccg-build}
gives relatively informative error messages. Loading a grammar into
\texttt{tccg} will perform some further checks, but note that loading a
grammar with errors usually means \texttt{tccg} croaks---outputting
only (less informative) stack traces---so it's good practice to validate
any changes you make to your grammars prior to running \texttt{tccg}.

\subsection{Using a \texttt{dict.xml} file}

Rather than creating a \texttt{morph.xml} file directly, you can employ
a \texttt{dict.xml} file, which groups word forms by their stems and
parts of speech, and lists the closed families for a given stem. A
\texttt{dict.xml} files usually works together with a file called
\texttt{lexicon-base.xml}, which does not contain \textsl{member}
entries for families. From the \texttt{dict.xml} file---which also
contains macro definitions---the \texttt{morph.xml} file can be
generated automatically, with proper hooks to a derived
\texttt{lexicon.xml} file, using \texttt{ccg-build}. (See the
\texttt{dict.xsd} schema in the \texttt{grammars} directory for a
complete description.)

In short, the simplest way to use a \texttt{dict.xml} file with
\texttt{ccg-build} is to prepare a family of categories in the file
named \texttt{lexicon-base.xml} without \textsl{member} entries, and to
group stems and their word forms in a file called \texttt{dict.xml},
along with macro definitions.

A sample entry from the \texttt{cem-english} \texttt{dict.xml} 
file appears below:

\begin{verbatim}
  <entry stem="eat" pos="V">
    <member-of family="IV"/>
    <member-of family="TV"/>
    <word form="eat" macros="@nonfin"/>
    <word form="eats" macros="@pres @+3rd-agr @sg-agr"/>
    <word form="ate" macros="@past"/>
    <word form="eaten" macros="@past-part"/>
  </entry>
\end{verbatim}

\noindent Note that the stem \gf{eat} is declared intransitive and
transitive without duplication in the morph or lexicon files. If you run
\texttt{ccg-build} as follows,

\begin{verbatim}
cem-english> ccg-build grammar
Buildfile: build.xml

init:
     [echo] ----------- OpenCCG ------------

grammar:
     [echo] Adding family members from dict.xml to 
            lexicon-base.xml, yielding lexicon.xml

     [echo] Extracting morph items from dict.xml to morph.xml

     [echo] Validating grammar.xml, lexicon.xml, morph.xml, 
            rules.xml and types.xml

BUILD SUCCESSFUL
Total time: 5 seconds
\end{verbatim}

\noindent there will be two lexical assignments for every word form of
\gf{eat}, one for its intransitive use, and one for transitive.

\subsection{Reducing redundancy with XSLT}

\href{http://www.w3.org/Style/XSL/}{XSLT} is a language for transforming
XML documents. Two XSLT transformations, \texttt{add-family-members.xsl}
and \texttt{extract-morph.xsl}, are used by \texttt{ccg-build} to handle
\texttt{dict.xml} files. You can also use XSLT transformations to reduce
redundancy in the lexico-grammar specifications.

For example, the \texttt{worldcup} grammar illustrates a couple of ways
of using XSLT to improve the specification of lexical families. With
this grammar, the \texttt{lexicon-base.xml} file is generated from an
XSLT transformation, called \texttt{lexicon-base.xsl}. This file begins
with the definition of variables for the various atomic categories used
in later complex category and family definitions.  The variable names
follow the format

\begin{verbatim} 
  <cat>(.<id>)?(.from-<id>)?(.<index>?)(.<feat-descriptions>)*
\end{verbatim}

\noindent i.e., the category label, followed optionally by the
\texttt{id}, the \texttt{inheritsFrom} id, the \texttt{index} variable,
and any further feature descriptions. This convention allows one to see
what atomic categories are already in use, and to determine the contents
of an atomic category at a glance. For example, \texttt{np.3.Y.acc} is
the name of the category with label \texttt{np}, id \texttt{3}, index
\texttt{Y}, and the case value \texttt{acc}; 
\texttt{np.2.X.default} is similar, but has default variables for
all features other than the \texttt{index}.

Once variables have been declared, they can be referenced further on
using \texttt{xsl:copy-of} statements. For example, the variable
\texttt{np.2.X.default} is referenced seven times in
\texttt{lexicon-base.xsl}. In this way, if a change to
\texttt{np.2.X.default} is desired, it can be made in one place in the
file, rather than seven.

Another XSLT mechanism employed in \texttt{lexicon-base.xsl} is a named
templated called \texttt{extend} which serves to append one element as
the last child of another.  This mechanism is used to associate logical
forms with syntactic categories, as well as to create new categories
from existing ones.  For example, in

\begin{small}
\begin{verbatim} 
  <xsl:variable name="wh-det.subj">    
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" 
                      select="xalan:nodeset($wh-np.subj)/*"/>
      <xsl:with-param name="ext" 
                      select="$fslash-n.2.X"/>
    </xsl:call-template>
  </xsl:variable>
\end{verbatim}
\end{small}

\noindent the category for a subject type-raised \emph{wh}-determiner,
like \gf{which}, is created by extending the category of a subject
type-raised \emph{wh}--noun phrase (e.g.\ \gf{who}) with an extra
nominal argument, \texttt{fslash-n.2.X} (declared earlier as a forward
slash plus a category with label \texttt{n}, id \texttt{2} and index
\texttt{X}).\footnote{The \texttt{xalan:nodeset} function makes it
possible to use a variable as a parameter to a named template; its use
won't be necessary in future versions of XSLT.} In this way, any changes
made to the category for \emph{wh}-determiners will carry over to the
category for \emph{wh}--noun phrases.

As XSLT is a powerful and extensible XML transformation language, there
are many further possibilities for using it in grammar
development---limited only by your imagination (and hacking ability). 

%% NB: Could eventually add lexical rule example.

%% NB: Should add discussion of chunking rules.
%% NB: Should add discussion of \textsl{licensing-features}


%% =====================================================================
%% BIBLIOGRAPHY
%% =====================================================================

\addcontentsline{toc}{section}{References}
\bibliographystyle{alpha}
\bibliography{openccg}

\end{document}


================================================
FILE: docs/guide/openccg.bib
================================================
@string{nllt="Natural Language and Linguistic Theory"}

@phdthesis{Baldridge:2002,
  author = {Baldridge, Jason},
  title  = {Lexically Specified Derivational Control in {C}ombinatory {C}ategorial {G}rammar},
  school = {School of Informatics, University of Edinburgh},
  year = {2002},
  note={Available from \url{http://homepages.inf.ed.ac.uk/jbaldrid/dissertation/}}
}
%  address = {Edinburgh, Scotland},

@inproceedings{Baldridge/Kruijff:2002,
  author={Baldridge, Jason and Kruijff, Geert-Jan M.},
  title={Coupling {CCG} and Hybrid Logic Dependency Semantics},
  booktitle={Proceedings of the 40th Annual Meeting of the Association for Computational Linguistics (ACL 2002)},
  year =         {2002},
  address =      {Philadelphia, Pennsylvania}
}

@inproceedings{Baldridge/Kruijff:2003,
  author={Baldridge, Jason and Kruijff, Geert-Jan M.},
  title={Multi-Modal Combinatory Categorial Grammar},
  booktitle={Proceedings of the 10th Conference of the European Chapter of the Association for Computational Linguistics (EACL 2003)},
  year =         {2003},
  address =      {Budapest, Hungary}}
}

@phdthesis{Kruijff:2001,
  author={Kruijff, Geert-Jan M.},
  title={A Categorial-Modal Logical Architecture of Informativity: Dependency Grammar Logic \& Information Structure},
  school={Faculty of Mathematics and Physics, Charles University},
  address={Prague, Czech Republic},
  year={2001}}

@book{Steedman:SynProc,
  author = {Mark Steedman},
  title = {The Syntactic Process},
  publisher = {The MIT Press},
  address="Cambridge Mass.",
  year = {2000},
}

@inproceedings{White/Baldridge:2003,
  author = {White, Michael and Baldridge, Jason},
  title  = {Adapting Chart Realization to {CCG}},
  booktitle = {Proceedings of the Ninth European Workshop on Natural Language Generation},
  year =         {2003},
  address =      {Budapest, Hungary}}
}

@Article{White-RLAC:2004,
author = {Michael White}, 
year = 2004, 
title = "{Efficient Realization of Coordinate Structures in Combinatory Categorial Grammar}",
journal = {Research on Language and Computation}, 
note = {To appear}
}

@InProceedings{White-INLG:2004,
author = {Michael White}, 
year = 2004, 
title = "{Reining in CCG Chart Realization}",
booktitle = {Proceedings of the Third International Conference on Natural Language Generation, INLG-04}
}

@InProceedings{White-ACLSoft:2005,
author = {Michael White}, 
year = 2005, 
title = "Designing an Extensible {API} for Integrating Language Modeling and Realization",
booktitle = {Proc.\ ACL-05 Workshop on Software}
}


@mastersthesis{erkanms03, 
author = {G{\"u}ne{\c{s}} Erkan}, 
title = {A Type System for {CCG}}, 
school = {Middle East Technical University, Ankara},
note={Available from \url{http://www.LcsL.metu.edu.tr/ftp/theses/erkan-ms-03.pdf.gz}},
year = {2003}, 
} 

@unpublished{bozsahinsteedman03,
author="Cem Bozsahin and Mark Steedman",
title="Lexicalized Asymmetry and Syntactic Projection",
year="2005",
note="{Manuscript}, University of {E}dinburgh"
}

@unpublished{Steedman/Baldridge:2003,
  author = 	 {Mark Steedman and Jason Baldridge},
  title = 	 {Combinatory {C}ategorial {G}rammar},
  note = {Tutorial paper, available from \url{http://homepages.inf.ed.ac.uk/jbaldrid/ccg.pdf}},
  year = {2003},
}

@article{bozsahin02cl,
author="Cem Bozsahin",
title= "The Combinatory Morphemic Lexicon",
journal= "Computational Linguistics",
volume=28, 
number=2,
pages="145--176",
year="2002"
}

@article{bresnanmchombo95,
author="Joan Bresnan and Sam A. Mchombo",
title= "The {L}exical {I}ntegrity {P}rinciple: Evidence from {B}antu",
journal= nllt,
volume="13",
pages="181--254",
year="1995"
}


================================================
FILE: docs/guide/openccg.sty
================================================

%%
%% This style file contains a minimal set of commands for 
%% OpenCCG categories and logical forms, plus derivations. 
%% It borrows from earlier style files by Gann, Jason and Geert-Jan, 
%% and from Beryl and Mark for the derivations.
%%

\newcommand{\bs}{\backslash}        % backslash, to save typing

\newcommand{\gf}[1]{\textsf{\textsl{#1}}}       % gloss font, for words
\newcommand{\cf}[1]{\ensuremath{\mathsf{#1}}}   % category font

\newcommand{\fb}[1]{\ensuremath{_{\mathit{#1}}}}                    % features, subscripted
\newcommand{\fsb}[2]{\ensuremath{_{\langle#1\rangle\mathit{#2}}}}   % fs index and features, subscripted

\newcommand{\C}[1]{\textbf{#1}}                 % concept font
\newcommand{\con}[1]{\ensuremath{\mathrm{#1}}}  % constant font, for sem feature values or sem sorts

\newcommand{\modp}[1]{\ensuremath{\langle}\textsc{#1}\ensuremath{\rangle}}  % sem relation/feature


% CCG derivations
% arguments: #1 = no. of words, #2 = body
% Carsten suggests removing @{}, in order to eliminate a gap on the 
% left end of lines in the derivation 
\newcommand{\deriv}[2]
{ 
  \renewcommand{\arraystretch}{.5}
  $\begin{array}[t]{*{#1}{c}}
     #2
   \end{array}$ 
}

% centered multicolumn (NB: changed \mc to \cmc to avoid conflict with kluwer.cls) 
\newcommand{\cmc}[2]{\multicolumn{#1}{c}{#2}}

% Rules, argument #1 gives the number of columns to cover.
\newcommand{\uline}[1]
{\cmc{#1}{\hrulefill} }
\newcommand{\fapply}[1]
{ \cmc{#1}{\hrulefill_{>}} }
\newcommand{\bapply}[1]
{ \cmc{#1}{\hrulefill_{<}} }
\newcommand{\fcomp}[1]
{ \cmc{#1}{\hrulefill_{{>}\mathbf{B}}}}
\newcommand{\fxcomp}[1]
{ \cmc{#1}{\hrulefill_{{>}\mathbf{B}_{\times}}}}
\newcommand{\fxcompN}[2]
{ \cmc{#1}{\hrulefill_{{>}\mathbf{B}^{#2}_{\times}}}}
\newcommand{\fcomptwo}[1]
{ \cmc{#1}{\hrulefill_{{>}\mathbf{B}^2}}}
\newcommand{\fxcomptwo}[1]
{ \cmc{#1}{\hrulefill_{{>}\mathbf{B}_{\times}^2}}}
\newcommand{\fcompthree}[1]
{ \cmc{#1}{\hrulefill_{{>}\mathbf{B}^3}}}
\newcommand{\fxcompthree}[1]
{ \cmc{#1}{\hrulefill_{{>}\mathbf{B}_{\times}^3}}}
\newcommand{\bcomp}[1]
{ \cmc{#1}{\hrulefill_{{<}\mathbf{B}}}}
\newcommand{\bxcomp}[1]
{ \cmc{#1}{\hrulefill_{{<}\mathbf{B}_{\times}}}}
\newcommand{\bxcompN}[2]
{ \cmc{#1}{\hrulefill_{{<}\mathbf{B}^{#2}_{\times}}}}
\newcommand{\bcomptwo}[1]
{ \cmc{#1}{\hrulefill_{{<}\mathbf{B}^2}}}
\newcommand{\bxcomptwo}[1]
{ \cmc{#1}{\hrulefill_{{<}\mathbf{B}_{\times}^2}}}
\newcommand{\bcompthree}[1]
{ \cmc{#1}{\hrulefill_{{<}\mathbf{B}^3}}}
\newcommand{\bxcompthree}[1]
{ \cmc{#1}{\hrulefill_{{<}\mathbf{B}_{\times}^3}}}
\newcommand{\fsubst}[1]
{ \cmc{#1}{\hrulefill_{{>}\mathbf{S}}}}
\newcommand{\bsubst}[1]
{ \cmc{#1}{\hrulefill_{{<}\mathbf{S}}}}
\newcommand{\fxsubst}[1]
{ \cmc{#1}{\hrulefill_{{>}\mathbf{S}_{\times}}}}
\newcommand{\bxsubst}[1]
{ \cmc{#1}{\hrulefill_{{<}\mathbf{S}_{\times}}}}
\newcommand{\ftype}[1]
{ \cmc{#1}{\hrulefill_{{>}\mathbf{T}}}}
\newcommand{\btype}[1]
{ \cmc{#1}{\hrulefill_{{<}\mathbf{T}}}}
\newcommand{\conj}[1]
{ \cmc{#1}{\hrulefill_{{<}\Phi{>}}}}
\newcommand{\boundary}[1]
{ \cmc{#1}{\hrulefill_{{<}\mathbf{\%}}}}
\newcommand{\asterisk}[1]
{ \cmc{#1}{\hrulefill_{\mathbf{*}}}}
\newcommand{\comb}[2] % an arbitrary combinator
{ \cmc{#1}{\hrulefill_{#2}}}
\newcommand{\badcomb}[2] % an inappropriate use of a combinator
{ \cmc{#1}{\hrulefill_{\mbox{ *** }}\hrulefill_{#2}}}
\newcommand{\dcomp}[2] % an arbitrary dcomposition
{ \cmc{#1}{\dotfill_{#2}}}
\newcommand{\unfreeze}[1]
{\cmc{#1}{\hrulefill_{\mathbf{@}}}  }

\newcommand{\ul}{\uline{1}}

\newcounter{CCG@counter}
\newcommand{\CCG@amp}{&}

\newcommand{\ulines}[1]{
  \uline{1}
  \setcounter{CCG@counter}{1} 
  \whiledo{\value{CCG@counter} < #1} { 
    \CCG@amp \uline{1}
    \stepcounter{CCG@counter} 
  }
}


================================================
FILE: docs/index.html
================================================
<html>
<head>

<!-- Language related information -->
<meta http-equiv=Content-Language content=EN>
<meta http-equiv=Content-Type content="text/html; charset=iso-8859-1">
<meta name=language content=EN>
<meta name=keywords content="CCG, OpenCCG, OpenNLP, Natural Language, NLP, AI">

<Link rel="stylesheet" href="style.css" type="text/css">

<title>The OpenCCG Homepage</title>

</head>
<body bgcolor="#FFFFFF">

<table width=100% border=0 cellPadding=0 cellSpacing=0>
<tr>
  <!--  <td width=18%>&nbsp;</td>-->
  <td width=60% alight="left" valign="top"><h2>OpenCCG: The OpenNLP CCG Library</td>
  <td width=27% align="right" valign="top"><h2>Home</h2></td>
  <td width=13%>&nbsp;</td> 
</tr>
</table>

<table width=100% height=100% border=0 cellPadding=0 cellSpacing=0>
<tr> 
<!--  <td width=18%>&nbsp;</td> -->
<td width=12%>&nbsp;</td>  
<td width=75% valign="top">

<HR WIDTH="100%">

<p>
OpenCCG, the <a href="http://opennlp.sf.net">OpenNLP</a> CCG Library, is an 
open source natural language processing library written in
Java, which provides parsing and realization services based on 
<a href="http://www.inf.ed.ac.uk/~steedman/">Mark Steedman</a>'s 
<a href="http://www.jasonbaldridge.com/papers/SteedmanBaldridgeNTSyntax.pdf">Combinatory
Categorial Grammar</a> (CCG) formalism.  
</p>

<p>
The library makes use of multi-modal extensions to CCG developed by 
<a href="http://www.jasonbaldridge.com/">Jason Baldridge</a> 
as part of the <a href="http://grok.sourceforge.net/">Grok</a> system
(the precursor to OpenCCG).
These extensions are described in Jason's 
<a href="http://hdl.handle.net/1842/562">dissertation</a> 
and in a joint <a href="http://www.aclweb.org/anthology-new/E/E03/E03-1036.pdf">EACL-03 paper</a> with 
<a href="http://www.dfki.de/~gj/">Geert-Jan Kruijff</a>. 
</p>

<p>
Subsequent development efforts, led by <a
 href="http://www.ling.ohio-state.edu/~mwhite/">Michael White</a>,
have focused on making the realizer practical to use in dialogue
systems, and more recently, on realization with broad coverage
grammars.  See the papers on Mike's web page for details. Since
version 0.9.4, OpenCCG has included broad coverage English parsing and
realization support that together make it possible to experiment with
open domain grammatical paraphrasing. Version 0.9.5 adds features for
dependency ordering and dependency length minimization in realization,
as in <a
 href="http://aclweb.org/anthology-new/D/D12/D12-1023.pdf">White and
Rajkumar (2012)</a>, along with support for using 5-gram gigaword
language models with <a
 href="http://kheafield.com/code/kenlm/">KenLM</a>, and creating
disjunctive logical forms based on the differences between aligned
semantic graphs, as in <a
 href="http://www.aclweb.org/anthology/W/W11/W11-1609.pdf">Martin and
White (2011)</a>.  It also includes <code>ccg2jsgf</code>, an <a
 href="https://sourceforge.net/projects/openccg/files/extensions/">extension</a>
developed for Knexus Research Corporation for compiling an OpenCCG
grammar into a context-free grammar in the Java Speech Grammar Format
used by the Sphinx speech recognizer, now released open
source. <b>(new!)</b>
</p>

<p>
Also, Jason Baldridge and students at UT Austin have developed DotCCG,
a new format for specifying OpenCCG grammars, and VisCCG, an editor
and visualizer for grammars written in DotCCG format. These
developments are described in <a
href="http://csli-publications.stanford.edu/GEAF/2007/papers/geaf07baldridgeetal.pdf">Baldridge,
Chatterjee, Palmer and Wing (2007)</a>. See the UT Austin
computational linguistics lab's <a
href="http://www.utcompling.com/wiki/openccg">OpenCCG
wiki</a>, which has a number of tutorials and example grammars for
DotCCG and VisCCG.
</p>

<p>
OpenCCG has been and is being used for a number of dialog systems: see
<a
href="http://www.utcompling.com/wiki/openccg/projects-using-openccg">the
list of projects using OpenCCG</a>. Please get in touch with Jason if you
would like add yours.
</p>

<p>
For the latest news about OpenCCG, check out the 
<a href="https://sourceforge.net/projects/openccg/">SourceForge
project page</a>.
</p>

<p>
Further development of OpenCCG has moved to
<a href="https://github.com/OpenCCG/openccg">GitHub</a>, 
where you can get the very latest code on branch
<code>master</code>; releases and binaries will continue to be posted
on SourceForge.
</p>

<center>
[<a href="index.html">Home</a>]
[<a href="https://github.com/OpenCCG/openccg/wiki">Wiki</a>]
[<a href="https://github.com/OpenCCG/openccg">GitHub</a>]
[<a href="https://sourceforge.net/projects/openccg/">SourceForge</a>]
[<a href="https://sourceforge.net/project/showfiles.php?group_id=74993">Download</a>]
<!-- 
[<a href="api/index.html">API</a>]
-->
[<a href="https://sourceforge.net/forum/?group_id=74993">Forums</a>]
</center>

<HR WIDTH="100%">
<h3>
Email: mwhite at (no spam please) ling dot osu dot edu<br>
2015 March 16<br>
<br>
<A href="http://sourceforge.net"> <IMG src="http://sourceforge.net/sflogo.php?group_id=74993&amp;type=5" width="210" height="62" border="0" alt="SourceForge.net Logo"></A> 
<br>
</h3>  

</td>
<td width=13%>&nbsp;</td>
</tr>
</table>


================================================
FILE: docs/maxent.cpp.patch
================================================
--- /home/dnm/maxent/maxent-20061005/src/maxent.cpp	2009-05-08 23:57:52.000000000 -0400
+++ /home/dnm/maxentfixes/maxentpatched.cpp	2009-05-08 23:57:47.000000000 -0400
@@ -154,6 +154,9 @@
             const char* q = it->second;
             while (p < q && *p != ':')
                 ++p;
+	    // fixes the case where ':' is in the feature string (D.N. Mehay)
+	    if((p+1) < q && *++p != ':')
+	      --p;
             if (p == q)
                 return false;
             context.push_back(make_pair(string(it->first, p - it->first), 


================================================
FILE: docs/realizer/build.xml
================================================
<?xml version="1.0"?>

<project name="OpenCCG Realizer Manual" basedir="." default="compile">

	<uptodate property="realizer-manual.upToDate"
    srcfile="./manual.tex"
    targetfile="../realizer-manual.pdf"/>
	
  <!-- =================================================================== -->
  <!-- Compiles Realizer Manual                                            -->
  <!-- =================================================================== -->
  <target name="compile" unless="realizer-manual.upToDate">
    <echo message="Compiling grammar rough guide"/>
    
    <available file="./gb4e.sty" property="gb4e.sty.present"/>
    <fail unless="gb4e.sty.present" message="gb4e.sty is not present"/>

  	<available file="./cgloss4e.sty" property="cgloss4e.sty.present"/>
    <fail unless="cgloss4e.sty.present" message="cgloss4e.sty is not present"/>

    <available file="./openccg.sty" property="openccg.sty.present"/>
    <fail unless="openccg.sty.present" message="openccg.sty is not present"/>
	    
    <available file="./refs.bib" property="refs.bib.present"/>
    <fail unless="refs.bib.present" message="refs.bib is not present"/>
  	
  	<available file="./ex1a.pdf" property="ex1a.pdf.present"/>
    <fail unless="ex1a.pdf.present" message="ex1a.pdf is not present"/>
  	
  	<available file="./ex1b.pdf" property="ex1b.pdf.present"/>
    <fail unless="ex1b.pdf.present" message="ex1b.pdf is not present"/>
    	
   	<available file="./ex1c.pdf" property="ex1c.pdf.present"/>
    <fail unless="ex1c.pdf.present" message="ex1c.pdf is not present"/>
  	
  	<available file="./pruner-class.pdf" property="pruner-class.pdf.present"/>
    <fail unless="pruner-class.pdf.present" message="pruner-class.pdf is not present"/>
    	
   	<available file="./realizer-class.pdf" property="realizer-class.pdf.present"/>
    <fail unless="realizer-class.pdf.present" message="realizer-class.pdf is not present"/>
    	
   	<available file="./scorer-class.pdf" property="scorer-class.pdf.present"/>
    <fail unless="scorer-class.pdf.present" message="scorer-class.pdf is not present"/>
	    
    <!-- branch on cygwin, then finish -->
    <antcall target="compile.default"/>
    <antcall target="compile.cygwin"/>
    <antcall target="compile.finish"/>
  </target>

  <target name="compile.default" unless="cygwin">
    <echo message="(default compile)"/>
    <exec executable="pdflatex" dir="." failonerror="true">
      <arg value="manual.tex"/>
    </exec>
    <exec executable="bibtex" dir="." failonerror="true">
      <arg value="manual"/>
    </exec>
    <exec executable="pdflatex" dir="." failonerror="true">
      <arg value="manual.tex"/>
    </exec>
    <exec executable="pdflatex" dir="." failonerror="true">
      <arg value="manual.tex"/>
    </exec>
  </target>
	  
  <target name="compile.cygwin" if="cygwin">
    <echo message="(cygwin compile)"/>
    <exec executable="bash" dir="." failonerror="true">
      <arg value="-c"/> <arg value="pdflatex manual.tex"/>
    </exec>
    <exec executable="bash" dir="." failonerror="true">
      <arg value="-c"/> <arg value="bibtex manual"/>
    </exec>
    <exec executable="bash" dir="." failonerror="true">
      <arg value="-c"/> <arg value="pdflatex manual.tex"/>
    </exec>
    <exec executable="bash" dir="." failonerror="true">
      <arg value="-c"/> <arg value="pdflatex manual.tex"/>
    </exec>
  </target>
	  
  <target name="compile.finish">
    <copy file="./manual.pdf" tofile="../realizer-manual.pdf" overwrite="true" />
  </target>

  <target name="clean">
    <delete>
      <fileset dir="." includes="manual.*" excludes="manual.tex"/>
    </delete>
  </target>

</project>

================================================
FILE: docs/realizer/cgloss4e.sty
================================================
% -*- LaTeX -*-
% Following borrows from Covington's style files inspired by Midnight by M.
% de Groot, adapted to be used with gb4e.sty: examples beginning with \ex can
% contain glosses directly. Default is
% Linguistic Inquiry style with all lines in \rm; to change a line (eg. to
% \it for a particular journal, change the appropriate line: e.g.,
% \let\eachwordone=\rm in a copy of this file. Note that it will NOT work
% to put \it before the line as the words are parsed separately.

% Use \singlegloss to force single-spaced glosses even in double-space
% environments. Works also in footnotes (^M as delimiter replaced by
% \\)---hpk
%
%%%
%%% Sentences with word-by-word glosses
%%%

% See covingtn.tex for full documentation.  Some examples:
%
% Displayed sentence with gloss and translation:
%
%             \gll Dit is een Nederlands voorbeeld.\\
%                  This is a Dutch example.\\
%             \glt `This is an example in Dutch.'
%
% Same, using bracketing where words do not correspond one-to-one:
%
%             \gll Dit is een voorbeeldje     in het Nederlands.\\
%                  This is a {little example} in {}  Dutch.\\
%             \glt `This is a little example in Dutch.'
%
% If you want to align 3 lines rather than two, use \glll instead of \gll.
%
% Layout is critical between \gll (or \glll) and \glt (or \gln).
%
% Thanks to Marcel R. van der Goot for permission to reproduce code.
\let\@gsingle=1
\def\singlegloss{\let\@gsingle=1}
\def\nosinglegloss{\let\@gsingle=0}
\@ifundefined{new@fontshape}%
   {\def\@selfnt{\ifx\@currsize\normalsize\@normalsize\else\@currsize\fi}}
   {\def\@selfnt{\selectfont}}

\def\gll%                 % Introduces 2-line text-and-gloss.
   {\begin{flushleft}
     \ifx\@gsingle1%           conditionally force single spacing (hpk/MC)
        \vskip\baselineskip\def\baselinestretch{1}%
        \@selfnt\vskip-\baselineskip\fi%
    \bgroup
    \twosent
   }

\def\glll%                 % Introduces 3-line text-and-gloss.
   {\begin{flushleft}
     \ifx\@gsingle1%        conditionally force single spacing (hpk/MC)
        \vskip\baselineskip\def\baselinestretch{1}%
        \@selfnt\vskip-\baselineskip\fi%
    \bgroup
    \threesent
   }

\def\glt{\vskip.17\baselineskip}
% Introduces a translation
\let\trans\glt

\def\glend{} % obsolete
      % Ends the gloss environment.

% The following TeX code is adapted, with permission, from:
% gloss.tex: Macros for vertically aligning words in consecutive sentences.
% Version: 1.0  release: 26 November 1990
% Copyright (c) 1991 Marcel R. van der Goot (marcel@cs.caltech.edu).
% Original Midnight/gloss.tex and Midnight/gloss.doc are available from
% csvax.cs.caltech.edu [131.215.131.131] in pub/tex
% and many other anonymous ftp archives.

\newbox\lineone% boxes with words from first line
\newbox\linetwo%
\newbox\linethree%
\newbox\wordone% a word from the first line (hbox)
\newbox\wordtwo%
\newbox\wordthree%
\newbox\gline% the constructed double line (hbox)
\newskip\glossglue% extra glue between glossed pairs or triples
\glossglue = 0pt plus 2pt minus 1pt % allow stretch/shrink between words
%\glossglue = 5pt plus 2pt minus 1pt % allow stretch/shrink between words
\newif\ifnotdone

\@ifundefined{eachwordone}{\let\eachwordone=\rm}{\relax}
\@ifundefined{eachwordtwo}{\let\eachwordtwo=\rm}{\relax}
\@ifundefined{eachwordthree}{\let\eachwordthree=\rm}{\relax}

\def\lastword#1#2#3% #1 = \each, #2 = line box, #3 = word box
   {\setbox#2=\vbox{\unvbox#2%
                    \global\setbox#3=\lastbox%
                   }%
    \ifvoid#3\global\setbox#3=\hbox{#1\strut{} }\fi
        % extra space following \strut in case #1 needs a space
   }

\def\testdone
   {\ifdim\ht\lineone=0pt
         \ifdim\ht\linetwo=0pt \notdonefalse % tricky space after pt
         \else\notdonetrue
         \fi
    \else\notdonetrue
    \fi
   }

\gdef\getwords(#1,#2)#3 #4\\% #1=linebox, #2=\each, #3=1st word, #4=remainder
   {\setbox#1=\vbox{\hbox{#2\strut#3 }% adds space
                    \unvbox#1%
                   }%
    \def\more{#4}%
    \ifx\more\empty\let\more=\donewords
    \else\let\more=\getwords
    \fi
    \more(#1,#2)#4\\%
   }

\gdef\donewords(#1,#2)\\{}%

\gdef\twosent#1\\ #2\\{% #1 = first line, #2 = second line
    \getwords(\lineone,\eachwordone)#1 \\%
    \getwords(\linetwo,\eachwordtwo)#2 \\%
    \loop\lastword{\eachwordone}{\lineone}{\wordone}%
         \lastword{\eachwordtwo}{\linetwo}{\wordtwo}%
         \global\setbox\gline=\hbox{\unhbox\gline
                                    \hskip\glossglue
                                    \vtop{\box\wordone   % vtop was vbox
                                          \nointerlineskip
                                          \box\wordtwo
                                         }%
                                   }%
         \testdone
         \ifnotdone
    \repeat
    \egroup % matches \bgroup in \gloss
   \gl@stop}

\gdef\threesent#1\\ #2\\ #3\\{% #1 = first line, #2 = second line, #3 = third
    \getwords(\lineone,\eachwordone)#1 \\%
    \getwords(\linetwo,\eachwordtwo)#2 \\%
    \getwords(\linethree,\eachwordthree)#3 \\%
    \loop\lastword{\eachwordone}{\lineone}{\wordone}%
         \lastword{\eachwordtwo}{\linetwo}{\wordtwo}%
         \lastword{\eachwordthree}{\linethree}{\wordthree}%
         \global\setbox\gline=\hbox{\unhbox\gline
                                    \hskip\glossglue
                                    \vtop{\box\wordone   % vtop was vbox
                                          \nointerlineskip
                                          \box\wordtwo
                                          \nointerlineskip
                                          \box\wordthree
                                         }%
                                   }%
         \testdone
         \ifnotdone
    \repeat
    \egroup % matches \bgroup in \gloss
   \gl@stop}

\def\gl@stop{{\hskip -\glossglue}\unhbox\gline\end{flushleft}}

\endinput


================================================
FILE: docs/realizer/gb4e.sty
================================================
% -*- LaTeX -*-
\def\gbVersion{4e}
%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
%  Version 4export (= v. 4 minus the compatibility code)
%  Based on hpk's gb.sty, revised for GM syllabus by ct,
%  and incorporating macros adapted from J.Frampton, M. de Groot en M.
%  Covington. Full documentation soon to come in gb4doc.tex. Bug-reports
%  and suggestions for improvements, other used features, please!
%
%  Notes:
%  
%  Various styles for X-bar levels; can be changed, but note that {picture}
%  environements (e.g. trees) will then come out wrong and have to be
%  fixed
%
%  This file allows _ and ^ to be used in ordinary text, hence must be
%  loaded AFTER any file that uses them in their TeX meaning. Hence
%  cgloss(n).sty is loaded early in this file.
%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%

%%%%%%%%%%%%%%%%%%%%%%%%
%  Format of examples: %
%%%%%%%%%%%%%%%%%%%%%%%%
% \begin{exe} or \exbegin
% <examples>                           (arab.)
% \begin{xlist} or \xlist
% <subexamples>                        (1st embedding, alph.)
% \begin{xlisti} or \xlisti
% <subsubexamples>                     (2st embedding, rom.)
% \end{xlisti}  or \endxlisti
% <more examples>
% \end{xlist} or \endxlist
% <still more examples>
% \end{exe} or \exend
%
% Other sublist-styles: xlistA (Alph.), xlistI (Rom.), xlistn (arab)
%
% \ex                               (produces Number)
% \ex <sentence>                    (numbered example)
% \ex[jdgmt]{sentence}              (numbered example with judgement)
%
% \exi{ident}                      (produces identifier)
% \exi{ident} <sentence>           (example numbered with identifier)
% \exi{ident}[jdgmt]{sentence}     (dito with judgement)
%                      (\exr, \exp and \sn are defined in terms of \exi)
%
% \exr{label}                       (produces cross-referenced Num.)
% \exr{label} <sentence>            (cross-referenced example)
% \exr{label}[jdgmt]{sentence}      (cross-referenced example with judgement)
%
% \exp{label}                       (same as
% \exp{label} <sentence>                     \exr but
% \exp{label}[jdgmt]{sentence}                        with prime)
%
% \sn <sentence>                    (unnumbered example)
% \sn[jdgmt]{sentence}              (unnumbered example with judgement)
%
%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%

\@ifundefined{new@fontshape}{\def\reset@font{}\let\mathrm\rm}{}

\let\prmbrs=0
\def\primebars{\let\prmbrs=1}
\def\obar#1{\ifmmode#1^{0}\else#1$^{0}$\fi}  %% FIX
\def\mbar#1{\ifmmode#1^{\mathrm{max}}\else#1$^{\mathrm{max}}$\fi}
\def\ibar#1{\ifx\prmbrs0%
                 \ifmmode\overline{\mathrm{#1}}\else$\overline{\mbox{#1}}$\fi%
            \else\ifmmode#1^{'}\else#1$^{'}$\fi\fi}
\def\iibar#1{\ifx\prmbrs0%
                  \ifmmode\overline{\overline{\mathrm{#1}}}%
                  \else$\overline{\overline{\mbox{#1}}}$\fi%
             \else #1P\fi}
\def\th{\ifmmode\theta\else$\theta$\fi}
\def\al{\ifmmode\alpha\else$\alpha$\fi}
\def\be{\ifmmode\beta\else$\beta$\fi}
\def\ga{\ifmmode\gamma\else$\gamma$\fi}
\def\de{\ifmmode\delta\else$\delta$\fi}
\def\spec#1{[Spec,#1]} %Def. of "Specifier of #1"
\def\ct#1{{\em #1\/}} %Citation of linguistic material with alternative style:
%\def\ct#1{`#1'}
\def\tx{\bf} %Introduction of technical terms with alternative style:
%\def\tx{\em}

\input{cgloss\gbVersion.sty}

%%% NEWSTUFF:
%\newcommand{\indexgroupmark}[1]{\item{\bf #1}}  % ?? -CT

% this allows _ to be used in horizontal mode (from J.Frampton):
% \catcode`_=\active
% \def_#1{\ifmmode\mit{\sb{#1}}\else${}\sb{#1}$\fi}
% \catcode`^=\active
% \def^#1{\ifmmode\mit{\sp{#1}}\else${}\sp{#1}$\fi}

% \def\lb#1{\@ifnextchar [{\@glarph{#1}}{\@bl{#1}}}
%\def\@glarph#1[#2]{\ifmmode{[}\sb{{\mathrm{#1}}\sb{#2}}\else%
%                            ${[}\sb{{\mathrm{#1}}\sb{#2}}$\fi}
% \def\@bl#1{\ifmmode{[}\sb{\mathrm{#1}}\;\else${[}\sb{\mathrm{#1}}\;$\fi}

% \def\rb#1{\@ifnextchar [{\@grarph{#1}}{\@br{#1}}}
%\def\@grarph#1[#2]{\ifmmode{]}\sb{{\mathrm{#1}}\sb{#2}}\else%
%                         ${]}\sb{{\mathrm{#1}}\sb{#2}}$\fi}
% \def\@br#1{\ifmmode{]}\sb{\mathrm{#1}}\;\else${]}\sb{\mathrm{#1}}\;$\fi}

%%% END_NEWSTUFF.


%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
%  Macros for examples, roughly following Linguistic Inquiry style.   %
%  From here on best not to tamper, else all the examples and cross-  %
%  references will come out scrambled! (see also note below) - CT     %
%  Completely rewritten for more robustness and flexibility. (hpk)    %
%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%

\def\qlist{\begin{list}{\Alph{xnum}.}{\usecounter{xnum}%
\setlength{\rightmargin}{\leftmargin}}}
\def\endqlist{\end{list}}

\newif\if@noftnote\@noftnotetrue
\newif\if@xrec\@xrecfalse
\@definecounter{fnx}

%%%% adapted from latex.tex to get examples in footnotes right
\long\def\@footnotetext#1{%
    \@noftnotefalse\setcounter{fnx}{0}%
    \insert\footins{\reset@font\footnotesize
    \interlinepenalty\interfootnotelinepenalty
    \splittopskip\footnotesep
    \splitmaxdepth \dp\strutbox \floatingpenalty \@MM
    \hsize\columnwidth \@parboxrestore
   \edef\@currentlabel{\csname p@footnote\endcsname\@thefnmark}\@makefntext
    {\rule{\z@}{\footnotesep}\ignorespaces
      #1\strut}}\@noftnotetrue}

\newcount\@xnumdepth \@xnumdepth = 0

\@definecounter{xnumi}
\@definecounter{xnumii}
\@definecounter{xnumiii}
\@definecounter{xnumiv}
\@definecounter{exx}
\setcounter{exx}{0}
\def\thexnumi{\@xsi{xnumi}}
\def\thexnumii{\@xsii{xnumii}}
\def\thexnumiii{\@xsiii{xnumiii}}
\def\thexnumiv{\@xsiv{xnumiv}}
\def\p@xnumii{\thexnumi}
\def\p@xnumiii{\thexnumi\thexnumii-}
\def\p@xnumiv{\thexnumi\thexnumii-\thexnumiii-}

\def\xs@default#1{\csname @@xs#1\endcsname}
\def\@@xsi{\let\@xsi\arabic}
\def\@@xsii{\let\@xsii\alph}
\def\@@xsiii{\let\@xsiii\roman}
\def\@@xsiv{\let\@xsi\arabic}

\@definecounter{rxnumi}
\@definecounter{rxnumii}
\@definecounter{rxnumiii}
\@definecounter{rxnumiv}

\def\save@counters{%
\setcounter{rxnumi}{\value{xnumi}}%
\setcounter{rxnumii}{\value{xnumii}}%
\setcounter{rxnumiii}{\value{xnumiii}}%
\setcounter{rxnumiv}{\value{xnumiv}}}%


\def\reset@counters{%
\setcounter{xnumi}{\value{rxnumi}}%
\setcounter{xnumii}{\value{rxnumii}}%
\setcounter{xnumiii}{\value{rxnumiii}}%
\setcounter{xnumiv}{\value{rxnumiv}}}%


\def\exewidth#1{\def\@exwidth{#1}} \exewidth{(234)}
\def\exe{\@ifnextchar [{\@exe}{\@exe[\@exwidth]}}

\def\@exe[#1]{\ifnum \@xnumdepth >0%
                 \if@xrec\@exrecwarn\fi%
                 \if@noftnote\@exrecwarn\fi%
                 \@xnumdepth0\@listdepth0\@xrectrue%
                 \save@counters%
              \fi%
                 \advance\@xnumdepth \@ne \@@xsi%
                 \begin{list}{(\thexnumi)}%
                             {\usecounter{xnumi}\@subex{#1}{1em}%
                              \if@noftnote%
                                 \setcounter{xnumi}{\value{exx}}%
                              \else%
                                 \setcounter{xnumi}{\value{fnx}}%
                              \fi}}

\def\endexe{\if@noftnote\setcounter{exx}{\value{xnumi}}%
                   \else\setcounter{fnx}{\value{xnumi}}%
                        \reset@counters\@xrecfalse\fi\end{list}}

\def\@exrecwarn{\typeout{*** Recursion on "exe"---your
                example numbering will probably be screwed up!}}

\def\xlist{\@ifnextchar [{\@xlist{}}{\@xlist{}[iv.]}}
\def\xlista{\@ifnextchar [{\@xlist{\alph}}{\@xlist{\alph}[m.]}}
\def\xlisti{\@ifnextchar [{\@xlist{\roman}}{\@xlist{\roman}[iv.]}}
\def\xlistn{\@ifnextchar [{\@xlist{\arabic}}{\@xlist{\arabic}[9.]}}
\def\xlistA{\@ifnextchar [{\@xlist{\Alph}}{\@xlist{\Alph}[M.]}}
\def\xlistI{\@ifnextchar [{\@xlist{\Roman}}{\@xlist{\Roman}[IV.]}}

\def\endxlist{\end{list}}
\def\endxlista{\end{list}}
\def\endxlistn{\end{list}}
\def\endxlistA{\end{list}}
\def\endxlistI{\end{list}}
\def\endxlisti{\end{list}}


%%% a generic sublist-styler
\def\@xlist#1[#2]{\ifnum \@xnumdepth >3 \@toodeep\else%
    \advance\@xnumdepth \@ne%
    \edef\@xnumctr{xnum\romannumeral\the\@xnumdepth}%
    \def\@bla{#1}
    \ifx\@bla\empty\xs@default{\romannumeral\the\@xnumdepth}\else%
      \expandafter\let\csname @xs\romannumeral\the\@xnumdepth\endcsname#1\fi
    \begin{list}{\csname the\@xnumctr\endcsname.}%
                {\usecounter{\@xnumctr}\@subex{#2}{1.5ex}}\fi}

\def\@subex#1#2{\settowidth{\labelwidth}{#1}\itemindent\z@\labelsep#2%
         \ifnum\the\@xnumdepth=1\topsep 7\p@ plus2\p@ minus3\p@\else%
         \topsep 2\p@ plus2\p@\fi\parsep 2\p@ plus\p@ minus\p@%
         \itemsep \parsep\leftmargin\labelwidth\advance\leftmargin#2\relax}

%%% the example-items
\def\ex{\@ifnextchar [{\@ex}{\item}}
\def\@ex[#1]#2{\item\@exj[#1]{#2}}
\def\@exj[#1]#2{\@exjbg{#1} #2 \end{list}}
\def\exi#1{\item[#1]\@ifnextchar [{\@exj}{}}
\def\judgewidth#1{\def\@jwidth{#1}}
\judgewidth{??}
\def\@exjbg#1{\begin{list}{#1}{\@subex{\@jwidth}{.5ex}}\item}
\def\exr#1{\exi{{(\ref{#1})}}}
\def\exp#1{\exi{{(\ref{#1}$'$)}}}
\def\sn{\exi{}}
\def\bu{\item[$\bullet$]}


%%%%%%% \lcomment for breaks in (example-)lists (leaves all counters
%%%%%%% as they are)    (hpk) 
\newlength{\lcommentsep}
\lcommentsep = 1ex

\long\def\lcomment#1%
   {\vspace{\lcommentsep}
    \item[]\hspace*{-\leftmargin}%
    \@tempskipa=\linewidth%
    \addtolength{\@tempskipa}{\rightmargin}%
    \addtolength{\@tempskipa}{\leftmargin}%
    \parbox{\@tempskipa}{#1}%
    \vspace{\lcommentsep}%
   }

%%%%%% control the alignment of exampleno. and (picture-)example
%%%%%%         (by Lex Holt <lex@cogsci.ed.ac.uk>).
\def\attop#1{\leavevmode\vtop{\strut\vskip-\baselineskip\vbox{#1}}}
\def\atcenter#1{$\vcenter{#1}$}
%%%%%%

%-------------------Move Arrows (from J.Frampton):

\def\leaderfill{\leaders\hrule\hfil}
\def\pointerup{\hbox to 0pt{\hss
  \vbox{\offinterlineskip\vskip-1pt\hbox{\elevenex\char'170}\null}\hss}}
\def\pointerdown{\hbox to 0pt{\hss
  \vtop{\offinterlineskip\null\hbox{\elevenex\char'171}\vskip-1pt}\hss}}

\let\pu=\pointerup
\let\pd=\pointerdown
\let\lf=\leaderfill

\def\spacer{\hskip4.5pt}
\def\fillright#1{\hfil#1\leaderfill}
\def\fillleft#1{\leaderfill#1\hfil}
% Changed spelling to \centr, else conflicts with LaTeX \center{} -CT
\def\centr#1{\leaderfill#1\leaderfill}
\def\link#1{\multispan#1\leaderfill}

\def\arrowalign#1{\vtop{\baselineskip=0pt \lineskiplimit=0pt \lineskip=2pt
  \halign{&##\cr#1}}}

%\font\elevenex=cmex10 scaled\magstephalf  % just for the arrow!
      %PS: this may not work on some installations, not sure why. CT
      %%PPS: (e.g., PCTeX, but it works find works fine with EmTeX)
%----------------END Move Arrows

\def\pijl{$\rightarrow$\ }

% Special accents for Vata & Gbadi; Navajo coming soon, I hope...:
%\def\bb#1{$\mathrm{\overline{#1}}$} Following looks better:
\def\bb#1{\ifmmode\overline{\mathrm{#1}}\else$\bar{\mathrm{#1}}$\fi}

\def\boven#1#2{\raisebox{-0.2pt}{$\stackrel{#1}{\mathrm{#2}}$}}
\def\bovenop#1#2{\raisebox{-0.06ex}[0ex][0ex]{$\stackrel{#1}{\mathrm{#2}}$}}
\def\vl{\rule{0.05em}{0.30em}}
\def\|#1{\ifmmode\vert#1\else\bovenop{\vl}{#1}\fi}


================================================
FILE: docs/realizer/manual.tex
================================================

%%
%% nb: use pdflatex to create pdf file with hyperlinks
%%

%% =====================================================================
%% DOCUMENT DATA
%% =====================================================================

\documentclass[11pt]{article}

\title{OpenCCG Realizer Manual}
\author{Michael White}


%% =====================================================================
%% PACKAGES
%% =====================================================================

\usepackage{openccg} % for hlds/ccg
\usepackage{graphicx} % for figs
\usepackage{gb4e} % for examples
%\usepackage{cgmacros,hylo,ccg} % for hlds/ccg

\usepackage[
  colorlinks=true, linkcolor=blue, citecolor=blue, urlcolor=blue,
  pdfstartview=FitH,
  pdftitle={OpenCCG Realizer Manual},
  pdfauthor={Michael White}
]{hyperref}

%\usepackage{mathptmx}

%% listing settings 
%% nb: not crazy about font, esp that bold not working with keywords
\usepackage{listings,color}
\lstset{language=Java,basicstyle=\ttfamily\footnotesize,keywordstyle=\underline,commentstyle=\itshape\color{blue}}
%basicstyle=\ttfamily\small

%% =====================================================================
%% NEW COMMANDS
%% =====================================================================

%\newcommand{\occg}{\textsf{OpenCCG}}
\newcommand{\occg}{OpenCCG}
\newcommand{\tccg}{\textsf{tccg}}
\newcommand{\ccgrz}{\textsf{ccg-realize}}
\newcommand{\ccgtest}{\textsf{ccg-test}}

\newcommand{\code}[1]{\texttt{#1}} %\small 
\newcommand{\eref}[2][]{(\ref{ex:#2}#1)} % ref to examples
\newcommand{\secref}[1]{Section~\ref{sec:#1}} % ref to sections
\newcommand{\figref}[1]{Figure~\ref{fig:#1}} % ref to figures
\newlength{\mytablen} % for indenting in terms
\newcommand{\mytab}[1]{
  \settowidth{\mytablen}{\ensuremath{#1}}
  \mbox{\hspace{\mytablen}}
}
\newcommand{\xor}{~\underline{\vee}~}
\newcommand{\shared}[1]{\fbox{\ensuremath{#1}}}
\newcommand{\alt}[1]{\mathsf{alt}_{#1}}
\newcommand{\opt}[1]{\mathsf{opt}_{#1}}
 
%% =====================================================================
%% DOCUMENT BODY
%% =====================================================================

\begin{document}

\thispagestyle{empty}
\maketitle
\tableofcontents
%\listoftables
\listoffigures
\newpage


%% to do:
%% making an n-gram model
%% DLFs

\section{About this manual}

This manual is a programmer's guide to using the \occg\ surface realizer
in Java applications. You can download and install \occg\ from its
website, \url{http://openccg.sourceforge.net}. Once you've unpacked the
archive, have a look at the \texttt{README} file for installation
instructions. For a brief introduction to writing grammars for \occg,
see the ``rough guide'' in \texttt{docs/grammars-rough-guide.pdf}.


\section{About the OpenCCG realizer}
\label{overview}

The OpenCCG realizer
\cite{White/Baldridge:2003,White-RLAC:2004,White-INLG:2004,White-ACLSoft:2005}
is an open source surface realizer for Steedman's
\cite{Steedman-LI:2000,Steedman:SynProc} Combinatory Categorial Grammar
(CCG), including the multi-modal extensions to CCG devised by Baldridge
and Kruijff \cite{Baldridge:PhD,Baldridge/Kruijff:2003}.

Like other chart realizers
\cite{Kay:1996,Shemtov:PhD,Carroll-and-co:1999,Bob-Moore:2002}, the
OpenCCG realizer takes as input a logical form specifying the
propositional meaning of a sentence, and returns one or more surface
strings that express this meaning according to the lexicon and grammar.
A distinguishing feature of OpenCCG is that it implements a hybrid
symbolic-statistical chart realization algorithm that combines (1) a
theoretically grounded approach to syntax and semantic composition, with
(2) the use of integrated language models for making choices among the
options left open by the grammar, thereby reducing the need for
hand-crafted rules.

To allow language models to be combined in flexible ways---as well as to
enable research on how to best combine language modeling and
realization---OpenCCG's design includes an extensible API (application
programming interface) that allows user-defined functions to be used for
scoring partial realizations and for pruning low-scoring ones during the
search. The design also includes classes for supporting a range of
language models and typical ways of combining them.

\begin{figure*}%[t]%[t]%[!h]
\begin{center}
\mbox{}
\includegraphics[width=\textwidth]{realizer-class.pdf} 
\caption{High-level architecture of the OpenCCG realizer}
\label{realizer-class}
\end{center}
\end{figure*}

The UML class diagram in Figure~\ref{realizer-class} shows the
high-level architecture of the OpenCCG realizer. A realizer
instance is constructed with a reference to a CCG grammar (which
supports both parsing and realization). The grammar's lexicon has
methods for looking up lexical items via their surface forms (for
parsing), or via the principal predicates or relations in their
semantics (for realization). A grammar also has a set of hierarchically
organized atomic types, which can serve as the values of features in the
syntactic categories, or as ontological sorts for the discourse
referents in the logical forms (LFs).

Lexical lookup yields lexical signs. A sign pairs a list of words with a
category, which itself pairs a syntactic category with a logical form.
Lexical signs are combined into derived signs using the rules in the
grammar's rule group. Derived signs maintain a derivation history, and
their word lists share structure with the word lists of their input
signs.

For generality, the realizer makes use of a configurable sign scorer and
pruning strategy. A sign scorer implements a function that returns a
number between 0 and 1 for an input sign. For example, a standard
trigram language model can be used to implement a sign scorer, by
returning the probability of a sign's words as its score. A pruning
strategy implements a method for determining which edges to prune during
the realizer's search. The input to the method is a ranked list of edges
for signs that have equivalent categories (but different words);
grouping edges in this way ensures that pruning cannot ``break'' the
realizer, i.e.\ prevent it from finding some grammatical derivation when
one exists. By default, an N-best pruning strategy is employed, which
keeps the N highest scoring input edges, pruning the rest (where N is
determined by the current preference settings).


\begin{figure*}%[p]%[t]%[!h]
\begin{center}
% \mbox{}
% \includegraphics{code/realize.pdf} 
\begin{lstlisting}
// load grammar, instantiate realizer
URL grammarURL = ...;
Grammar grammar = new Grammar(grammarURL);
Realizer realizer = new Realizer(grammar);

// configure realizer with trigram backoff model 
// and 10-best pruning strategy
realizer.signScorer = new StandardNgramModel(3, "lm.3bo");
realizer.pruningStrategy = new NBestPruningStrategy(10);

// ... then, for each request:

// get LF from input XML
Document inputDoc = ...;
LF lf = realizer.getLfFromDoc(inputDoc);

// realize LF and get output words in XML
Edge bestEdge = realizer.realize(lf);
Document outputDoc = bestEdge.sign.getWordsInXml();

// return output
... outputDoc ...;
\end{lstlisting}
\caption{Example realizer usage}
\label{realizer-usage}
\end{center}
\end{figure*}

\section{Using the realizer}

Sample Java code for using the realizer appears in
Figure~\ref{realizer-usage}. The input is an XML document that contains
an \code{lf} element either as the root or as a child of the root. To
create a sample XML document with an acceptable format, you can use the
\tccg\ tool's \code{:2xml <filename>} command. Note that the
input XML document can be created in any way that is allowed by the JDOM
API. For example, if the logical form is created by a Java XSLT-based
sentence planner in the same process, the XSLT output can be captured in
a JDOM document, and then simply passed by reference to the realizer.

The output of the realizer is typically an XML document, as shown in the
figure. In such documents, each word in the output sequence appears in
its own element; additionally, any pitch accents and boundary tones
appear in separate elements, and any expanded multi-words are indicated.
Output documents of this kind can be easily processed into other formats
using XSLT.  If a simple string output suffices, the
\code{Sign.getOrthography()} method can be used instead.

The realization algorithm is implemented by the \code{realize(LF)} method.
As in the chart realizers cited earlier, the algorithm makes use of a
chart and an agenda to perform a bottom-up dynamic programming search
for signs whose LFs completely cover the elementary predications in the
input logical form. The algorithm's details and a worked example appear
in \cite{White-RLAC:2004,White-INLG:2004}. To see a full realization
trace, you can use \ccgrz\ to realize an LF stored in an XML file (e.g.\
one created using \tccg). As shown in Figure~\ref{realizer-usage}, the
\code{realize(LF)} method returns the edge for the best realization of the
input LF, as determined by the sign scorer. After a realization request,
the N-best complete edges---or more generally, all the edges for
complete realizations that survived pruning---are also available from
the chart. To access these edges, you can invoke
\code{realizer.getChart().bestEdges()}.

The search for complete realizations proceeds in one of two modes,
anytime and two-stage (packing/unpacking). In the anytime mode, a
best-first search is performed with a configurable time limit (which may
be a limit on how long to look for a better realization, after the first
complete one is found). With this mode, the scores assigned by the sign
scorer determine the order of the edges on the agenda, and thus have an
impact on realization speed. In the two-stage mode, a packed forest of
all possible realizations is created in the first stage; then in the
second stage, the packed representation is unpacked in bottom-up
fashion, with scores assigned to the edge for each sign as it is
unpacked, much as in \cite{Langkilde:2000}. In both modes, the pruning
strategy is invoked to determine whether to keep or prune newly
constructed edges. For single-best output, the anytime mode can provide
signficant time savings by cutting off the search early; see
\cite{White-INLG:2004} for discussion. For N-best output---especially
when a complete search (up to the edges that survive the pruning
strategy) is desirable---the two-stage mode can be more efficient.


\section{Scoring signs}

The classes for implementing sign scorers appear in
Figure~\ref{scorer-class}. In the diagram, classes for n-gram scoring
appear towards the bottom, while classes for combining scorers appear on
the left, and the class for avoiding repetition appears on the right.

\begin{figure*}%[p]%[t]%[!h]
\begin{center}
\mbox{}
\includegraphics[width=\textwidth]{scorer-class.pdf} 
\caption{Classes for scoring signs}
\label{scorer-class}
\end{center}
\end{figure*}

\subsection{Standard n-gram models}
\label{standard-ngrams}

The \code{Standard\-Ngram\-Model} class can load standard n-gram backoff
models for scoring, as shown earlier in Figure~\ref{realizer-usage}.
Such models can be constructed with the SRILM toolkit
\cite{SRILM-ICSLP:2002}, as described in Section~\ref{using-srilm}; in
principle, other toolkits could be used instead, as long as their output
could be converted into the same file formats. Since the SRILM toolkit
has more restrictive licensing conditions than those of OpenCCG's LGPL
license, OpenCCG includes its own classes for scoring with n-gram
models, in order to avoid any necessary runtime dependencies on the
SRILM toolkit.

The n-gram tables are efficiently stored in a trie data structure (as in
the SRILM toolkit), thereby avoiding any arbitrary limit on the n-gram
order. To save memory and speed up equality tests, each string is
interned (replaced with a canonical instance) at load time, which
accomplishes the same purpose as replacing the strings with integers,
but without the need to maintain a separate mapping from integers back
to strings. For better generalization, certain words may be dynamically
replaced with the names of their semantic classes when looking up n-gram
probabilities. Words are assigned to semantic classes in the lexicon,
and the semantic classes to use in this way may be configured at the
grammar level. Note that \cite{Oh/Rudnicky:2002} and \cite{Adwait:2002}
make similar use of semantic classes in n-gram scoring, by deferring the
instantiation of classes (such as \textit{departure city}) until the end
of the generation process; our approach accomplishes the same goal in a
slightly more flexible way, in that it also allows the specific word to
be examined by other scoring models, if desired.

As discussed in \cite{White-INLG:2004}, with dialogue systems like COMIC
n-gram models can do an excellent job of placing underconstrained
adjectival and adverbial modifiers---as well as boundary tones---without
resorting to the more complex methods investigated for adjective
ordering in \cite{Shaw/Hatzi:1999,Malouf:2000}. For instance, in
examples like those in \eref{adv-placement}, they correctly select the
preferred positions for \textit{here} and \textit{also} (as well as for
the boundary tones), with respect to the verbal head and sister
dependents:
 
\begin{exe}
  %\small
  \ex \label{ex:adv-placement}
  \begin{xlist}
  \ex 
  Here$_{L+H*}$ LH\% we have a design in the classic$_{H*}$ style LL\% .
  \ex 
  This$_{L+H*}$ design LH\% here$_{L+H*}$ LH\% is also$_{H*}$ classic LL\% .
  \end{xlist}
\end{exe}

We have also found that it can be useful to use reverse (or
``right-to-left'') models, as they can help to place adverbs like
\textit{though}, as in \eref{though}:

\begin{exe}
  %\small
  \ex \label{ex:though}
  The tiles are also$_{H*}$ from the Jazz$_{H*}$ series though LL\% .
\end{exe}

\noindent In principle, the forward and reverse probabilities should be
the same---as they are both derived via the chain rule from the same
joint probability of the words in the sequence---but we have found that
with sparse data the estimates can differ substantially. In particular,
since \textit{though} typically appears at the end of a variety of
clauses, its right context is much more predictable than its left
context, and thus reverse models yield more accurate estimates of its
likelihood of appearing clause-finally. 

\subsection{N-gram scorers}

The \code{Standard\-Ngram\-Model} class is implemented as a subclass of
the base class \code{Ngram\-Scorer}. All \code{Ngram\-Scorer} instances
may have any number of \code{Ngram\-Filter} instances, whose
\code{filter\-Out} methods are invoked prior to n-gram scoring; if any
of these methods return true, a score of zero is immediately returned.
The \code{AAn\-Filter} provides one concrete implementation of the
\code{Ngram\-Filter} interface, and returns true if it finds a bigram
consisting of \textit{a} followed by a vowel-inital word, or \textit{an}
followed by a consonant-initial word, subject to a configurable set of
exceptions that can be culled from bigram counts. We have found that
such n-gram filters can be more efficient, and more reliable, than
relying on n-gram scores alone; in particular, with \textit{a/an}, since
the unigram probability for \textit{a} tends to be much higher than that
of \textit{an}, with unseen words beginning with a vowel, there may not
be a clear preference for the bigram beginning with \textit{an}.

The base class \code{Ngram\-Scorer} implements the bulk of the
\code{score} method, using an abstract \code{log\-Prob\-From\-Ngram} method
for subclass-specific calculation of the log probabilities (with
backoff) for individual n-grams. The \code{score} method also invokes
the \code{prepare\-To\-Score\-Words} method, in order to allow for
subclass-specific pre-processing of the words in the given sign. With
\code{Standard\-Ngram\-Model}, this method is used to extract the word forms
or semantic classes into a list of strings to score. It also appends any
pitch accents to the word forms or semantic classes, effectively
treating them as integral parts of the words.

Since the realizer builds up partial realizations bottom-up rather than
left-to-right, it only adds start of sentence (and end of sentence) tags
with complete realizations. As a consequence, the words with less than a
full $n-1$ words of history are scored with appropriate sub-models. For
example, the first word of a phrase is scored with a unigram sub-model,
without imposing backoff penalties.

Another consequence of bottom-up realization is that both the left- and
right-contexts may change when forming new signs from a given input
sign. Consequently, it is often not possible (even in principle) to use
the score of an input sign directly in computing the score of a new
result sign. If one could make assumptions about how the score of an
input sign has been computed---e.g., by a bigram model---one could
determine the score of the result sign from the scores of the input
signs together with an adjustment for the word(s) whose context has
changed. However, our general approach to sign scoring precludes making
such assumptions. Nevertheless, it is still possible to improve the
efficiency of n-gram scoring by caching the log probability of a sign's
words, and then looking up that log probability when the sign is used as
the first input sign in creating a new combined sign---thus retaining
the same left context---and only recomputing the log probabilities for
the words of any input signs past the first one. (With reverse models,
the sign must be the last sign in the combination.) In principle, the
derivation history could be consulted further to narrow down the words
whose n-gram probabilities must be recomputed to the minimum possible,
though \code{Ngram\-Scorer} only implements a single-step lookup at
present.\footnote{Informal experiments indicate that caching log
probabilities in this way can yield an overall reduction in best-first
realization times of 2-3\% on average.} Finally, note that a Java
\code{Weak\-Hash\-Map} is used to implement the cache, in order to avoid
an undesirable buildup of entries across realization requests.

\subsection{Interpolation}
\label{interpolation}

Scoring models may be linearly interpolated in two ways.  Sign scorers
of any variety may be combined using the \code{Sign\-Scorer\-Interpolation} 
class.  For example, Figure~\ref{forward-reverse-interpolation} shows 
how forward and reverse n-gram models may be interpolated.

\begin{figure*}%[p]%[t]%[!h]
\begin{center}
\begin{lstlisting}
// configure realizer with 4-gram forward and reverse backoff 
// models, interpolated with equal weight
NgramScorer forwardModel = new StandardNgramModel(4, "lm.4bo"); 
NgramScorer reverseModel = new StandardNgramModel(4, "lm-r.4bo"); 
reverseModel.setReverse(true);
realizer.signScorer = new SignScorerInterpolation(
    new SignScorer[] { forwardModel, reverseModel }
);
\end{lstlisting}
\caption{Example interpolated n-gram model}
\label{forward-reverse-interpolation}
\end{center}
\end{figure*}

With n-gram models of the same direction, it is also possible to
linearly interpolate models at the word level, using the
\code{Linear\-Ngram\-Scorer\-Combo} class. Word-level interpolation
makes it easier to use cache models created with maximum likelihood
estimation, as word-level interpolation with a base model avoids
problems with zero probabilities in the cache model. As discussed in
\cite{Carsten-Alignment:2005}, cache models can be used to promote
alignment with a conversational partner, by constructing a cache model
from the bigrams in the partner's previous turn, and interpolating it
with a base model.\footnote{At present, such cache models must be
constructed with a call to the SRILM toolkit; it would not be difficult
to add OpenCCG support for constructing them though, since these models
do not require smoothing.} Figure~\ref{base-cache-interpolation} shows
one way to create such an interpolated model.

\begin{figure*}%[p]%[t]%[!h]
\begin{center}
\begin{lstlisting}
// configure realizer with 4-gram backoff base model, 
// interpolated at the word level with a bigram maximum-likelihood 
// cache model, with more weight given to the base model
NgramScorer baseModel = new StandardNgramModel(4, "lm.4bo"); 
NgramScorer cacheModel = new StandardNgramModel(2, "lm-cache.mle"); 
realizer.signScorer = new LinearNgramScorerCombo(
    new SignScorer[] { baseModel, cacheModel }, 
    new double[] { 0.6, 0.4 }
);
\end{lstlisting}
\caption{Example word-level interpolation of a cache model}
\label{base-cache-interpolation}
\end{center}
\end{figure*}

\subsection{N-gram precision models}
\label{ngram-precision}

The \code{NgramPrecisionModel} subclass of \code{Ngram\-Scorer} computes a
modified version of the Bleu score used in MT evaluation
\cite{Bleu:2001}. Its constructor takes as input an array of target
strings---from which it extracts the n-gram sequences to use in
computing the n-gram precision score---and the desired order. Unlike
with the Bleu score, rank order centroid weights (rather than the
geometric mean) are used to combine scores of different orders, which
avoids problems with scoring partial realizations which have no n-gram
matches of the target order. For simplicity, the score also does not
include the Bleu score's bells and whistles to make cheating on length
difficult.
 
We have found n-gram precision models to be very useful for regression
testing the grammar, as an n-gram precision model created just from the
target string nearly always leads the realizer to choose that exact
string as its preferred realization. These models can also be useful for
evaluating the success of different scoring models in a cross-validation
setup, though with high quality output, manual inspection is usually
necessary to determine the importance of any differences between the
preferred realization and the target string. Finally, note that n-gram
precision models can be used as a quick-and-dirty substitute for
standard n-gram models, if one does not have time to install and use the
SRILM toolkit.

\subsection{Factored language models}

A factored language model \cite{Bilmes-Kirchoff:2003} is a new kind of
language model that treats words as bundles of factors. To support
scoring with such models, OpenCCG represents words as objects with a
surface form, pitch accent, stem, part of speech, supertag, and semantic
class. Words may also have any number of further attributes, such as
associated gesture classes, in order to handle in a general way elements
like pitch accents that are ``coarticulated'' with words. 

To represent words efficiently, and to speed up equality tests, all
attribute values are interned, and the \code{Word} objects themselves
are interned via a factory method. Note that in Java, it is
straightforward to intern objects other than strings by employing a
\code{Weak\-Hash\-Map} to map from an object key to a weak reference to
itself as the canonical instance. (Using a weak reference avoids
accumulating interned objects that would otherwise be garbage
collected.)

With the SRILM toolkit, factored language models can be constructed that
support \textit{generalized parallel backoff}: that is, backoff order is
not restricted to just dropping the most temporally distant word first,
but rather may be specified as a path through the set of contextual
parent variables; additionally, parallel backoff paths may be specified,
with the possibility of combining these paths dynamically in various
ways. In OpenCCG, the \code{Factored\-Ngram\-Model} class supports
scoring with factored language models that employ generalized backoff,
though parallel backoff is not yet supported, as it remains somewhat
unclear whether the added complexity of parallel backoff is worth the
implementation effort. Typically, several related factored language
models are specified in a single file and loaded by a
\code{Factored\-Ngram\-Model\-Family}, which can multiplicatively score
models for different child variables, and include different sub-models
for the same child variable.

To illustrate, let us consider a simplified version of the factored
language model family used in the COMIC realizer. This model computes
the probability of the current word given the preceding ones according
to the formula shown in \eref{comic-flm}, where a word consists of the
factors word (W), pitch accent (A), gesture class (GC), and gesture
instance (GI), plus the other standard factors which the model ignores:

\begin{exe}
\ex \label{ex:comic-flm}
\begin{small}
\(
\begin{array}{l}
P(\langle W,A,GC,GI \rangle \, | \, \langle W,A,GC,GI \rangle_{-1} \, \ldots) \approx  \\
\; \; \; P(W \, | \, W_{-1} W_{-2} A_{-1} A_{-2}) \; \times \\
\; \; \; P(GC \, | \, W) \; \times \\
\; \; \; P(GI \, | \, GC) \\
\end{array}
\)
\end{small}
\end{exe}

\noindent In \eref{comic-flm}, the probability of the current word is
approximated by the probability of the current word form given the
preceding two word forms and preceding two pitch accents, multiplied by
the probability of the current gesture class given the current word
form, and by the probability of the current gesture instance given the
current gesture class. Note that in the COMIC grammar, the choice of
pitch accent is entirely rule governed, so the current pitch accent is
not scored separately in the model. However, the preceding pitch accents
are taken into account in predicting the current word form, as
perplexity experiments have suggested that they do provide additional
information beyond that provided by the previous word forms.

The specification file for this model appears in Figure~\ref{flm-spec}.
The format of the file is a restricted form of the files used by the
SRILM toolkit to build factored language models. The file specifies four
models, where the first, third and fourth models correspond to those in
\eref{comic-flm}. With the first model, since the previous words are
typically more informative than the previous pitch accents, the backoff
order specifies that the most distant accent, \code{A(-2)}, should be
dropped first, followed by the previous accent, \code{A(-1)}, then the
most distant word, \code{W(-2)}, and finally the previous word,
\code{W(-1)}. The second model is considered a sub-model of the
first---since it likewise predicts the current word---to be used when
there is only one word of context available (i.e.\ with bigrams). Note
that when scoring a bigram, the second model will take the previous
pitch accent into account, whereas the first model would not. For
documentation of the file format as it is used in the SRILM toolkit, see
\cite{FLM-JHSW:2002}.

\begin{figure*}%[p]%[t]%[!h]
\begin{footnotesize}
\begin{verbatim}
## Simplified COMIC realizer FLM spec file

## Trigram Word model based on previous words and accents, dropping accents first, 
##   with bigram sub-model;
## Unigram Gesture Class model based on current word; and 
## Unigram Gesture Instance model based on current gesture class

4

## 3gram with A
W : 4 W(-1) W(-2) A(-1) A(-2) w_w1w2a1a2.count w_w1w2a1a2.lm 5
  W1,W2,A1,A2  A2 ndiscount gtmin 1 
  W1,W2,A1  A1 ndiscount gtmin 1 
  W1,W2  W2 ndiscount gtmin 1 
  W1  W1 ndiscount gtmin 1 
  0   0  ndiscount gtmin 1

## bigram with A
W : 2 W(-1) A(-1) w_w1a1.count w_w1a1.lm 3
  W1,A1  A1  ndiscount gtmin 1 
  W1  W1  ndiscount gtmin 1 
  0   0   ndiscount gtmin 1

## Gesture class depends on current word
GC : 1 W(0) gc_w0.count gc_w0.lm 2
  W0  W0 ndiscount gtmin 1 
  0   0  ndiscount gtmin 1

## Gesture instance depends only on class
GI : 1 GC(0) gi_gc0.count gi_gc0.lm 2
  GC0  GC0 ndiscount gtmin 1
  0 0
\end{verbatim}
\end{footnotesize}
\caption{Example factored language model family specification}
\label{flm-spec}
\end{figure*}

Like \code{Standard\-Ngram\-Model}, the \code{Factored\-Ngram\-Model} class
stores its n-gram tables in a trie data structure, except that it stores
an interned factor key (i.e.\ a factor name and value pair, or just a
string, in the case of the word form) at each node, rather than a simple
string. During scoring, the \code{log\-Prob\-From\-Ngram} method determines
the log probability (with backoff) of a given n-gram by extracting the
appropriate sequence of factor keys, and using them to compute the log
probability as with standard n-gram models. The
\code{Factored\-Ngram\-Model\-Family} class computes log probabilities by
delegating to its component factored n-gram models (choosing appropriate
sub-models, when appropriate) and summing the results.
 
\subsection{Avoiding repetition}

While cache models appear to be a promising avenue to promote lexical
and syntactic alignment with a conversational partner, a different
mechanism appears to be called for to avoid ``self-alignment''---that
is, to avoid the repetitive use of words and phrases. As a means to
experiment with avoiding repetition, OpenCCG includes the
\code{Repetition\-Scorer} class. This class makes use of a configurable
penalty plus a set of methods for dynamically managing the context. It
returns a score of \( 10^{- c_r \times p} \), where $c_r$ is the count
of repeated items, and $p$ is the penalty. Note that this formula
returns 1 if there are no repeated items, and returns a score that is
linear in log space with the number of repeated items otherwise.

A repetition scorer can be combined multiplicatively with an n-gram
model, in order to discount realizations that repeat items from the
recent context. Figure~\ref{rep-scorer} shows such a combination,
together with the operations for updating the context. By default, open
class stems are the considered the relevant items over which to count
repetitions, though this behavior can be specialized by subclassing
\code{Repetition\-Scorer} and overriding the \code{updateItems} method.
Note that in counting repetitions, full counts are given to items in the
previous words or recent context, while fractional counts are given to
older items; the exact details may likewise be changed in a subclass, by
overriding the \code{repeatedItems} method.

\begin{figure*}%[p]%[t]%[!h]
\begin{center}
\begin{lstlisting}
// set up n-gram scorer and repetition scorer
String lmfile = "ngrams/combined.flm";
NgramScorer ngramScorer = new FactoredNgramModelFamily(lmfile, true);
ngramScorer.addFilter(new AAnFilter());
RepetitionScorer repetitionScorer = new RepetitionScorer();

// combine n-gram scorer with repetition scorer
realizer.signScorer = new SignScorerProduct(
    new SignScorer[] { ngramScorer, repetitionScorer }
);

// ... then, after each realization request, 
Edge bestEdge = realizer.realize(lf);

// ... update repetition context for next realization:
repetitionScorer.ageContext();
repetitionScorer.updateContext(bestEdge.getSign());
\end{lstlisting}
\caption{Example combination of an n-gram scorer and a repetition scorer}
\label{rep-scorer}
\end{center}
\end{figure*}

\subsection{Building language models with the SRILM toolkit}
\label{using-srilm}

You can use \occg's regression testing tool, \ccgtest, to help build and
test language models built with the SRILM toolkit. By default, running
\ccgtest\ will use the grammar in the current directory to parse and
realize the default regression file, \code{testbed.xml}, using an n-gram
precision model constructed for each test item. Using the appropriate
command-line options, it is also possible to export the text of the test
items in order to construct an n-gram model with the SRILM toolkit, and
then use the resulting model in testing the realizer.

To display the syntax of \ccgtest's command-line options, you can invoke
it with the the \code{-h} option, as shown in \eref{ccg-test-help}. To
export the text of the test items to a text file, you use the
\code{-text} option, as in \eref{export-text}. The next step is to use
SRILM's \code{ngram-count} tool to build an n-gram language model. In
\eref{make-lm},\footnote{This command, and the ensuing ones, should be
entered on one line.} \code{ngram-count} is used to build a 4-gram
backoff model, \code{n.4bo}, from the text file \code{tb.txt}, using
Ristad's ``natural'' discounting method \cite{Ristad:1995}. For small
test sets, we have found that Ristad's method works better than the
default one (Good-Turing). Note that in \eref{make-lm}, the \code{-unk}
option is used to reserve some probability for unknown words; the
\code{-gt<N>min 1} options (for N=1 to 4) specify to keep all 1-counts;
and the \code{-ndiscount<N>} options (for N=1 to 4) specify the use of
natural discounting for unigrams through 4-grams. Finally, to test the
resulting language model, you use \ccgtest's \code{-ngramorder} and
\code{-lm} options, as shown in \eref{test-lm}.

\begin{exe}
  %\small
  \ex %\label{ex:make-test-lm}
  \begin{xlist}
  \ex \label{ex:ccg-test-help}
  \code{ccg-test -h}
  \ex \label{ex:export-text} 
  \code{ccg-test -text tb.txt}
  \ex \label{ex:make-lm} 
  \code{ngram-count -order 4 -unk -text tb.txt -lm n.4bo \\
  -gt1min 1 -gt2min 1 -gt3min 1 -gt4min 1 \\
  -ndiscount1 -ndiscount2 -ndiscount3 -ndiscount4}
  \ex \label{ex:test-lm}
  \code{ccg-test -noparsing -ngramorder 4 -lm n.4bo}
  \end{xlist}
\end{exe}

To perform a simple 2-fold cross-validation, \ccgtest\ includes options
for exporting or testing just the even or odd test items. The command in
\eref{export-even} shows how you can export just the text of the
even-numbered test items. Note that the \code{-textsc} option specifies
that the text be exported using semantic class replacement, i.e.\ with
certain words replaced with their semantic classes; the classes to use
for this purpose are specified using the \code{replacement-sem-classes}
attribute of the \code{tokenizer} element in the \code{grammar.xml}
file.  The next step is to build a language model just as before; the
abbreviated command appears in \eref{make-even-lmsc}.  Finally, you can
test the language model on just the odd-numbered items, as in
\eref{test-odd}, where the \code{-lmsc} option specifies that semantic
class replacement should be employed when scoring realizations with the
model.  Naturally, you can switch the \code{-even} and \code{-odd}
flags, and adjust the text and language model names, to test realization
on the even-numbered items, using a language model trained from the
odd-numbered ones.

\begin{exe}
  %\small
  \ex %\label{ex:even-odd}
  \begin{xlist}
  \ex \label{ex:export-even} 
  \code{ccg-test -even -textsc tb-sc.even.txt}
  \ex \label{ex:make-even-lmsc} 
  \code{ngram-count -order 4 -unk -text tb-sc.even.txt \\
  -lm n-sc.even.4bo ...}
  \ex \label{ex:test-odd}
  \code{ccg-test -noparsing -odd -ngramorder 4 -lmsc n-sc.even.4bo}
  \end{xlist}
\end{exe}

An example of building a factored language model appears next. In
\eref{export-fsc}, the text of the test items is exported, where each
word appears with all its factors, and word forms are replaced with
semantic classes when appropriate.  In \eref{make-flmsc}, SRILM's
\code{fngram-count} is used to create a factored language model from the
spec file named \code{spec.flm}.  (Note that the various individual
language model files are listed in the spec file.)  Finally,
\eref{test-flm} shows how the factored language model can be tested in
\ccgtest.

\begin{exe}
  %\small
  \ex 
  \begin{xlist}
  \ex \label{ex:export-fsc} 
  \code{ccg-test -textfsc tb-fsc.txt}
  \ex \label{ex:make-flmsc} 
  \code{fngram-count -factor-file spec.flm -text tb-fsc.txt -lm -unk}
  \ex \label{ex:test-flm}
  \code{ccg-test -noparsing -flmsc spec.flm}
  \end{xlist}
\end{exe}


\section{Pruning Strategies}
\label{pruning}

The classes for defining edge pruning strategies appear in
Figure~\ref{pruner-class}. As mentioned in Section~\ref{overview}, an N-best
pruning strategy is employed by default, where N is determined by the
current preference settings. It is also possible to define custom
strategies. To support the definition of a certain kind of custom
strategy, the abstract class \code{Diversity\-Pruning\-Strategy}
provides an N-best pruning strategy that promotes diversity in the edges
that are kept, according to the equivalence relation established by the
abstract \code{not\-Compellingly\-Different} method. In particular, in
order to determine which edges to keep, a diversity pruning strategy
clusters the edges into a ranked list of equivalence classes, which are
sequentially sampled until the limit N is reached. If the
\code{single\-Best\-Per\-Group} flag is set, then a maximum of one edge
per equivalence class is retained.

\begin{figure*}%[p]%[t]%[!h]
\begin{center}
\mbox{}
%scale=1.25
\includegraphics[width=\textwidth]{pruner-class.pdf} 
\caption{Classes for defining pruning strategies}
\label{pruner-class}
\end{center}
\end{figure*}

As an example, the COMIC realizer's diversity pruning strategy appears
in Figure~\ref{gest-diversity-strategy}. The idea behind this strategy
is to avoid having the N-best lists become full of signs whose words
differ only in the exact gesture instance associated with one or more of
the words. With this strategy, if two signs differ in just this way, the
edge for the lower-scoring sign will be considered ``not compellingly
different'' and pruned from the N-best list, making way for other edges
whose signs exhibit more interesting differences.

\begin{figure*}%[p]%[t]%[!h]
\begin{center}
\begin{lstlisting}
// configure realizer with gesture diversity pruner
realizer.pruningStrategy = new DiversityPruningStrategy() {
  /** 
   * Returns true iff the given signs are not compellingly different; 
   * in particular, returns true iff the words differ only in their  
   * gesture instances. */
  public boolean notCompellinglyDifferent(Sign sign1, Sign sign2) {
    List words1 = sign1.getWords(); List words2 = sign2.getWords();
    if (words1.size() != words2.size()) return false;
    for (int i = 0; i < words1.size(); i++) {
      Word w1 = (Word) words1.get(i); Word w2 = (Word) words2.get(i);
      if (w1 == w2) continue;
      if (w1.getForm() != w2.getForm()) return false;
      if (w1.getPitchAccent() != w2.getPitchAccent()) return false;
      if (w1.getVal("GC") != w2.getVal("GC")) return false;
      // nb: assuming that they differ in the val of GI at this point 
    }
    return true;
  }
};
\end{lstlisting}
\caption{Example diversity pruning strategy}
\label{gest-diversity-strategy}
\end{center}
\end{figure*}

OpenCCG also provides a concrete subclass of
\code{Diversity\-Pruning\-Strategy} named
\code{Ngram\-Diversity\-Pruning\-Strategy}, which generalizes the
approach to pruning described in \cite{Langkilde:2000}. With this class,
two signs are considered not compellingly different if they share the
same $n\!-\!1$ initial and final words, where $n$ is the n-gram order.
When one is interested in single-best output, an n-gram diversity
pruning strategy can increase efficiency while guaranteeing no loss in
quality---as long as the reduction in the search space outweighs the
extra time necessary to check for the same initial and final
words---since any words in between an input sign's $n\!-\!1$ initial and
final ones cannot affect the n-gram score of a new sign formed from the
input sign. However, when N-best outputs are desired, or when repetition
scoring is employed, it is less clear whether it makes sense to use an
n-gram diversity pruning strategy; for this reason, a simple N-best
strategy remains the default option.


\section{Disjunctive logical forms}
\label{sec:disj-lf}

In applications, to specify the desired space of possible paraphrases,
one may either provide an input logical form that underspecifies certain
realization choices, or include explicit disjunctions in the input LF
(or both). In our experience, we have found disjunctive LFs---inspired
by those found in \cite{Shemtov:PhD}---to be an important capability,
especially as one seeks to make grammars reusable across applications.

\begin{figure}%[t]%[!h]
\begin{small}
\begin{center}
\includegraphics[width=0.52\textwidth]{ex1a} 
\end{center}
\begin{itemize}
\item[(a)] Semantic dependency graph for \textit{The design (is$\mid$'s) 
based on the Funny Day collection by Villeroy and Boch.}
\end{itemize}

\vspace{3mm}
\begin{center}
\includegraphics[width=0.52\textwidth]{ex1b} 
\end{center}
\begin{itemize}
\item[(b)] Semantic dependency graph for \textit{The design (is$\mid$'s) 
based on Villeroy and Boch's Funny Day series.}
\end{itemize}

\vspace{3mm}
\begin{center}
\includegraphics[width=0.52\textwidth]{ex1c} 
\end{center}
\begin{itemize}
\item[(c)] Disjunctive semantic dependency graph covering (a)-(b), i.e.\
\textit{The design (is$\mid$'s) based on 
(the Funny Day (collection$\mid$series) by Villeroy and Boch $\mid$
Villeroy and Boch's Funny Day (collection$\mid$series)).}
\end{itemize}
\end{small}

\caption{Example semantic dependency graphs.}
\label{fig:ex1}
\end{figure}

\begin{figure}%[t]%[!h]
\begin{small}
\ensuremath{
@_{e}(\C{be} \wedge \modp{tense}\con{pres} \wedge \modp{mood}\con{dcl} \wedge \\
    \mytab{@_{e}(}
    \modp{Arg}(d \wedge \C{design} \wedge \modp{det}\con{the} \wedge \modp{num}\con{sg}) \wedge \\
    \mytab{@_{e}(}
    \modp{Prop}(p \wedge \C{based-on} \wedge \\
                \mytab{@_{e}(\modp{Prop}(}
                \modp{Artifact}d \wedge \\
                \mytab{@_{e}(\modp{Prop}(}
                \modp{Source}(c \wedge \C{collection} \wedge \modp{det}\con{the} \wedge \modp{num}\con{sg} \wedge \\
                              \mytab{@_{e}(\modp{Prop}(\modp{Source}(}
                              \modp{HasProp}(f \wedge \C{Funny\_Day}) \wedge \\
                              \mytab{@_{e}(\modp{Prop}(\modp{Source}(}
                              \modp{Creator}(v \wedge \C{V\&B}))))
}

\begin{center}
(a)

\vspace{2mm}
\mbox{}\vdots
\vspace{2mm}
\end{center}

\ensuremath{
@_{e}(\C{be} \wedge \modp{tense}\con{pres} \wedge \modp{mood}\con{dcl} \wedge \\
    \mytab{@_{e}(}
    \modp{Arg}(d \wedge \C{design} \wedge \modp{det}\con{the} \wedge \modp{num}\con{sg}) \wedge \\
    \mytab{@_{e}(}
    \modp{Prop}(p \wedge \C{based-on} \wedge \\
                \mytab{@_{e}(\modp{Prop}(}
                \modp{Artifact}d \wedge \\
                \mytab{@_{e}(\modp{Prop}(}
                \modp{Source}(c \wedge \modp{num}\con{sg} \wedge (\modp{det}\con{the})? \wedge \\
                              \mytab{@_{e}(\modp{Prop}(\modp{Source}(}
                              (\C{collection} \xor \C{series}) \wedge \\
                              \mytab{@_{e}(\modp{Prop}(\modp{Source}(}
                              \modp{HasProp}(f \wedge \C{Funny\_Day}) \wedge \\
                              \mytab{@_{e}(\modp{Prop}(\modp{Source}(}
                              (\modp{Creator}\shared{v} \xor \modp{GenOwner}\shared{v})))) \\
\wedge @_{v}(\C{Villeroy\_and\_Boch})
}

\begin{center}
(c)
\end{center}
\end{small}

\caption{HLDS for examples in \figref{ex1}.}
\label{fig:ex1-hlds}
\end{figure}

As an illustration of disjunctive logical forms, consider the semantic
dependency graphs in \figref{ex1}, which are taken from the
COMIC\footnote{\texttt{http://www.hcrc.ed.ac.uk/comic/}} multimodal
dialogue system.\footnote{To simplify the exposition, the features
  specifying information structure and deictic gestures have been
  omitted, as have the semantic sorts of the discourse referents.}
Given the lexical categories in the COMIC grammar, the graphs in
\figref{ex1}(a) and (b) fully specify their respective realizations,
with the exception of the choice of the full or contracted form of the
copula.\footnote{Note that to be consistent with the distributed
  grammar, the predicate $\C{based\_on}$ should actually be
  $\C{based-on}$; this discrepancy has been corrected in the
  subsequent figures.} To generalize over these alternatives, the
disjunctive graph in (c) may be employed.  This graph allows a free
choice between the domain synonyms \textit{collection} and
\textit{series}, as indicated by the vertical bar between their
respective predications. The graph also allows a free choice between
the \modp{Creator} and \modp{GenOwner} relations---lexicalized via
\textit{by} and the possessive, respectively---connecting the head $c$
(\textit{collection} or \textit{series}) with the dependent $v$ (for
\textit{Villeroy and Boch}); this choice is indicated by an arc
between the two dependency relations.\footnote{Note that the arc and
  vertical bar are just presentation devices; there is no difference
  in the underlying implementation.} Finally, the determiner feature
(\modp{det}\con{the}) on $c$ is indicated as optional, via the
question mark.\footnote{Another option would be to include the
  determiner feature in the alternative with the \modp{Creator}
  relation, but that would make the graph harder to draw and would not
  illustrate optionality.}

It is worth pausing at this point to observe that in designing the
COMIC grammar, the differences between (a) and (b) could perhaps have
been collapsed.  However, such a move would make it more difficult to
reuse the grammar in other applications---and indeed, the core of the
grammar is shared with the FLIGHTS system
\cite{FLIGHTS-FLAIRS:2004}---as it would presuppose that these
paraphrases should always available in the same contexts.  An example
where the disjunctively specified paraphrases have applicable contexts
that are more clearly limited appears in \eref{ex2}:

\begin{exe}
\ex \label{ex:ex2}
(This design $\mid$ This one $\mid$ This) (is$\mid$'s) (classic $\mid$
in the classic style) $\mid$ Here we have a (classic design $\mid$
design in the classic style).
\end{exe}

\noindent This example shows some of the phrasings that may be used in
COMIC to describe the style of a design that has not been discussed
previously.  The example includes a top-level disjunction between the
use of a deictic NP \textit{this design $\mid$ this one $\mid$ this}
(with an accompanying pointing gesture) followed by the copula, or the
use of the phrase \textit{here we have} to introduce the design.
While these alternatives can function as paraphrases in this context,
it is difficult to see how one might specify them in a single
underspecified (and application-neutral) logical form.

Graphs such as those in \figref{ex1} are represented internally using
Hybrid Logic Dependency Semantics (HLDS), as in \figref{ex1-hlds}. In
HLDS, as can be seen in \figref{ex1-hlds}(a), each semantic head is
associated with a nominal that identifies its discourse referent, and
heads are connected to their dependents via dependency relations, which
are modeled as modal relations; modal relations are also used to
represent semantic features (in which case the relation is to an
anonymous node). In (c), two new operators are introduced to represent
periphrastic alternatives and optional parts of the meaning, namely
$\xor$ and $(\cdot)?$, for exclusive-or and optionality, respectively.
To indicate that a nominal represents a reference to a node that is
considered a shared part of multiple alternatives, the nominal is
annotated with a box, as exemplified by \shared{v}. This notion of
shared references is needed during the logical form flattening stage of
the realization algorithm in order to determine which elementary
predications are part of each alternative.

\begin{figure}%[t]%[!h]
\begin{footnotesize}
\begin{verbatim}
<node id="e" pred="be" tense="pres" mood="dcl">
  <rel name="Arg"> 
    <node id="d" pred="design" det="the" num="sg"/>
  </rel>
  <rel name="Prop">
    <node id="p" pred="based-on">
      <rel name="Artifact"> <node idref="d"/> </rel>
      <rel name="Source"> 
        <node id="c" pred="collection" det="the" num="sg">
          <rel name="HasProp"> 
            <node id="f" pred="Funny_Day"/>
          </rel>
          <rel name="Creator"> 
            <node id="v" pred="Villeroy_and_Boch"/>
          </rel> 
        </node>
      </rel>
    </node>
  </rel>
</node>
\end{verbatim}
\end{footnotesize}

\caption{XML for example (a) \figref{ex1}.}
\label{fig:ex1-xml-a}
\end{figure}

\begin{figure}%[t]%[!h]
\begin{footnotesize}
\begin{verbatim}
<node id="e" pred="be" tense="pres" mood="dcl">
  <rel name="Arg"> 
    <node id="d" pred="design" det="the" num="sg"/>
  </rel>
  <rel name="Prop">
    <node id="p" pred="based-on">
      <rel name="Artifact"> <node idref="d"/> </rel>
      <rel name="Source"> 
        <node id="c" num="sg">
          <opt> <atts det="the"/> </opt>
          <one-of>
            <atts pred="collection"/> 
            <atts pred="series"/>
          </one-of>
          <rel name="HasProp"> 
            <node id="f" pred="Funny_Day"/>
          </rel>
          <one-of>
            <rel name="Creator"> 
              <node idref="v" shared="true"/> 
            </rel> 
            <rel name="GenOwner">
              <node idref="v" shared="true"/> 
            </rel> 
          </one-of>
        </node>
      </rel>
    </node>
  </rel>
</node>
<node id="v" pred="Villeroy_and_Boch"/>
\end{verbatim}
\end{footnotesize}

\caption{XML for example (c) \figref{ex1}.}
\label{fig:ex1-xml-c}
\end{figure}

To specify inputs to the realizer, an XML representation of HLDS terms
may be employed; alternatively, the more intuitive XML graph
representation illustrated in \figref{ex1-xml-a} and \figref{ex1-xml-c}
may be used, with an automatic translation converting such
representations to HLDS. As can be seen in \figref{ex1-xml-a}, the nodes
and dependency relations in the graph are represented by \texttt{node}
and \texttt{rel} elements. Note that \texttt{node} elements that
represent subordinated, reentrant references to a node use an
\texttt{idref} attribute, as exemplified by the \texttt{Artifact}
relation to the \texttt{node} element with \texttt{idref="d"}.
\figref{ex1-xml-c} shows how periphrastic alternatives and optional
parts of the meaning are specified using the \texttt{one-of} and
\texttt{opt} elements, respectively. Where the alternatives involve
attributes of a node, an \texttt{atts} element is used to provide the
lexical predications or semantic features in question. Finally, note
that \texttt{node} elements that represent references to a node that is
considered a shared part of multiple alternatives is marked with the
\texttt{shared="true"} attribute, as is the case here with the
references to the dependent node $v$ (for \textit{Villeroy and Boch}).


%% =====================================================================
%% BIBLIOGRAPHY
%% =====================================================================

\addcontentsline{toc}{section}{References}
\bibliographystyle{alpha}
\bibliography{refs}

\end{document}


================================================
FILE: docs/realizer/openccg.sty
================================================

%%
%% This style file contains a minimal set of commands for 
%% OpenCCG categories and logical forms, plus derivations. 
%% It borrows from earlier style files by Gann, Jason and Geert-Jan, 
%% and from Beryl and Mark for the derivations.
%%

\newcommand{\bs}{\backslash}        % backslash, to save typing

\newcommand{\gf}[1]{\textsf{\textsl{#1}}}       % gloss font, for words
\newcommand{\cf}[1]{\ensuremath{\mathsf{#1}}}   % category font

\newcommand{\fb}[1]{\ensuremath{_{\mathit{#1}}}}                    % features, subscripted
\newcommand{\fsb}[2]{\ensuremath{_{\langle#1\rangle\mathit{#2}}}}   % fs index and features, subscripted

\newcommand{\C}[1]{\textbf{#1}}                 % concept font
\newcommand{\con}[1]{\ensuremath{\mathrm{#1}}}  % constant font, for sem feature values or sem sorts

\newcommand{\modp}[1]{\ensuremath{\langle}\textsc{#1}\ensuremath{\rangle}}  % sem relation/feature


% CCG derivations
% arguments: #1 = no. of words, #2 = body
% Carsten suggests removing @{}, in order to eliminate a gap on the 
% left end of lines in the derivation 
\newcommand{\deriv}[2]
{ 
  \renewcommand{\arraystretch}{.5}
  $\begin{array}[t]{*{#1}{c}}
     #2
   \end{array}$ 
}

% centered multicolumn (NB: changed \mc to \cmc to avoid conflict with kluwer.cls) 
\newcommand{\cmc}[2]{\multicolumn{#1}{c}{#2}}

% Rules, argument #1 gives the number of columns to cover.
\newcommand{\uline}[1]
{\cmc{#1}{\hrulefill} }
\newcommand{\fapply}[1]
{ \cmc{#1}{\hrulefill_{>}} }
\newcommand{\bapply}[1]
{ \cmc{#1}{\hrulefill_{<}} }
\newcommand{\fcomp}[1]
{ \cmc{#1}{\hrulefill_{{>}\mathbf{B}}}}
\newcommand{\fxcomp}[1]
{ \cmc{#1}{\hrulefill_{{>}\mathbf{B}_{\times}}}}
\newcommand{\fxcompN}[2]
{ \cmc{#1}{\hrulefill_{{>}\mathbf{B}^{#2}_{\times}}}}
\newcommand{\fcomptwo}[1]
{ \cmc{#1}{\hrulefill_{{>}\mathbf{B}^2}}}
\newcommand{\fxcomptwo}[1]
{ \cmc{#1}{\hrulefill_{{>}\mathbf{B}_{\times}^2}}}
\newcommand{\fcompthree}[1]
{ \cmc{#1}{\hrulefill_{{>}\mathbf{B}^3}}}
\newcommand{\fxcompthree}[1]
{ \cmc{#1}{\hrulefill_{{>}\mathbf{B}_{\times}^3}}}
\newcommand{\bcomp}[1]
{ \cmc{#1}{\hrulefill_{{<}\mathbf{B}}}}
\newcommand{\bxcomp}[1]
{ \cmc{#1}{\hrulefill_{{<}\mathbf{B}_{\times}}}}
\newcommand{\bxcompN}[2]
{ \cmc{#1}{\hrulefill_{{<}\mathbf{B}^{#2}_{\times}}}}
\newcommand{\bcomptwo}[1]
{ \cmc{#1}{\hrulefill_{{<}\mathbf{B}^2}}}
\newcommand{\bxcomptwo}[1]
{ \cmc{#1}{\hrulefill_{{<}\mathbf{B}_{\times}^2}}}
\newcommand{\bcompthree}[1]
{ \cmc{#1}{\hrulefill_{{<}\mathbf{B}^3}}}
\newcommand{\bxcompthree}[1]
{ \cmc{#1}{\hrulefill_{{<}\mathbf{B}_{\times}^3}}}
\newcommand{\fsubst}[1]
{ \cmc{#1}{\hrulefill_{{>}\mathbf{S}}}}
\newcommand{\bsubst}[1]
{ \cmc{#1}{\hrulefill_{{<}\mathbf{S}}}}
\newcommand{\fxsubst}[1]
{ \cmc{#1}{\hrulefill_{{>}\mathbf{S}_{\times}}}}
\newcommand{\bxsubst}[1]
{ \cmc{#1}{\hrulefill_{{<}\mathbf{S}_{\times}}}}
\newcommand{\ftype}[1]
{ \cmc{#1}{\hrulefill_{{>}\mathbf{T}}}}
\newcommand{\btype}[1]
{ \cmc{#1}{\hrulefill_{{<}\mathbf{T}}}}
\newcommand{\conj}[1]
{ \cmc{#1}{\hrulefill_{{<}\Phi{>}}}}
\newcommand{\boundary}[1]
{ \cmc{#1}{\hrulefill_{{<}\mathbf{\%}}}}
\newcommand{\asterisk}[1]
{ \cmc{#1}{\hrulefill_{\mathbf{*}}}}
\newcommand{\comb}[2] % an arbitrary combinator
{ \cmc{#1}{\hrulefill_{#2}}}
\newcommand{\badcomb}[2] % an inappropriate use of a combinator
{ \cmc{#1}{\hrulefill_{\mbox{ *** }}\hrulefill_{#2}}}
\newcommand{\dcomp}[2] % an arbitrary dcomposition
{ \cmc{#1}{\dotfill_{#2}}}
\newcommand{\unfreeze}[1]
{\cmc{#1}{\hrulefill_{\mathbf{@}}}  }

\newcommand{\ul}{\uline{1}}

\newcounter{CCG@counter}
\newcommand{\CCG@amp}{&}

\newcommand{\ulines}[1]{
  \uline{1}
  \setcounter{CCG@counter}{1} 
  \whiledo{\value{CCG@counter} < #1} { 
    \CCG@amp \uline{1}
    \stepcounter{CCG@counter} 
  }
}


================================================
FILE: docs/realizer/refs.bib
================================================

@PhdThesis{Baldridge:PhD,
  author = 	 {Jason Baldridge},
  title = 	 {Lexically Specified Derivational Control in Combinatory Categorial Grammar},
  school = 	 {School of Informatics, University of Edinburgh},
  year = 	 2002
}

@InProceedings{Baldridge/Kruijff:2002,
  author = 	 {Baldridge, Jason and Kruijff, Geert-Jan},
  title = 	 "{Coupling {CCG} and Hybrid Logic Dependency Semantics}",
  booktitle =	 {Proc.\ ACL-02},
  year =	 2002
}
% booktitle =	 {Proc.\ of 40th Annual Meeting of the Association for Computational Linguistics},
% pages = {319--326},
%  address =	 {Philadelphia, Pennsylvania},

@InProceedings{Baldridge/Kruijff:2003,
  author = 	 {Baldridge, Jason and Kruijff, Geert-Jan},
  title = 	 "{Multi-Modal Combinatory Categorial Grammar}",
  booktitle = {Proc.\ ACL-03},
  year =	 2003
}
% booktitle = {Proc.\ of 10th Annual Meeting of the European Association for Computational Linguistics},
%  address =	 {Budapest, Hungary}


@phdthesis{Kruijff:PhD,
  author={Kruijff, Geert-Jan M.},
  title={A Categorial Modal Architecture of Informativity: 
	   Dependency Grammar Logic \& Information Structure},
  school={Charles University},
  year=2001
}


@InProceedings{Carroll-and-co:1999,
author = {John Carroll and Ann Copestake and Dan Flickinger and Victor Pozna\'nski},
title = {An efficient chart generator for (semi-) lexicalist grammars},
booktitle = {Proc.\ EWNLG-99},
year = 1999
}
% booktitle = {Proc.\ of the 7th European Workshop on Natural Language Generation}, 
% Toulouse, France.
% pages = {86-95}

@InProceedings{Kay:1996,
author = {Martin Kay},
title = {Chart generation},
booktitle = {Proc.\ ACL-96},
year = 1996
}
% booktitle = {Proc.\ of the 34th Annual Meeting of the Association for Computational Linguistics}, 
% pages = {200-204}
% Santa Cruz, California.


@InProceedings{Shieber:1988,
author = {Stuart Shieber},
year = 1988,
title = {A uniform architecture for parsing and generation},
booktitle = {Proc.\ COLING-88}
}
% booktitle = {Proc.\ of the 14th International Conference on Computational Linguistics}, 
% pages = {614-619}
% Budapest, Hungary.


@InProceedings{Bob-Moore:2002,
author = {Robert C. Moore},
title = {A Complete, Efficient Sentence-Realization Algorithm for Unification Grammar},
year = 2002,
booktitle = {Proc.\ INLG-02}
}
% booktitle = {Proc.\ of the 2nd International Natural Language Generation Conference}
%pages?
%New York


@InProceedings{Knight/Hatzi:1995,
author = {Kevin Knight and Vasileios Hatzivassiloglou},
year = 1995,
title = {Two-level, many-paths generation},
booktitle = {Proc.\ ACL-95}
}

%I. Langkilde and K. Knight. 1998a. Generation that
%exploits corpus-based statistical knowledge. In Proc.
%COLING-ACL.

@InProceedings{Langkilde/Knight:1998,
  author = 	 {Irene Langkilde and Kevin Knight}, 
  title = 	 {The practical value of n-grams in generation},
  booktitle = 	 {Proc.\ INLG-98},
  year =	 1998
}
  % booktitle = 	 {Proc.\ of the Ninth International Workshop on Natural Language Generation},

@InProceedings{Langkilde:2000,
author = {Irene Langkilde},
year = 2000,
title = {Forest-based statistical sentence generation}, 
booktitle = {Proc.\ NAACL-00}
}

@InProceedings{Langkilde-Geary:2002,
author = {Irene Langkilde-Geary}, 
title = {An Empirical Verification of Coverage and Correctness for a General-Purpose Sentence Generator}, 
year = 2002,
booktitle = {Proc.\ INLG-02}
}
% booktitle = {Proc.\ of the Second International Natural Language Generation Conference}
%pages?
%New York


@InProceedings{Srini/Owen:2000,
author = {Srinivas Bangalore and Owen Rambow}, 
title = {Exploiting a Probabilistic Hierarchical Model for Generation}, 
year = 2000, 
booktitle = {Proc.\ COLING-00}
}
% Saarbrucken, Germany, August 2000.


@InProceedings{Varges/Mellish:2001,
author = {Sebastian Varges and Chris Mellish},
year = 2001,
title = {Instance-based Natural Language Generation},
booktitle = {Proc.\ NAACL-01}
}
% booktitle = {Proc.\ of the 2nd Meeting of the North American Chapter of the Association for Computational Linguistics},
% pages = {1--8}
% (NAACL-2001)
% Carnegie Mellon University, Pittsburgh, PA, USA.  


@Article{Steedman-LI:2000,
author = {Mark Steedman}, 
year = 2000,
title = "Information Structure and the Syntax-Phonology Interface", 
journal = "Linguistic Inquiry", 
volume = 31,
number = 4, 
pages = {649--689}
}
 

@Book{Steedman:SynProc,
  author = 	 {Mark Steedman},
  title = 	 {The Syntactic Process},
  publisher = 	{MIT Press},
  year = 	 2000,
}
%  address="Cambridge Mass.",


@InProceedings{White/Baldridge:2003,
author = {Michael White and Jason Baldridge}, 
year = 2003,
title = "{Adapting Chart Realization to {CCG}}",
booktitle = {Proc.\ EWNLG-03}
} 
% booktitle = {Proc.\ of the 9th European Workshop on Natural Language Generation}

@Article{White-RLAC:2004,
author = {Michael White}, 
year = 2004, 
title = "{Efficient Realization of Coordinate Structures in Combinatory Categorial Grammar}",
journal = {Research on Language and Computation}, 
note = {To appear}
}

@InProceedings{White-INLG:2004,
author = {Michael White}, 
year = 2004, 
title = "{Reining in CCG Chart Realization}",
booktitle = {Proc.\ INLG-04}
}

@InProceedings{White-ACLSoft:2005,
author = {Michael White}, 
year = 2005, 
title = "Designing an Extensible {API} for Integrating Language Modeling and Realization",
booktitle = {Proc.\ ACL-05 Workshop on Software}
}


@InCollection{Kruijff:2003,
  author = {Geert-Jan M. Kruijff},
  title = {Binding Across Boundaries},
  booktitle = {Resource-Sensitivity in Binding and Anaphora},
  editor = {Geert-Jan M. Kruijff and Richard T. Oehrle},
  publisher = {Kluwer Academic Publishers},
  year = 2003
}

@PhdThesis{Shemtov:PhD,
year=1997,
author={Hadar Shemtov},
title={Ambiguity Management in Natural Language Generation},
school={Stanford University}
}

 
@TechReport{Bleu:2001,
author = {Kishore Papineni and Salim Roukos and Todd Ward and Wei-Jing Zhu}, 
year = 2001,
title = "{Bleu: a Method for Automatic Evaluation of Machine Translation}",
institution = {IBM}, 
number = {RC22176}
}


@InProceedings{FLIGHTS-FLAIRS:2004, 
  author = 	 {Johanna Moore and Mary Ellen Foster and Oliver Lemon and Michael White}, 
  title = 	 "Generating Tailored, Comparative Descriptions in Spoken Dialogue", 
  booktitle = 	 {Proc.\ FLAIRS-04},
  year = {2004}
}

@inproceedings{COMIC-eChallenges:2003,
    title = {Towards Ambient Intelligence: Multimodal Computers that Understand our Intentions},
    author = {Els den Os and Lou Boves},
    booktitle = {Proc.\ eChallenges-03},
    year = {2003}
}

@InProceedings{SRILM-ICSLP:2002,
author = {Andreas Stolcke}, 
title = "{SRILM} --- {A}n extensible language modeling toolkit", 
booktitle = {Proc.\ ICSLP-02}, 
year = 2002}

@TechReport{Ristad:1995,
author = {Eric S.\ Ristad},
year = 1995,
title = "{A Natural Law of Succession}",
institution = {Princeton Univ.}, 
number = {CS-TR-495-95}
}


@InProceedings{Bilmes-Kirchoff:2003,
author = {Jeff Bilmes and Katrin Kirchhoff}, 
title = "Factored language models and general parallelized backoff",
booktitle = {Proc.\ HLT-03}, 
year = 2003}

@Misc{FLM-JHSW:2002,
author = {Katrin Kirchhoff and Jeff Bilmes and Sourin Das and Nicolae Duta and Melissa Egan and Gang Ji and Feng He and John Henderson and Daben Liu and Mohamed Noamany and Pat Schone and Richard Schwartz and Dimitra Vergyri},
title = "{Novel Approaches to Arabic Speech Recognition: Report from the 2002 Johns-Hopkins Summer Workshop}", 
year = 2002} 


@Article{Daelemans:1999,
  author = {Walter Daelemans},
  title = "Introduction to the special issue on memory-based language processing",
  journal = {Journal of Experimental \& Theoretical Artificial Intelligence},
  volume = 11, 
  number = 3, 
  year = 1999, 
  pages = {287--296}
}

@InProceedings{Shaw/Hatzi:1999,
author = {James Shaw and Vasileios Hatzivassiloglou}, 
title = "Ordering Among Premodifiers",
booktitle = {Proc.\ ACL-99}, 
year = 1999}
% Proc. of the 37th Association for Computational Linguistics, pages 135-143, College Park, Maryland, June 1999

@InProceedings{Malouf:2000,
author = {Robert Malouf},
title = "The order of prenominal adjectives in natural language generation",
booktitle = {Proc.\ ACL-00}, 
year = 2000}
% Proceedings of the 38th Annual Meeting of the Association for Computational Linguistics. Pages 85-92.

@Article{Adwait:2002,
  author = {Adwait Ratnaparkhi},
  title = "Trainable approaches to surface natural language generation and their application to conversational dialog systems",
  journal = {Computer, Speech \& Language}, 
  volume = 16, 
  number = {3/4}, 
  year = 2002, 
  pages = {435--455}
}

@Article{Oh/Rudnicky:2002,
  author = {Alice H. Oh and Alexander I. Rudnicky},
  title = "Stochastic natural language generation for spoken dialog systems", 
  journal = {Computer, Speech \& Language}, 
  volume = 16, 
  number = {3/4}, 
  year = 2002, 
  pages = {387--407}
}


@InProceedings{Carsten-Alignment:2005,
author = {Carsten Brockmann and Amy Isard and Jon Oberlander and Michael White},
title = "Variable alignment in affective dialogue",
booktitle = {Proc.\ UM-05 Workshop on Affective Dialogue Systems},
year = 2005}

@Unpublished{COMIC-D7.4:2004,
author = {Michael White},
title = "Experiments with Multimodal Output in Human-Machine Interaction",
note = {IST Project COMIC Public Deliverable 7.4},
year = 2004}
%\texttt{http://www.hcrc.ed.ac.uk/comic/documents/deliverables/D7.4-final.pdf}

@InProceedings{Foster-White-NLPXML:2004,
author = {Mary Ellen Foster and Michael White},
title = "{Techniques for Text Planning with XSLT}", 
booktitle = {Proc.\ 4th NLPXML Workshop}, 
year = 2004}


================================================
FILE: docs/style.css
================================================
body{
font-family: Arial, Helvetica, sans-serif;
size: 12pt;
background: white;
color: black;
}

h1{
font-family: Verdana, Arial, Helvetica, sans-serif;
font-size: 18pt;
color: #006699;
font-weight: italic;
text-align: center;
}

h2{
font-family: Verdana, Arial, Helvetica, sans-serif;
font-size: 16pt;
font-weight: bold;
color: #006699;
}

h3{
font-family: Verdana, Arial, Helvetica, sans-serif;
font-size: 10pt;
color: #006699;
text-align: right;
}

a{
font-family: arial,times;
}

p{
font-family: Verdana, Arial, Helvetica, sans-serif;
color: #000000;
font-size: 12pt;
}

table{
border: 0;
margin: 0;
}

td{
font-family: Bookman,Lucida, Helvetica,arial, times;
font-size: 12pt;
}

td.header1{
font-family: Bookman,Lucida, Helvetica,arial, times;
font-size: 12pt;
background: #52A0EF;
}

td.banner{
font-family: Bookman,Lucida, Helvetica,arial, times;
font-size: 12pt;
background: white;
}

td.header2{
font-family: Bookman,Lucida, Helvetica,arial, times;
font-size: 12pt;
background: #52A0EF;
}


================================================
FILE: docs/taggers-README
================================================

The OpenCCG POS- and supertaggers can be used off-the-shelf, as well
as with the OpenCCG parser.  This README describes how to train and
use the taggers off-the-shelf; for their use with the OpenCCG parser,
see ccgbank-README.

The training process has been implemented in an ant build file, so
it's a bit easier now.  Before you get started, you'll need to
configure your environment variables as described in the main README
(ie, $OPENCCG_HOME/README).  After that, you'll need to install SRILM and Zhang
Le's maxent toolkit, as described below.  Note that this should be
relatively straightforward on linux, but potentially difficult on
other platforms.

Once you've taken care of these prerequisites, simply cd into
$OPENCCG_HOME/ccgbank, and then you can simply train the POS- and
supertagger as follows:

$ cd $OPENCCG_HOME/ccgbank
$ ccg-build -f build-original.xml &> logs/log.original &

Note that ccg-build is simply a front-end to ant that sets some
environment variables, so you can pass through ant flags such as -f,
which indicates that the build file to use is build-original.xml
(rather than the default, build.xml).

The training will take a while; you can check the progess by peeking
at the log file (logs/log.original), as well as the log files for
individual steps in the process, which you can see by looking in the
build-original.xml file.

Once training is done, you can try it out as follows:

$ ccg-build -f build-original.xml test &> logs/log.original.test &

This task will test the POS- and supertaggers on the dev section, and
should only take a matter of minutes. Note that you will likely have
to increase the Java memory limit, if you haven't already done so;
this can be done by choosing a higher value for JAVA_MEM at the end of
the script $OPENCCG_HOME/bin/ccg-env, which is invoked by all the
other OpenCCG scripts (including ccg-build).

The supertagger output file will be in the following format (with each
sentence bracketed by <s>...</s>):

<s>
<word1>[tab]<numOfPOS>[tab]<pos1>...[tab]...<posK>[tab]<numOfSupertags>[tab]<st1>...[tab]...<stL>
...
<wordN>[tab]<numOfPOS>[tab]<pos1>...[tab]...<posM>[tab]<numOfSupertags>[tab]<st1>...[tab]...<stU>
</s>

Adjust the '-beta' option in the build file's test-st-model target to
tag at greater tagging ambiguity levels.

Have fun, and do let us know if anything in these instructions
is flawed. 


----------------- REQUIRED SOFTWARE -----------------

To train the models, you'll need to have SRILM command-line
tools (or some in-house stand-in) and Zhang Le's maxent
toolkit working.

Install SRILM as per the directions, and do the following
to install the patched version of Zhang Le's toolkit:

$ cd
$ wget http://homepages.inf.ed.ac.uk/lzhang10/software/maxent/maxent-20061005.tar.bz2

Unpack and patch the maxent.cpp file (it doesn't
cover the case where ':' can be part of the feature
symbol itself, and not just a delimiter that separates
string repr's of features from their real-valued
activations).

$ bunzip2 maxent-20061005.tar.bz2
$ tar xf maxent-20061005.tar
$ cd maxent-20061005/src
$ patch maxent.cpp $OPENCCG_HOME/docs/maxent.cpp.patched

Now compile the maxent code.

$ cd 
$ cd maxent-20061005
$ make clean all unittest

Test to make sure it (more or less) works (I always only
pass 7 of the 8 tests, but the training seems to work):

$ cd test
$ ./runall.py

Finally, add the 'maxent' binary (under 'maxent-20061005/src/opt')
to your PATH environment variable.

Good. Now we're ready to train some taggers!


---------------- NOTES ------------------------

All the taggers in OpenCCG perform forward-backward tagging.  To
simplify the implementation (and to take advantage of arbitrarily long
n-gram histories of tags) we take a hybrid approach, simply
multiplying the non-sequence-aware maxent tagging model with a
SRILM-trained (i.e., ARPA-formatted) model of tag sequences.  This was
the alternative to the orthodox MEMM (Maximum Entropy Markov Model)
approach suggested in (McCallum, et al., 2000, section 2.6).
Otherwise, the approach closely follows that of Curran, Clark and
Vadas (2006), including the use of beta-best POS tags as features.

The POS- and supertaggers can make use of a prior model instead of a
tag dictionary.  The idea is to train a prior model to give
probabilistic features to a downstream maxent model and let it sort it
out, rather than using tagging dictionaries (which use crude frequency
cut-offs to determine which tags a word may be assigned).
Unfortunately, empirical testing of this idea has been inconclusive,
so it's been put on the back burner (by default, a prior model is used
with the POS tagger but not the supertagger); it remains for future
work to better test the idea, and in particular, whether the prior
model feature approach can take better advantage of self-trained data
by just re-training the prior model on such data.


================================================
FILE: grammars/add-chunks.xsl
================================================
<?xml version="1.0"?>
<!-- 
Copyright (C) 2003-5 University of Edinburgh (Michael White)
$Revision: 1.13 $, $Date: 2009/11/12 00:40:44 $ 

This transformation adds LF chunks (to be realized separately) to the 
HLDS representations.
-->
<xsl:transform 
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform" 
  version="1.0"
  xmlns:xalan2="http://xml.apache.org/xslt"
  exclude-result-prefixes="xalan2">

  <xsl:output indent="yes" xalan2:indent-amount="2"/> 
  <xsl:strip-space elements="*"/>

  
  <!-- default: chunk all non-trivial children when there is at least one relational child --> 
  <xsl:template match="*[(self::diamond or self::satop) and .//diamond[nom]]">
    <xsl:call-template name="chunk-all"/>
  </xsl:template>

  
  <!-- override: don't chunk w/in a disjunctive relation -->
  <xsl:template match="diamond[op[@name='xor']/satop]" priority="1.5">
    <xsl:call-template name="copy"/>
  </xsl:template>
  
  <!-- or with a continuation satop -->
  <xsl:template match="satop[@continuation] | satop[@continuation]/diamond | diamond[nom[@continuation]]" priority="1.45">
    <xsl:call-template name="copy"/>
  </xsl:template>

  
  <!-- or a node containing a (possibly optional) mood feature -->
  <xsl:template match="*[diamond[@mode='mood'] or op[@name='opt']/diamond[@mode='mood']]" priority="1.4">
    <xsl:call-template name="copy"/>
  </xsl:template>

  
  <!-- or w/in scopal body -->
  <xsl:template match="diamond[@mode='Body']" priority="1.3">
    <xsl:call-template name="copy"/>
  </xsl:template>

  <xsl:template match="satop[parent::op[@name='xor' and parent::diamond[@mode='Body']]]" priority="1.3">
    <xsl:call-template name="copy"/>
  </xsl:template>


  <!-- or a tuple -->
  <xsl:template match="*[prop[@name='tup']]" priority="1.2">
    <xsl:call-template name="copy"/>
  </xsl:template>

  
  <!-- or under a First rel containing a tuple item (for gapping) -->
  <xsl:template match="diamond[@mode='First'and diamond[@mode='Item' and prop[@name='tup']]]" priority="1.1">
    <xsl:call-template name="copy"/>
  </xsl:template>
  

  <!-- filter @continuation -->
  <xsl:template match="@continuation"/>


  <!-- chunk all children -->
  <xsl:template name="chunk-all">
    <xsl:copy>
      <xsl:apply-templates select="@*"/>
      <chunk>
        <xsl:apply-templates select="node()"/>
      </chunk>
    </xsl:copy>
  </xsl:template>
  
  
  <!-- Copy -->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

  <xsl:template name="copy">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: grammars/add-family-members.xsl
================================================
<?xml version="1.0"?>
<!-- 
Copyright (C) 2003-4 University of Edinburgh (Michael White)
$Revision: 1.8 $, $Date: 2005/07/18 21:19:41 $ 

This transformation adds family members to an input lexicon 
from a dictionary file given as a parameter. 
It also adds particular stems for a family entry.
-->
<xsl:transform 
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform" 
  version="1.0"
  xmlns:xalan2="http://xml.apache.org/xslt"
  exclude-result-prefixes="xalan2">

  <xsl:output indent="yes" xalan2:indent-amount="2"/> 
  <xsl:strip-space elements="*"/>
  
  
  <!-- Name of the dictionary file with the family members to add -->
  <xsl:param name="dict-file"/>
  
  <!-- Key to find members of a family -->
  <xsl:key name="member-of-key" match="member-of" use="@family"/>

  <!-- Key to find particular stems for a family entry -->
  <xsl:key name="stem-for-key" match="stem-for" use="concat(@family,'.',@entry)"/>
  
  
  <!-- Start with xref check on member-of and stem-for elements in dict file -->
  <xsl:template match="/">
    <!-- Change context to dict-file -->
    <xsl:variable name="root" select="."/>
    <xsl:for-each select="document($dict-file)">
      <!-- Check member-of elements -->
      <xsl:for-each select="//member-of">
        <xsl:variable name="family" select="@family"/>
        <xsl:if test="not($root//family[@name=$family])">
          <xsl:message>
            <xsl:text>Warning, no family with name '</xsl:text>
            <xsl:value-of select="$family"/>
            <xsl:text>' found for entry with stem '</xsl:text>
            <xsl:value-of select="../@stem"/>
            <xsl:text>'. </xsl:text>
          </xsl:message>
        </xsl:if>
      </xsl:for-each>
      <!-- Check stem-for elements -->
      <xsl:for-each select="//stem-for">
        <xsl:variable name="family" select="@family"/>
        <xsl:variable name="entry" select="@entry"/>
        <xsl:if test="not($root//family[@name=$family]/entry[@name=$entry])">
          <xsl:message>
            <xsl:text>Warning, no entry with name '</xsl:text>
            <xsl:value-of select="$entry"/>
            <xsl:text>' found in family with name '</xsl:text>
            <xsl:value-of select="$family"/>
            <xsl:text>' for entry with stem '</xsl:text>
            <xsl:value-of select="../@stem"/>
            <xsl:text>'. </xsl:text>
          </xsl:message>
        </xsl:if>
      </xsl:for-each>
    </xsl:for-each>
    <!-- Continue with lexicon transformation -->
    <xsl:apply-templates/>
  </xsl:template>
  
  
  <!-- Add family members to a family -->
  <xsl:template match="family">
    <xsl:copy>
      <!-- Copy attributes and entries -->
      <xsl:apply-templates select="@*|node()"/>
      <!-- Add members ... -->
      <xsl:variable name="family" select="@name"/>
      <!-- Change context to dict-file -->
      <xsl:for-each select="document($dict-file)">
      <!-- Find member-of elements for this family -->
      <xsl:for-each select="key('member-of-key', $family)">
        <!-- Add a member for the entry's stem -->
        <member stem="{../@stem}">
          <!-- Add @pred, if any (with preference given to local specification) -->
          <xsl:if test="../@pred">
            <xsl:attribute name="pred"><xsl:value-of select="../@pred"/></xsl:attribute>
          </xsl:if>
          <xsl:if test="@pred">
            <xsl:attribute name="pred"><xsl:value-of select="@pred"/></xsl:attribute>
          </xsl:if>
        </member>
      </xsl:for-each>
      </xsl:for-each>
    </xsl:copy>
  </xsl:template>
  
  
  <!-- Add particular stem for a family entry, if any -->
  <xsl:template match="entry">
    <xsl:copy>
      <!-- Copy attributes -->
      <xsl:apply-templates select="@*"/>
      <!-- Look for particular stem ... -->
      <xsl:variable name="family-dot-entry" select="concat(../@name,'.',@name)"/>
      <!-- Change context to dict-file -->
      <xsl:for-each select="document($dict-file)">
      <xsl:variable name="stem-for" select="key('stem-for-key', $family-dot-entry)"/>
      <!-- Add @stem if a particular stem found for this entry -->
      <xsl:if test="$stem-for">
        <xsl:attribute name="stem"><xsl:value-of select="$stem-for/../@stem"/></xsl:attribute>
      </xsl:if>
      </xsl:for-each>
      <!-- Copy rest -->
      <xsl:apply-templates select="node()"/>
    </xsl:copy>
  </xsl:template>
  
  
  <!-- Copy -->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: grammars/append.xsl
================================================
<?xml version="1.0"?>
<!-- 
Copyright (C) 2003 University of Edinburgh (Michael White) 
$Revision: 1.3 $, $Date: 2004/11/19 10:58:58 $ 

This transformation appends the children of the root element 
of the specified file to the root element of the input file.
-->
<xsl:transform 
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform" 
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  exclude-result-prefixes="xalan">

  <xsl:output indent="yes" xalan2:indent-amount="2"/> 
  <xsl:strip-space elements="*"/>

  
  <!-- Name of the file to append -->
  <xsl:param name="file-to-append"/>
  
  
  <!-- Append to root element, overwriting root attributes -->
  <xsl:template match="/*">
    <xsl:copy>
      <xsl:apply-templates select="@*"/>
      <xsl:apply-templates select="document($file-to-append)/*/@*"/>
      <xsl:apply-templates select="node()"/>
      <xsl:apply-templates select="document($file-to-append)/*/node()"/>
    </xsl:copy>
  </xsl:template>

  
  <!-- Copy -->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: grammars/categories.xsd
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!-- 
Copyright (C) 2003-4 University of Edinburgh (Michael White) 
$Revision: 1.9 $, $Date: 2004/10/05 11:01:40 $ 
-->
<xsd:schema xmlns:xsd="http://www.w3.org/2001/XMLSchema">

  <xsd:annotation>
  <xsd:documentation>
    Elements and types for categories and feature structures.

    By and large, there are no constraints on the names used in defining categories, 
    with just a few exceptions:
    
      - '[*DEFAULT*]' proposition or feature value: this reserved value is replaced with 
        the predicate associated with a lexical item (defaulting to the stem) 
        when instantiating the lexical categories associated with a word
        
      - 'index' feature: this feature receives special treatment in the realizer; see 
        Mike and Jason's paper on the realizer for details, at  
        http://www.iccs.informatics.ed.ac.uk/~mwhite/White-Baldridge-ENLG-2003-to-appear.pdf 

      - lists: lists are defined with the 'First' and 'Last' relations, which is 
        (optionally) converted to just the 'List' relation by simplify-lists.xsl; 
        elements in the list are represented using nodes with the 'elem' predicate, 
        together with 'Item' and 'Next' relations to point to the actual list item 
        and the next element, respectively
        
      - tuples: pairs (for argument clusters and gapping) are represented using 
        nodes with the 'tup' (for tuple) predicate, together with 'Item1' and 'Item2' 
        relations to point to the paired items (in principle, further 'ItemN' 
        relations could be used for tuples of length greater than 2); 
        paired items receive special treatment in the realizer
        
      - 'BoundVar' relation: this relation indicates that the subordinate nominal is 
        a bound var; as a result, feature-based instantiation is disabled in the realizer
        
      - 'mark' feature: this semantic attribute indicates that the realizer should label 
        the phrase in the XML output headed by the index associated with this feature
  </xsd:documentation>
  </xsd:annotation>

  <xsd:include schemaLocation="tokens.xsd"/>
  <xsd:include schemaLocation="hlds.xsd"/>
  
  
  <!-- categories -->
  
  <xsd:element name="category" abstract="true">
    <xsd:annotation>
    <xsd:documentation>
      A category, either atomic or complex.
    </xsd:documentation>
    </xsd:annotation>
  </xsd:element>
  
  <xsd:element name="atomcat" substitutionGroup="category">
    <xsd:annotation>
    <xsd:documentation>
      An atomic category.
      Atomic categories must have a type, and may contain 
      a feature structure and LF.
      The possible LF predications are given by the "hldsPreds" type in hlds.xsd.
    </xsd:documentation>
    </xsd:annotation>
    <xsd:complexType>
      <xsd:sequence>
        <xsd:element ref="fs" minOccurs="0"/>
        <xsd:element name="lf" type="hldsPreds" minOccurs="0"/>
      </xsd:sequence>
      <xsd:attribute name="type" type="xsd:NMTOKEN" use="required">
        <xsd:annotation>
        <xsd:documentation>
          The type of the category, e.g. "np".
        </xsd:documentation>
        </xsd:annotation>
      </xsd:attribute>
    </xsd:complexType>
  </xsd:element>
  
  
  <xsd:element name="complexcat" substitutionGroup="category">
    <xsd:annotation>
    <xsd:documentation>
      A complex category, consisting of a target category, 
      an argument stack, and an optional LF.
      Since a complex cat is not curried, the target category will 
      always be atomic.
      An argument stack is one or more basic args, dollar args or set args.
    </xsd:documentation>
    </xsd:annotation>
    
    <xsd:complexType>
      <xsd:sequence>
        <!-- target cat -->
        <xsd:element ref="atomcat"/>
        
        <!-- arg stack -->
        <xsd:choice maxOccurs="unbounded">
          <!--
            NB: An arg stack should be one or more basic, dollar or set args, as 
                shown in this comment below.  Since the slash element is potentially 
                ambiguous between an element of a basic arg or a dollar arg, the slash 
                needs to be factored out, as in the actual definition below.
                
            <xsd:group ref="basicArg"/>
            <xsd:group ref="dollarArg"/>
            <xsd:element ref="setarg"/>
          -->
          <xsd:sequence>
            <xsd:element ref="slash"/>
            <xsd:choice>
              <xsd:element ref="category"/>
              <xsd:element ref="dollar"/>
            </xsd:choice>
          </xsd:sequence>
          <xsd:element ref="dollar"/>
          <xsd:element ref="setarg"/>
        </xsd:choice>
        
        <!-- lf -->
        <xsd:element name="lf" type="hldsPreds" minOccurs="0"/>
      </xsd:sequence>
    </xsd:complexType>
  </xsd:element>
  
  
  <!-- feature structures -->
  
  <xsd:element name="fs">
    <xsd:annotation>
    <xsd:documentation>
      A simple, non-recursive feature structure, consisting of a set 
      of features, i.e. attribute-value pairs.
      If there is only a single, string-valued feature, it can be 
      specified using the "attr" and "val" attributes on this element.
    </xsd:documentation>
    </xsd:annotation>
    <xsd:complexType>
      <xsd:sequence>
        <xsd:element ref="feat" minOccurs="0" maxOccurs="unbounded"/>
      </xsd:sequence>
      <xsd:attribute name="id" type="xsd:integer">
        <xsd:annotation>
        <xsd:documentation>
          An integer id for the feature structure.
          The id is used for coindexation, "inheritsFrom" feature propagation, 
          and macro access.
        </xsd:documentation>
        </xsd:annotation>
      </xsd:attribute>
      <xsd:attribute name="inheritsFrom" type="xsd:integer">
        <xsd:annotation>
        <xsd:documentation>
          This attribute is used to specify feature propagation with exceptions 
					(i.e., default unification).
          At run time, feature equations are added in order to propagate feature values.
          In particular, a feature variable is added to this feature structure and 
          a corresponding one is added to the referenced feature structure, 
          for all appropriate attributes except those with explicit values already 
          on this feature structure.
          The appropriate attributes are determined by the type of the atomic category, 
          and consist of all the attributes seen with this category type in the lexicon 
          file.  NB: Attributes appearing in macros in the morph file are not included, 
          since their association with category types is not available statically.
        </xsd:documentation>
        </xsd:annotation>
      </xsd:attribute>
      <xsd:attribute name="attr" type="xsd:NMTOKEN">
        <xsd:annotation>
        <xsd:documentation>
          The name of the single, string-valued feature (when appropriate).
        </xsd:documentation>
        </xsd:annotation>
      </xsd:attribute>
      <xsd:attribute name="val" type="token">
        <xsd:annotation>
        <xsd:documentation>
          The value of the feature.
        </xsd:documentation>
        </xsd:annotation>
      </xsd:attribute>
    </xsd:complexType>
  </xsd:element>
  
  <xsd:element name="feat">
    <xsd:annotation>
    <xsd:documentation>
      A feature, i.e. an attribute-value pair.
      Features can be either syntactic or semantic (LF-valued).
      Syntactic features can be either ground or variable. 
      If ground, they must be string-valued, and specified via the "val" attribute; 
      if variable, the value is a variable named by a "featvar" element.
      Semantic features can also be either ground or variable; 
      their possible values are given by the "hldsFeatVals" type in hlds.xsd.
    </xsd:documentation>
    </xsd:annotation>
    <xsd:complexType>
      <xsd:choice minOccurs="0">
        <xsd:element ref="featvar"/>
        <xsd:element name="lf" type="hldsFeatVals"/>
      </xsd:choice>
      <xsd:attribute name="attr" type="xsd:NMTOKEN" use="required">
        <xsd:annotation>
        <xsd:documentation>
          The name of the feature.
        </xsd:documentation>
        </xsd:annotation>
      </xsd:attribute>
      <xsd:attribute name="val" type="token">
        <xsd:annotation>
        <xsd:documentation>
          The value of the feature, when string-valued.
        </xsd:documentation>
        </xsd:annotation>
      </xsd:attribute>
    </xsd:complexType>
  </xsd:element>
  
  <xsd:element name="featvar">
    <xsd:annotation>
    <xsd:documentation>
      A variable over syntactic feature values.
    </xsd:documentation>
    </xsd:annotation>
    <xsd:complexType>
      <xsd:attribute name="name" type="typedFeature" use="required">
        <xsd:annotation>
        <xsd:documentation>
          The name of the feature variable.
        </xsd:documentation>
        </xsd:annotation>
      </xsd:attribute>
    </xsd:complexType>
  </xsd:element>
  
  
  <!-- args: basic, dollar and set -->
  
  <xsd:group name="basicArg">  
    <xsd:annotation>
    <xsd:documentation>
      A basic arg pairs a slash and a category.
    </xsd:documentation>
    </xsd:annotation>
    <xsd:sequence>
      <xsd:element ref="slash"/>
      <xsd:element ref="category"/>
    </xsd:sequence>
  </xsd:group>
  
  <xsd:group name="dollarArg">  
    <xsd:annotation>
    <xsd:documentation>
      A dollar arg pairs an optional slash and a dollar variable.
      The slash defaults to the most general slash.
    </xsd:documentation>
    </xsd:annotation>
    <xsd:sequence>
      <xsd:element ref="slash" minOccurs="0"/>
      <xsd:element ref="dollar"/>
    </xsd:sequence>
  </xsd:group>
  
  <xsd:element name="dollar">
    <xsd:annotation>
    <xsd:documentation>
      A dollar variable in the definition of a complex category, 
      i.e. a variable over any sublist of args in an arg stack.
    </xsd:documentation>
    </xsd:annotation>
    <xsd:complexType>
      <xsd:attribute name="name" type="xsd:NMTOKEN">
        <xsd:annotation>
        <xsd:documentation>
          The name of the dollar variable, for coindexation purposes.
        </xsd:documentation>
        </xsd:annotation>
      </xsd:attribute>
    </xsd:complexType>
  </xsd:element>
  
  <xsd:element name="setarg">
    <xsd:annotation>
    <xsd:documentation>
      A set arg, i.e. an unordered set of basic args.
    </xsd:documentation>
    </xsd:annotation>
    <xsd:complexType>
      <xsd:sequence>
        <xsd:group ref="basicArg" minOccurs="2" maxOccurs="unbounded"/>
      </xsd:sequence>
    </xsd:complexType>
  </xsd:element>

  
  <!-- slash -->
  
  <xsd:element name="slash">
    <xsd:annotation>
    <xsd:documentation>
      A slash in the definition of a complex category.
      A slash has a direction, a mode and an ability; 
      a variable can also be given for the mode, using the 
      "varmodality" attribute.
      For discussion, see Jason's dissertation, esp. Ch. 8 on 
      the implementation; the dissertation is downloadable from 
      http://www.iccs.inf.ed.ac.uk/~jmb/dissertation
    </xsd:documentation>
    </xsd:annotation>
    <xsd:complexType>
      <xsd:attribute name="dir">
        <xsd:annotation>
        <xsd:documentation>
          The direction of the slash.
          The direction can be forward (/), backward (\) or both (|).
          Defaults to both.
        </xsd:documentation>
        </xsd:annotation>
        <xsd:simpleType>
          <xsd:restriction base="xsd:string">
            <xsd:enumeration value="/"/>
            <xsd:enumeration value="\"/>
            <xsd:enumeration value="|"/>
          </xsd:restriction>
        </xsd:simpleType>
      </xsd:attribute>
      <xsd:attribute name="mode">
        <xsd:annotation>
        <xsd:documentation>
          The mode of the slash.
          The possible values are: 
            all (.), application only (*), 
            associative (^), permutative (x), 
            permutative right (x&gt;), permutative left (&lt;x), 
            associative permutative right (&gt;), and associative permutative left (&lt;).
          Defaults to all.
          See Jason's dissertation for details.
        </xsd:documentation>
        </xsd:annotation>
        <xsd:simpleType>
          <xsd:restriction base="xsd:string">
            <xsd:enumeration value="."/>
            <xsd:enumeration value="*"/>
            <xsd:enumeration value="^"/>
            <xsd:enumeration value="x"/>
            <xsd:enumeration value="x&gt;"/>
            <xsd:enumeration value="&lt;x"/>
            <xsd:enumeration value="&gt;"/>
            <xsd:enumeration value="&lt;"/>
          </xsd:restriction>
        </xsd:simpleType>
      </xsd:attribute>
      <xsd:attribute name="varmodality" type="xsd:NMTOKEN">
        <xsd:annotation>
        <xsd:documentation>
          A variable over modalities.
        </xsd:documentation>
        </xsd:annotation>
      </xsd:attribute>
      <xsd:attribute name="ability">
        <xsd:annotation>
        <xsd:documentation>
          The ability of the slash, either inert or active.
          Defaults to either.
          This is used to implement antecedent government; 
          see Jason's dissertation for details.
        </xsd:documentation>
        </xsd:annotation>
        <xsd:simpleType>
          <xsd:restriction base="xsd:string">
            <xsd:enumeration value="inert"/>
            <xsd:enumeration value="active"/>
          </xsd:restriction>
        </xsd:simpleType>
      </xsd:attribute>
    </xsd:complexType>
  </xsd:element>

</xsd:schema>


================================================
FILE: grammars/comic/build.xml
================================================
<!-- $Id: build.xml,v 1.5 2007/03/26 14:42:19 mwhite14850 Exp $ -->
<!-- Copyright (C) 2003-4 University of Edinburgh (Michael White) -->
<project default="grammar" basedir=".">

  <!-- =================================================================== -->
  <!-- Initialization target                                               -->
  <!-- =================================================================== -->
  <target name="init">
    <tstamp/>
    <property name="Name" value="OpenCCG"/>
    <property name="name" value="openccg"/>

    <echo message="----------- ${Name} ------------"/>

    <property name="lib.dir" value="${openccg.home}/lib"/>
    <property name="grammars.dir" value="${openccg.home}/grammars"/>
    <property name="core-en.dir" value="${grammars.dir}/core-en"/>

    <path id="validate.classpath">
      <pathelement location="${lib.dir}/xercesImpl.jar"/>
      <pathelement location="${lib.dir}/${name}.jar"/>
    </path>
  </target>
  

  <!-- =================================================================== -->
  <!-- Help on usage                                                       -->
  <!-- =================================================================== -->
  <target name="usage">
    <echo message=""/>
    <echo message=""/>
    <echo message="OpenCCG grammar build file"/>
    <echo message="-------------------------------------------------------------"/>
    <echo message=""/>
    <echo message=" Available targets are:"/>
    <echo message=""/>
    <echo message="   grammar  --> builds the grammar (default)"/>
    <echo message=""/>
    <echo message=" See the comments inside the build.xml file for more details."/>
    <echo message="-------------------------------------------------------------"/>
    <echo message=""/>
    <echo message=""/>
  </target>
  

  <!-- =================================================================== -->
  <!-- Builds grammar                                                     -->
  <!-- =================================================================== -->
  <target name="grammar" depends="init" description="builds grammar">
    <echo message="Transforming dict.xsl to dict.xml"/>
    <java classname="org.apache.xalan.xslt.Process"> 
      <arg value="-XSL"/> <arg value="dict.xsl"/>
      <arg value="-OUT"/> <arg value="dict.xml"/>
    </java>
    <echo message="Transforming lexicon-base.xsl to lexicon-base.xml and unary-rules.xml"/>
    <java classname="org.apache.xalan.xslt.Process"> 
      <arg value="-XSL"/> <arg value="lexicon-base.xsl"/>
      <arg value="-OUT"/> <arg value="lexicon-base.xml"/>
    </java>
    <echo message="Adding family members from dict.xml to lexicon-base.xml, yielding lexicon.xml"/>
    <java classname="org.apache.xalan.xslt.Process"> 
      <arg value="-IN"/> <arg value="lexicon-base.xml"/>
      <arg value="-XSL"/> <arg value="${grammars.dir}/add-family-members.xsl"/>
      <arg value="-PARAM"/> <arg value="dict-file"/> <arg value="${basedir}/dict.xml"/>
      <arg value="-OUT"/> <arg value="lexicon.xml"/>
    </java>
    <echo message="Adding intonation info to dict.xml yielding dict-plus-intonation-info.xml"/>
    <java classname="org.apache.xalan.xslt.Process"> 
      <arg value="-IN"/> <arg value="dict.xml"/>
      <arg value="-XSL"/> <arg value="${core-en.dir}/add-intonation-info.xsl"/>
      <arg value="-OUT"/> <arg value="dict-plus-intonation-info.xml"/>
    </java>
    <echo message="Extracting morph items from dict-plus-intonation-info.xml to morph.xml"/>
    <java classname="org.apache.xalan.xslt.Process"> 
      <arg value="-IN"/> <arg value="dict-plus-intonation-info.xml"/>
      <arg value="-XSL"/> <arg value="${grammars.dir}/extract-morph.xsl"/>
      <arg value="-OUT"/> <arg value="morph.xml"/>
    </java>
    <echo message="Adding type changing rules from unary-rules.xml to rules-base.xml, yielding rules.xml"/>
    <java classname="org.apache.xalan.xslt.Process"> 
      <arg value="-IN"/> <arg value="rules-base.xml"/>
      <arg value="-XSL"/> <arg value="${grammars.dir}/append.xsl"/>
      <arg value="-PARAM"/> <arg value="file-to-append"/> <arg value="${basedir}/unary-rules.xml"/>
      <arg value="-OUT"/> <arg value="rules.xml"/>
    </java>
    <echo message="Adding extra types from types-extras.xml to core-en/types.xml, yielding types.xml"/>
    <java classname="org.apache.xalan.xslt.Process"> 
      <arg value="-IN"/> <arg value="${core-en.dir}/types.xml"/>
      <arg value="-XSL"/> <arg value="${grammars.dir}/append.xsl"/>
      <arg value="-PARAM"/> <arg value="file-to-append"/> <arg value="${basedir}/types-extras.xml"/>
      <arg value="-OUT"/> <arg value="types.xml"/>
    </java>
    <echo message="Validating grammar.xml, lexicon.xml, morph.xml, rules.xml and types.xml"/>
    <java classname="opennlp.ccg.test.Validator" classpathref="validate.classpath" fork="true"> 
      <arg value="grammar.xml"/>
      <arg value="lexicon.xml"/>
      <arg value="morph.xml"/>
      <arg value="rules.xml"/>
      <arg value="types.xml"/>
    </java>
  </target>

</project>

<!-- End of file -->


================================================
FILE: grammars/comic/dict.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<dictionary xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:noNamespaceSchemaLocation="../dict.xsd" name="comic">
  <entry pos="Dummy" stem="*dummy*">
    <member-of family="Dummy"/>
  </entry>
  <entry class="date" pos="NNP" stem="[*DATE*]"/>
  <entry class="time" pos="NNP" stem="[*TIME*]"/>
  <entry macros="@pl-2" class="num" pos="Num" stem="[*NUM*]"/>
  <entry class="amt" pos="NNP" stem="[*AMT*]"/>
  <entry class="dur" pos="NNP" stem="[*DUR*]"/>
  <entry pos="BT" stem="L">
    <member-of family="BoundaryTone-L-LL%"/>
  </entry>
  <entry pos="BT" stem="LL%">
    <member-of family="BoundaryTone-L-LL%"/>
  </entry>
  <entry pos="BT" stem="LH%">
    <member-of family="BoundaryTone-LH%"/>
  </entry>
  <entry pos="BT" stem="HH%">
    <member-of family="BoundaryTone-HH%"/>
  </entry>
  <entry pos="," stem=",">
    <member-of family="Comma"/>
    <member-of pred="elab-rel" family="Comma-Elab"/>
  </entry>
  <entry pos="." stem=".">
    <member-of family="FullStop"/>
  </entry>
  <entry pos="?" stem="?">
    <member-of family="QuestionMark"/>
  </entry>
  <entry pos="Comp" stem="that">
    <member-of family="Comp"/>
  </entry>
  <entry pos="RelPro" stem="that">
    <member-of family="RelPro"/>
    <member-of pred="elab-rel" family="RelPro-Appos"/>
  </entry>
  <entry macros="@1st" class="animate-being" pos="Pro" stem="pro1">
    <member-of family="ProNP"/>
    <word macros="@sg @nom" form="I"/>
    <word macros="@sg @acc" form="me"/>
    <word macros="@pl @nom" form="we"/>
    <word macros="@pl @acc" form="us"/>
  </entry>
  <entry class="animate-being" pos="PossPro" stem="pro1">
    <member-of family="PossPro"/>
    <word macros="@sg-P" form="my"/>
    <word macros="@pl-P" form="our"/>
  </entry>
  <entry macros="@2nd" class="animate-being" pos="Pro" stem="pro2" word="you">
    <member-of family="ProNP"/>
  </entry>
  <entry class="animate-being" pos="PossPro" stem="pro2" word="your">
    <member-of family="PossPro"/>
  </entry>
  <entry macros="@3rd" pos="Pro" stem="pro3f">
    <member-of family="ProNP"/>
    <word macros="@sg @nom" form="she"/>
    <word macros="@sg @acc" form="her"/>
  </entry>
  <entry macros="@sg-P" pos="PossPro" stem="pro3f" word="her">
    <member-of family="PossPro"/>
  </entry>
  <entry macros="@3rd" pos="Pro" stem="pro3m">
    <member-of family="ProNP"/>
    <word macros="@sg @nom" form="he"/>
    <word macros="@sg @acc" form="him"/>
  </entry>
  <entry macros="@sg-P" pos="PossPro" stem="pro3m" word="his">
    <member-of family="PossPro"/>
  </entry>
  <entry macros="@3rd" pos="Pro" stem="pro3n">
    <member-of family="ProNP"/>
    <word macros="@sg" form="it"/>
    <word macros="@pl @nom" form="they"/>
    <word macros="@pl @acc" form="them"/>
  </entry>
  <entry pos="PossPro" stem="pro3n">
    <member-of family="PossPro"/>
    <word macros="@sg-P" form="its"/>
    <word macros="@pl-P" form="their"/>
  </entry>
  <entry macros="@3rd" pos="Pro" stem="this">
    <member-of family="ProNP"/>
    <word macros="@sg" form="this"/>
    <word macros="@pl" form="these"/>
  </entry>
  <entry macros="@3rd" pos="Pro" stem="that">
    <member-of family="ProNP"/>
    <word macros="@sg" form="that"/>
    <word macros="@pl" form="those"/>
  </entry>
  <entry pos="N" stem="pro_one">
    <word macros="@sg" form="one"/>
    <word macros="@pl" form="ones"/>
  </entry>
  <entry pos="Expl" stem="it">
    <member-of family="ExplNP"/>
  </entry>
  <entry pos="Expl" stem="there">
    <member-of family="ExplNP"/>
  </entry>
  <entry pos="Expl" stem="here">
    <member-of family="ExplNP"/>
  </entry>
  <entry pos="Conj" stem="and">
    <member-of family="Conj"/>
    <stem-for entry="NP-Collective" family="Conj"/>
    <stem-for entry="NP-Distributive-and" family="Conj"/>
    <member-of family="Subconj-Initial-Only"/>
  </entry>
  <entry pos="Conj" stem="or">
    <member-of family="Conj"/>
    <stem-for entry="NP-Distributive-or" family="Conj"/>
    <member-of family="Subconj-Initial-Only"/>
  </entry>
  <entry pos="Conj" stem="but">
    <member-of family="Conj-Sentential-Binary"/>
    <member-of family="Subconj-Initial-Only"/>
    <member-of family="Subconj-Medial"/>
  </entry>
  <entry pos="Conj" stem="although">
    <member-of family="Subconj-Initial"/>
  </entry>
  <entry pos="Conj" stem="if">
    <member-of family="Subconj-Initial"/>
  </entry>
  <entry pos="Conj" stem="while">
    <member-of family="Subconj-Medial"/>
  </entry>
  <entry macros="@sg-2" pos="QNP" pred="every" stem="everyone">
    <member-of family="QuantNP"/>
  </entry>
  <entry macros="@pl-2" pos="QNP" stem="both">
    <member-of family="QuantNP"/>
  </entry>
  <entry macros="@sg-2" pos="QNP" stem="neither">
    <member-of family="QuantNP"/>
  </entry>
  <entry macros="@pl-2" pos="QNP" stem="none">
    <member-of family="QuantNP"/>
  </entry>
  <entry macros="@pl-or-mass-2" pos="QNP" stem="all">
    <member-of family="QuantNP"/>
  </entry>
  <entry pos="WhNP" stem="what">
    <member-of family="WhNP"/>
  </entry>
  <entry macros="@X-location" pos="WhNP" stem="where">
    <member-of family="WhNP"/>
  </entry>
  <entry macros="@X-person" pos="WhNP" stem="who">
    <member-of family="WhNP"/>
  </entry>
  <entry macros="@sg-2" pos="Det" stem="a">
    <member-of family="Det"/>
    <word form="a"/>
    <word form="an"/>
  </entry>
  <entry pos="Det" stem="some">
    <member-of family="Det"/>
  </entry>
  <entry pos="Det" stem="the">
    <member-of family="Det"/>
  </entry>
  <entry macros="@sg-2" pos="PDet" stem="another">
    <member-of family="PDet"/>
  </entry>
  <entry pos="PDet" stem="this">
    <member-of family="PDet"/>
    <word macros="@sg-or-mass-2" form="this"/>
    <word macros="@pl-2" form="these"/>
  </entry>
  <entry pos="PDet" stem="that">
    <member-of family="PDet"/>
    <word macros="@sg-or-mass-2" form="that"/>
    <word macros="@pl-2" form="those"/>
  </entry>
  <entry pos="PossS" stem="'s">
    <member-of family="PossS"/>
  </entry>
  <entry macros="@pl-or-mass-2" pos="QDet" stem="all">
    <member-of family="QuantDet"/>
  </entry>
  <entry macros="@pl-2" pos="QDet" stem="both">
    <member-of family="QuantDet"/>
  </entry>
  <entry macros="@sg-2" pos="QDet" stem="every">
    <member-of family="QuantDet"/>
  </entry>
  <entry macros="@sg-2" pos="QDet" stem="neither">
    <member-of family="QuantDet"/>
  </entry>
  <entry pos="QDet" stem="no">
    <member-of family="QuantDet"/>
  </entry>
  <entry pos="Wh" stem="what">
    <member-of family="WhDet"/>
  </entry>
  <entry pos="Wh" stem="which">
    <member-of family="WhDet"/>
  </entry>
  <entry pos="Adv" stem="also">
    <member-of family="Adverb"/>
  </entry>
  <entry pos="Adv" stem="either">
    <member-of family="Adverb"/>
  </entry>
  <entry pos="Adv" stem="though">
    <member-of family="Adverb"/>
  </entry>
  <entry pos="Prep" stem="with">
    <member-of family="Prep-Nom"/>
    <member-of family="With-Poss"/>
  </entry>
  <entry pos="V" stem="can">
    <member-of family="Modal"/>
  </entry>
  <entry pos="V" stem="may">
    <member-of family="Modal"/>
  </entry>
  <entry pos="V" stem="should">
    <member-of family="Modal"/>
  </entry>
  <entry pos="V" stem="would">
    <member-of family="Modal"/>
    <word form="would"/>
    <word form="'d"/>
  </entry>
  <entry pos="V" stem="will">
    <member-of family="Modal"/>
    <word form="will"/>
    <word form="'ll"/>
  </entry>
  <entry pos="V" stem="not">
    <member-of family="Negation"/>
    <word macros="@base @base6" form="not"/>
    <word macros="@base @base6" form="n't"/>
    <word macros="@adj @adj6" form="not"/>
    <word macros="@adj @adj6" form="n't"/>
  </entry>
  <entry pos="V" stem="do">
    <member-of family="Modal"/>
    <member-of family="Do-Support"/>
    <word macros="@pres @sg-agr @non-3rd-agr" form="do"/>
    <word macros="@pres @sg-or-mass-agr @3rd-agr" form="does"/>
    <word macros="@pres @pl-agr" form="do"/>
    <word macros="@past" form="did"/>
  </entry>
  <entry pos="V" stem="be">
    <member-of family="Copula"/>
    <member-of pred="prog" family="Progressive"/>
    <member-of pred="there-be" family="ThereExistential"/>
    <member-of pred="here-be" family="HereExistential"/>
    <word excluded="Inverted" macros="@base" form="be"/>
    <word macros="@pres @sg-agr @1st-agr" form="am"/>
    <word macros="@pres @sg-agr @1st-agr" form="'m"/>
    <word macros="@pres @sg-agr @2nd-agr" form="are"/>
    <word macros="@pres @sg-agr @2nd-agr" form="'re"/>
    <word macros="@pres @sg-or-mass-agr @3rd-agr" form="is"/>
    <word macros="@pres @sg-or-mass-agr @3rd-agr" form="'s"/>
    <word macros="@pres @pl-agr" form="are"/>
    <word macros="@pres @pl-agr" form="'re"/>
    <word macros="@past @sg-agr @1st-agr" form="was"/>
    <word macros="@past @sg-agr @2nd-agr" form="were"/>
    <word macros="@past @sg-or-mass-agr @3rd-agr" form="was"/>
    <word macros="@past @pl-agr" form="were"/>
  </entry>
  <entry pos="V" stem="have">
    <member-of family="Possession"/>
    <word excluded="Inverted" macros="@base" form="have"/>
    <word macros="@pres @sg-agr @non-3rd-agr" form="have"/>
    <word macros="@pres @sg-or-mass-agr @3rd-agr" form="has"/>
    <word macros="@pres @pl-agr" form="have"/>
    <word macros="@past" form="had"/>
  </entry>
  <entry pos="V" stem="like">
    <member-of family="Experiencer-Subj"/>
    <word macros="@base" form="like"/>
    <word macros="@ng" form="liking"/>
    <word macros="@pres @sg-agr @non-3rd-agr" form="like"/>
    <word macros="@pres @sg-or-mass-agr @3rd-agr" form="likes"/>
    <word macros="@pres @pl-agr" form="like"/>
    <word macros="@past" form="liked"/>
  </entry>
  <entry pos="V" stem="make">
    <member-of family="Agentive-Causing"/>
    <word macros="@base" form="make"/>
    <word macros="@ng" form="making"/>
    <word macros="@pres @sg-agr @non-3rd-agr" form="make"/>
    <word macros="@pres @sg-or-mass-agr @3rd-agr" form="makes"/>
    <word macros="@pres @pl-agr" form="make"/>
    <word macros="@past" form="made"/>
  </entry>
  <entry pos="V" stem="mention">
    <member-of family="Statement"/>
    <word macros="@pres @sg-agr @non-3rd-agr" form="mention"/>
    <word macros="@pres @sg-or-mass-agr @3rd-agr" form="mentions"/>
    <word macros="@pres @pl-agr" form="mention"/>
    <word macros="@past" form="mentioned"/>
  </entry>
  <entry pos="V" stem="say">
    <member-of family="Statement"/>
    <word macros="@pres @sg-agr @non-3rd-agr" form="say"/>
    <word macros="@pres @sg-or-mass-agr @3rd-agr" form="says"/>
    <word macros="@pres @pl-agr" form="say"/>
    <word macros="@past" form="said"/>
  </entry>
  <entry macros="@sg-2" class="num" pos="Num" stem="one">
    <member-of family="One-Det"/>
  </entry>
  <entry macros="@sg-2" class="num" pos="Num" stem="1">
    <member-of family="One-Det"/>
  </entry>
  <entry macros="@pl-2" class="num" pos="Num" stem="several"/>
  <entry macros="@pl-2" class="num" pos="Num" stem="two"/>
  <entry macros="@pl-2" class="num" pos="Num" stem="three"/>
  <entry macros="@pl-2" class="num" pos="Num" stem="four"/>
  <entry macros="@pl-2" class="num" pos="Num" stem="five"/>
  <entry macros="@pl-2" class="num" pos="Num" stem="six"/>
  <entry macros="@pl-2" class="num" pos="Num" stem="seven"/>
  <entry macros="@pl-2" class="num" pos="Num" stem="eight"/>
  <entry macros="@pl-2" class="num" pos="Num" stem="nine"/>
  <entry macros="@pl-2" class="num" pos="Num" stem="ten"/>
  <entry pos="Prep" stem="at">
    <member-of family="Prep-Nom"/>
  </entry>
  <entry pos="Prep" stem="by">
    <member-of family="By-Creator"/>
  </entry>
  <entry pos="Prep" stem="from">
    <member-of family="Prep-Nom"/>
    <member-of family="Prep-Source"/>
  </entry>
  <entry pos="Adj" stem="in">
    <member-of family="Prep-Loc"/>
  </entry>
  <entry pos="Adv" stem="in_addition_to">
    <member-of pred="in-addition-to" family="Prep-Transitional"/>
  </entry>
  <entry pos="Prep" stem="of">
    <member-of family="Prep-Nom"/>
  </entry>
  <entry pos="Adj" stem="on">
    <member-of family="Prep-Loc"/>
  </entry>
  <entry pos="Prep" stem="to">
    <member-of family="To-Infinitive"/>
  </entry>
  <entry pos="Adv" stem="before">
    <member-of family="Adverb"/>
  </entry>
  <entry pos="Adv" stem="earlier">
    <member-of family="Adverb"/>
  </entry>
  <entry pos="Adv" stem="down_here">
    <member-of family="Loc-Adverb"/>
  </entry>
  <entry pos="Adv" stem="here">
    <member-of family="Loc-Adverb"/>
  </entry>
  <entry pos="Adv" stem="now">
    <member-of family="Transitional-Adverb"/>
  </entry>
  <entry pos="Adv" stem="once_again">
    <member-of pred="once-again" family="Adverb"/>
  </entry>
  <entry pos="Conj" stem="as">
    <member-of family="Subconj-Transitional"/>
  </entry>
  <entry pos="V" stem="draw">
    <member-of pred="draw-from" family="Drawing-From"/>
    <word macros="@base" form="draw"/>
    <word macros="@ng" form="drawing"/>
    <word macros="@pres @sg-agr @non-3rd-agr" form="draw"/>
    <word macros="@pres @sg-or-mass-agr @3rd-agr" form="draws"/>
    <word macros="@pres @pl-agr" form="draw"/>
    <word macros="@past" form="drew"/>
  </entry>
  <entry pos="V" stem="feature">
    <member-of family="Featuring"/>
    <word macros="@base" form="feature"/>
    <word macros="@ng" form="featuring"/>
    <word macros="@pres @sg-agr @non-3rd-agr" form="feature"/>
    <word macros="@pres @sg-or-mass-agr @3rd-agr" form="features"/>
    <word macros="@pres @pl-agr" form="feature"/>
    <word macros="@past" form="featured"/>
  </entry>
  <entry pos="V" stem="go">
    <member-of pred="go-with" family="Going-With"/>
    <word macros="@base" form="go"/>
    <word macros="@ng" form="going"/>
    <word macros="@pres @sg-agr @non-3rd-agr" form="go"/>
    <word macros="@pres @sg-or-mass-agr @3rd-agr" form="goes"/>
    <word macros="@pres @pl-agr" form="go"/>
    <word macros="@past" form="went"/>
  </entry>
  <entry pos="V" stem="look-at">
    <member-of family="Looking-At"/>
    <word macros="@base" form="look"/>
    <word macros="@ng" form="looking"/>
    <word macros="@pres @sg-agr @non-3rd-agr" form="look"/>
    <word macros="@pres @sg-or-mass-agr @3rd-agr" form="looks"/>
    <word macros="@pres @pl-agr" form="look"/>
    <word macros="@past" form="looked"/>
  </entry>
  <entry pos="V" stem="mean">
    <member-of family="Meaning"/>
    <word macros="@base" form="mean"/>
    <word macros="@ng" form="meaning"/>
    <word macros="@pres @sg-agr @non-3rd-agr" form="mean"/>
    <word macros="@pres @sg-or-mass-agr @3rd-agr" form="means"/>
    <word macros="@pres @pl-agr" form="mean"/>
    <word macros="@past" form="meant"/>
  </entry>
  <entry pos="V" stem="see">
    <member-of family="Seeing"/>
    <word macros="@base" form="see"/>
    <word macros="@ng" form="seeing"/>
    <word macros="@pres @sg-agr @non-3rd-agr" form="see"/>
    <word macros="@pres @sg-or-mass-agr @3rd-agr" form="sees"/>
    <word macros="@pres @pl-agr" form="see"/>
    <word macros="@past" form="saw"/>
  </entry>
  <entry pos="V" stem="use">
    <member-of family="Using"/>
    <word macros="@base" form="use"/>
    <word macros="@ng" form="using"/>
    <word macros="@pres @sg-agr @non-3rd-agr" form="use"/>
    <word macros="@pres @sg-or-mass-agr @3rd-agr" form="uses"/>
    <word macros="@pres @pl-agr" form="use"/>
    <word macros="@past" form="used"/>
  </entry>
  <entry pos="V" stem="want">
    <member-of family="Experiencer-Subj"/>
    <word macros="@base" form="want"/>
    <word macros="@ng" form="wanting"/>
    <word macros="@pres @sg-agr @non-3rd-agr" form="want"/>
    <word macros="@pres @sg-or-mass-agr @3rd-agr" form="wants"/>
    <word macros="@pres @pl-agr" form="want"/>
    <word macros="@past" form="wanted"/>
  </entry>
  <entry class="colour_prop" pos="V" stem="help-set-mood">
    <member-of family="Canned-VP"/>
    <word macros="@ng" form="helping_to_set_the_mood"/>
    <word macros="@pres @sg-or-mass-agr @3rd-agr" form="helps_to_set_the_mood"/>
    <word macros="@pres @pl-agr" form="help_to_set_the_mood"/>
  </entry>
  <entry class="colour_prop" pos="V" stem="emphasise-straight-lined-character">
    <member-of family="Canned-VP"/>
    <word macros="@ng" form="emphasising_the_clear,_straight_lined_character_of_your_bathroom_in_a_stylish_way"/>
    <word macros="@pres @sg-or-mass-agr @3rd-agr" form="emphasises_the_clear,_straight_lined_character_of_your_bathroom_in_a_stylish_way"/>
    <word macros="@pres @pl-agr" form="emphasise_the_clear,_straight_lined_character_of_your_bathroom_in_a_stylish_way"/>
  </entry>
  <entry class="colour_prop" pos="V" stem="give-tuscan-feeling">
    <member-of family="Canned-VP"/>
    <word macros="@ng" form="giving_the_room_the_feeling_of_a_Tuscan_country_home"/>
    <word macros="@pres @sg-or-mass-agr @3rd-agr" form="gives_the_room_the_feeling_of_a_Tuscan_country_home"/>
    <word macros="@pres @pl-agr" form="give_the_room_the_feeling_of_a_Tuscan_country_home"/>
  </entry>
  <entry pos="Adj" stem="based_on">
    <member-of pred="based-on" family="Based-On"/>
  </entry>
  <entry pos="Adj" stem="more">
    <member-of family="Adjective"/>
  </entry>
  <entry pos="Adj" stem="other">
    <member-of family="Adjective"/>
  </entry>
  <entry class="quality" pos="Adj" stem="abstract">
    <member-of family="Adjective"/>
  </entry>
  <entry class="quality" pos="Adj" stem="animal">
    <member-of family="Adjective"/>
  </entry>
  <entry class="quality" pos="Adj" stem="belt_buckle">
    <member-of pred="belt-buckle" family="Adjective"/>
  </entry>
  <entry class="quality" pos="Adj" stem="comic">
    <member-of family="Adjective"/>
  </entry>
  <entry class="quality" pos="Adj" stem="cross">
    <member-of family="Adjective"/>
  </entry>
  <entry class="quality" pos="Adj" stem="diamond">
    <member-of family="Adjective"/>
  </entry>
  <entry class="quality" pos="Adj" stem="decorative">
    <member-of family="Adjective"/>
  </entry>
  <entry class="quality" pos="Adj" stem="face">
    <member-of family="Adjective"/>
  </entry>
  <entry class="quality" pos="Adj" stem="female">
    <member-of family="Adjective"/>
  </entry>
  <entry class="quality" pos="Adj" stem="floral">
    <member-of family="Adjective"/>
  </entry>
  <entry class="quality" pos="Adj" stem="geometric">
    <member-of family="Adjective"/>
  </entry>
  <entry class="quality" pos="Adj" stem="jeans">
    <member-of family="Adjective"/>
  </entry>
  <entry class="quality" pos="Adj" stem="male">
    <member-of family="Adjective"/>
  </entry>
  <entry class="style" pos="Adj" stem="classic">
    <member-of family="Adjective"/>
  </entry>
  <entry class="style" pos="Adj" stem="country">
    <member-of family="Adjective"/>
  </entry>
  <entry class="style" pos="Adj" stem="family">
    <member-of family="Adjective"/>
  </entry>
  <entry class="style" pos="Adj" stem="modern">
    <member-of family="Adjective"/>
  </entry>
  <entry class="size" pos="Adj" stem="larger">
    <member-of family="Adjective"/>
  </entry>
  <entry class="size" pos="Adj" stem="smaller">
    <member-of family="Adjective"/>
  </entry>
  <entry class="colour" pos="Adj" stem="beige">
    <member-of family="Adjective"/>
  </entry>
  <entry class="colour" macros="@mass" pos="N" stem="beige"/>
  <entry class="colour" pos="Adj" stem="black">
    <member-of family="Adjective"/>
  </entry>
  <entry class="colour" macros="@mass" pos="N" stem="black"/>
  <entry class="colour" pos="Adj" stem="blue">
    <member-of family="Adjective"/>
  </entry>
  <entry class="colour" macros="@mass" pos="N" stem="blue"/>
  <entry class="colour" pos="Adj" stem="brown">
    <member-of family="Adjective"/>
  </entry>
  <entry class="colour" macros="@mass" pos="N" stem="brown"/>
  <entry class="colour" pos="Adj" stem="cream">
    <member-of family="Adjective"/>
  </entry>
  <entry class="colour" macros="@mass" pos="N" stem="cream"/>
  <entry class="colour" pos="Adj" stem="dark_green">
    <member-of family="Adjective"/>
  </entry>
  <entry class="colour" macros="@mass" pos="N" stem="dark_green"/>
  <entry class="colour" pos="Adj" stem="dark_red">
    <member-of family="Adjective"/>
  </entry>
  <entry class="colour" macros="@mass" pos="N" stem="dark_red"/>
  <entry class="colour" pos="Adj" stem="gray">
    <member-of family="Adjective"/>
  </entry>
  <entry class="colour" macros="@mass" pos="N" stem="gray"/>
  <entry class="colour" pos="Adj" stem="grey">
    <member-of family="Adjective"/>
  </entry>
  <entry class="colour" macros="@mass" pos="N" stem="grey"/>
  <entry class="colour" pos="Adj" stem="green">
    <member-of family="Adjective"/>
  </entry>
  <entry class="colour" macros="@mass" pos="N" stem="green"/>
  <entry class="colour" pos="Adj" stem="indigo">
    <member-of family="Adjective"/>
  </entry>
  <entry class="colour" macros="@mass" pos="N" stem="indigo"/>
  <entry class="colour" pos="Adj" stem="ochre">
    <member-of family="Adjective"/>
  </entry>
  <entry class="colour" macros="@mass" pos="N" stem="ochre"/>
  <entry class="colour" pos="Adj" stem="off_white">
    <member-of family="Adjective"/>
  </entry>
  <entry class="colour" macros="@mass" pos="N" stem="off_white"/>
  <entry class="colour" pos="Adj" stem="orange">
    <member-of family="Adjective"/>
  </entry>
  <entry class="colour" macros="@mass" pos="N" stem="orange"/>
  <entry class="colour" pos="Adj" stem="pink">
    <member-of family="Adjective"/>
  </entry>
  <entry class="colour" macros="@mass" pos="N" stem="pink"/>
  <entry class="colour" pos="Adj" stem="purple">
    <member-of family="Adjective"/>
  </entry>
  <entry class="colour" macros="@mass" pos="N" stem="purple"/>
  <entry class="colour" pos="Adj" stem="red">
    <member-of family="Adjective"/>
  </entry>
  <entry class="colour" macros="@mass" pos="N" stem="red"/>
  <entry class="colour" pos="Adj" stem="rose">
    <member-of family="Adjective"/>
  </entry>
  <entry class="colour" macros="@mass" pos="N" stem="rose"/>
  <entry class="colour" pos="Adj" stem="royal_blue">
    <member-of family="Adjective"/>
  </entry>
  <entry class="colour" macros="@mass" pos="N" stem="royal_blue"/>
  <entry class="colour" pos="Adj" stem="salmon">
    <member-of family="Adjective"/>
  </entry>
  <entry class="colour" macros="@mass" pos="N" stem="salmon"/>
  <entry class="colour" pos="Adj" stem="sandstone">
    <member-of family="Adjective"/>
  </entry>
  <entry class="colour" macros="@mass" pos="N" stem="sandstone"/>
  <entry class="colour" pos="Adj" stem="silver">
    <member-of family="Adjective"/>
  </entry>
  <entry class="colour" macros="@mass" pos="N" stem="silver"/>
  <entry class="colour" pos="Adj" stem="terracotta">
    <member-of family="Adjective"/>
  </entry>
  <entry class="colour" macros="@mass" pos="N" stem="terracotta"/>
  <entry class="colour" pos="Adj" stem="violet">
    <member-of family="Adjective"/>
  </entry>
  <entry class="colour" macros="@mass" pos="N" stem="violet"/>
  <entry class="colour" pos="Adj" stem="white">
    <member-of family="Adjective"/>
  </entry>
  <entry class="colour" macros="@mass" pos="N" stem="white"/>
  <entry class="colour" pos="Adj" stem="yellow">
    <member-of family="Adjective"/>
  </entry>
  <entry class="colour" macros="@mass" pos="N" stem="yellow"/>
  <entry class="decoration" macros="@mass" pos="N" stem="art"/>
  <entry class="decoration" macros="@mass" pos="N" stem="artwork"/>
  <entry class="abstraction" pos="N" stem="collection">
    <word macros="@sg" form="collection"/>
    <word macros="@pl" form="collections"/>
  </entry>
  <entry class="abstraction" pos="N" stem="colour">
    <word macros="@sg" form="colour"/>
    <word macros="@pl" form="colours"/>
  </entry>
  <entry class="mental-obj" pos="N" stem="colour_scheme">
    <word macros="@sg" form="colour_scheme"/>
    <word macros="@pl" form="colour_schemes"/>
  </entry>
  <entry class="mental-obj" pos="N" stem="design">
    <word macros="@sg" form="design"/>
    <word macros="@pl" form="designs"/>
  </entry>
  <entry class="decoration" macros="@mass" pos="N" stem="fruit"/>
  <entry class="decoration" macros="@pl" pos="N" stem="mosaics"/>
  <entry class="decoration" pos="N" stem="motif">
    <word macros="@sg" form="motif"/>
    <word macros="@pl" form="motifs"/>
  </entry>
  <entry class="mental-obj" pos="N" stem="option">
    <word macros="@sg" form="option"/>
    <word macros="@pl" form="options"/>
  </entry>
  <entry class="abstraction" pos="N" stem="series">
    <word macros="@sg" form="series"/>
    <word macros="@pl" form="series"/>
  </entry>
  <entry class="decoration" pos="N" stem="shape">
    <word macros="@sg" form="shape"/>
    <word macros="@pl" form="shapes"/>
  </entry>
  <entry class="abstraction" pos="N" stem="style">
    <word macros="@sg" form="style"/>
    <word macros="@pl" form="styles"/>
  </entry>
  <entry class="phys-obj" pos="N" stem="tile">
    <word macros="@sg" form="tile"/>
    <word macros="@pl" form="tiles"/>
  </entry>
  <entry macros="@sg-2" class="manufacturer" pos="NNP" stem="Agrob_Buchtal"/>
  <entry macros="@sg-2" class="manufacturer" pos="NNP" stem="Alessi_Tiles"/>
  <entry macros="@sg-2" class="manufacturer" pos="NNP" stem="Aparici"/>
  <entry macros="@sg-2" class="manufacturer" pos="NNP" stem="Apavisa"/>
  <entry macros="@sg-2" class="manufacturer" pos="NNP" stem="Bisazza"/>
  <entry macros="@sg-2" class="manufacturer" pos="NNP" stem="Cerim_Ceramiche"/>
  <entry macros="@sg-2" class="manufacturer" pos="NNP" stem="Coem"/>
  <entry macros="@sg-2" class="manufacturer" pos="NNP" stem="Engers_Eurodesign"/>
  <entry macros="@sg-2" class="manufacturer" pos="NNP" stem="Gardenia_Orchidea"/>
  <entry macros="@sg-2" class="manufacturer" pos="NNP" stem="Imola_Ceramica"/>
  <entry macros="@sg-2" class="manufacturer" pos="NNP" stem="Iris_Ceramica"/>
  <entry macros="@sg-2" class="manufacturer" pos="NNP" stem="NovaBell"/>
  <entry macros="@sg-2" class="manufacturer" pos="NNP" stem="Porcelaingres"/>
  <entry macros="@sg-2" class="manufacturer" pos="NNP" stem="Porcelanosa"/>
  <entry macros="@sg-2" class="manufacturer" pos="NNP" stem="Sphinx_Tiles"/>
  <entry macros="@sg-2" class="manufacturer" pos="NNP" stem="Steuler"/>
  <entry macros="@sg-2" class="manufacturer" pos="NNP" stem="Villeroy_and_Boch"/>
  <entry macros="@sg-2" class="series" pos="NNP" stem="Abbazie"/>
  <entry class="series" pos="Adj" stem="Abbazie">
    <member-of family="Adjective"/>
  </entry>
  <entry macros="@sg-2" class="series" pos="NNP" stem="Aguamarina"/>
  <entry class="series" pos="Adj" stem="Aguamarina">
    <member-of family="Adjective"/>
  </entry>
  <entry macros="@sg-2" class="series" pos="NNP" stem="Alt_Mettlach"/>
  <entry class="series" pos="Adj" stem="Alt_Mettlach">
    <member-of family="Adjective"/>
  </entry>
  <entry macros="@sg-2" class="series" pos="NNP" stem="Altamira"/>
  <entry class="series" pos="Adj" stem="Altamira">
    <member-of family="Adjective"/>
  </entry>
  <entry macros="@sg-2" class="series" pos="NNP" stem="Amazonita"/>
  <entry class="series" pos="Adj" stem="Amazonita">
    <member-of family="Adjective"/>
  </entry>
  <entry macros="@sg-2" class="series" pos="NNP" stem="Anasol"/>
  <entry class="series" pos="Adj" stem="Anasol">
    <member-of family="Adjective"/>
  </entry>
  <entry macros="@sg-2" class="series" pos="NNP" stem="Aramis"/>
  <entry class="series" pos="Adj" stem="Aramis">
    <member-of family="Adjective"/>
  </entry>
  <entry macros="@sg-2" class="series" pos="NNP" stem="Asterix"/>
  <entry class="series" pos="Adj" stem="Asterix">
    <member-of family="Adjective"/>
  </entry>
  <entry macros="@sg-2" class="series" pos="NNP" stem="Armonie"/>
  <entry class="series" pos="Adj" stem="Armonie">
    <member-of family="Adjective"/>
  </entry>
  <entry macros="@sg-2" class="series" pos="NNP" stem="Ateliers"/>
  <entry class="series" pos="Adj" stem="Ateliers">
    <member-of family="Adjective"/>
  </entry>
  <entry macros="@sg-2" class="series" pos="NNP" stem="Blue_Jeans"/>
  <entry class="series" pos="Adj" stem="Blue_Jeans">
    <member-of family="Adjective"/>
  </entry>
  <entry macros="@sg-2" class="series" pos="NNP" stem="Carioca"/>
  <entry class="series" pos="Adj" stem="Carioca">
    <member-of family="Adjective"/>
  </entry>
  <entry macros="@sg-2" class="series" pos="NNP" stem="Cardiff"/>
  <entry class="series" pos="Adj" stem="Cardiff">
    <member-of family="Adjective"/>
  </entry>
  <entry macros="@sg-2" class="series" pos="NNP" stem="Century"/>
  <entry class="series" pos="Adj" stem="Century">
    <member-of family="Adjective"/>
  </entry>
  <entry macros="@sg-2" class="series" pos="NNP" stem="Century_Esprit"/>
  <entry class="series" pos="Adj" stem="Century_Esprit">
    <member-of family="Adjective"/>
  </entry>
  <entry macros="@sg-2" class="series" pos="NNP" stem="Colorado"/>
  <entry class="series" pos="Adj" stem="Colorado">
    <member-of family="Adjective"/>
  </entry>
  <entry macros="@sg-2" class="series" pos="NNP" stem="Creative_System_Amazonas"/>
  <entry class="series" pos="Adj" stem="Creative_System_Amazonas">
    <member-of family="Adjective"/>
  </entry>
  <entry macros="@sg-2" class="series" pos="NNP" stem="Creative_System_Safari"/>
  <entry class="series" pos="Adj" stem="Creative_System_Safari">
    <member-of family="Adjective"/>
  </entry>
  <entry macros="@sg-2" class="series" pos="NNP" stem="Darlington"/>
  <entry class="series" pos="Adj" stem="Darlington">
    <member-of family="Adjective"/>
  </entry>
  <entry macros="@sg-2" class="series" pos="NNP" stem="Funny_Day"/>
  <entry class="series" pos="Adj" stem="Funny_Day">
    <member-of family="Adjective"/>
  </entry>
  <entry macros="@sg-2" class="series" pos="NNP" stem="Girotondo_Tile"/>
  <entry class="series" pos="Adj" stem="Girotondo_Tile">
    <member-of family="Adjective"/>
  </entry>
  <entry macros="@sg-2" class="series" pos="NNP" stem="Helenus"/>
  <entry class="series" pos="Adj" stem="Helenus">
    <member-of family="Adjective"/>
  </entry>
  <entry macros="@sg-2" class="series" pos="NNP" stem="Hippo"/>
  <entry class="series" pos="Adj" stem="Hippo">
    <member-of family="Adjective"/>
  </entry>
  <entry macros="@sg-2" class="series" pos="NNP" stem="HundertWasser"/>
  <entry class="series" pos="Adj" stem="HundertWasser">
    <member-of family="Adjective"/>
  </entry>
  <entry macros="@sg-2" class="series" pos="NNP" stem="I_marmi"/>
  <entry class="series" pos="Adj" stem="I_marmi">
    <member-of family="Adjective"/>
  </entry>
  <entry macros="@sg-2" class="series" pos="NNP" stem="I_marmi_Art"/>
  <entry class="series" pos="Adj" stem="I_marmi_Art">
    <member-of family="Adjective"/>
  </entry>
  <entry macros="@sg-2" class="series" pos="NNP" stem="Jazz"/>
  <entry class="series" pos="Adj" stem="Jazz">
    <member-of family="Adjective"/>
  </entry>
  <entry macros="@sg-2" class="series" pos="NNP" stem="Kerarock"/>
  <entry class="series" pos="Adj" stem="Kerarock">
    <member-of family="Adjective"/>
  </entry>
  <entry macros="@sg-2" class="series" pos="NNP" stem="Le_Pietre"/>
  <entry class="series" pos="Adj" stem="Le_Pietre">
    <member-of family="Adjective"/>
  </entry>
  <entry macros="@sg-2" class="series" pos="NNP" stem="Levante"/>
  <entry class="series" pos="Adj" stem="Levante">
    <member-of family="Adjective"/>
  </entry>
  <entry macros="@sg-2" class="series" pos="NNP" stem="Lollipop"/>
  <entry class="series" pos="Adj" stem="Lollipop">
    <member-of family="Adjective"/>
  </entry>
  <entry macros="@sg-2" class="series" pos="NNP" stem="Opus_Romano"/>
  <entry class="series" pos="Adj" stem="Opus_Romano">
    <member-of family="Adjective"/>
  </entry>
  <entry macros="@sg-2" class="series" pos="NNP" stem="Palace"/>
  <entry class="series" pos="Adj" stem="Palace">
    <member-of family="Adjective"/>
  </entry>
  <entry macros="@sg-2" class="series" pos="NNP" stem="Sandstein"/>
  <entry class="series" pos="Adj" stem="Sandstein">
    <member-of family="Adjective"/>
  </entry>
  <entry macros="@sg-2" class="series" pos="NNP" stem="Smart"/>
  <entry class="series" pos="Adj" stem="Smart">
    <member-of family="Adjective"/>
  </entry>
  <entry macros="@sg-2" class="series" pos="NNP" stem="Tirrenia"/>
  <entry class="series" pos="Adj" stem="Tirrenia">
    <member-of family="Adjective"/>
  </entry>
  <entry macros="@sg-2" class="series" pos="NNP" stem="Viso_Tile"/>
  <entry class="series" pos="Adj" stem="Viso_Tile">
    <member-of family="Adjective"/>
  </entry>
  <entry coart="true" pos="Gest" stem="*circ*" word="GI-00:GC-e">
    <member-of family="Gesture"/>
  </entry>
  <entry coart="true" pos="Gest" stem="*circ*" word="GI-01:GC-e">
    <member-of family="Gesture"/>
  </entry>
  <entry coart="true" pos="Gest" stem="*circ*" word="GI-03:GC-e">
    <member-of family="Gesture"/>
  </entry>
  <entry coart="true" pos="Gest" stem="*circ*" word="GI-25:GC-e">
    <member-of family="Gesture"/>
  </entry>
  <entry coart="true" pos="Gest" stem="*circ*" word="GI-28:GC-e">
    <member-of family="Gesture"/>
  </entry>
  <entry coart="true" pos="Gest" stem="*circ*" word="GI-29:GC-e">
    <member-of family="Gesture"/>
  </entry>
  <entry coart="true" pos="Gest" stem="*circ*" word="GI-30:GC-e">
    <member-of family="Gesture"/>
  </entry>
  <entry coart="true" pos="Gest" stem="*circ*" word="GI-31:GC-e">
    <member-of family="Gesture"/>
  </entry>
  <entry coart="true" pos="Gest" stem="*circ*" word="GI-32:GC-e">
    <member-of family="Gesture"/>
  </entry>
  <entry coart="true" pos="Gest" stem="*circ*" word="GI-33:GC-e">
    <member-of family="Gesture"/>
  </entry>
  <entry coart="true" pos="Gest" stem="*circ*" word="GI-34:GC-e">
    <member-of family="Gesture"/>
  </entry>
  <entry coart="true" pos="Gest" stem="*circ*" word="GI-35:GC-e">
    <member-of family="Gesture"/>
  </entry>
  <entry coart="true" pos="Gest" stem="*wave*" word="GI-36:GC-w">
    <member-of family="Gesture"/>
  </entry>
  <entry coart="true" pos="Gest" stem="*wave*" word="GI-37:GC-w">
    <member-of family="Gesture"/>
  </entry>
  <entry coart="true" pos="Gest" stem="*wave*" word="GI-40:GC-w">
    <member-of family="Gesture"/>
  </entry>
  <entry coart="true" pos="Gest" stem="*wave*" word="GI-41:GC-w">
    <member-of family="Gesture"/>
  </entry>
  <entry coart="true" pos="Gest" stem="*wave*" word="GI-44:GC-w">
    <member-of family="Gesture"/>
  </entry>
  <entry coart="true" pos="Nod" stem="*nod*" word="NI-00">
    <member-of family="Nod"/>
  </entry>
  <macro name="@mass">
    <fs val="mass" attr="num" id="2"/>
  </macro>
  <macro name="@sg">
    <fs val="sg" attr="num" id="2"/>
    <lf>
      <satop nomvar="X">
        <diamond mode="num">
          <prop name="sg"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@sg-agr">
    <fs val="sg" attr="num" id="1"/>
    <fs val="sg" attr="num" id="2"/>
  </macro>
  <macro name="@sg-or-mass-agr">
    <fs id="1">
      <feat attr="num">
        <featvar name="NUM:sg-or-mass"/>
      </feat>
    </fs>
    <fs id="2">
      <feat attr="num">
        <featvar name="NUM:sg-or-mass"/>
      </feat>
    </fs>
  </macro>
  <macro name="@sg-2">
    <fs val="sg" attr="num" id="2"/>
  </macro>
  <macro name="@sg-or-mass-2">
    <fs val="sg-or-mass" attr="num" id="2"/>
  </macro>
  <macro name="@sg-P">
    <lf>
      <satop nomvar="P">
        <diamond mode="num">
          <prop name="sg"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@pl">
    <fs val="pl" attr="num" id="2"/>
    <lf>
      <satop nomvar="X">
        <diamond mode="num">
          <prop name="pl"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@pl-agr">
    <fs val="pl" attr="num" id="1"/>
    <fs val="pl" attr="num" id="2"/>
  </macro>
  <macro name="@pl-2">
    <fs val="pl" attr="num" id="2"/>
  </macro>
  <macro name="@pl-or-mass-2">
    <fs val="pl-or-mass" attr="num" id="2"/>
  </macro>
  <macro name="@pl-P">
    <lf>
      <satop nomvar="P">
        <diamond mode="num">
          <prop name="pl"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@1st">
    <fs val="1st" attr="pers" id="2"/>
  </macro>
  <macro name="@1st-agr">
    <fs val="1st" attr="pers" id="1"/>
    <fs val="1st" attr="pers" id="2"/>
  </macro>
  <macro name="@2nd">
    <fs val="2nd" attr="pers" id="2"/>
  </macro>
  <macro name="@2nd-agr">
    <fs val="2nd" attr="pers" id="1"/>
    <fs val="2nd" attr="pers" id="2"/>
  </macro>
  <macro name="@non-3rd-agr">
    <fs id="1">
      <feat attr="pers">
        <featvar name="PERS:non-3rd"/>
      </feat>
    </fs>
    <fs id="2">
      <feat attr="pers">
        <featvar name="PERS:non-3rd"/>
      </feat>
    </fs>
  </macro>
  <macro name="@3rd">
    <fs val="3rd" attr="pers" id="2"/>
  </macro>
  <macro name="@3rd-agr">
    <fs val="3rd" attr="pers" id="1"/>
    <fs val="3rd" attr="pers" id="2"/>
  </macro>
  <macro name="@nom">
    <fs val="nom" attr="case" id="2"/>
  </macro>
  <macro name="@acc">
    <fs val="acc" attr="case" id="2"/>
  </macro>
  <macro name="@pp-from">
    <fs val="from" attr="lex" id="3"/>
  </macro>
  <macro name="@pp-to">
    <fs val="to" attr="lex" id="3"/>
  </macro>
  <macro name="@prt-up">
    <fs val="up" attr="lex" id="4"/>
  </macro>
  <macro name="@prt-with">
    <fs val="with" attr="lex" id="4"/>
  </macro>
  <macro name="@ng">
    <fs val="ng" attr="form" id="1"/>
  </macro>
  <macro name="@base">
    <fs val="base" attr="form" id="1"/>
  </macro>
  <macro name="@base6">
    <fs val="base" attr="form" id="6"/>
  </macro>
  <macro name="@dcl">
    <fs id="1">
      <feat val="dcl" attr="form"/>
    </fs>
  </macro>
  <macro name="@adj">
    <fs val="adj" attr="form" id="1"/>
  </macro>
  <macro name="@adj6">
    <fs val="adj" attr="form" id="6"/>
  </macro>
  <macro name="@X-location">
    <fs id="2">
      <feat attr="index">
        <lf>
          <nomvar name="X:location"/>
        </lf>
      </feat>
    </fs>
  </macro>
  <macro name="@X-person">
    <fs id="2">
      <feat attr="index">
        <lf>
          <nomvar name="X:person"/>
        </lf>
      </feat>
    </fs>
  </macro>
  <macro name="@past">
    <lf>
      <satop nomvar="E">
        <diamond mode="tense">
          <prop name="past"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@pres">
    <lf>
      <satop nomvar="E">
        <diamond mode="tense">
          <prop name="pres"/>
        </diamond>
      </satop>
    </lf>
  </macro>
</dictionary>


================================================
FILE: grammars/comic/dict.xsl
================================================
<?xml version="1.0"?>
<!-- 
Copyright (C) 2003-4 University of Edinburgh (Michael White) 
$Revision: 1.40 $, $Date: 2005/11/16 18:14:50 $ 

NB: These namespace declarations seem to work with the version of Xalan 
    that comes with JDK 1.4.  With newer versions of Xalan, 
    different namespace declarations may be required. 
-->
<xsl:transform 
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform" 
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  exclude-result-prefixes="xalan xalan2">
  

  <!-- ***** Import Core Dictionary Definitions ***** -->
  <xsl:import href="../core-en/dict.xsl"/>
  
  <xsl:output indent="yes" xalan2:indent-amount="2"/> 
  <xsl:strip-space elements="*"/>

  
  <!-- ***** Start Output Here ***** -->
  <xsl:template match="/">
  <dictionary name="comic"
    xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
    xsi:noNamespaceSchemaLocation="../dict.xsd"
  >
  
  <!-- Add core entries -->
  <xsl:call-template name="add-entries"/>

  
  <!-- Prepositions -->
  <entry stem="at" pos="Prep">
    <member-of family="Prep-Nom"/>
  </entry>
  <entry stem="by" pos="Prep">
    <member-of family="By-Creator"/>
  </entry>
  <entry stem="from" pos="Prep">
    <member-of family="Prep-Nom"/>
    <member-of family="Prep-Source"/>
  </entry>
  <entry stem="in" pos="Adj">
    <member-of family="Prep-Loc"/>
  </entry>
  <entry stem="in_addition_to" pos="Adv">
    <member-of family="Prep-Transitional" pred="in-addition-to"/>
  </entry>
  <entry stem="of" pos="Prep">
    <member-of family="Prep-Nom"/>
  </entry>
  <entry stem="on" pos="Adj">
    <member-of family="Prep-Loc"/>
  </entry>
  <entry stem="to" pos="Prep">
    <member-of family="To-Infinitive"/>
  </entry>
  

  <!-- Adverbs -->
  <entry stem="again" pos="Adv">
    <member-of family="Adverb"/>
  </entry>
  <entry stem="before" pos="Adv">
    <member-of family="Adverb"/>
  </entry>
  <entry stem="earlier" pos="Adv">
    <member-of family="Adverb"/>
  </entry>
  <entry stem="down_here" pos="Adv">
    <member-of family="Loc-Adverb"/>
  </entry>
  <entry stem="here" pos="Adv">
    <member-of family="Loc-Adverb"/>
  </entry>
  <entry stem="now" pos="Adv">
    <member-of family="Transitional-Adverb"/>
  </entry>
  <entry stem="once_again" pos="Adv">
    <member-of family="Adverb" pred="once-again"/>
  </entry>
  
  
  <!-- Conjunctions -->
  <entry stem="as" pos="Conj">
    <member-of family="Subconj-Transitional"/>
  </entry>
  
  
  <!-- Verbs -->
  <entry stem="draw" pos="V">
    <member-of family="Drawing-From" pred="draw-from"/>
    <word form="draw" macros="@base"/>
    <word form="drawing" macros="@ng"/>
    <word form="draw" macros="@pres @sg-agr @non-3rd-agr"/>
    <word form="draws" macros="@pres @sg-or-mass-agr @3rd-agr"/>
    <word form="draw" macros="@pres @pl-agr"/>
    <word form="drew" macros="@past"/>
  </entry>

  <entry stem="feature" pos="V">
    <member-of family="Featuring"/>
    <word form="feature" macros="@base"/>
    <word form="featuring" macros="@ng"/>
    <word form="feature" macros="@pres @sg-agr @non-3rd-agr"/>
    <word form="features" macros="@pres @sg-or-mass-agr @3rd-agr"/>
    <word form="feature" macros="@pres @pl-agr"/>
    <word form="featured" macros="@past"/>
  </entry>

  <entry stem="go" pos="V">
    <member-of family="Going-With" pred="go-with"/>
    <word form="go" macros="@base"/>
    <word form="going" macros="@ng"/>
    <word form="go" macros="@pres @sg-agr @non-3rd-agr"/>
    <word form="goes" macros="@pres @sg-or-mass-agr @3rd-agr"/>
    <word form="go" macros="@pres @pl-agr"/>
    <word form="went" macros="@past"/>
  </entry>

  <entry stem="look-at" pos="V">
    <member-of family="Looking-At"/>
    <word form="look" macros="@base"/>
    <word form="looking" macros="@ng"/>
    <word form="look" macros="@pres @sg-agr @non-3rd-agr"/>
    <word form="looks" macros="@pres @sg-or-mass-agr @3rd-agr"/>
    <word form="look" macros="@pres @pl-agr"/>
    <word form="looked" macros="@past"/>
  </entry>

  <entry stem="mean" pos="V">
    <member-of family="Meaning"/>
    <word form="mean" macros="@base"/>
    <word form="meaning" macros="@ng"/>
    <word form="mean" macros="@pres @sg-agr @non-3rd-agr"/>
    <word form="means" macros="@pres @sg-or-mass-agr @3rd-agr"/>
    <word form="mean" macros="@pres @pl-agr"/>
    <word form="meant" macros="@past"/>
  </entry>

  <entry stem="see" pos="V">
    <member-of family="Seeing"/>
    <word form="see" macros="@base"/>
    <word form="seeing" macros="@ng"/>
    <word form="see" macros="@pres @sg-agr @non-3rd-agr"/>
    <word form="sees" macros="@pres @sg-or-mass-agr @3rd-agr"/>
    <word form="see" macros="@pres @pl-agr"/>
    <word form="saw" macros="@past"/>
  </entry>

  <entry stem="use" pos="V">
    <member-of family="Using"/>
    <word form="use" macros="@base"/>
    <word form="using" macros="@ng"/>
    <word form="use" macros="@pres @sg-agr @non-3rd-agr"/>
    <word form="uses" macros="@pres @sg-or-mass-agr @3rd-agr"/>
    <word form="use" macros="@pres @pl-agr"/>
    <word form="used" macros="@past"/>
  </entry>

  <entry stem="want" pos="V">
    <member-of family="Experiencer-Subj"/>
    <word form="want" macros="@base"/>
    <word form="wanting" macros="@ng"/>
    <word form="want" macros="@pres @sg-agr @non-3rd-agr"/>
    <word form="wants" macros="@pres @sg-or-mass-agr @3rd-agr"/>
    <word form="want" macros="@pres @pl-agr"/>
    <word form="wanted" macros="@past"/>
  </entry>


  <!-- Canned VPs -->
  <entry stem="help-set-mood" pos="V" class="colour_prop">
    <member-of family="Canned-VP"/>
    <word form="helping_to_set_the_mood" macros="@ng"/>
    <word form="helps_to_set_the_mood" macros="@pres @sg-or-mass-agr @3rd-agr"/>
    <word form="help_to_set_the_mood" macros="@pres @pl-agr"/>
  </entry>

  <entry stem="emphasise-straight-lined-character" pos="V" class="colour_prop">
    <member-of family="Canned-VP"/>
    <word form="emphasising_the_clear,_straight_lined_character_of_your_bathroom_in_a_stylish_way" macros="@ng"/>
    <word form="emphasises_the_clear,_straight_lined_character_of_your_bathroom_in_a_stylish_way" macros="@pres @sg-or-mass-agr @3rd-agr"/>
    <word form="emphasise_the_clear,_straight_lined_character_of_your_bathroom_in_a_stylish_way" macros="@pres @pl-agr"/>
  </entry>

  <entry stem="give-tuscan-feeling" pos="V" class="colour_prop">
    <member-of family="Canned-VP"/>
    <word form="giving_the_room_the_feeling_of_a_Tuscan_country_home" macros="@ng"/>
    <word form="gives_the_room_the_feeling_of_a_Tuscan_country_home" macros="@pres @sg-or-mass-agr @3rd-agr"/>
    <word form="give_the_room_the_feeling_of_a_Tuscan_country_home" macros="@pres @pl-agr"/>
  </entry>

  
  <!-- Adjectives -->
  <entry stem="based_on" pos="Adj">
    <member-of family="Based-On" pred="based-on"/>
  </entry>

  <entry stem="more" pos="Adj">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="other" pos="Adj">
    <member-of family="Adjective"/>
  </entry>
  
  <entry stem="abstract" pos="Adj" class="quality">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="animal" pos="Adj" class="quality">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="belt_buckle" pos="Adj" class="quality">
    <member-of family="Adjective" pred="belt-buckle"/>
  </entry>
  <entry stem="comic" pos="Adj" class="quality">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="cross" pos="Adj" class="quality">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="diamond" pos="Adj" class="quality">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="decorative" pos="Adj" class="quality">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="face" pos="Adj" class="quality">  <!-- nb: nouns like 'face' for 'face-motifs' -->
    <member-of family="Adjective"/>
  </entry>
  <entry stem="female" pos="Adj" class="quality">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="floral" pos="Adj" class="quality">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="geometric" pos="Adj" class="quality">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="jeans" pos="Adj" class="quality">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="male" pos="Adj" class="quality">
    <member-of family="Adjective"/>
  </entry>
  
  <entry stem="classic" pos="Adj" class="style">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="country" pos="Adj" class="style">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="family" pos="Adj" class="style">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="modern" pos="Adj" class="style">
    <member-of family="Adjective"/>
  </entry>
  
  <entry stem="larger" pos="Adj" class="size">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="smaller" pos="Adj" class="size">
    <member-of family="Adjective"/>
  </entry>
  
  <!-- Colours (adj and noun) -->
  <entry stem="beige" pos="Adj" class="colour">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="beige" pos="N" macros="@mass" class="colour"/>
  <entry stem="black" pos="Adj" class="colour">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="black" pos="N" macros="@mass" class="colour"/>
  <entry stem="blue" pos="Adj" class="colour">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="blue" pos="N" macros="@mass" class="colour"/>
  <entry stem="brown" pos="Adj" class="colour">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="brown" pos="N" macros="@mass" class="colour"/>
  <entry stem="cream" pos="Adj" class="colour">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="cream" pos="N" macros="@mass" class="colour"/>
  <entry stem="dark_green" pos="Adj" class="colour">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="dark_green" pos="N" macros="@mass" class="colour"/>
  <entry stem="dark_red" pos="Adj" class="colour">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="dark_red" pos="N" macros="@mass" class="colour"/>
  <entry stem="gray" pos="Adj" class="colour">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="gray" pos="N" macros="@mass" class="colour"/>
  <entry stem="grey" pos="Adj" class="colour">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="grey" pos="N" macros="@mass" class="colour"/>
  <entry stem="green" pos="Adj" class="colour">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="green" pos="N" macros="@mass" class="colour"/>
  <entry stem="indigo" pos="Adj" class="colour">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="indigo" pos="N" macros="@mass" class="colour"/>
  <entry stem="ochre" pos="Adj" class="colour">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="ochre" pos="N" macros="@mass" class="colour"/>
  <entry stem="off_white" pos="Adj" class="colour">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="off_white" pos="N" macros="@mass" class="colour"/>
  <entry stem="orange" pos="Adj" class="colour">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="orange" pos="N" macros="@mass" class="colour"/>
  <entry stem="pink" pos="Adj" class="colour">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="pink" pos="N" macros="@mass" class="colour"/>
  <entry stem="purple" pos="Adj" class="colour">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="purple" pos="N" macros="@mass" class="colour"/>
  <entry stem="red" pos="Adj" class="colour">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="red" pos="N" macros="@mass" class="colour"/>
  <entry stem="rose" pos="Adj" class="colour">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="rose" pos="N" macros="@mass" class="colour"/>
  <entry stem="royal_blue" pos="Adj" class="colour">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="royal_blue" pos="N" macros="@mass" class="colour"/>
  <entry stem="salmon" pos="Adj" class="colour">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="salmon" pos="N" macros="@mass" class="colour"/>
  <entry stem="sandstone" pos="Adj" class="colour">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="sandstone" pos="N" macros="@mass" class="colour"/>
  <entry stem="silver" pos="Adj" class="colour">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="silver" pos="N" macros="@mass" class="colour"/>
  <entry stem="terracotta" pos="Adj" class="colour">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="terracotta" pos="N" macros="@mass" class="colour"/>
  <entry stem="violet" pos="Adj" class="colour">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="violet" pos="N" macros="@mass" class="colour"/>
  <entry stem="white" pos="Adj" class="colour">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="white" pos="N" macros="@mass" class="colour"/>
  <entry stem="yellow" pos="Adj" class="colour">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="yellow" pos="N" macros="@mass" class="colour"/>

  
  <!-- Nouns -->
  <entry stem="art" pos="N" macros="@mass" class="decoration"/>
  <entry stem="artwork" pos="N" macros="@mass" class="decoration"/>
  <entry stem="collection" pos="N" class="abstraction">
    <word form="collection" macros="@sg"/>
    <word form="collections" macros="@pl"/>
  </entry>
  <entry stem="colour" pos="N" class="abstraction">
    <word form="colour" macros="@sg"/>
    <word form="colours" macros="@pl"/>
  </entry>
  <entry stem="colour_scheme" pos="N" class="mental-obj">
    <word form="colour_scheme" macros="@sg"/>
    <word form="colour_schemes" macros="@pl"/>
  </entry>
  <entry stem="design" pos="N" class="mental-obj">
    <word form="design" macros="@sg"/>
    <word form="designs" macros="@pl"/>
  </entry>
  <entry stem="fruit" pos="N" macros="@mass" class="decoration"/>
  <entry stem="mosaics" pos="N" macros="@pl" class="decoration"/>
  <entry stem="motif" pos="N" class="decoration">
    <word form="motif" macros="@sg"/>
    <word form="motifs" macros="@pl"/>
  </entry>
  <entry stem="option" pos="N" class="mental-obj">
    <word form="option" macros="@sg"/>
    <word form="options" macros="@pl"/>
  </entry>
  <entry stem="series" pos="N" class="abstraction">
    <word form="series" macros="@sg"/>
    <word form="series" macros="@pl"/>
  </entry>
  <entry stem="shape" pos="N" class="decoration">
    <word form="shape" macros="@sg"/>
    <word form="shapes" macros="@pl"/>
  </entry>
  <entry stem="style" pos="N" class="abstraction">
    <word form="style" macros="@sg"/>
    <word form="styles" macros="@pl"/>
  </entry>
  <entry stem="tile" pos="N" class="phys-obj">
    <word form="tile" macros="@sg"/>
    <word form="tiles" macros="@pl"/>
  </entry>
  
  
  <!-- Proper Names (with some also as adjectives, for now) -->
  <entry stem="Agrob_Buchtal" pos="NNP" class="manufacturer" macros="@sg-2"/>
  <entry stem="Alessi_Tiles" pos="NNP" class="manufacturer" macros="@sg-2"/>
  <entry stem="Aparici" pos="NNP" class="manufacturer" macros="@sg-2"/>
  <entry stem="Apavisa" pos="NNP" class="manufacturer" macros="@sg-2"/>
  <entry stem="Bisazza" pos="NNP" class="manufacturer" macros="@sg-2"/>
  <entry stem="Cerim_Ceramiche" pos="NNP" class="manufacturer" macros="@sg-2"/>
  <entry stem="Coem" pos="NNP" class="manufacturer" macros="@sg-2"/>
  <entry stem="Engers_Eurodesign" pos="NNP" class="manufacturer" macros="@sg-2"/>
  <entry stem="Gardenia_Orchidea" pos="NNP" class="manufacturer" macros="@sg-2"/>
  <entry stem="Imola_Ceramica" pos="NNP" class="manufacturer" macros="@sg-2"/>
  <entry stem="Iris_Ceramica" pos="NNP" class="manufacturer" macros="@sg-2"/>
  <entry stem="NovaBell" pos="NNP" class="manufacturer" macros="@sg-2"/>
  <entry stem="Porcelaingres" pos="NNP" class="manufacturer" macros="@sg-2"/>
  <entry stem="Porcelanosa" pos="NNP" class="manufacturer" macros="@sg-2"/>
  <entry stem="Sphinx_Tiles" pos="NNP" class="manufacturer" macros="@sg-2"/>
  <entry stem="Steuler" pos="NNP" class="manufacturer" macros="@sg-2"/>
  <entry stem="Villeroy_and_Boch" pos="NNP" class="manufacturer" macros="@sg-2"/>

  <entry stem="Abbazie" pos="NNP" class="series" macros="@sg-2"/>
  <entry stem="Abbazie" pos="Adj" class="series">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="Aguamarina" pos="NNP" class="series" macros="@sg-2"/>
  <entry stem="Aguamarina" pos="Adj" class="series">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="Alt_Mettlach" pos="NNP" class="series" macros="@sg-2"/>
  <entry stem="Alt_Mettlach" pos="Adj" class="series">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="Altamira" pos="NNP" class="series" macros="@sg-2"/>
  <entry stem="Altamira" pos="Adj" class="series">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="Amazonita" pos="NNP" class="series" macros="@sg-2"/>
  <entry stem="Amazonita" pos="Adj" class="series">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="Anasol" pos="NNP" class="series" macros="@sg-2"/>
  <entry stem="Anasol" pos="Adj" class="series">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="Aramis" pos="NNP" class="series" macros="@sg-2"/>
  <entry stem="Aramis" pos="Adj" class="series">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="Asterix" pos="NNP" class="series" macros="@sg-2"/>
  <entry stem="Asterix" pos="Adj" class="series">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="Armonie" pos="NNP" class="series" macros="@sg-2"/>
  <entry stem="Armonie" pos="Adj" class="series">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="Ateliers" pos="NNP" class="series" macros="@sg-2"/>
  <entry stem="Ateliers" pos="Adj" class="series">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="Blue_Jeans" pos="NNP" class="series" macros="@sg-2"/>
  <entry stem="Blue_Jeans" pos="Adj" class="series">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="Carioca" pos="NNP" class="series" macros="@sg-2"/>
  <entry stem="Carioca" pos="Adj" class="series">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="Cardiff" pos="NNP" class="series" macros="@sg-2"/>
  <entry stem="Cardiff" pos="Adj" class="series">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="Century" pos="NNP" class="series" macros="@sg-2"/>
  <entry stem="Century" pos="Adj" class="series">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="Century_Esprit" pos="NNP" class="series" macros="@sg-2"/>
  <entry stem="Century_Esprit" pos="Adj" class="series">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="Colorado" pos="NNP" class="series" macros="@sg-2"/>
  <entry stem="Colorado" pos="Adj" class="series">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="Creative_System_Amazonas" pos="NNP" class="series" macros="@sg-2"/>
  <entry stem="Creative_System_Amazonas" pos="Adj" class="series">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="Creative_System_Safari" pos="NNP" class="series" macros="@sg-2"/>
  <entry stem="Creative_System_Safari" pos="Adj" class="series">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="Darlington" pos="NNP" class="series" macros="@sg-2"/>
  <entry stem="Darlington" pos="Adj" class="series">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="Funny_Day" pos="NNP" class="series" macros="@sg-2"/>
  <entry stem="Funny_Day" pos="Adj" class="series">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="Girotondo_Tile" pos="NNP" class="series" macros="@sg-2"/>
  <entry stem="Girotondo_Tile" pos="Adj" class="series">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="Helenus" pos="NNP" class="series" macros="@sg-2"/>
  <entry stem="Helenus" pos="Adj" class="series">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="Hippo" pos="NNP" class="series" macros="@sg-2"/>
  <entry stem="Hippo" pos="Adj" class="series">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="HundertWasser" pos="NNP" class="series" macros="@sg-2"/>
  <entry stem="HundertWasser" pos="Adj" class="series">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="I_marmi" pos="NNP" class="series" macros="@sg-2"/>
  <entry stem="I_marmi" pos="Adj" class="series">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="I_marmi_Art" pos="NNP" class="series" macros="@sg-2"/>
  <entry stem="I_marmi_Art" pos="Adj" class="series">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="Jazz" pos="NNP" class="series" macros="@sg-2"/>
  <entry stem="Jazz" pos="Adj" class="series">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="Kerarock" pos="NNP" class="series" macros="@sg-2"/>
  <entry stem="Kerarock" pos="Adj" class="series">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="Le_Pietre" pos="NNP" class="series" macros="@sg-2"/>
  <entry stem="Le_Pietre" pos="Adj" class="series">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="Levante" pos="NNP" class="series" macros="@sg-2"/>
  <entry stem="Levante" pos="Adj" class="series">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="Lollipop" pos="NNP" class="series" macros="@sg-2"/>
  <entry stem="Lollipop" pos="Adj" class="series">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="Opus_Romano" pos="NNP" class="series" macros="@sg-2"/>
  <entry stem="Opus_Romano" pos="Adj" class="series">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="Palace" pos="NNP" class="series" macros="@sg-2"/>
  <entry stem="Palace" pos="Adj" class="series">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="Sandstein" pos="NNP" class="series" macros="@sg-2"/>
  <entry stem="Sandstein" pos="Adj" class="series">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="Smart" pos="NNP" class="series" macros="@sg-2"/>
  <entry stem="Smart" pos="Adj" class="series">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="Tirrenia" pos="NNP" class="series" macros="@sg-2"/>
  <entry stem="Tirrenia" pos="Adj" class="series">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="Viso_Tile" pos="NNP" class="series" macros="@sg-2"/>
  <entry stem="Viso_Tile" pos="Adj" class="series">
    <member-of family="Adjective"/>
  </entry>

  
  <!-- Gesture Instances -->
  <entry word="GI-00:GC-e" stem="*circ*" pos="Gest" coart="true">
    <member-of family="Gesture"/>
  </entry>
  <entry word="GI-01:GC-e" stem="*circ*" pos="Gest" coart="true">
    <member-of family="Gesture"/>
  </entry>
  <entry word="GI-03:GC-e" stem="*circ*" pos="Gest" coart="true">
    <member-of family="Gesture"/>
  </entry>
  <entry word="GI-25:GC-e" stem="*circ*" pos="Gest" coart="true">
    <member-of family="Gesture"/>
  </entry>
  <entry word="GI-28:GC-e" stem="*circ*" pos="Gest" coart="true">
    <member-of family="Gesture"/>
  </entry>
  <entry word="GI-29:GC-e" stem="*circ*" pos="Gest" coart="true">
    <member-of family="Gesture"/>
  </entry>
  <entry word="GI-30:GC-e" stem="*circ*" pos="Gest" coart="true">
    <member-of family="Gesture"/>
  </entry>
  <entry word="GI-31:GC-e" stem="*circ*" pos="Gest" coart="true">
    <member-of family="Gesture"/>
  </entry>
  <entry word="GI-32:GC-e" stem="*circ*" pos="Gest" coart="true">
    <member-of family="Gesture"/>
  </entry>
  <entry word="GI-33:GC-e" stem="*circ*" pos="Gest" coart="true">
    <member-of family="Gesture"/>
  </entry>
  <entry word="GI-34:GC-e" stem="*circ*" pos="Gest" coart="true">
    <member-of family="Gesture"/>
  </entry>
  <entry word="GI-35:GC-e" stem="*circ*" pos="Gest" coart="true">
    <member-of family="Gesture"/>
  </entry>
  <entry word="GI-36:GC-w" stem="*wave*" pos="Gest" coart="true">
    <member-of family="Gesture"/>
  </entry>
  <entry word="GI-37:GC-w" stem="*wave*" pos="Gest" coart="true">
    <member-of family="Gesture"/>
  </entry>
  <entry word="GI-40:GC-w" stem="*wave*" pos="Gest" coart="true">
    <member-of family="Gesture"/>
  </entry>
  <entry word="GI-41:GC-w" stem="*wave*" pos="Gest" coart="true">
    <member-of family="Gesture"/>
  </entry>
  <entry word="GI-44:GC-w" stem="*wave*" pos="Gest" coart="true">
    <member-of family="Gesture"/>
  </entry>

  <!-- Nods (for example) -->
  <entry word="NI-00" stem="*nod*" pos="Nod" coart="true">
    <member-of family="Nod"/>
  </entry>

  
  <!-- Add core macros -->
  <xsl:call-template name="add-macros"/>
  
  </dictionary>
  </xsl:template>
</xsl:transform>


================================================
FILE: grammars/comic/grammar.xml
================================================
<?xml version="1.0"?>
<!-- 
Copyright (C) 2003-4 University of Edinburgh (Michael White) 
$Revision: 1.8 $, $Date: 2004/11/19 10:59:05 $ 
-->
<grammar name="comic"
  xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
  xsi:noNamespaceSchemaLocation="../grammar.xsd"
>

  <lexicon file="lexicon.xml"/>
  <morphology file="morph.xml"/>
  <rules file="rules.xml"/>
  <types file="types.xml"/>
  <tokenizer replacement-sem-classes="amt colour colour_prop 
    date decoration manufacturer num quality series time"/>

  <LF-from-XML>
    <transform file="../core-en/derive-features.xsl"/>
    <transform file="../treeify-lists.xsl"/>
    <transform file="../convert-to-hlds.xsl"/>
    <transform file="../core-en/add-chunks.xsl"/>
  </LF-from-XML>

  <LF-to-XML>
    <transform file="../core-en/raise-nodes.xsl"/>
    <transform file="../convert-to-graph.xsl"/>
    <transform file="../simplify-lists.xsl"/>
    <transform file="../core-en/drop-features.xsl"/>
  </LF-to-XML>

</grammar>


================================================
FILE: grammars/comic/lexicon-base.xsl
================================================
<?xml version="1.0"?>
<!-- 
Copyright (C) 2003-4 University of Edinburgh (Michael White)
$Revision: 1.32 $, $Date: 2005/07/20 15:59:08 $ 

See ../core-en/lexicon.xsl for comments re grammar.

The semantic roles are taken from FrameNet where possible.

NB: These namespace declarations seem to work with the version of Xalan 
    that comes with JDK 1.4.  In Xalan 2.5, the redirect namespace is 
    supposed to be declared as http://xml.apache.org/xalan/redirect, 
    but giving the classname (magically) seems to work.  
    With newer versions of Xalan, different namespace declarations may be required. 
-->
<xsl:transform 
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform" 
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:redirect="org.apache.xalan.lib.Redirect" 
  extension-element-prefixes="redirect"
  exclude-result-prefixes="xalan xalan2">

  
  <!-- ***** Import Core Lexicon Definitions ***** -->
  <xsl:import href="../core-en/lexicon.xsl"/>
  
  <xsl:output indent="yes" xalan2:indent-amount="2"/> 
  <xsl:strip-space elements="*"/>

  
  <!-- ***** Start Output Here ***** -->
  <xsl:template match="/">
  <ccg-lexicon name="comic" 
    xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
    xsi:noNamespaceSchemaLocation="../lexicon.xsd"
  >

  <!-- ***** Feature Declarations ******  -->
  <xsl:call-template name="add-feature-declarations"/>
  
  
  <!-- ***** Relation Sorting ******  -->
  <relation-sorting order=
    "BoundVar PairedWith
     Restr Body 
     Det Card Num 
     Arg Arg1 Arg2 Of
     Core Trib
     First Last List EqL
     Agent Experiencer Fig FigInv Owner
     Artifact Creator ElementOf Cognizer Communicator Perceiver 
     *
     Beneficiary Ground Poss Pred Prop Situation
     Chosen Content Material Phenomenon Referent Where
     Source
     Location 
     HasProp GenOwner
     GenRel Next"/>

    
  <!-- ***** Derived Categories and Families ***** -->
  <xsl:call-template name="add-core-families"/>
  
  
  <!-- By-Creator -->
  <xsl:variable name="X.Creator.Y">  
    <lf>
      <satop nomvar="X:sem-obj">
        <diamond mode="Creator"><nomvar name="Y:causal-agent"/></diamond>
      </satop>
    </lf>
  </xsl:variable>

  <xsl:variable name="P.has-rel.Of.X.Creator.Y">
    <xsl:call-template name="make-has-rel-lf">
      <xsl:with-param name="rel">Creator</xsl:with-param>
    </xsl:call-template>
  </xsl:variable>
  
  <family name="By-Creator" pos="Prep" closed="true" indexRel="Creator">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($prep.n-postmod)/*"/>
        <xsl:with-param name="ext" select="$X.Creator.Y"/>
      </xsl:call-template>
    </entry>
    <entry name="Predicative">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($pred.prep)/*"/>
        <xsl:with-param name="ext" select="$P.has-rel.Of.X.Creator.Y"/>
      </xsl:call-template>
    </entry>
  </family>
  
  <!-- From-Source -->
  <xsl:variable name="X.Source.Y">
    <lf>
      <satop nomvar="X:sem-obj">
        <diamond mode="Source"><nomvar name="Y:abstraction"/></diamond>
      </satop>
    </lf>
  </xsl:variable>

  <xsl:variable name="P.has-rel.Of.X.Source.Y">
    <xsl:call-template name="make-has-rel-lf">
      <xsl:with-param name="rel">Source</xsl:with-param>
    </xsl:call-template>
  </xsl:variable>
  
  <family name="Prep-Source" pos="Prep" closed="true" indexRel="Source">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($prep.n-postmod)/*"/>
        <xsl:with-param name="ext" select="$X.Source.Y"/>
      </xsl:call-template>
    </entry>
    <entry name="Predicative">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($pred.prep)/*"/>
        <xsl:with-param name="ext" select="$P.has-rel.Of.X.Source.Y"/>
      </xsl:call-template>
    </entry>
  </family>
  
  
  <!-- Based-On: uses Artifact, Source roles -->
  <xsl:variable name="pred.adj.np">
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($pred.adj)/*"/>
      <xsl:with-param name="ext">
        <slash dir="/" mode="&lt;"/>
        <xsl:copy-of select="$np.3.Y.acc"/>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>
  
  <xsl:variable name="P.Default.Artifact.X.Source.Y">  
    <lf>
      <satop nomvar="P:proposition">
        <prop name="[*DEFAULT*]"/>
        <diamond mode="Artifact"><nomvar name="X:sem-obj"/></diamond>
        <diamond mode="Source"><nomvar name="Y:abstraction"/></diamond>
      </satop>
    </lf>
  </xsl:variable>

  <family name="Based-On" pos="Adj" closed="true">
    <entry name="Predicative">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($pred.adj.np)/*"/>
        <xsl:with-param name="ext" select="$P.Default.Artifact.X.Source.Y"/>
      </xsl:call-template>
    </entry>
  </family>

  
  <!-- Canned-VP -->
  <xsl:variable name="E.Default.Arg.X">
    <lf>
      <satop nomvar="E:situation">
        <prop name="[*DEFAULT*]"/>
        <diamond mode="Arg"><nomvar name="X:sem-obj"/></diamond>
      </satop>
    </lf>
  </xsl:variable>
  
  <family name="Canned-VP" pos="V" closed="true">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($iv)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Arg.X"/>
      </xsl:call-template>
    </entry>
  </family>
  
  
  <!-- Drawing-From: uses Artifact, Source roles -->
  <xsl:variable name="E.Default.Artifact.X.Source.Y">  
    <lf>
      <satop nomvar="E:proposition">
        <prop name="[*DEFAULT*]"/>
        <diamond mode="Artifact"><nomvar name="X:sem-obj"/></diamond>
        <diamond mode="Source"><nomvar name="Y:abstraction"/></diamond>
      </satop>
    </lf>
  </xsl:variable>

  <family name="Drawing-From" pos="V" closed="true">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($tv.from)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Artifact.X.Source.Y"/>
      </xsl:call-template>
    </entry>
  </family>
  
  <!-- Featuring: uses Artifact, Poss, Where roles -->
  <!-- 
    NB: 'Where' is used instead of the more general Location role, 
        in order to avoid problems with lex lookup in realization.
  -->
  <xsl:variable name="E.Default.Artifact.X.Poss.Y">  
    <lf>
      <satop nomvar="E:proposition">
        <prop name="[*DEFAULT*]"/>
        <diamond mode="Artifact"><nomvar name="X:sem-obj"/></diamond>
        <diamond mode="Poss"><nomvar name="Y:sem-obj"/></diamond>
      </satop>
    </lf>
  </xsl:variable>

  <xsl:variable name="E.Default.Artifact.X.Poss.Y.Where.P">  
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($E.Default.Artifact.X.Poss.Y)/*"/>
      <xsl:with-param name="ext">
        <satop nomvar="E:proposition">
          <diamond mode="Where"><nomvar name="P:proposition"/></diamond>
        </satop>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>

  <family name="Featuring" pos="V" closed="true">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($tv)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Artifact.X.Poss.Y"/>
      </xsl:call-template>
    </entry>
    <entry name="TV-Plus-Pred-Y">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($tv.plus.pred.Y)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Artifact.X.Poss.Y.Where.P"/>
      </xsl:call-template>
    </entry>
  </family>
  
  <family name="Going-With" pos="V" closed="true">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($tv.with)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Cognizer.X.Chosen.Y"/>
      </xsl:call-template>
    </entry>
  </family>
  
  <!-- Looking-At/Seeing: uses Perceiver, Phenomenon roles -->
  <family name="Looking-At" pos="V" closed="true">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($tv.at)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Perceiver.X.Phenomenon.Y"/>
      </xsl:call-template>
    </entry>
  </family>
  
  <family name="Seeing" pos="V" closed="true">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($tv)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Perceiver.X.Phenomenon.Y"/>
      </xsl:call-template>
    </entry>
    <entry name="Intransitive">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($iv)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Perceiver.X"/>
      </xsl:call-template>
    </entry>
  </family>
  
  <!-- Meaning: uses Communicator, Referent roles -->
  <xsl:variable name="E.Default.Communicator.X.Referent.Y">  
    <lf>
      <satop nomvar="E:proposition">
        <prop name="[*DEFAULT*]"/>
        <diamond mode="Communicator"><nomvar name="X:causal-agent"/></diamond>
        <diamond mode="Referent"><nomvar name="Y:sem-obj"/></diamond>
      </satop>
    </lf>
  </xsl:variable>

  <family name="Meaning" pos="V" closed="true">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($tv)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Communicator.X.Referent.Y"/>
      </xsl:call-template>
    </entry>
  </family>
  
  <!-- Using: uses Artifact, Material roles -->
  <xsl:variable name="E.Default.Artifact.X.Material.Y">  
    <lf>
      <satop nomvar="E:proposition">
        <prop name="[*DEFAULT*]"/>
        <diamond mode="Artifact"><nomvar name="X:sem-obj"/></diamond>
        <diamond mode="Material"><nomvar name="Y:phys-obj"/></diamond>
      </satop>
    </lf>
  </xsl:variable>

  <family name="Using" pos="V" closed="true">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($tv)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Artifact.X.Material.Y"/>
      </xsl:call-template>
    </entry>
  </family>
  
  <!-- Gesture -->
  <family name="Gesture" pos="Gest" closed="true" coartRel="gest">
    <entry name="Primary">
      <complexcat>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index"><lf><nomvar name="X"/></lf></feat>
          </fs>
        </atomcat>
        <slash dir="|" mode="*"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index"><lf><nomvar name="X"/></lf></feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="gest"><prop name="+"/></diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <!-- 
    <entry name="NP">
      <complexcat>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index"><lf><nomvar name="X"/></lf></feat>
          </fs>
        </atomcat>
        <slash dir="|" mode="*"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index"><lf><nomvar name="X"/></lf></feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="gest"><prop name="+"/></diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    -->
  </family>
  
  <!-- Nod (for example) -->
  <family name="Nod" pos="Nod" closed="true" coartRel="nod">
    <entry name="Primary">
      <complexcat>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index"><lf><nomvar name="X"/></lf></feat>
          </fs>
        </atomcat>
        <slash dir="|" mode="*"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index"><lf><nomvar name="X"/></lf></feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="nod"><prop name="+"/></diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
  
  </ccg-lexicon>

  
  <!-- ***** Write type changing and lexical factor rules to unary-rules.xml ***** -->
  <redirect:write file="unary-rules.xml">
  <unary-rules>
    <xsl:call-template name="add-unary-rules"/>

    <!-- Num Element-Of -->
    <typechanging name="num-elt">
      <arg>
        <atomcat type="num">
          <fs id="2">
            <feat attr="index"><lf><nomvar name="X"/></lf></feat>
          </fs>
        </atomcat>
      </arg>
      <result>
        <complexcat>
          <atomcat type="np">
            <fs inheritsFrom="2">
              <feat attr="index"><lf><nomvar name="X"/></lf></feat>
              <feat attr="info"><lf><var name="INFO"/></lf></feat>
              <feat attr="owner"><lf><var name="OWNER"/></lf></feat>
              <feat attr="pers" val="3rd"/>
            </fs>
          </atomcat>
          <slash dir="/" mode="^"/>
          <atomcat type="pp">
            <fs>
              <feat attr="index"><lf><nomvar name="Y"/></lf></feat>
              <feat attr="lex" val="of"/>
            </fs>
          </atomcat>
          <lf>
            <satop nomvar="X:sem-obj">
              <diamond mode="det"><prop name="nil"/></diamond>
              <diamond mode="ElementOf"><nomvar name="Y:sem-obj"/></diamond>
            </satop>
          </lf>
        </complexcat>
      </result>
    </typechanging>
  </unary-rules>
  </redirect:write>
  </xsl:template>

</xsl:transform>


================================================
FILE: grammars/comic/lexicon.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<ccg-lexicon xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:noNamespaceSchemaLocation="../lexicon.xsd" name="comic">
  <distributive-features attrs="info owner"/>
  <licensing-features>
    <feat location="target-only" val="emb" attr="form"/>
    <feat location="target-only" val="inf" attr="form"/>
    <feat location="target-only" val="adj" attr="form"/>
    <feat license-marked-cats="true" also-licensed-by="q-base" val="wh" attr="form"/>
    <feat license-marked-cats="true" also-licensed-by="q-base" val="q" attr="form"/>
    <feat also-licensed-by="q-base" val="q" attr="form"/>
    <feat location="args-only" instantiate="false" attr="owner"/>
  </licensing-features>
  <relation-sorting order="BoundVar PairedWith      Restr Body       Det Card Num       Arg Arg1 Arg2 Of      Core Trib      First Last List EqL      Agent Experiencer Fig FigInv Owner      Artifact Creator ElementOf Cognizer Communicator Perceiver       *      Beneficiary Ground Poss Pred Prop Situation      Chosen Content Material Phenomenon Referent Where      Source      Location       HasProp GenOwner      GenRel Next"/>
  <family closed="true" pos="Dummy" name="Dummy">
    <entry name="np_conj">
      <atomcat type="np_conj">
        <fs>
          <feat attr="num">
            <featvar name="NUM:num-vals"/>
          </feat>
          <feat attr="pers">
            <featvar name="PERS:pers-vals"/>
          </feat>
          <feat attr="case">
            <featvar name="CASE"/>
          </feat>
          <feat attr="type">
            <featvar name="TYPE"/>
          </feat>
          <feat attr="index">
            <lf>
              <nomvar name="INDEX"/>
            </lf>
          </feat>
          <feat attr="info">
            <lf>
              <var name="INFO"/>
            </lf>
          </feat>
          <feat attr="owner">
            <lf>
              <var name="OWNER"/>
            </lf>
          </feat>
        </fs>
      </atomcat>
    </entry>
    <entry name="s_conj">
      <atomcat type="s_conj">
        <fs>
          <feat attr="num">
            <featvar name="NUM:num-vals"/>
          </feat>
          <feat attr="pers">
            <featvar name="PERS:pers-vals"/>
          </feat>
          <feat attr="form">
            <featvar name="FORM:form-vals"/>
          </feat>
          <feat attr="index">
            <lf>
              <nomvar name="INDEX"/>
            </lf>
          </feat>
          <feat attr="info">
            <lf>
              <var name="INFO"/>
            </lf>
          </feat>
          <feat attr="owner">
            <lf>
              <var name="OWNER"/>
            </lf>
          </feat>
          <feat attr="op-index">
            <lf>
              <nomvar name="OP-INDEX"/>
            </lf>
          </feat>
        </fs>
      </atomcat>
    </entry>
    <member stem="*dummy*"/>
  </family>
  <family pos="N" name="Noun">
    <entry name="Primary">
      <atomcat type="n">
        <fs id="2">
          <feat attr="num">
            <featvar name="NUM:num-vals"/>
          </feat>
          <feat attr="index">
            <lf>
              <nomvar name="X"/>
            </lf>
          </feat>
          <feat attr="info">
            <lf>
              <var name="INFO"/>
            </lf>
          </feat>
          <feat attr="owner">
            <lf>
              <var name="OWNER"/>
            </lf>
          </feat>
        </fs>
        <lf>
          <satop nomvar="X:sem-obj">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </atomcat>
    </entry>
  </family>
  <family pos="Num" name="Num">
    <entry name="Primary">
      <atomcat type="num">
        <fs id="2">
          <feat attr="num">
            <featvar name="NUM:num-vals"/>
          </feat>
          <feat attr="index">
            <lf>
              <nomvar name="X"/>
            </lf>
          </feat>
          <feat attr="info">
            <lf>
              <var name="INFO"/>
            </lf>
          </feat>
          <feat attr="owner">
            <lf>
              <var name="OWNER"/>
            </lf>
          </feat>
        </fs>
        <lf>
          <satop nomvar="X:num">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </atomcat>
    </entry>
  </family>
  <family closed="true" pos="Pro" name="ProNP">
    <entry name="Primary">
      <atomcat type="np">
        <fs id="2">
          <feat attr="num">
            <featvar name="NUM:num-vals"/>
          </feat>
          <feat attr="pers">
            <featvar name="PERS:pers-vals"/>
          </feat>
          <feat attr="case">
            <featvar name="CASE"/>
          </feat>
          <feat attr="index">
            <lf>
              <nomvar name="X"/>
            </lf>
          </feat>
          <feat attr="info">
            <lf>
              <var name="INFO"/>
            </lf>
          </feat>
          <feat attr="owner">
            <lf>
              <var name="OWNER"/>
            </lf>
          </feat>
        </fs>
        <lf>
          <satop nomvar="X:sem-obj">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </atomcat>
    </entry>
    <member stem="pro1"/>
    <member stem="pro2"/>
    <member stem="pro3f"/>
    <member stem="pro3m"/>
    <member stem="pro3n"/>
    <member stem="this"/>
    <member stem="that"/>
  </family>
  <family pos="NNP" name="Name">
    <entry name="Primary">
      <atomcat type="np">
        <fs id="2">
          <feat val="3rd" attr="pers"/>
          <feat attr="index">
            <lf>
              <nomvar name="X"/>
            </lf>
          </feat>
        </fs>
        <lf>
          <satop nomvar="X:sem-obj">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </atomcat>
    </entry>
  </family>
  <family indexRel="*NoSem*" closed="true" pos="Expl" name="ExplNP">
    <entry name="Primary">
      <atomcat type="np_expl">
        <fs>
          <feat val="[*DEFAULT*]" attr="lex"/>
        </fs>
      </atomcat>
    </entry>
    <entry name="RightwardTypeRaised">
      <complexcat>
        <atomcat type="s">
          <fs id="1"/>
        </atomcat>
        <slash ability="active" varmodality="M" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1"/>
          </atomcat>
          <slash ability="active" varmodality="M" dir="\"/>
          <atomcat type="np_expl">
            <fs>
              <feat val="[*DEFAULT*]" attr="lex"/>
            </fs>
          </atomcat>
        </complexcat>
      </complexcat>
    </entry>
    <member stem="it"/>
    <member stem="there"/>
    <member stem="here"/>
  </family>
  <family closed="true" pos="QNP" name="QuantNP">
    <entry name="RightwardTypeRaised">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash ability="active" varmodality="M" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash ability="active" varmodality="M" dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="num">
                <featvar name="NUM:num-vals"/>
              </feat>
              <feat val="3rd" attr="pers"/>
              <feat attr="case">
                <featvar name="CASE"/>
              </feat>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="S:quantification">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Restr">
              <nomvar name="X:sem-obj"/>
            </diamond>
            <diamond mode="Body">
              <nomvar name="E:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="LeftwardTypeRaised">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash/>
        <dollar name="1"/>
        <slash ability="active" varmodality="M" dir="\"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
          <slash ability="active" varmodality="M" dir="/"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="num">
                <featvar name="NUM:num-vals"/>
              </feat>
              <feat val="3rd" attr="pers"/>
              <feat attr="case">
                <featvar name="CASE"/>
              </feat>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="S:quantification">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Restr">
              <nomvar name="X:sem-obj"/>
            </diamond>
            <diamond mode="Body">
              <nomvar name="E:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="everyone" pred="every"/>
    <member stem="both"/>
    <member stem="neither"/>
    <member stem="none"/>
    <member stem="all"/>
  </family>
  <family closed="true" pos="WhNP" name="WhNP">
    <entry name="SubjectExtraction">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="wh" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="Q"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="num">
                <featvar name="NUM:num-vals"/>
              </feat>
              <feat val="3rd" attr="pers"/>
              <feat attr="case">
                <featvar name="CASE"/>
              </feat>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="Q:quantification">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Restr">
              <nomvar name="X:sem-obj"/>
            </diamond>
            <diamond mode="Body">
              <nomvar name="E:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="ObjectExtraction">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="wh" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="Q"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat val="q" attr="form"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="/"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="num">
                <featvar name="NUM:num-vals"/>
              </feat>
              <feat val="3rd" attr="pers"/>
              <feat attr="case">
                <featvar name="CASE"/>
              </feat>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="Q:quantification">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Restr">
              <nomvar name="X:sem-obj"/>
            </diamond>
            <diamond mode="Body">
              <nomvar name="E:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="ObjectInSitu">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="wh" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="Q"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash/>
        <dollar name="1"/>
        <slash ability="active" varmodality="M" dir="\"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
          <slash ability="active" varmodality="M" dir="/"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="num">
                <featvar name="NUM:num-vals"/>
              </feat>
              <feat val="3rd" attr="pers"/>
              <feat attr="case">
                <featvar name="CASE"/>
              </feat>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="Q:quantification">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Restr">
              <nomvar name="X:sem-obj"/>
            </diamond>
            <diamond mode="Body">
              <nomvar name="E:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="what"/>
    <member stem="where"/>
    <member stem="who"/>
  </family>
  <family indexRel="det" closed="true" pos="Det" name="Det">
    <entry name="Primary">
      <complexcat>
        <atomcat type="np">
          <fs id="2">
            <feat val="3rd" attr="pers"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="det">
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="a"/>
    <member stem="some"/>
    <member stem="the"/>
  </family>
  <family closed="true" pos="PDet" name="PDet">
    <entry name="Primary">
      <complexcat>
        <atomcat type="np">
          <fs id="2">
            <feat val="3rd" attr="pers"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="Det">
              <nomvar name="P:proposition"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="another"/>
    <member stem="this"/>
    <member stem="that"/>
  </family>
  <family closed="true" pos="Num" name="One-Det">
    <entry name="Primary">
      <complexcat>
        <atomcat type="np">
          <fs id="2">
            <feat val="3rd" attr="pers"/>
            <feat attr="index">
              <lf>
                <nomvar name="W"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="W"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="W:sem-obj">
            <diamond mode="det">
              <prop name="nil"/>
            </diamond>
            <diamond mode="Card">
              <nomvar name="X:num"/>
            </diamond>
          </satop>
          <satop nomvar="X:num">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="one"/>
    <member stem="1"/>
  </family>
  <family closed="true" pos="PossPro" name="PossPro">
    <entry name="Primary">
      <complexcat>
        <atomcat type="np">
          <fs id="2">
            <feat val="3rd" attr="pers"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="GenOwner">
              <nomvar name="P:sem-obj"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="pro1"/>
    <member stem="pro2"/>
    <member stem="pro3f"/>
    <member stem="pro3m"/>
    <member stem="pro3n"/>
  </family>
  <family indexRel="GenOwner" closed="true" pos="PossS" name="PossS">
    <entry name="Primary">
      <complexcat>
        <atomcat type="np">
          <fs id="2">
            <feat val="3rd" attr="pers"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="gen" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="GenOwner">
              <nomvar name="Y:sem-obj"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="'s"/>
  </family>
  <family closed="true" pos="QDet" name="QuantDet">
    <entry name="RightwardTypeRaised">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash ability="active" varmodality="M" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash ability="active" varmodality="M" dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="num">
                <featvar name="NUM:num-vals"/>
              </feat>
              <feat val="3rd" attr="pers"/>
              <feat attr="case">
                <featvar name="CASE"/>
              </feat>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash mode="^" dir="/"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="S:quantification">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Restr">
              <nomvar name="X:sem-obj"/>
            </diamond>
            <diamond mode="Body">
              <nomvar name="E:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="LeftwardTypeRaised">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash/>
        <dollar name="1"/>
        <slash ability="active" varmodality="M" dir="\"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
          <slash ability="active" varmodality="M" dir="/"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="num">
                <featvar name="NUM:num-vals"/>
              </feat>
              <feat val="3rd" attr="pers"/>
              <feat attr="case">
                <featvar name="CASE"/>
              </feat>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash mode="^" dir="/"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="S:quantification">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Restr">
              <nomvar name="X:sem-obj"/>
            </diamond>
            <diamond mode="Body">
              <nomvar name="E:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="all"/>
    <member stem="both"/>
    <member stem="every"/>
    <member stem="neither"/>
    <member stem="no"/>
  </family>
  <family closed="true" pos="Wh" name="WhDet">
    <entry name="SubjectExtraction">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="wh" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="Q"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="num">
                <featvar name="NUM:num-vals"/>
              </feat>
              <feat val="3rd" attr="pers"/>
              <feat attr="case">
                <featvar name="CASE"/>
              </feat>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash mode="^" dir="/"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="Q:quantification">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Restr">
              <nomvar name="X:sem-obj"/>
            </diamond>
            <diamond mode="Body">
              <nomvar name="E:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="ObjectExtraction">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="wh" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="Q"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat val="q" attr="form"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="/"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="num">
                <featvar name="NUM:num-vals"/>
              </feat>
              <feat val="3rd" attr="pers"/>
              <feat attr="case">
                <featvar name="CASE"/>
              </feat>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash mode="^" dir="/"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="Q:quantification">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Restr">
              <nomvar name="X:sem-obj"/>
            </diamond>
            <diamond mode="Body">
              <nomvar name="E:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="ObjectInSitu">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="wh" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="Q"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash/>
        <dollar name="1"/>
        <slash ability="active" varmodality="M" dir="\"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
          <slash ability="active" varmodality="M" dir="/"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="num">
                <featvar name="NUM:num-vals"/>
              </feat>
              <feat val="3rd" attr="pers"/>
              <feat attr="case">
                <featvar name="CASE"/>
              </feat>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash mode="^" dir="/"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="Q:quantification">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Restr">
              <nomvar name="X:sem-obj"/>
            </diamond>
            <diamond mode="Body">
              <nomvar name="E:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="what"/>
    <member stem="which"/>
  </family>
  <family closed="true" pos="Adj" name="Adjective">
    <entry name="Primary">
      <complexcat>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="HasProp">
              <nomvar name="P:proposition"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Predicative">
      <complexcat>
        <atomcat type="s">
          <fs>
            <feat val="adj" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="P"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash ability="inert" mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="P:proposition">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Of">
              <nomvar name="X:sem-obj"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="more"/>
    <member stem="other"/>
    <member stem="abstract"/>
    <member stem="animal"/>
    <member stem="belt_buckle" pred="belt-buckle"/>
    <member stem="comic"/>
    <member stem="cross"/>
    <member stem="diamond"/>
    <member stem="decorative"/>
    <member stem="face"/>
    <member stem="female"/>
    <member stem="floral"/>
    <member stem="geometric"/>
    <member stem="jeans"/>
    <member stem="male"/>
    <member stem="classic"/>
    <member stem="country"/>
    <member stem="family"/>
    <member stem="modern"/>
    <member stem="larger"/>
    <member stem="smaller"/>
    <member stem="beige"/>
    <member stem="black"/>
    <member stem="blue"/>
    <member stem="brown"/>
    <member stem="cream"/>
    <member stem="dark_green"/>
    <member stem="dark_red"/>
    <member stem="gray"/>
    <member stem="grey"/>
    <member stem="green"/>
    <member stem="indigo"/>
    <member stem="ochre"/>
    <member stem="off_white"/>
    <member stem="orange"/>
    <member stem="pink"/>
    <member stem="purple"/>
    <member stem="red"/>
    <member stem="rose"/>
    <member stem="royal_blue"/>
    <member stem="salmon"/>
    <member stem="sandstone"/>
    <member stem="silver"/>
    <member stem="terracotta"/>
    <member stem="violet"/>
    <member stem="white"/>
    <member stem="yellow"/>
    <member stem="Abbazie"/>
    <member stem="Aguamarina"/>
    <member stem="Alt_Mettlach"/>
    <member stem="Altamira"/>
    <member stem="Amazonita"/>
    <member stem="Anasol"/>
    <member stem="Aramis"/>
    <member stem="Asterix"/>
    <member stem="Armonie"/>
    <member stem="Ateliers"/>
    <member stem="Blue_Jeans"/>
    <member stem="Carioca"/>
    <member stem="Cardiff"/>
    <member stem="Century"/>
    <member stem="Century_Esprit"/>
    <member stem="Colorado"/>
    <member stem="Creative_System_Amazonas"/>
    <member stem="Creative_System_Safari"/>
    <member stem="Darlington"/>
    <member stem="Funny_Day"/>
    <member stem="Girotondo_Tile"/>
    <member stem="Helenus"/>
    <member stem="Hippo"/>
    <member stem="HundertWasser"/>
    <member stem="I_marmi"/>
    <member stem="I_marmi_Art"/>
    <member stem="Jazz"/>
    <member stem="Kerarock"/>
    <member stem="Le_Pietre"/>
    <member stem="Levante"/>
    <member stem="Lollipop"/>
    <member stem="Opus_Romano"/>
    <member stem="Palace"/>
    <member stem="Sandstein"/>
    <member stem="Smart"/>
    <member stem="Tirrenia"/>
    <member stem="Viso_Tile"/>
  </family>
  <family closed="true" pos="Adj" name="Adjective-Measure">
    <entry name="Primary">
      <complexcat>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:measure">
            <diamond mode="HasProp">
              <nomvar name="P:proposition"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
  <family closed="true" pos="Adv" name="Adverb">
    <entry name="Initial">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="fronted" attr="form"/>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <atomcat type="s">
          <fs id="1">
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:situation">
            <diamond mode="HasProp">
              <nomvar name="P:proposition"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Forward">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="E:situation">
            <diamond mode="HasProp">
              <nomvar name="P:proposition"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Backward">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:situation">
            <diamond mode="HasProp">
              <nomvar name="P:proposition"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="also"/>
    <member stem="either"/>
    <member stem="though"/>
    <member stem="before"/>
    <member stem="earlier"/>
    <member stem="once_again" pred="once-again"/>
  </family>
  <family closed="true" pos="Adv" name="Loc-Adverb">
    <entry name="Initial">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="fronted" attr="form"/>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <atomcat type="s">
          <fs id="1">
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:situation">
            <diamond mode="Location">
              <nomvar name="P:location"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Forward">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="E:situation">
            <diamond mode="Location">
              <nomvar name="P:location"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Backward">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:situation">
            <diamond mode="Location">
              <nomvar name="P:location"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="down_here"/>
    <member stem="here"/>
  </family>
  <family closed="true" pos="Adv" name="Transitional-Adverb">
    <entry name="Initial">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="fronted" attr="form"/>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <atomcat type="punct">
          <fs>
            <feat val="," attr="lex"/>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:situation">
            <diamond mode="HasProp">
              <nomvar name="P:proposition"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="now"/>
  </family>
  <family indexRel="*NoSem*" closed="true" pos="Prep" name="Particle">
    <entry name="Primary">
      <atomcat type="prt">
        <fs>
          <feat val="[*DEFAULT*]" attr="lex"/>
        </fs>
      </atomcat>
    </entry>
  </family>
  <family indexRel="*NoSem*" closed="true" pos="Prep" name="Prep-Nom">
    <entry name="Nominal">
      <complexcat>
        <atomcat type="pp">
          <fs inheritsFrom="3">
            <feat val="[*DEFAULT*]" attr="lex"/>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="with"/>
    <member stem="at"/>
    <member stem="from"/>
    <member stem="of"/>
  </family>
  <family closed="true" pos="Adj" name="Prep-Loc">
    <entry name="Primary">
      <complexcat>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="FigInv">
              <nomvar name="P:proposition"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Ground">
                <nomvar name="Y:sem-obj"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Predicative">
      <complexcat>
        <atomcat type="s">
          <fs>
            <feat val="adj" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="P"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash ability="inert" mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="P:proposition">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Fig">
              <nomvar name="X:sem-obj"/>
            </diamond>
            <diamond mode="Ground">
              <nomvar name="Y:sem-obj"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="in"/>
    <member stem="on"/>
  </family>
  <family indexRel="Poss" closed="true" pos="Prep" name="With-Poss">
    <entry name="Primary">
      <complexcat>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="Poss">
              <nomvar name="Y:sem-obj"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Plus-Pred-Y">
      <complexcat>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs>
              <feat val="adj" attr="form"/>
              <feat attr="index">
                <lf>
                  <nomvar name="P"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash ability="inert" mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs>
              <feat attr="index">
                <lf>
                  <nomvar name="Y"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash mode="&lt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="Poss">
              <nomvar name="Y:sem-obj"/>
            </diamond>
            <diamond mode="Where">
              <nomvar name="P:proposition"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Appos">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat attr="form">
              <featvar name="FORM:form-vals"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
            <feat attr="info">
              <lf>
                <var name="INFO"/>
              </lf>
            </feat>
            <feat attr="owner">
              <lf>
                <var name="OWNER"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="punct">
          <fs>
            <feat val="," attr="lex"/>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="S:proposition">
            <prop name="elab-rel"/>
            <diamond mode="info">
              <var name="INFO"/>
            </diamond>
            <diamond mode="owner">
              <var name="OWNER"/>
            </diamond>
            <diamond mode="kon">
              <prop name="-"/>
            </diamond>
            <diamond mode="Core">
              <nomvar name="E:situation"/>
            </diamond>
            <diamond mode="Trib">
              <nomvar name="P:situation"/>
            </diamond>
          </satop>
          <satop nomvar="P:proposition">
            <prop name="has-rel"/>
            <diamond mode="info">
              <var name="INFO"/>
            </diamond>
            <diamond mode="owner">
              <var name="OWNER"/>
            </diamond>
            <diamond mode="kon">
              <prop name="-"/>
            </diamond>
            <diamond mode="Of">
              <nomvar name="X:"/>
            </diamond>
            <diamond mode="Poss">
              <nomvar name="Y:"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Appos-Plus-Pred-Y">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat attr="form">
              <featvar name="FORM:form-vals"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
            <feat attr="info">
              <lf>
                <var name="INFO"/>
              </lf>
            </feat>
            <feat attr="owner">
              <lf>
                <var name="OWNER"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="punct">
          <fs>
            <feat val="," attr="lex"/>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs>
              <feat val="adj" attr="form"/>
              <feat attr="index">
                <lf>
                  <nomvar name="P2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash ability="inert" mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs>
              <feat attr="index">
                <lf>
                  <nomvar name="Y"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash mode="*" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="S:proposition">
            <prop name="elab-rel"/>
            <diamond mode="info">
              <var name="INFO"/>
            </diamond>
            <diamond mode="owner">
              <var name="OWNER"/>
            </diamond>
            <diamond mode="kon">
              <prop name="-"/>
            </diamond>
            <diamond mode="Core">
              <nomvar name="E:situation"/>
            </diamond>
            <diamond mode="Trib">
              <nomvar name="P:situation"/>
            </diamond>
          </satop>
          <satop nomvar="P:proposition">
            <prop name="has-rel"/>
            <diamond mode="info">
              <var name="INFO"/>
            </diamond>
            <diamond mode="owner">
              <var name="OWNER"/>
            </diamond>
            <diamond mode="kon">
              <prop name="-"/>
            </diamond>
            <diamond mode="Of">
              <nomvar name="X:"/>
            </diamond>
            <diamond mode="Poss">
              <nomvar name="Y:"/>
            </diamond>
          </satop>
          <satop nomvar="P">
            <diamond mode="Where">
              <nomvar name="P2:proposition"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="with"/>
  </family>
  <family closed="true" pos="Adv" name="Prep-Transitional">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="fronted" attr="form"/>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <atomcat type="punct">
          <fs>
            <feat val="," attr="lex"/>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:sem-obj">
            <diamond mode="HasProp">
              <nomvar name="P:proposition"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Arg">
                <nomvar name="Y:sem-obj"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="in_addition_to" pred="in-addition-to"/>
  </family>
  <family indexRel="*NoSem*" closed="true" pos="Prep" name="To-Infinitive">
    <entry name="Basic">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="inf" attr="form"/>
          </fs>
        </atomcat>
        <slash ability="inert" mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat val="base" attr="form"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
      </complexcat>
    </entry>
    <member stem="to"/>
  </family>
  <family closed="true" pos="V" name="Possession">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:situation">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Owner">
              <nomvar name="X:sem-obj"/>
            </diamond>
            <diamond mode="Poss">
              <nomvar name="Y:sem-obj"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="TV-Plus-Pred-Y">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs>
              <feat val="adj" attr="form"/>
              <feat attr="index">
                <lf>
                  <nomvar name="P"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash ability="inert" mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs>
              <feat attr="index">
                <lf>
                  <nomvar name="Y"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:situation">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Owner">
              <nomvar name="X:sem-obj"/>
            </diamond>
            <diamond mode="Poss">
              <nomvar name="Y:sem-obj"/>
            </diamond>
          </satop>
          <satop nomvar="E:situation">
            <diamond mode="Where">
              <nomvar name="P:proposition"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="have"/>
  </family>
  <family closed="true" pos="V" name="Statement">
    <entry name="IV">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:statement">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Speaker">
              <nomvar name="X:causal-agent"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="TV-SComp-Dcl">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="/"/>
        <atomcat type="s">
          <fs>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:statement">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Speaker">
              <nomvar name="X:causal-agent"/>
            </diamond>
          </satop>
          <satop nomvar="E:statement">
            <diamond mode="Message">
              <nomvar name="E2:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="TV-SComp-Emb">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="/"/>
        <atomcat type="s">
          <fs>
            <feat val="emb" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:statement">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Speaker">
              <nomvar name="X:causal-agent"/>
            </diamond>
          </satop>
          <satop nomvar="E:statement">
            <diamond mode="Message">
              <nomvar name="E2:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="mention"/>
    <member stem="say"/>
  </family>
  <family closed="true" pos="V" name="Experiencer-Subj">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs>
              <feat val="inf" attr="form"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="E:experience">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Experiencer">
              <nomvar name="X:animate-being"/>
            </diamond>
            <diamond mode="Content">
              <nomvar name="E2:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="like"/>
    <member stem="want"/>
  </family>
  <family closed="true" pos="V" name="Agentive-Causing">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:situation">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Agent">
              <nomvar name="X:causal-agent"/>
            </diamond>
            <diamond mode="Effect">
              <nomvar name="Y:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="make"/>
  </family>
  <family closed="true" pos="V" name="Copula">
    <entry name="Pred">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs>
              <feat val="adj" attr="form"/>
              <feat attr="index">
                <lf>
                  <nomvar name="P"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash ability="inert" mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="E:state">
            <prop name="be"/>
            <diamond mode="Arg">
              <nomvar name="X:sem-obj"/>
            </diamond>
            <diamond mode="Prop">
              <nomvar name="P:proposition"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Pred-Inverted">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="q" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs>
              <feat val="adj" attr="form"/>
              <feat attr="index">
                <lf>
                  <nomvar name="P"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash ability="inert" mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash mode="*" dir="/"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:state">
            <prop name="be"/>
            <diamond mode="Arg">
              <nomvar name="X:sem-obj"/>
            </diamond>
            <diamond mode="Prop">
              <nomvar name="P:proposition"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="NP">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:state">
            <prop name="be"/>
            <diamond mode="Arg">
              <nomvar name="X:sem-obj"/>
            </diamond>
            <diamond mode="Pred">
              <nomvar name="Y:sem-obj"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="NP-Inverted">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="q" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:state">
            <prop name="be"/>
            <diamond mode="Arg">
              <nomvar name="X:sem-obj"/>
            </diamond>
            <diamond mode="Pred">
              <nomvar name="Y:sem-obj"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="be"/>
  </family>
  <family closed="true" pos="V" name="ThereExistential">
    <entry name="NP">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np_expl">
          <fs>
            <feat val="there" attr="lex"/>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:state">
            <prop name="there-be"/>
            <diamond mode="Arg">
              <nomvar name="X:sem-obj"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="NP-PredAdj">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np_expl">
          <fs>
            <feat val="there" attr="lex"/>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs>
              <feat val="adj" attr="form"/>
              <feat attr="index">
                <lf>
                  <nomvar name="P"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash ability="inert" mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:state">
            <prop name="there-be"/>
            <diamond mode="Arg">
              <nomvar name="X:sem-obj"/>
            </diamond>
          </satop>
          <satop nomvar="E:state">
            <diamond mode="Prop">
              <nomvar name="P:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="NP-PredNg">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np_expl">
          <fs>
            <feat val="there" attr="lex"/>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs>
              <feat val="ng" attr="form"/>
              <feat attr="index">
                <lf>
                  <nomvar name="P"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:state">
            <prop name="there-be"/>
            <diamond mode="Arg">
              <nomvar name="X:sem-obj"/>
            </diamond>
          </satop>
          <satop nomvar="E:state">
            <diamond mode="Prop">
              <nomvar name="P:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="NP-Inverted">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="q" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <atomcat type="np_expl">
          <fs>
            <feat val="there" attr="lex"/>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:state">
            <prop name="there-be"/>
            <diamond mode="Arg">
              <nomvar name="X:sem-obj"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="NP-PredAdj-Inverted">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="q" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs>
              <feat val="adj" attr="form"/>
              <feat attr="index">
                <lf>
                  <nomvar name="P"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash ability="inert" mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <atomcat type="np_expl">
          <fs>
            <feat val="there" attr="lex"/>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:state">
            <prop name="there-be"/>
            <diamond mode="Arg">
              <nomvar name="X:sem-obj"/>
            </diamond>
          </satop>
          <satop nomvar="E:state">
            <diamond mode="Prop">
              <nomvar name="P:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="NP-PredNg-Inverted">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="q" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs>
              <feat val="ng" attr="form"/>
              <feat attr="index">
                <lf>
                  <nomvar name="P"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <atomcat type="np_expl">
          <fs>
            <feat val="there" attr="lex"/>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:state">
            <prop name="there-be"/>
            <diamond mode="Arg">
              <nomvar name="X:sem-obj"/>
            </diamond>
          </satop>
          <satop nomvar="E:state">
            <diamond mode="Prop">
              <nomvar name="P:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="be" pred="there-be"/>
  </family>
  <family closed="true" pos="V" name="HereExistential">
    <entry name="NP">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np_expl">
          <fs>
            <feat val="here" attr="lex"/>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:state">
            <prop name="here-be"/>
            <diamond mode="Arg">
              <nomvar name="X:sem-obj"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="be" pred="here-be"/>
  </family>
  <family closed="true" pos="V" name="Modal">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs>
              <feat val="base" attr="form"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="E:state">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Body">
              <nomvar name="E2:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Inverted">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="2" id="1">
            <feat val="q" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <atomcat type="s">
          <fs id="2">
            <feat val="base" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:state">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Body">
              <nomvar name="E2:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="can"/>
    <member stem="may"/>
    <member stem="should"/>
    <member stem="would"/>
    <member stem="will"/>
    <member stem="do"/>
  </family>
  <family indexRel="prog" closed="true" pos="V" name="Progressive">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs>
              <feat val="ng" attr="form"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="E:state">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Body">
              <nomvar name="E2:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Inverted">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="2" id="1">
            <feat val="q" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <atomcat type="s">
          <fs id="2">
            <feat val="ng" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:state">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Body">
              <nomvar name="E2:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="be" pred="prog"/>
  </family>
  <family closed="true" pos="V" name="Negation">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="6" id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="6">
              <feat attr="index">
                <lf>
                  <nomvar name="E2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="E:state">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Body">
              <nomvar name="E2:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="not"/>
  </family>
  <family indexRel="tense" closed="true" pos="V" name="Do-Support">
    <entry name="Inverted">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="2" id="1">
            <feat val="q" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <atomcat type="s">
          <fs id="2">
            <feat val="base" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="do"/>
  </family>
  <family closed="true" pos="Conj" name="Conj">
    <entry name="NP-Collective" stem="and">
      <complexcat>
        <atomcat type="np_conj">
          <fs id="1">
            <feat val="pl" attr="num"/>
            <feat attr="case">
              <featvar name="CASE"/>
            </feat>
            <feat val="coll" attr="type"/>
            <feat attr="index">
              <lf>
                <nomvar name="L1"/>
              </lf>
            </feat>
            <feat attr="op-index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="np">
          <fs>
            <feat attr="case">
              <featvar name="CASE"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="bt">
          <fs>
            <feat val="LH%" attr="lex"/>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <atomcat type="np">
          <fs>
            <feat attr="case">
              <featvar name="CASE"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="S:sem-obj">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Last">
              <nomvar name="L_N:struct"/>
            </diamond>
          </satop>
          <satop nomvar="L1:struct">
            <prop name="elem"/>
            <diamond mode="Item">
              <nomvar name="X1:sem-obj"/>
            </diamond>
            <diamond mode="Next">
              <nomvar name="L2:struct"/>
              <prop name="elem"/>
              <diamond mode="Item">
                <nomvar name="X2:sem-obj"/>
              </diamond>
              <diamond mode="EqL">
                <nomvar name="L_N:struct"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="NP-Distributive-and" stem="and">
      <complexcat>
        <atomcat type="np_conj">
          <fs id="1">
            <feat val="pl" attr="num"/>
            <feat attr="case">
              <featvar name="CASE"/>
            </feat>
            <feat val="distr" attr="type"/>
            <feat attr="index">
              <lf>
                <nomvar name="L1"/>
              </lf>
            </feat>
            <feat attr="op-index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="np">
          <fs>
            <feat attr="case">
              <featvar name="CASE"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="bt">
          <fs>
            <feat val="LH%" attr="lex"/>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <atomcat type="np">
          <fs>
            <feat attr="case">
              <featvar name="CASE"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="S:sem-obj">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Last">
              <nomvar name="L_N:struct"/>
            </diamond>
          </satop>
          <satop nomvar="L1:struct">
            <prop name="elem"/>
            <diamond mode="Item">
              <nomvar name="X1:sem-obj"/>
            </diamond>
            <diamond mode="Next">
              <nomvar name="L2:struct"/>
              <prop name="elem"/>
              <diamond mode="Item">
                <nomvar name="X2:sem-obj"/>
              </diamond>
              <diamond mode="EqL">
                <nomvar name="L_N:struct"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="NP-Distributive-or" stem="or">
      <complexcat>
        <atomcat type="np_conj">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="case">
              <featvar name="CASE"/>
            </feat>
            <feat val="distr" attr="type"/>
            <feat attr="index">
              <lf>
                <nomvar name="L1"/>
              </lf>
            </feat>
            <feat attr="op-index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="np">
          <fs>
            <feat attr="case">
              <featvar name="CASE"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="bt">
          <fs>
            <feat val="LH%" attr="lex"/>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <atomcat type="np">
          <fs>
            <feat attr="case">
              <featvar name="CASE"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="S:sem-obj">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Last">
              <nomvar name="L_N:struct"/>
            </diamond>
          </satop>
          <satop nomvar="L1:struct">
            <prop name="elem"/>
            <diamond mode="Item">
              <nomvar name="X1:sem-obj"/>
            </diamond>
            <diamond mode="Next">
              <nomvar name="L2:struct"/>
              <prop name="elem"/>
              <diamond mode="Item">
                <nomvar name="X2:sem-obj"/>
              </diamond>
              <diamond mode="EqL">
                <nomvar name="L_N:struct"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Sentential">
      <complexcat>
        <atomcat type="s_conj">
          <fs inheritsFrom="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="L1"/>
              </lf>
            </feat>
            <feat attr="op-index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash/>
        <dollar name="1"/>
        <slash mode="*" dir="\"/>
        <complexcat>
          <atomcat type="s">
            <fs inheritsFrom="1">
              <feat attr="num">
                <featvar name="NUM:num-vals"/>
              </feat>
              <feat attr="pers">
                <featvar name="PERS:pers-vals"/>
              </feat>
              <feat attr="index">
                <lf>
                  <nomvar name="E1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
        </complexcat>
        <slash mode="*" dir="\"/>
        <atomcat type="bt">
          <fs>
            <feat val="LH%" attr="lex"/>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="E2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
        </complexcat>
        <lf>
          <satop nomvar="S:situation">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Last">
              <nomvar name="L_N:struct"/>
            </diamond>
          </satop>
          <satop nomvar="L1:struct">
            <prop name="elem"/>
            <diamond mode="Item">
              <nomvar name="E1:situation"/>
            </diamond>
            <diamond mode="Next">
              <nomvar name="L2:struct"/>
              <prop name="elem"/>
              <diamond mode="Item">
                <nomvar name="E2:situation"/>
              </diamond>
              <diamond mode="EqL">
                <nomvar name="L_N:struct"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="and"/>
    <member stem="or"/>
  </family>
  <family closed="true" pos="Conj" name="Conj-Sentential-Binary">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash/>
        <dollar name="1"/>
        <slash mode="*" dir="\"/>
        <complexcat>
          <atomcat type="s">
            <fs inheritsFrom="1">
              <feat attr="num">
                <featvar name="NUM:num-vals"/>
              </feat>
              <feat attr="pers">
                <featvar name="PERS:pers-vals"/>
              </feat>
              <feat attr="index">
                <lf>
                  <nomvar name="E1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
        </complexcat>
        <slash mode="*" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="E2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
        </complexcat>
        <lf>
          <satop nomvar="S:situation">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="E1:situation"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="E2:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="but"/>
  </family>
  <family closed="true" pos="Conj" name="Subconj-Initial-Only">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="S:situation">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg2">
              <nomvar name="E2:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="VP">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="E2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="S:situation">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg2">
              <nomvar name="E2:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="and"/>
    <member stem="or"/>
    <member stem="but"/>
  </family>
  <family closed="true" pos="Conj" name="Subconj-Medial">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="E1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="punct">
          <fs>
            <feat val="," attr="lex"/>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="S:situation">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="E1:situation"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="E2:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="but"/>
    <member stem="while"/>
  </family>
  <family closed="true" pos="Conj" name="Subconj-Initial">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <atomcat type="punct">
          <fs>
            <feat val="," attr="lex"/>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="E1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="S:situation">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="E1:situation"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="E2:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="although"/>
    <member stem="if"/>
  </family>
  <family closed="true" pos="Conj" name="Subconj-Transitional">
    <entry name="Initial">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="fronted" attr="form"/>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <atomcat type="punct">
          <fs>
            <feat val="," attr="lex"/>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <atomcat type="s">
          <fs>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:situation">
            <diamond mode="HasProp">
              <nomvar name="S:situation"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Arg">
                <nomvar name="E2:situation"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="as"/>
  </family>
  <family indexRel="GenRel" closed="true" pos="RelPro" name="RelPro">
    <entry name="Primary">
      <complexcat>
        <atomcat type="n">
          <fs inheritsFrom="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
            <feat attr="case">
              <featvar name="CASE"/>
            </feat>
          </fs>
        </atomcat>
        <setarg>
          <slash mode="*" dir="\"/>
          <atomcat type="n">
            <fs inheritsFrom="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
              <feat attr="case">
                <featvar name="CASE"/>
              </feat>
            </fs>
          </atomcat>
          <slash mode="*" dir="/"/>
          <complexcat>
            <atomcat type="s">
              <fs id="1">
                <feat val="dcl" attr="form"/>
                <feat attr="index">
                  <lf>
                    <nomvar name="E"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
            <slash dir="|"/>
            <atomcat type="np">
              <fs id="2">
                <feat val="3rd" attr="pers"/>
                <feat attr="index">
                  <lf>
                    <nomvar name="X"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
          </complexcat>
        </setarg>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="GenRel">
              <nomvar name="E:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="that"/>
  </family>
  <family closed="true" pos="RelPro" name="RelPro-Appos">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat attr="form">
              <featvar name="FORM:form-vals"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
            <feat attr="info">
              <lf>
                <var name="INFO"/>
              </lf>
            </feat>
            <feat attr="owner">
              <lf>
                <var name="OWNER"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs>
              <feat val="dcl" attr="form"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="|"/>
          <atomcat type="np">
            <fs id="2">
              <feat val="3rd" attr="pers"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="S:proposition">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="info">
              <var name="INFO"/>
            </diamond>
            <diamond mode="owner">
              <var name="OWNER"/>
            </diamond>
            <diamond mode="kon">
              <prop name="-"/>
            </diamond>
            <diamond mode="Core">
              <nomvar name="E:situation"/>
            </diamond>
            <diamond mode="Trib">
              <nomvar name="E2:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="that" pred="elab-rel"/>
  </family>
  <family indexRel="*NoSem*" closed="true" pos="Comp" name="Comp">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="emb" attr="form"/>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <atomcat type="s">
          <fs id="1">
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="that"/>
  </family>
  <family indexRel="*NoSem*" closed="true" pos="BT" name="BoundaryTone-L-LL%">
    <entry name="S">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="phr" attr="info"/>
            <feat val="nil" attr="owner"/>
          </fs>
        </atomcat>
        <slash/>
        <dollar name="1"/>
        <slash mode="*" dir="\"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="info">
                <lf>
                  <var name="INFO"/>
                </lf>
              </feat>
              <feat attr="owner">
                <lf>
                  <prop name="s"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
        </complexcat>
      </complexcat>
    </entry>
    <member stem="L"/>
    <member stem="LL%"/>
  </family>
  <family indexRel="*NoSem*" closed="true" pos="BT" name="BoundaryTone-LL%-as-LH%">
    <entry name="BT">
      <atomcat type="bt">
        <fs>
          <feat val="LH%" attr="lex"/>
        </fs>
      </atomcat>
    </entry>
  </family>
  <family indexRel="*NoSem*" closed="true" pos="BT" name="BoundaryTone-LH%">
    <entry name="S">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="phr" attr="info"/>
            <feat val="nil" attr="owner"/>
          </fs>
        </atomcat>
        <slash/>
        <dollar name="1"/>
        <slash mode="*" dir="\"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="info">
                <lf>
                  <var name="INFO"/>
                </lf>
              </feat>
              <feat attr="owner">
                <lf>
                  <prop name="h"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
        </complexcat>
      </complexcat>
    </entry>
    <entry name="BT">
      <atomcat type="bt">
        <fs>
          <feat val="LH%" attr="lex"/>
        </fs>
      </atomcat>
    </entry>
    <member stem="LH%"/>
  </family>
  <family indexRel="*NoSem*" closed="true" pos="BT" name="BoundaryTone-HH%">
    <entry name="S-q">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="phr" attr="info"/>
            <feat val="nil" attr="owner"/>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="s">
          <fs id="1">
            <feat val="q" attr="form"/>
            <feat attr="info">
              <lf>
                <var name="INFO"/>
              </lf>
            </feat>
            <feat attr="owner">
              <lf>
                <prop name="h"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="HH%"/>
  </family>
  <family closed="true" pos="," name="Comma">
    <entry indexRel="*NoSem*" name="Primary">
      <atomcat type="punct">
        <fs>
          <feat val="," attr="lex"/>
        </fs>
      </atomcat>
    </entry>
    <entry indexRel="Next" name="Sentential">
      <complexcat>
        <atomcat type="s_conj">
          <fs inheritsFrom="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="L1"/>
              </lf>
            </feat>
            <feat attr="op-index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash/>
        <dollar name="1"/>
        <slash mode="*" dir="\"/>
        <complexcat>
          <atomcat type="s">
            <fs inheritsFrom="1">
              <feat attr="num">
                <featvar name="NUM:num-vals"/>
              </feat>
              <feat attr="pers">
                <featvar name="PERS:pers-vals"/>
              </feat>
              <feat attr="index">
                <lf>
                  <nomvar name="E1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
        </complexcat>
        <slash mode="*" dir="\"/>
        <atomcat type="bt">
          <fs>
            <feat val="LH%" attr="lex"/>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <complexcat>
          <atomcat type="s_conj">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="L2"/>
                </lf>
              </feat>
              <feat attr="op-index">
                <lf>
                  <nomvar name="S"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
        </complexcat>
        <lf>
          <satop nomvar="L1:struct">
            <prop name="elem"/>
            <diamond mode="Item">
              <nomvar name="E1:situation"/>
            </diamond>
            <diamond mode="Next">
              <nomvar name="L2:struct"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry indexRel="Next" name="NP">
      <complexcat>
        <atomcat type="np_conj">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="L1"/>
              </lf>
            </feat>
            <feat attr="op-index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="np">
          <fs>
            <feat attr="case">
              <featvar name="CASE"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="bt">
          <fs>
            <feat val="LH%" attr="lex"/>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <atomcat type="np_conj">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="L2"/>
              </lf>
            </feat>
            <feat attr="op-index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
            <feat attr="info">
              <lf>
                <var name="INFO"/>
              </lf>
            </feat>
            <feat attr="owner">
              <lf>
                <var name="OWNER"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="L1:struct">
            <prop name="elem"/>
            <diamond mode="Item">
              <nomvar name="X1:sem-obj"/>
            </diamond>
            <diamond mode="Next">
              <nomvar name="L2:struct"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem=","/>
  </family>
  <family closed="true" pos="," name="Comma-Elab">
    <entry name="VP-ng">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat attr="form">
              <featvar name="FORM:form-vals"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
            <feat attr="info">
              <lf>
                <var name="INFO"/>
              </lf>
            </feat>
            <feat attr="owner">
              <lf>
                <var name="OWNER"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs>
              <feat val="ng" attr="form"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="S:proposition">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="info">
              <var name="INFO"/>
            </diamond>
            <diamond mode="owner">
              <var name="OWNER"/>
            </diamond>
            <diamond mode="kon">
              <prop name="-"/>
            </diamond>
            <diamond mode="Core">
              <nomvar name="E:situation"/>
            </diamond>
            <diamond mode="Trib">
              <nomvar name="E2:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Pred-Adj">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat attr="form">
              <featvar name="FORM:form-vals"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
            <feat attr="info">
              <lf>
                <var name="INFO"/>
              </lf>
            </feat>
            <feat attr="owner">
              <lf>
                <var name="OWNER"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs>
              <feat val="adj" attr="form"/>
              <feat attr="index">
                <lf>
                  <nomvar name="P"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash ability="inert" mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="S:proposition">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="info">
              <var name="INFO"/>
            </diamond>
            <diamond mode="owner">
              <var name="OWNER"/>
            </diamond>
            <diamond mode="kon">
              <prop name="-"/>
            </diamond>
            <diamond mode="Core">
              <nomvar name="E:situation"/>
            </diamond>
            <diamond mode="Trib">
              <nomvar name="P:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="," pred="elab-rel"/>
  </family>
  <family indexRel="mood" closed="true" pos="." name="FullStop">
    <entry name="Declare-Dcl-or-Fronted">
      <complexcat>
        <atomcat type="sent">
          <fs>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="s">
          <fs id="1">
            <feat val="dcl-base" attr="form"/>
            <feat val="phr" attr="info"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:sem-obj">
            <diamond mode="mood">
              <prop name="dcl"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Declare-VP-Ng">
      <complexcat>
        <atomcat type="sent">
          <fs>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat val="ng" attr="form"/>
              <feat val="phr" attr="info"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="E:sem-obj">
            <diamond mode="mood">
              <prop name="dcl"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="."/>
  </family>
  <family indexRel="mood" closed="true" pos="?" name="QuestionMark">
    <entry name="Ask-Q-or-Wh">
      <complexcat>
        <atomcat type="sent">
          <fs>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="s">
          <fs id="1">
            <feat val="q-base" attr="form"/>
            <feat val="phr" attr="info"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:sem-obj">
            <diamond mode="mood">
              <prop name="int"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Ask-VP-Wh">
      <complexcat>
        <atomcat type="sent">
          <fs>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat val="wh" attr="form"/>
              <feat val="phr" attr="info"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="E:sem-obj">
            <diamond mode="mood">
              <prop name="int"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="?"/>
  </family>
  <family indexRel="Creator" closed="true" pos="Prep" name="By-Creator">
    <entry name="Primary">
      <complexcat>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="Creator">
              <nomvar name="Y:causal-agent"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Predicative">
      <complexcat>
        <atomcat type="s">
          <fs>
            <feat val="adj" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="P"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash ability="inert" mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="P:proposition">
            <prop name="has-rel"/>
            <diamond mode="info">
              <var name="INFO"/>
            </diamond>
            <diamond mode="owner">
              <var name="OWNER"/>
            </diamond>
            <diamond mode="kon">
              <prop name="-"/>
            </diamond>
            <diamond mode="Of">
              <nomvar name="X:"/>
            </diamond>
            <diamond mode="Creator">
              <nomvar name="Y:"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="by"/>
  </family>
  <family indexRel="Source" closed="true" pos="Prep" name="Prep-Source">
    <entry name="Primary">
      <complexcat>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="Source">
              <nomvar name="Y:abstraction"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Predicative">
      <complexcat>
        <atomcat type="s">
          <fs>
            <feat val="adj" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="P"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash ability="inert" mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="P:proposition">
            <prop name="has-rel"/>
            <diamond mode="info">
              <var name="INFO"/>
            </diamond>
            <diamond mode="owner">
              <var name="OWNER"/>
            </diamond>
            <diamond mode="kon">
              <prop name="-"/>
            </diamond>
            <diamond mode="Of">
              <nomvar name="X:"/>
            </diamond>
            <diamond mode="Source">
              <nomvar name="Y:"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="from"/>
  </family>
  <family closed="true" pos="Adj" name="Based-On">
    <entry name="Predicative">
      <complexcat>
        <atomcat type="s">
          <fs>
            <feat val="adj" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="P"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash ability="inert" mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="P:proposition">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Artifact">
              <nomvar name="X:sem-obj"/>
            </diamond>
            <diamond mode="Source">
              <nomvar name="Y:abstraction"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="based_on" pred="based-on"/>
  </family>
  <family closed="true" pos="V" name="Canned-VP">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:situation">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg">
              <nomvar name="X:sem-obj"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="help-set-mood"/>
    <member stem="emphasise-straight-lined-character"/>
    <member stem="give-tuscan-feeling"/>
  </family>
  <family closed="true" pos="V" name="Drawing-From">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="pp">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
            <feat val="from" attr="lex"/>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:proposition">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Artifact">
              <nomvar name="X:sem-obj"/>
            </diamond>
            <diamond mode="Source">
              <nomvar name="Y:abstraction"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="draw" pred="draw-from"/>
  </family>
  <family closed="true" pos="V" name="Featuring">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:proposition">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Artifact">
              <nomvar name="X:sem-obj"/>
            </diamond>
            <diamond mode="Poss">
              <nomvar name="Y:sem-obj"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="TV-Plus-Pred-Y">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs>
              <feat val="adj" attr="form"/>
              <feat attr="index">
                <lf>
                  <nomvar name="P"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash ability="inert" mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs>
              <feat attr="index">
                <lf>
                  <nomvar name="Y"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:proposition">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Artifact">
              <nomvar name="X:sem-obj"/>
            </diamond>
            <diamond mode="Poss">
              <nomvar name="Y:sem-obj"/>
            </diamond>
          </satop>
          <satop nomvar="E:proposition">
            <diamond mode="Where">
              <nomvar name="P:proposition"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="feature"/>
  </family>
  <family closed="true" pos="V" name="Going-With">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="pp">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
            <feat val="with" attr="lex"/>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:action">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Cognizer">
              <nomvar name="X:causal-agent"/>
            </diamond>
            <diamond mode="Chosen">
              <nomvar name="Y:sem-obj"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="go" pred="go-with"/>
  </family>
  <family closed="true" pos="V" name="Looking-At">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="pp">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
            <feat val="at" attr="lex"/>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:experience">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Perceiver">
              <nomvar name="X:animate-being"/>
            </diamond>
            <diamond mode="Phenomenon">
              <nomvar name="Y:sem-obj"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="look-at"/>
  </family>
  <family closed="true" pos="V" name="Seeing">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:experience">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Perceiver">
              <nomvar name="X:animate-being"/>
            </diamond>
            <diamond mode="Phenomenon">
              <nomvar name="Y:sem-obj"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Intransitive">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:experience">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Perceiver">
              <nomvar name="X:animate-being"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="see"/>
  </family>
  <family closed="true" pos="V" name="Meaning">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:proposition">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Communicator">
              <nomvar name="X:causal-agent"/>
            </diamond>
            <diamond mode="Referent">
              <nomvar name="Y:sem-obj"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="mean"/>
  </family>
  <family closed="true" pos="V" name="Using">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:proposition">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Artifact">
              <nomvar name="X:sem-obj"/>
            </diamond>
            <diamond mode="Material">
              <nomvar name="Y:phys-obj"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="use"/>
  </family>
  <family coartRel="gest" closed="true" pos="Gest" name="Gesture">
    <entry name="Primary">
      <complexcat>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="|"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="gest">
              <prop name="+"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="*circ*"/>
    <member stem="*circ*"/>
    <member stem="*circ*"/>
    <member stem="*circ*"/>
    <member stem="*circ*"/>
    <member stem="*circ*"/>
    <member stem="*circ*"/>
    <member stem="*circ*"/>
    <member stem="*circ*"/>
    <member stem="*circ*"/>
    <member stem="*circ*"/>
    <member stem="*circ*"/>
    <member stem="*wave*"/>
    <member stem="*wave*"/>
    <member stem="*wave*"/>
    <member stem="*wave*"/>
    <member stem="*wave*"/>
  </family>
  <family coartRel="nod" closed="true" pos="Nod" name="Nod">
    <entry name="Primary">
      <complexcat>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="|"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="nod">
              <prop name="+"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="*nod*"/>
  </family>
</ccg-lexicon>


================================================
FILE: grammars/comic/morph.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<morph xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:noNamespaceSchemaLocation="../morph.xsd" name="comic">
  <entry pos="Dummy" word="*dummy*"/>
  <entry pos="NNP" word="[*DATE*]" class="date" macros="@INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="[*DATE*]_L+H*" stem="[*DATE*]" class="date" macros="@th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="[*DATE*]_H*" stem="[*DATE*]" class="date" macros="@rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="[*TIME*]" class="time" macros="@INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="[*TIME*]_L+H*" stem="[*TIME*]" class="time" macros="@th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="[*TIME*]_H*" stem="[*TIME*]" class="time" macros="@rh-X @kon-X @OWNER-X"/>
  <entry pos="Num" word="[*NUM*]" class="num" macros="@pl-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Num" word="[*NUM*]_L+H*" stem="[*NUM*]" class="num" macros="@pl-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="Num" word="[*NUM*]_H*" stem="[*NUM*]" class="num" macros="@pl-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="[*AMT*]" class="amt" macros="@INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="[*AMT*]_L+H*" stem="[*AMT*]" class="amt" macros="@th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="[*AMT*]_H*" stem="[*AMT*]" class="amt" macros="@rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="[*DUR*]" class="dur" macros="@INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="[*DUR*]_L+H*" stem="[*DUR*]" class="dur" macros="@th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="[*DUR*]_H*" stem="[*DUR*]" class="dur" macros="@rh-X @kon-X @OWNER-X"/>
  <entry pos="BT" word="L"/>
  <entry pos="BT" word="LL%"/>
  <entry pos="BT" word="LH%"/>
  <entry pos="BT" word="HH%"/>
  <entry pos="," word=","/>
  <entry pos="." word="."/>
  <entry pos="?" word="?"/>
  <entry pos="Comp" word="that"/>
  <entry pos="RelPro" word="that"/>
  <entry pos="Pro" word="I" stem="pro1" class="animate-being" macros="@1st @sg @nom @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Pro" word="I_L+H*" stem="pro1" class="animate-being" macros="@1st @sg @nom @th-X @kon-X @OWNER-X"/>
  <entry pos="Pro" word="I_H*" stem="pro1" class="animate-being" macros="@1st @sg @nom @rh-X @kon-X @OWNER-X"/>
  <entry pos="Pro" word="me" stem="pro1" class="animate-being" macros="@1st @sg @acc @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Pro" word="me_L+H*" stem="pro1" class="animate-being" macros="@1st @sg @acc @th-X @kon-X @OWNER-X"/>
  <entry pos="Pro" word="me_H*" stem="pro1" class="animate-being" macros="@1st @sg @acc @rh-X @kon-X @OWNER-X"/>
  <entry pos="Pro" word="we" stem="pro1" class="animate-being" macros="@1st @pl @nom @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Pro" word="we_L+H*" stem="pro1" class="animate-being" macros="@1st @pl @nom @th-X @kon-X @OWNER-X"/>
  <entry pos="Pro" word="we_H*" stem="pro1" class="animate-being" macros="@1st @pl @nom @rh-X @kon-X @OWNER-X"/>
  <entry pos="Pro" word="us" stem="pro1" class="animate-being" macros="@1st @pl @acc @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Pro" word="us_L+H*" stem="pro1" class="animate-being" macros="@1st @pl @acc @th-X @kon-X @OWNER-X"/>
  <entry pos="Pro" word="us_H*" stem="pro1" class="animate-being" macros="@1st @pl @acc @rh-X @kon-X @OWNER-X"/>
  <entry pos="PossPro" word="my" stem="pro1" class="animate-being" macros="@sg-P @INFO-P @nokon-P @OWNER-P"/>
  <entry pos="PossPro" word="my_L+H*" stem="pro1" class="animate-being" macros="@sg-P @th-P @kon-P @OWNER-P"/>
  <entry pos="PossPro" word="my_H*" stem="pro1" class="animate-being" macros="@sg-P @rh-P @kon-P @OWNER-P"/>
  <entry pos="PossPro" word="our" stem="pro1" class="animate-being" macros="@pl-P @INFO-P @nokon-P @OWNER-P"/>
  <entry pos="PossPro" word="our_L+H*" stem="pro1" class="animate-being" macros="@pl-P @th-P @kon-P @OWNER-P"/>
  <entry pos="PossPro" word="our_H*" stem="pro1" class="animate-being" macros="@pl-P @rh-P @kon-P @OWNER-P"/>
  <entry pos="Pro" word="you" stem="pro2" class="animate-being" macros="@2nd @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Pro" word="you_L+H*" stem="pro2" class="animate-being" macros="@2nd @th-X @kon-X @OWNER-X"/>
  <entry pos="Pro" word="you_H*" stem="pro2" class="animate-being" macros="@2nd @rh-X @kon-X @OWNER-X"/>
  <entry pos="PossPro" word="your" stem="pro2" class="animate-being" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="PossPro" word="your_L+H*" stem="pro2" class="animate-being" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="PossPro" word="your_H*" stem="pro2" class="animate-being" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Pro" word="she" stem="pro3f" macros="@3rd @sg @nom @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Pro" word="she_L+H*" stem="pro3f" macros="@3rd @sg @nom @th-X @kon-X @OWNER-X"/>
  <entry pos="Pro" word="she_H*" stem="pro3f" macros="@3rd @sg @nom @rh-X @kon-X @OWNER-X"/>
  <entry pos="Pro" word="her" stem="pro3f" macros="@3rd @sg @acc @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Pro" word="her_L+H*" stem="pro3f" macros="@3rd @sg @acc @th-X @kon-X @OWNER-X"/>
  <entry pos="Pro" word="her_H*" stem="pro3f" macros="@3rd @sg @acc @rh-X @kon-X @OWNER-X"/>
  <entry pos="PossPro" word="her" stem="pro3f" macros="@sg-P @INFO-P @nokon-P @OWNER-P"/>
  <entry pos="PossPro" word="her_L+H*" stem="pro3f" macros="@sg-P @th-P @kon-P @OWNER-P"/>
  <entry pos="PossPro" word="her_H*" stem="pro3f" macros="@sg-P @rh-P @kon-P @OWNER-P"/>
  <entry pos="Pro" word="he" stem="pro3m" macros="@3rd @sg @nom @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Pro" word="he_L+H*" stem="pro3m" macros="@3rd @sg @nom @th-X @kon-X @OWNER-X"/>
  <entry pos="Pro" word="he_H*" stem="pro3m" macros="@3rd @sg @nom @rh-X @kon-X @OWNER-X"/>
  <entry pos="Pro" word="him" stem="pro3m" macros="@3rd @sg @acc @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Pro" word="him_L+H*" stem="pro3m" macros="@3rd @sg @acc @th-X @kon-X @OWNER-X"/>
  <entry pos="Pro" word="him_H*" stem="pro3m" macros="@3rd @sg @acc @rh-X @kon-X @OWNER-X"/>
  <entry pos="PossPro" word="his" stem="pro3m" macros="@sg-P @INFO-P @nokon-P @OWNER-P"/>
  <entry pos="PossPro" word="his_L+H*" stem="pro3m" macros="@sg-P @th-P @kon-P @OWNER-P"/>
  <entry pos="PossPro" word="his_H*" stem="pro3m" macros="@sg-P @rh-P @kon-P @OWNER-P"/>
  <entry pos="Pro" word="it" stem="pro3n" macros="@3rd @sg @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Pro" word="it_L+H*" stem="pro3n" macros="@3rd @sg @th-X @kon-X @OWNER-X"/>
  <entry pos="Pro" word="it_H*" stem="pro3n" macros="@3rd @sg @rh-X @kon-X @OWNER-X"/>
  <entry pos="Pro" word="they" stem="pro3n" macros="@3rd @pl @nom @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Pro" word="they_L+H*" stem="pro3n" macros="@3rd @pl @nom @th-X @kon-X @OWNER-X"/>
  <entry pos="Pro" word="they_H*" stem="pro3n" macros="@3rd @pl @nom @rh-X @kon-X @OWNER-X"/>
  <entry pos="Pro" word="them" stem="pro3n" macros="@3rd @pl @acc @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Pro" word="them_L+H*" stem="pro3n" macros="@3rd @pl @acc @th-X @kon-X @OWNER-X"/>
  <entry pos="Pro" word="them_H*" stem="pro3n" macros="@3rd @pl @acc @rh-X @kon-X @OWNER-X"/>
  <entry pos="PossPro" word="its" stem="pro3n" macros="@sg-P @INFO-P @nokon-P @OWNER-P"/>
  <entry pos="PossPro" word="its_L+H*" stem="pro3n" macros="@sg-P @th-P @kon-P @OWNER-P"/>
  <entry pos="PossPro" word="its_H*" stem="pro3n" macros="@sg-P @rh-P @kon-P @OWNER-P"/>
  <entry pos="PossPro" word="their" stem="pro3n" macros="@pl-P @INFO-P @nokon-P @OWNER-P"/>
  <entry pos="PossPro" word="their_L+H*" stem="pro3n" macros="@pl-P @th-P @kon-P @OWNER-P"/>
  <entry pos="PossPro" word="their_H*" stem="pro3n" macros="@pl-P @rh-P @kon-P @OWNER-P"/>
  <entry pos="Pro" word="this" macros="@3rd @sg @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Pro" word="this_L+H*" stem="this" macros="@3rd @sg @th-X @kon-X @OWNER-X"/>
  <entry pos="Pro" word="this_H*" stem="this" macros="@3rd @sg @rh-X @kon-X @OWNER-X"/>
  <entry pos="Pro" word="these" stem="this" macros="@3rd @pl @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Pro" word="these_L+H*" stem="this" macros="@3rd @pl @th-X @kon-X @OWNER-X"/>
  <entry pos="Pro" word="these_H*" stem="this" macros="@3rd @pl @rh-X @kon-X @OWNER-X"/>
  <entry pos="Pro" word="that" macros="@3rd @sg @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Pro" word="that_L+H*" stem="that" macros="@3rd @sg @th-X @kon-X @OWNER-X"/>
  <entry pos="Pro" word="that_H*" stem="that" macros="@3rd @sg @rh-X @kon-X @OWNER-X"/>
  <entry pos="Pro" word="those" stem="that" macros="@3rd @pl @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Pro" word="those_L+H*" stem="that" macros="@3rd @pl @th-X @kon-X @OWNER-X"/>
  <entry pos="Pro" word="those_H*" stem="that" macros="@3rd @pl @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="one" stem="pro_one" macros="@sg @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="one_L+H*" stem="pro_one" macros="@sg @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="one_H*" stem="pro_one" macros="@sg @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="ones" stem="pro_one" macros="@pl @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="ones_L+H*" stem="pro_one" macros="@pl @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="ones_H*" stem="pro_one" macros="@pl @rh-X @kon-X @OWNER-X"/>
  <entry pos="Expl" word="it"/>
  <entry pos="Expl" word="there"/>
  <entry pos="Expl" word="here"/>
  <entry pos="Conj" word="and" macros="@INFO-S @nokon-S @OWNER-S"/>
  <entry pos="Conj" word="and_L+H*" stem="and" macros="@th-S @kon-S @OWNER-S"/>
  <entry pos="Conj" word="and_H*" stem="and" macros="@rh-S @kon-S @OWNER-S"/>
  <entry pos="Conj" word="or" macros="@INFO-S @nokon-S @OWNER-S"/>
  <entry pos="Conj" word="or_L+H*" stem="or" macros="@th-S @kon-S @OWNER-S"/>
  <entry pos="Conj" word="or_H*" stem="or" macros="@rh-S @kon-S @OWNER-S"/>
  <entry pos="Conj" word="but" macros="@INFO-S @nokon-S @OWNER-S"/>
  <entry pos="Conj" word="but_L+H*" stem="but" macros="@th-S @kon-S @OWNER-S"/>
  <entry pos="Conj" word="but_H*" stem="but" macros="@rh-S @kon-S @OWNER-S"/>
  <entry pos="Conj" word="although" macros="@INFO-S @nokon-S @OWNER-S"/>
  <entry pos="Conj" word="although_L+H*" stem="although" macros="@th-S @kon-S @OWNER-S"/>
  <entry pos="Conj" word="although_H*" stem="although" macros="@rh-S @kon-S @OWNER-S"/>
  <entry pos="Conj" word="if" macros="@INFO-S @nokon-S @OWNER-S"/>
  <entry pos="Conj" word="if_L+H*" stem="if" macros="@th-S @kon-S @OWNER-S"/>
  <entry pos="Conj" word="if_H*" stem="if" macros="@rh-S @kon-S @OWNER-S"/>
  <entry pos="Conj" word="while" macros="@INFO-S @nokon-S @OWNER-S"/>
  <entry pos="Conj" word="while_L+H*" stem="while" macros="@th-S @kon-S @OWNER-S"/>
  <entry pos="Conj" word="while_H*" stem="while" macros="@rh-S @kon-S @OWNER-S"/>
  <entry pos="QNP" word="everyone" macros="@sg-2 @INFO-S @nokon-S @OWNER-S"/>
  <entry pos="QNP" word="everyone_L+H*" stem="everyone" macros="@sg-2 @th-S @kon-S @OWNER-S"/>
  <entry pos="QNP" word="everyone_H*" stem="everyone" macros="@sg-2 @rh-S @kon-S @OWNER-S"/>
  <entry pos="QNP" word="both" macros="@pl-2 @INFO-S @nokon-S @OWNER-S"/>
  <entry pos="QNP" word="both_L+H*" stem="both" macros="@pl-2 @th-S @kon-S @OWNER-S"/>
  <entry pos="QNP" word="both_H*" stem="both" macros="@pl-2 @rh-S @kon-S @OWNER-S"/>
  <entry pos="QNP" word="neither" macros="@sg-2 @INFO-S @nokon-S @OWNER-S"/>
  <entry pos="QNP" word="neither_L+H*" stem="neither" macros="@sg-2 @th-S @kon-S @OWNER-S"/>
  <entry pos="QNP" word="neither_H*" stem="neither" macros="@sg-2 @rh-S @kon-S @OWNER-S"/>
  <entry pos="QNP" word="none" macros="@pl-2 @INFO-S @nokon-S @OWNER-S"/>
  <entry pos="QNP" word="none_L+H*" stem="none" macros="@pl-2 @th-S @kon-S @OWNER-S"/>
  <entry pos="QNP" word="none_H*" stem="none" macros="@pl-2 @rh-S @kon-S @OWNER-S"/>
  <entry pos="QNP" word="all" macros="@pl-or-mass-2 @INFO-S @nokon-S @OWNER-S"/>
  <entry pos="QNP" word="all_L+H*" stem="all" macros="@pl-or-mass-2 @th-S @kon-S @OWNER-S"/>
  <entry pos="QNP" word="all_H*" stem="all" macros="@pl-or-mass-2 @rh-S @kon-S @OWNER-S"/>
  <entry pos="WhNP" word="what" macros="@INFO-Q @nokon-Q @OWNER-Q"/>
  <entry pos="WhNP" word="what_L+H*" stem="what" macros="@th-Q @kon-Q @OWNER-Q"/>
  <entry pos="WhNP" word="what_H*" stem="what" macros="@rh-Q @kon-Q @OWNER-Q"/>
  <entry pos="WhNP" word="where" macros="@X-location @INFO-Q @nokon-Q @OWNER-Q"/>
  <entry pos="WhNP" word="where_L+H*" stem="where" macros="@X-location @th-Q @kon-Q @OWNER-Q"/>
  <entry pos="WhNP" word="where_H*" stem="where" macros="@X-location @rh-Q @kon-Q @OWNER-Q"/>
  <entry pos="WhNP" word="who" macros="@X-person @INFO-Q @nokon-Q @OWNER-Q"/>
  <entry pos="WhNP" word="who_L+H*" stem="who" macros="@X-person @th-Q @kon-Q @OWNER-Q"/>
  <entry pos="WhNP" word="who_H*" stem="who" macros="@X-person @rh-Q @kon-Q @OWNER-Q"/>
  <entry pos="Det" word="a" macros="@sg-2"/>
  <entry pos="Det" word="an" stem="a" macros="@sg-2"/>
  <entry pos="Det" word="some"/>
  <entry pos="Det" word="the"/>
  <entry pos="PDet" word="another" macros="@sg-2 @INFO-P @nokon-P @OWNER-P"/>
  <entry pos="PDet" word="another_L+H*" stem="another" macros="@sg-2 @th-P @kon-P @OWNER-P"/>
  <entry pos="PDet" word="another_H*" stem="another" macros="@sg-2 @rh-P @kon-P @OWNER-P"/>
  <entry pos="PDet" word="this" macros="@sg-or-mass-2 @INFO-P @nokon-P @OWNER-P"/>
  <entry pos="PDet" word="this_L+H*" stem="this" macros="@sg-or-mass-2 @th-P @kon-P @OWNER-P"/>
  <entry pos="PDet" word="this_H*" stem="this" macros="@sg-or-mass-2 @rh-P @kon-P @OWNER-P"/>
  <entry pos="PDet" word="these" stem="this" macros="@pl-2 @INFO-P @nokon-P @OWNER-P"/>
  <entry pos="PDet" word="these_L+H*" stem="this" macros="@pl-2 @th-P @kon-P @OWNER-P"/>
  <entry pos="PDet" word="these_H*" stem="this" macros="@pl-2 @rh-P @kon-P @OWNER-P"/>
  <entry pos="PDet" word="that" macros="@sg-or-mass-2 @INFO-P @nokon-P @OWNER-P"/>
  <entry pos="PDet" word="that_L+H*" stem="that" macros="@sg-or-mass-2 @th-P @kon-P @OWNER-P"/>
  <entry pos="PDet" word="that_H*" stem="that" macros="@sg-or-mass-2 @rh-P @kon-P @OWNER-P"/>
  <entry pos="PDet" word="those" stem="that" macros="@pl-2 @INFO-P @nokon-P @OWNER-P"/>
  <entry pos="PDet" word="those_L+H*" stem="that" macros="@pl-2 @th-P @kon-P @OWNER-P"/>
  <entry pos="PDet" word="those_H*" stem="that" macros="@pl-2 @rh-P @kon-P @OWNER-P"/>
  <entry pos="PossS" word="'s" macros="@INFO-3 @OWNER-3"/>
  <entry pos="QDet" word="all" macros="@pl-or-mass-2 @INFO-S @nokon-S @OWNER-S"/>
  <entry pos="QDet" word="all_L+H*" stem="all" macros="@pl-or-mass-2 @th-S @kon-S @OWNER-S"/>
  <entry pos="QDet" word="all_H*" stem="all" macros="@pl-or-mass-2 @rh-S @kon-S @OWNER-S"/>
  <entry pos="QDet" word="both" macros="@pl-2 @INFO-S @nokon-S @OWNER-S"/>
  <entry pos="QDet" word="both_L+H*" stem="both" macros="@pl-2 @th-S @kon-S @OWNER-S"/>
  <entry pos="QDet" word="both_H*" stem="both" macros="@pl-2 @rh-S @kon-S @OWNER-S"/>
  <entry pos="QDet" word="every" macros="@sg-2 @INFO-S @nokon-S @OWNER-S"/>
  <entry pos="QDet" word="every_L+H*" stem="every" macros="@sg-2 @th-S @kon-S @OWNER-S"/>
  <entry pos="QDet" word="every_H*" stem="every" macros="@sg-2 @rh-S @kon-S @OWNER-S"/>
  <entry pos="QDet" word="neither" macros="@sg-2 @INFO-S @nokon-S @OWNER-S"/>
  <entry pos="QDet" word="neither_L+H*" stem="neither" macros="@sg-2 @th-S @kon-S @OWNER-S"/>
  <entry pos="QDet" word="neither_H*" stem="neither" macros="@sg-2 @rh-S @kon-S @OWNER-S"/>
  <entry pos="QDet" word="no" macros="@INFO-S @nokon-S @OWNER-S"/>
  <entry pos="QDet" word="no_L+H*" stem="no" macros="@th-S @kon-S @OWNER-S"/>
  <entry pos="QDet" word="no_H*" stem="no" macros="@rh-S @kon-S @OWNER-S"/>
  <entry pos="Wh" word="what" macros="@INFO-Q @nokon-Q @OWNER-Q"/>
  <entry pos="Wh" word="what_L+H*" stem="what" macros="@th-Q @kon-Q @OWNER-Q"/>
  <entry pos="Wh" word="what_H*" stem="what" macros="@rh-Q @kon-Q @OWNER-Q"/>
  <entry pos="Wh" word="which" macros="@INFO-Q @nokon-Q @OWNER-Q"/>
  <entry pos="Wh" word="which_L+H*" stem="which" macros="@th-Q @kon-Q @OWNER-Q"/>
  <entry pos="Wh" word="which_H*" stem="which" macros="@rh-Q @kon-Q @OWNER-Q"/>
  <entry pos="Adv" word="also" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adv" word="also_L+H*" stem="also" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adv" word="also_H*" stem="also" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adv" word="either" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adv" word="either_L+H*" stem="either" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adv" word="either_H*" stem="either" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adv" word="though" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adv" word="though_L+H*" stem="though" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adv" word="though_H*" stem="though" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Prep" word="with" macros="@INFO-3 @OWNER-3"/>
  <entry pos="V" word="can" macros="@INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="can_L+H*" stem="can" macros="@th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="can_H*" stem="can" macros="@rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="may" macros="@INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="may_L+H*" stem="may" macros="@th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="may_H*" stem="may" macros="@rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="should" macros="@INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="should_L+H*" stem="should" macros="@th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="should_H*" stem="should" macros="@rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="would" macros="@INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="would_L+H*" stem="would" macros="@th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="would_H*" stem="would" macros="@rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="'d" stem="would" macros="@INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="will" macros="@INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="will_L+H*" stem="will" macros="@th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="will_H*" stem="will" macros="@rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="'ll" stem="will" macros="@INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="not" macros="@base @base6 @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="not_L+H*" stem="not" macros="@base @base6 @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="not_H*" stem="not" macros="@base @base6 @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="n't" stem="not" macros="@base @base6 @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="not" macros="@adj @adj6 @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="not_L+H*" stem="not" macros="@adj @adj6 @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="not_H*" stem="not" macros="@adj @adj6 @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="n't" stem="not" macros="@adj @adj6 @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="do" macros="@pres @sg-agr @non-3rd-agr @INFO-E @nokon-E @OWNER-E" excluded="Do-Support"/>
  <entry pos="V" word="do_L+H*" stem="do" macros="@pres @sg-agr @non-3rd-agr @th-E @kon-E @OWNER-E" excluded="Do-Support"/>
  <entry pos="V" word="do_H*" stem="do" macros="@pres @sg-agr @non-3rd-agr @rh-E @kon-E @OWNER-E" excluded="Do-Support"/>
  <entry pos="V" word="does" stem="do" macros="@pres @sg-or-mass-agr @3rd-agr @INFO-E @nokon-E @OWNER-E" excluded="Do-Support"/>
  <entry pos="V" word="does_L+H*" stem="do" macros="@pres @sg-or-mass-agr @3rd-agr @th-E @kon-E @OWNER-E" excluded="Do-Support"/>
  <entry pos="V" word="does_H*" stem="do" macros="@pres @sg-or-mass-agr @3rd-agr @rh-E @kon-E @OWNER-E" excluded="Do-Support"/>
  <entry pos="V" word="do" macros="@pres @pl-agr @INFO-E @nokon-E @OWNER-E" excluded="Do-Support"/>
  <entry pos="V" word="do_L+H*" stem="do" macros="@pres @pl-agr @th-E @kon-E @OWNER-E" excluded="Do-Support"/>
  <entry pos="V" word="do_H*" stem="do" macros="@pres @pl-agr @rh-E @kon-E @OWNER-E" excluded="Do-Support"/>
  <entry pos="V" word="did" stem="do" macros="@past @INFO-E @nokon-E @OWNER-E" excluded="Do-Support"/>
  <entry pos="V" word="did_L+H*" stem="do" macros="@past @th-E @kon-E @OWNER-E" excluded="Do-Support"/>
  <entry pos="V" word="did_H*" stem="do" macros="@past @rh-E @kon-E @OWNER-E" excluded="Do-Support"/>
  <entry pos="V" word="do" macros="@pres @sg-agr @non-3rd-agr" excluded="Modal"/>
  <entry pos="V" word="does" stem="do" macros="@pres @sg-or-mass-agr @3rd-agr" excluded="Modal"/>
  <entry pos="V" word="do" macros="@pres @pl-agr" excluded="Modal"/>
  <entry pos="V" word="did" stem="do" macros="@past" excluded="Modal"/>
  <entry pos="V" word="be" macros="@base @INFO-E @nokon-E @OWNER-E" excluded="Inverted"/>
  <entry pos="V" word="be_L+H*" stem="be" macros="@base @th-E @kon-E @OWNER-E" excluded="Inverted"/>
  <entry pos="V" word="be_H*" stem="be" macros="@base @rh-E @kon-E @OWNER-E" excluded="Inverted"/>
  <entry pos="V" word="am" stem="be" macros="@pres @sg-agr @1st-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="am_L+H*" stem="be" macros="@pres @sg-agr @1st-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="am_H*" stem="be" macros="@pres @sg-agr @1st-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="'m" stem="be" macros="@pres @sg-agr @1st-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="are" stem="be" macros="@pres @sg-agr @2nd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="are_L+H*" stem="be" macros="@pres @sg-agr @2nd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="are_H*" stem="be" macros="@pres @sg-agr @2nd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="'re" stem="be" macros="@pres @sg-agr @2nd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="is" stem="be" macros="@pres @sg-or-mass-agr @3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="is_L+H*" stem="be" macros="@pres @sg-or-mass-agr @3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="is_H*" stem="be" macros="@pres @sg-or-mass-agr @3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="'s" stem="be" macros="@pres @sg-or-mass-agr @3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="are" stem="be" macros="@pres @pl-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="are_L+H*" stem="be" macros="@pres @pl-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="are_H*" stem="be" macros="@pres @pl-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="'re" stem="be" macros="@pres @pl-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="was" stem="be" macros="@past @sg-agr @1st-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="was_L+H*" stem="be" macros="@past @sg-agr @1st-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="was_H*" stem="be" macros="@past @sg-agr @1st-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="were" stem="be" macros="@past @sg-agr @2nd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="were_L+H*" stem="be" macros="@past @sg-agr @2nd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="were_H*" stem="be" macros="@past @sg-agr @2nd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="was" stem="be" macros="@past @sg-or-mass-agr @3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="was_L+H*" stem="be" macros="@past @sg-or-mass-agr @3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="was_H*" stem="be" macros="@past @sg-or-mass-agr @3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="were" stem="be" macros="@past @pl-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="were_L+H*" stem="be" macros="@past @pl-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="were_H*" stem="be" macros="@past @pl-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="have" macros="@base @INFO-E @nokon-E @OWNER-E" excluded="Inverted"/>
  <entry pos="V" word="have_L+H*" stem="have" macros="@base @th-E @kon-E @OWNER-E" excluded="Inverted"/>
  <entry pos="V" word="have_H*" stem="have" macros="@base @rh-E @kon-E @OWNER-E" excluded="Inverted"/>
  <entry pos="V" word="have" macros="@pres @sg-agr @non-3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="have_L+H*" stem="have" macros="@pres @sg-agr @non-3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="have_H*" stem="have" macros="@pres @sg-agr @non-3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="has" stem="have" macros="@pres @sg-or-mass-agr @3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="has_L+H*" stem="have" macros="@pres @sg-or-mass-agr @3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="has_H*" stem="have" macros="@pres @sg-or-mass-agr @3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="have" macros="@pres @pl-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="have_L+H*" stem="have" macros="@pres @pl-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="have_H*" stem="have" macros="@pres @pl-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="had" stem="have" macros="@past @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="had_L+H*" stem="have" macros="@past @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="had_H*" stem="have" macros="@past @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="like" macros="@base @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="like_L+H*" stem="like" macros="@base @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="like_H*" stem="like" macros="@base @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="liking" stem="like" macros="@ng @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="liking_L+H*" stem="like" macros="@ng @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="liking_H*" stem="like" macros="@ng @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="like" macros="@pres @sg-agr @non-3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="like_L+H*" stem="like" macros="@pres @sg-agr @non-3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="like_H*" stem="like" macros="@pres @sg-agr @non-3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="likes" stem="like" macros="@pres @sg-or-mass-agr @3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="likes_L+H*" stem="like" macros="@pres @sg-or-mass-agr @3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="likes_H*" stem="like" macros="@pres @sg-or-mass-agr @3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="like" macros="@pres @pl-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="like_L+H*" stem="like" macros="@pres @pl-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="like_H*" stem="like" macros="@pres @pl-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="liked" stem="like" macros="@past @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="liked_L+H*" stem="like" macros="@past @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="liked_H*" stem="like" macros="@past @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="make" macros="@base @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="make_L+H*" stem="make" macros="@base @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="make_H*" stem="make" macros="@base @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="making" stem="make" macros="@ng @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="making_L+H*" stem="make" macros="@ng @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="making_H*" stem="make" macros="@ng @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="make" macros="@pres @sg-agr @non-3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="make_L+H*" stem="make" macros="@pres @sg-agr @non-3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="make_H*" stem="make" macros="@pres @sg-agr @non-3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="makes" stem="make" macros="@pres @sg-or-mass-agr @3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="makes_L+H*" stem="make" macros="@pres @sg-or-mass-agr @3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="makes_H*" stem="make" macros="@pres @sg-or-mass-agr @3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="make" macros="@pres @pl-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="make_L+H*" stem="make" macros="@pres @pl-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="make_H*" stem="make" macros="@pres @pl-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="made" stem="make" macros="@past @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="made_L+H*" stem="make" macros="@past @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="made_H*" stem="make" macros="@past @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="mention" macros="@pres @sg-agr @non-3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="mention_L+H*" stem="mention" macros="@pres @sg-agr @non-3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="mention_H*" stem="mention" macros="@pres @sg-agr @non-3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="mentions" stem="mention" macros="@pres @sg-or-mass-agr @3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="mentions_L+H*" stem="mention" macros="@pres @sg-or-mass-agr @3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="mentions_H*" stem="mention" macros="@pres @sg-or-mass-agr @3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="mention" macros="@pres @pl-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="mention_L+H*" stem="mention" macros="@pres @pl-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="mention_H*" stem="mention" macros="@pres @pl-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="mentioned" stem="mention" macros="@past @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="mentioned_L+H*" stem="mention" macros="@past @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="mentioned_H*" stem="mention" macros="@past @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="say" macros="@pres @sg-agr @non-3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="say_L+H*" stem="say" macros="@pres @sg-agr @non-3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="say_H*" stem="say" macros="@pres @sg-agr @non-3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="says" stem="say" macros="@pres @sg-or-mass-agr @3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="says_L+H*" stem="say" macros="@pres @sg-or-mass-agr @3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="says_H*" stem="say" macros="@pres @sg-or-mass-agr @3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="say" macros="@pres @pl-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="say_L+H*" stem="say" macros="@pres @pl-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="say_H*" stem="say" macros="@pres @pl-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="said" stem="say" macros="@past @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="said_L+H*" stem="say" macros="@past @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="said_H*" stem="say" macros="@past @rh-E @kon-E @OWNER-E"/>
  <entry pos="Num" word="one" class="num" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Num" word="one_L+H*" stem="one" class="num" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="Num" word="one_H*" stem="one" class="num" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Num" word="1" class="num" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Num" word="1_L+H*" stem="1" class="num" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="Num" word="1_H*" stem="1" class="num" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Num" word="several" class="num" macros="@pl-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Num" word="several_L+H*" stem="several" class="num" macros="@pl-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="Num" word="several_H*" stem="several" class="num" macros="@pl-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Num" word="two" class="num" macros="@pl-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Num" word="two_L+H*" stem="two" class="num" macros="@pl-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="Num" word="two_H*" stem="two" class="num" macros="@pl-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Num" word="three" class="num" macros="@pl-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Num" word="three_L+H*" stem="three" class="num" macros="@pl-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="Num" word="three_H*" stem="three" class="num" macros="@pl-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Num" word="four" class="num" macros="@pl-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Num" word="four_L+H*" stem="four" class="num" macros="@pl-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="Num" word="four_H*" stem="four" class="num" macros="@pl-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Num" word="five" class="num" macros="@pl-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Num" word="five_L+H*" stem="five" class="num" macros="@pl-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="Num" word="five_H*" stem="five" class="num" macros="@pl-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Num" word="six" class="num" macros="@pl-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Num" word="six_L+H*" stem="six" class="num" macros="@pl-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="Num" word="six_H*" stem="six" class="num" macros="@pl-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Num" word="seven" class="num" macros="@pl-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Num" word="seven_L+H*" stem="seven" class="num" macros="@pl-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="Num" word="seven_H*" stem="seven" class="num" macros="@pl-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Num" word="eight" class="num" macros="@pl-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Num" word="eight_L+H*" stem="eight" class="num" macros="@pl-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="Num" word="eight_H*" stem="eight" class="num" macros="@pl-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Num" word="nine" class="num" macros="@pl-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Num" word="nine_L+H*" stem="nine" class="num" macros="@pl-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="Num" word="nine_H*" stem="nine" class="num" macros="@pl-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Num" word="ten" class="num" macros="@pl-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Num" word="ten_L+H*" stem="ten" class="num" macros="@pl-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="Num" word="ten_H*" stem="ten" class="num" macros="@pl-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Prep" word="at" macros="@INFO-3 @OWNER-3"/>
  <entry pos="Prep" word="by" macros="@INFO-3 @OWNER-3"/>
  <entry pos="Prep" word="from" macros="@INFO-3 @OWNER-3"/>
  <entry pos="Adj" word="in" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="in_L+H*" stem="in" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="in_H*" stem="in" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adv" word="in_addition_to" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adv" word="in_addition_to_L+H*" stem="in_addition_to" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adv" word="in_addition_to_H*" stem="in_addition_to" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Prep" word="of" macros="@INFO-3 @OWNER-3"/>
  <entry pos="Adj" word="on" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="on_L+H*" stem="on" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="on_H*" stem="on" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Prep" word="to" macros="@INFO-3 @OWNER-3"/>
  <entry pos="Adv" word="before" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adv" word="before_L+H*" stem="before" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adv" word="before_H*" stem="before" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adv" word="earlier" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adv" word="earlier_L+H*" stem="earlier" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adv" word="earlier_H*" stem="earlier" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adv" word="down_here" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adv" word="down_here_L+H*" stem="down_here" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adv" word="down_here_H*" stem="down_here" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adv" word="here" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adv" word="here_L+H*" stem="here" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adv" word="here_H*" stem="here" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adv" word="now" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adv" word="now_L+H*" stem="now" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adv" word="now_H*" stem="now" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adv" word="once_again" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adv" word="once_again_L+H*" stem="once_again" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adv" word="once_again_H*" stem="once_again" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Conj" word="as" macros="@INFO-S @nokon-S @OWNER-S"/>
  <entry pos="Conj" word="as_L+H*" stem="as" macros="@th-S @kon-S @OWNER-S"/>
  <entry pos="Conj" word="as_H*" stem="as" macros="@rh-S @kon-S @OWNER-S"/>
  <entry pos="V" word="draw" macros="@base @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="draw_L+H*" stem="draw" macros="@base @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="draw_H*" stem="draw" macros="@base @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="drawing" stem="draw" macros="@ng @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="drawing_L+H*" stem="draw" macros="@ng @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="drawing_H*" stem="draw" macros="@ng @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="draw" macros="@pres @sg-agr @non-3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="draw_L+H*" stem="draw" macros="@pres @sg-agr @non-3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="draw_H*" stem="draw" macros="@pres @sg-agr @non-3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="draws" stem="draw" macros="@pres @sg-or-mass-agr @3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="draws_L+H*" stem="draw" macros="@pres @sg-or-mass-agr @3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="draws_H*" stem="draw" macros="@pres @sg-or-mass-agr @3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="draw" macros="@pres @pl-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="draw_L+H*" stem="draw" macros="@pres @pl-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="draw_H*" stem="draw" macros="@pres @pl-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="drew" stem="draw" macros="@past @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="drew_L+H*" stem="draw" macros="@past @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="drew_H*" stem="draw" macros="@past @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="feature" macros="@base @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="feature_L+H*" stem="feature" macros="@base @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="feature_H*" stem="feature" macros="@base @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="featuring" stem="feature" macros="@ng @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="featuring_L+H*" stem="feature" macros="@ng @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="featuring_H*" stem="feature" macros="@ng @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="feature" macros="@pres @sg-agr @non-3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="feature_L+H*" stem="feature" macros="@pres @sg-agr @non-3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="feature_H*" stem="feature" macros="@pres @sg-agr @non-3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="features" stem="feature" macros="@pres @sg-or-mass-agr @3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="features_L+H*" stem="feature" macros="@pres @sg-or-mass-agr @3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="features_H*" stem="feature" macros="@pres @sg-or-mass-agr @3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="feature" macros="@pres @pl-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="feature_L+H*" stem="feature" macros="@pres @pl-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="feature_H*" stem="feature" macros="@pres @pl-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="featured" stem="feature" macros="@past @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="featured_L+H*" stem="feature" macros="@past @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="featured_H*" stem="feature" macros="@past @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="go" macros="@base @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="go_L+H*" stem="go" macros="@base @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="go_H*" stem="go" macros="@base @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="going" stem="go" macros="@ng @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="going_L+H*" stem="go" macros="@ng @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="going_H*" stem="go" macros="@ng @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="go" macros="@pres @sg-agr @non-3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="go_L+H*" stem="go" macros="@pres @sg-agr @non-3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="go_H*" stem="go" macros="@pres @sg-agr @non-3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="goes" stem="go" macros="@pres @sg-or-mass-agr @3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="goes_L+H*" stem="go" macros="@pres @sg-or-mass-agr @3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="goes_H*" stem="go" macros="@pres @sg-or-mass-agr @3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="go" macros="@pres @pl-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="go_L+H*" stem="go" macros="@pres @pl-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="go_H*" stem="go" macros="@pres @pl-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="went" stem="go" macros="@past @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="went_L+H*" stem="go" macros="@past @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="went_H*" stem="go" macros="@past @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="look" stem="look-at" macros="@base @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="look_L+H*" stem="look-at" macros="@base @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="look_H*" stem="look-at" macros="@base @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="looking" stem="look-at" macros="@ng @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="looking_L+H*" stem="look-at" macros="@ng @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="looking_H*" stem="look-at" macros="@ng @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="look" stem="look-at" macros="@pres @sg-agr @non-3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="look_L+H*" stem="look-at" macros="@pres @sg-agr @non-3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="look_H*" stem="look-at" macros="@pres @sg-agr @non-3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="looks" stem="look-at" macros="@pres @sg-or-mass-agr @3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="looks_L+H*" stem="look-at" macros="@pres @sg-or-mass-agr @3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="looks_H*" stem="look-at" macros="@pres @sg-or-mass-agr @3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="look" stem="look-at" macros="@pres @pl-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="look_L+H*" stem="look-at" macros="@pres @pl-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="look_H*" stem="look-at" macros="@pres @pl-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="looked" stem="look-at" macros="@past @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="looked_L+H*" stem="look-at" macros="@past @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="looked_H*" stem="look-at" macros="@past @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="mean" macros="@base @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="mean_L+H*" stem="mean" macros="@base @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="mean_H*" stem="mean" macros="@base @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="meaning" stem="mean" macros="@ng @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="meaning_L+H*" stem="mean" macros="@ng @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="meaning_H*" stem="mean" macros="@ng @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="mean" macros="@pres @sg-agr @non-3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="mean_L+H*" stem="mean" macros="@pres @sg-agr @non-3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="mean_H*" stem="mean" macros="@pres @sg-agr @non-3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="means" stem="mean" macros="@pres @sg-or-mass-agr @3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="means_L+H*" stem="mean" macros="@pres @sg-or-mass-agr @3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="means_H*" stem="mean" macros="@pres @sg-or-mass-agr @3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="mean" macros="@pres @pl-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="mean_L+H*" stem="mean" macros="@pres @pl-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="mean_H*" stem="mean" macros="@pres @pl-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="meant" stem="mean" macros="@past @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="meant_L+H*" stem="mean" macros="@past @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="meant_H*" stem="mean" macros="@past @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="see" macros="@base @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="see_L+H*" stem="see" macros="@base @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="see_H*" stem="see" macros="@base @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="seeing" stem="see" macros="@ng @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="seeing_L+H*" stem="see" macros="@ng @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="seeing_H*" stem="see" macros="@ng @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="see" macros="@pres @sg-agr @non-3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="see_L+H*" stem="see" macros="@pres @sg-agr @non-3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="see_H*" stem="see" macros="@pres @sg-agr @non-3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="sees" stem="see" macros="@pres @sg-or-mass-agr @3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="sees_L+H*" stem="see" macros="@pres @sg-or-mass-agr @3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="sees_H*" stem="see" macros="@pres @sg-or-mass-agr @3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="see" macros="@pres @pl-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="see_L+H*" stem="see" macros="@pres @pl-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="see_H*" stem="see" macros="@pres @pl-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="saw" stem="see" macros="@past @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="saw_L+H*" stem="see" macros="@past @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="saw_H*" stem="see" macros="@past @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="use" macros="@base @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="use_L+H*" stem="use" macros="@base @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="use_H*" stem="use" macros="@base @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="using" stem="use" macros="@ng @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="using_L+H*" stem="use" macros="@ng @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="using_H*" stem="use" macros="@ng @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="use" macros="@pres @sg-agr @non-3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="use_L+H*" stem="use" macros="@pres @sg-agr @non-3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="use_H*" stem="use" macros="@pres @sg-agr @non-3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="uses" stem="use" macros="@pres @sg-or-mass-agr @3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="uses_L+H*" stem="use" macros="@pres @sg-or-mass-agr @3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="uses_H*" stem="use" macros="@pres @sg-or-mass-agr @3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="use" macros="@pres @pl-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="use_L+H*" stem="use" macros="@pres @pl-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="use_H*" stem="use" macros="@pres @pl-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="used" stem="use" macros="@past @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="used_L+H*" stem="use" macros="@past @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="used_H*" stem="use" macros="@past @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="want" macros="@base @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="want_L+H*" stem="want" macros="@base @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="want_H*" stem="want" macros="@base @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="wanting" stem="want" macros="@ng @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="wanting_L+H*" stem="want" macros="@ng @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="wanting_H*" stem="want" macros="@ng @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="want" macros="@pres @sg-agr @non-3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="want_L+H*" stem="want" macros="@pres @sg-agr @non-3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="want_H*" stem="want" macros="@pres @sg-agr @non-3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="wants" stem="want" macros="@pres @sg-or-mass-agr @3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="wants_L+H*" stem="want" macros="@pres @sg-or-mass-agr @3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="wants_H*" stem="want" macros="@pres @sg-or-mass-agr @3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="want" macros="@pres @pl-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="want_L+H*" stem="want" macros="@pres @pl-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="want_H*" stem="want" macros="@pres @pl-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="wanted" stem="want" macros="@past @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="wanted_L+H*" stem="want" macros="@past @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="wanted_H*" stem="want" macros="@past @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="helping_to_set_the_mood" stem="help-set-mood" class="colour_prop" macros="@ng @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="helping_to_set_the_mood_L+H*" stem="help-set-mood" class="colour_prop" macros="@ng @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="helping_to_set_the_mood_H*" stem="help-set-mood" class="colour_prop" macros="@ng @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="helps_to_set_the_mood" stem="help-set-mood" class="colour_prop" macros="@pres @sg-or-mass-agr @3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="helps_to_set_the_mood_L+H*" stem="help-set-mood" class="colour_prop" macros="@pres @sg-or-mass-agr @3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="helps_to_set_the_mood_H*" stem="help-set-mood" class="colour_prop" macros="@pres @sg-or-mass-agr @3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="help_to_set_the_mood" stem="help-set-mood" class="colour_prop" macros="@pres @pl-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="help_to_set_the_mood_L+H*" stem="help-set-mood" class="colour_prop" macros="@pres @pl-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="help_to_set_the_mood_H*" stem="help-set-mood" class="colour_prop" macros="@pres @pl-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="emphasising_the_clear,_straight_lined_character_of_your_bathroom_in_a_stylish_way" stem="emphasise-straight-lined-character" class="colour_prop" macros="@ng @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="emphasising_the_clear,_straight_lined_character_of_your_bathroom_in_a_stylish_way_L+H*" stem="emphasise-straight-lined-character" class="colour_prop" macros="@ng @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="emphasising_the_clear,_straight_lined_character_of_your_bathroom_in_a_stylish_way_H*" stem="emphasise-straight-lined-character" class="colour_prop" macros="@ng @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="emphasises_the_clear,_straight_lined_character_of_your_bathroom_in_a_stylish_way" stem="emphasise-straight-lined-character" class="colour_prop" macros="@pres @sg-or-mass-agr @3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="emphasises_the_clear,_straight_lined_character_of_your_bathroom_in_a_stylish_way_L+H*" stem="emphasise-straight-lined-character" class="colour_prop" macros="@pres @sg-or-mass-agr @3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="emphasises_the_clear,_straight_lined_character_of_your_bathroom_in_a_stylish_way_H*" stem="emphasise-straight-lined-character" class="colour_prop" macros="@pres @sg-or-mass-agr @3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="emphasise_the_clear,_straight_lined_character_of_your_bathroom_in_a_stylish_way" stem="emphasise-straight-lined-character" class="colour_prop" macros="@pres @pl-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="emphasise_the_clear,_straight_lined_character_of_your_bathroom_in_a_stylish_way_L+H*" stem="emphasise-straight-lined-character" class="colour_prop" macros="@pres @pl-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="emphasise_the_clear,_straight_lined_character_of_your_bathroom_in_a_stylish_way_H*" stem="emphasise-straight-lined-character" class="colour_prop" macros="@pres @pl-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="giving_the_room_the_feeling_of_a_Tuscan_country_home" stem="give-tuscan-feeling" class="colour_prop" macros="@ng @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="giving_the_room_the_feeling_of_a_Tuscan_country_home_L+H*" stem="give-tuscan-feeling" class="colour_prop" macros="@ng @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="giving_the_room_the_feeling_of_a_Tuscan_country_home_H*" stem="give-tuscan-feeling" class="colour_prop" macros="@ng @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="gives_the_room_the_feeling_of_a_Tuscan_country_home" stem="give-tuscan-feeling" class="colour_prop" macros="@pres @sg-or-mass-agr @3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="gives_the_room_the_feeling_of_a_Tuscan_country_home_L+H*" stem="give-tuscan-feeling" class="colour_prop" macros="@pres @sg-or-mass-agr @3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="gives_the_room_the_feeling_of_a_Tuscan_country_home_H*" stem="give-tuscan-feeling" class="colour_prop" macros="@pres @sg-or-mass-agr @3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="give_the_room_the_feeling_of_a_Tuscan_country_home" stem="give-tuscan-feeling" class="colour_prop" macros="@pres @pl-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="give_the_room_the_feeling_of_a_Tuscan_country_home_L+H*" stem="give-tuscan-feeling" class="colour_prop" macros="@pres @pl-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="give_the_room_the_feeling_of_a_Tuscan_country_home_H*" stem="give-tuscan-feeling" class="colour_prop" macros="@pres @pl-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="Adj" word="based_on" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="based_on_L+H*" stem="based_on" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="based_on_H*" stem="based_on" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="more" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="more_L+H*" stem="more" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="more_H*" stem="more" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="other" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="other_L+H*" stem="other" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="other_H*" stem="other" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="abstract" class="quality" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="abstract_L+H*" stem="abstract" class="quality" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="abstract_H*" stem="abstract" class="quality" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="animal" class="quality" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="animal_L+H*" stem="animal" class="quality" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="animal_H*" stem="animal" class="quality" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="belt_buckle" class="quality" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="belt_buckle_L+H*" stem="belt_buckle" class="quality" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="belt_buckle_H*" stem="belt_buckle" class="quality" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="comic" class="quality" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="comic_L+H*" stem="comic" class="quality" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="comic_H*" stem="comic" class="quality" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="cross" class="quality" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="cross_L+H*" stem="cross" class="quality" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="cross_H*" stem="cross" class="quality" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="diamond" class="quality" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="diamond_L+H*" stem="diamond" class="quality" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="diamond_H*" stem="diamond" class="quality" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="decorative" class="quality" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="decorative_L+H*" stem="decorative" class="quality" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="decorative_H*" stem="decorative" class="quality" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="face" class="quality" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="face_L+H*" stem="face" class="quality" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="face_H*" stem="face" class="quality" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="female" class="quality" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="female_L+H*" stem="female" class="quality" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="female_H*" stem="female" class="quality" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="floral" class="quality" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="floral_L+H*" stem="floral" class="quality" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="floral_H*" stem="floral" class="quality" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="geometric" class="quality" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="geometric_L+H*" stem="geometric" class="quality" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="geometric_H*" stem="geometric" class="quality" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="jeans" class="quality" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="jeans_L+H*" stem="jeans" class="quality" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="jeans_H*" stem="jeans" class="quality" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="male" class="quality" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="male_L+H*" stem="male" class="quality" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="male_H*" stem="male" class="quality" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="classic" class="style" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="classic_L+H*" stem="classic" class="style" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="classic_H*" stem="classic" class="style" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="country" class="style" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="country_L+H*" stem="country" class="style" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="country_H*" stem="country" class="style" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="family" class="style" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="family_L+H*" stem="family" class="style" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="family_H*" stem="family" class="style" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="modern" class="style" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="modern_L+H*" stem="modern" class="style" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="modern_H*" stem="modern" class="style" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="larger" class="size" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="larger_L+H*" stem="larger" class="size" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="larger_H*" stem="larger" class="size" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="smaller" class="size" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="smaller_L+H*" stem="smaller" class="size" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="smaller_H*" stem="smaller" class="size" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="beige" class="colour" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="beige_L+H*" stem="beige" class="colour" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="beige_H*" stem="beige" class="colour" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="N" word="beige" class="colour" macros="@mass @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="beige_L+H*" stem="beige" class="colour" macros="@mass @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="beige_H*" stem="beige" class="colour" macros="@mass @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="black" class="colour" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="black_L+H*" stem="black" class="colour" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="black_H*" stem="black" class="colour" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="N" word="black" class="colour" macros="@mass @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="black_L+H*" stem="black" class="colour" macros="@mass @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="black_H*" stem="black" class="colour" macros="@mass @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="blue" class="colour" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="blue_L+H*" stem="blue" class="colour" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="blue_H*" stem="blue" class="colour" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="N" word="blue" class="colour" macros="@mass @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="blue_L+H*" stem="blue" class="colour" macros="@mass @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="blue_H*" stem="blue" class="colour" macros="@mass @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="brown" class="colour" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="brown_L+H*" stem="brown" class="colour" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="brown_H*" stem="brown" class="colour" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="N" word="brown" class="colour" macros="@mass @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="brown_L+H*" stem="brown" class="colour" macros="@mass @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="brown_H*" stem="brown" class="colour" macros="@mass @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="cream" class="colour" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="cream_L+H*" stem="cream" class="colour" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="cream_H*" stem="cream" class="colour" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="N" word="cream" class="colour" macros="@mass @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="cream_L+H*" stem="cream" class="colour" macros="@mass @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="cream_H*" stem="cream" class="colour" macros="@mass @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="dark_green" class="colour" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="dark_green_L+H*" stem="dark_green" class="colour" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="dark_green_H*" stem="dark_green" class="colour" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="N" word="dark_green" class="colour" macros="@mass @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="dark_green_L+H*" stem="dark_green" class="colour" macros="@mass @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="dark_green_H*" stem="dark_green" class="colour" macros="@mass @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="dark_red" class="colour" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="dark_red_L+H*" stem="dark_red" class="colour" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="dark_red_H*" stem="dark_red" class="colour" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="N" word="dark_red" class="colour" macros="@mass @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="dark_red_L+H*" stem="dark_red" class="colour" macros="@mass @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="dark_red_H*" stem="dark_red" class="colour" macros="@mass @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="gray" class="colour" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="gray_L+H*" stem="gray" class="colour" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="gray_H*" stem="gray" class="colour" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="N" word="gray" class="colour" macros="@mass @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="gray_L+H*" stem="gray" class="colour" macros="@mass @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="gray_H*" stem="gray" class="colour" macros="@mass @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="grey" class="colour" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="grey_L+H*" stem="grey" class="colour" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="grey_H*" stem="grey" class="colour" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="N" word="grey" class="colour" macros="@mass @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="grey_L+H*" stem="grey" class="colour" macros="@mass @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="grey_H*" stem="grey" class="colour" macros="@mass @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="green" class="colour" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="green_L+H*" stem="green" class="colour" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="green_H*" stem="green" class="colour" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="N" word="green" class="colour" macros="@mass @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="green_L+H*" stem="green" class="colour" macros="@mass @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="green_H*" stem="green" class="colour" macros="@mass @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="indigo" class="colour" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="indigo_L+H*" stem="indigo" class="colour" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="indigo_H*" stem="indigo" class="colour" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="N" word="indigo" class="colour" macros="@mass @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="indigo_L+H*" stem="indigo" class="colour" macros="@mass @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="indigo_H*" stem="indigo" class="colour" macros="@mass @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="ochre" class="colour" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="ochre_L+H*" stem="ochre" class="colour" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="ochre_H*" stem="ochre" class="colour" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="N" word="ochre" class="colour" macros="@mass @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="ochre_L+H*" stem="ochre" class="colour" macros="@mass @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="ochre_H*" stem="ochre" class="colour" macros="@mass @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="off_white" class="colour" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="off_white_L+H*" stem="off_white" class="colour" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="off_white_H*" stem="off_white" class="colour" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="N" word="off_white" class="colour" macros="@mass @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="off_white_L+H*" stem="off_white" class="colour" macros="@mass @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="off_white_H*" stem="off_white" class="colour" macros="@mass @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="orange" class="colour" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="orange_L+H*" stem="orange" class="colour" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="orange_H*" stem="orange" class="colour" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="N" word="orange" class="colour" macros="@mass @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="orange_L+H*" stem="orange" class="colour" macros="@mass @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="orange_H*" stem="orange" class="colour" macros="@mass @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="pink" class="colour" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="pink_L+H*" stem="pink" class="colour" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="pink_H*" stem="pink" class="colour" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="N" word="pink" class="colour" macros="@mass @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="pink_L+H*" stem="pink" class="colour" macros="@mass @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="pink_H*" stem="pink" class="colour" macros="@mass @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="purple" class="colour" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="purple_L+H*" stem="purple" class="colour" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="purple_H*" stem="purple" class="colour" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="N" word="purple" class="colour" macros="@mass @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="purple_L+H*" stem="purple" class="colour" macros="@mass @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="purple_H*" stem="purple" class="colour" macros="@mass @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="red" class="colour" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="red_L+H*" stem="red" class="colour" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="red_H*" stem="red" class="colour" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="N" word="red" class="colour" macros="@mass @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="red_L+H*" stem="red" class="colour" macros="@mass @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="red_H*" stem="red" class="colour" macros="@mass @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="rose" class="colour" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="rose_L+H*" stem="rose" class="colour" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="rose_H*" stem="rose" class="colour" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="N" word="rose" class="colour" macros="@mass @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="rose_L+H*" stem="rose" class="colour" macros="@mass @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="rose_H*" stem="rose" class="colour" macros="@mass @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="royal_blue" class="colour" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="royal_blue_L+H*" stem="royal_blue" class="colour" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="royal_blue_H*" stem="royal_blue" class="colour" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="N" word="royal_blue" class="colour" macros="@mass @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="royal_blue_L+H*" stem="royal_blue" class="colour" macros="@mass @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="royal_blue_H*" stem="royal_blue" class="colour" macros="@mass @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="salmon" class="colour" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="salmon_L+H*" stem="salmon" class="colour" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="salmon_H*" stem="salmon" class="colour" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="N" word="salmon" class="colour" macros="@mass @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="salmon_L+H*" stem="salmon" class="colour" macros="@mass @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="salmon_H*" stem="salmon" class="colour" macros="@mass @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="sandstone" class="colour" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="sandstone_L+H*" stem="sandstone" class="colour" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="sandstone_H*" stem="sandstone" class="colour" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="N" word="sandstone" class="colour" macros="@mass @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="sandstone_L+H*" stem="sandstone" class="colour" macros="@mass @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="sandstone_H*" stem="sandstone" class="colour" macros="@mass @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="silver" class="colour" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="silver_L+H*" stem="silver" class="colour" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="silver_H*" stem="silver" class="colour" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="N" word="silver" class="colour" macros="@mass @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="silver_L+H*" stem="silver" class="colour" macros="@mass @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="silver_H*" stem="silver" class="colour" macros="@mass @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="terracotta" class="colour" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="terracotta_L+H*" stem="terracotta" class="colour" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="terracotta_H*" stem="terracotta" class="colour" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="N" word="terracotta" class="colour" macros="@mass @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="terracotta_L+H*" stem="terracotta" class="colour" macros="@mass @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="terracotta_H*" stem="terracotta" class="colour" macros="@mass @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="violet" class="colour" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="violet_L+H*" stem="violet" class="colour" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="violet_H*" stem="violet" class="colour" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="N" word="violet" class="colour" macros="@mass @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="violet_L+H*" stem="violet" class="colour" macros="@mass @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="violet_H*" stem="violet" class="colour" macros="@mass @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="white" class="colour" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="white_L+H*" stem="white" class="colour" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="white_H*" stem="white" class="colour" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="N" word="white" class="colour" macros="@mass @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="white_L+H*" stem="white" class="colour" macros="@mass @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="white_H*" stem="white" class="colour" macros="@mass @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="yellow" class="colour" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="yellow_L+H*" stem="yellow" class="colour" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="yellow_H*" stem="yellow" class="colour" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="N" word="yellow" class="colour" macros="@mass @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="yellow_L+H*" stem="yellow" class="colour" macros="@mass @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="yellow_H*" stem="yellow" class="colour" macros="@mass @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="art" class="decoration" macros="@mass @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="art_L+H*" stem="art" class="decoration" macros="@mass @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="art_H*" stem="art" class="decoration" macros="@mass @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="artwork" class="decoration" macros="@mass @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="artwork_L+H*" stem="artwork" class="decoration" macros="@mass @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="artwork_H*" stem="artwork" class="decoration" macros="@mass @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="collection" class="abstraction" macros="@sg @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="collection_L+H*" stem="collection" class="abstraction" macros="@sg @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="collection_H*" stem="collection" class="abstraction" macros="@sg @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="collections" stem="collection" class="abstraction" macros="@pl @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="collections_L+H*" stem="collection" class="abstraction" macros="@pl @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="collections_H*" stem="collection" class="abstraction" macros="@pl @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="colour" class="abstraction" macros="@sg @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="colour_L+H*" stem="colour" class="abstraction" macros="@sg @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="colour_H*" stem="colour" class="abstraction" macros="@sg @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="colours" stem="colour" class="abstraction" macros="@pl @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="colours_L+H*" stem="colour" class="abstraction" macros="@pl @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="colours_H*" stem="colour" class="abstraction" macros="@pl @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="colour_scheme" class="mental-obj" macros="@sg @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="colour_scheme_L+H*" stem="colour_scheme" class="mental-obj" macros="@sg @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="colour_scheme_H*" stem="colour_scheme" class="mental-obj" macros="@sg @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="colour_schemes" stem="colour_scheme" class="mental-obj" macros="@pl @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="colour_schemes_L+H*" stem="colour_scheme" class="mental-obj" macros="@pl @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="colour_schemes_H*" stem="colour_scheme" class="mental-obj" macros="@pl @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="design" class="mental-obj" macros="@sg @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="design_L+H*" stem="design" class="mental-obj" macros="@sg @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="design_H*" stem="design" class="mental-obj" macros="@sg @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="designs" stem="design" class="mental-obj" macros="@pl @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="designs_L+H*" stem="design" class="mental-obj" macros="@pl @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="designs_H*" stem="design" class="mental-obj" macros="@pl @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="fruit" class="decoration" macros="@mass @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="fruit_L+H*" stem="fruit" class="decoration" macros="@mass @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="fruit_H*" stem="fruit" class="decoration" macros="@mass @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="mosaics" class="decoration" macros="@pl @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="mosaics_L+H*" stem="mosaics" class="decoration" macros="@pl @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="mosaics_H*" stem="mosaics" class="decoration" macros="@pl @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="motif" class="decoration" macros="@sg @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="motif_L+H*" stem="motif" class="decoration" macros="@sg @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="motif_H*" stem="motif" class="decoration" macros="@sg @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="motifs" stem="motif" class="decoration" macros="@pl @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="motifs_L+H*" stem="motif" class="decoration" macros="@pl @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="motifs_H*" stem="motif" class="decoration" macros="@pl @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="option" class="mental-obj" macros="@sg @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="option_L+H*" stem="option" class="mental-obj" macros="@sg @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="option_H*" stem="option" class="mental-obj" macros="@sg @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="options" stem="option" class="mental-obj" macros="@pl @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="options_L+H*" stem="option" class="mental-obj" macros="@pl @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="options_H*" stem="option" class="mental-obj" macros="@pl @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="series" class="abstraction" macros="@sg @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="series_L+H*" stem="series" class="abstraction" macros="@sg @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="series_H*" stem="series" class="abstraction" macros="@sg @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="series" class="abstraction" macros="@pl @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="series_L+H*" stem="series" class="abstraction" macros="@pl @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="series_H*" stem="series" class="abstraction" macros="@pl @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="shape" class="decoration" macros="@sg @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="shape_L+H*" stem="shape" class="decoration" macros="@sg @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="shape_H*" stem="shape" class="decoration" macros="@sg @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="shapes" stem="shape" class="decoration" macros="@pl @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="shapes_L+H*" stem="shape" class="decoration" macros="@pl @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="shapes_H*" stem="shape" class="decoration" macros="@pl @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="style" class="abstraction" macros="@sg @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="style_L+H*" stem="style" class="abstraction" macros="@sg @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="style_H*" stem="style" class="abstraction" macros="@sg @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="styles" stem="style" class="abstraction" macros="@pl @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="styles_L+H*" stem="style" class="abstraction" macros="@pl @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="styles_H*" stem="style" class="abstraction" macros="@pl @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="tile" class="phys-obj" macros="@sg @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="tile_L+H*" stem="tile" class="phys-obj" macros="@sg @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="tile_H*" stem="tile" class="phys-obj" macros="@sg @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="tiles" stem="tile" class="phys-obj" macros="@pl @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="tiles_L+H*" stem="tile" class="phys-obj" macros="@pl @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="tiles_H*" stem="tile" class="phys-obj" macros="@pl @rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Agrob_Buchtal" class="manufacturer" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Agrob_Buchtal_L+H*" stem="Agrob_Buchtal" class="manufacturer" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Agrob_Buchtal_H*" stem="Agrob_Buchtal" class="manufacturer" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Alessi_Tiles" class="manufacturer" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Alessi_Tiles_L+H*" stem="Alessi_Tiles" class="manufacturer" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Alessi_Tiles_H*" stem="Alessi_Tiles" class="manufacturer" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Aparici" class="manufacturer" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Aparici_L+H*" stem="Aparici" class="manufacturer" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Aparici_H*" stem="Aparici" class="manufacturer" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Apavisa" class="manufacturer" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Apavisa_L+H*" stem="Apavisa" class="manufacturer" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Apavisa_H*" stem="Apavisa" class="manufacturer" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Bisazza" class="manufacturer" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Bisazza_L+H*" stem="Bisazza" class="manufacturer" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Bisazza_H*" stem="Bisazza" class="manufacturer" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Cerim_Ceramiche" class="manufacturer" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Cerim_Ceramiche_L+H*" stem="Cerim_Ceramiche" class="manufacturer" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Cerim_Ceramiche_H*" stem="Cerim_Ceramiche" class="manufacturer" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Coem" class="manufacturer" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Coem_L+H*" stem="Coem" class="manufacturer" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Coem_H*" stem="Coem" class="manufacturer" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Engers_Eurodesign" class="manufacturer" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Engers_Eurodesign_L+H*" stem="Engers_Eurodesign" class="manufacturer" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Engers_Eurodesign_H*" stem="Engers_Eurodesign" class="manufacturer" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Gardenia_Orchidea" class="manufacturer" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Gardenia_Orchidea_L+H*" stem="Gardenia_Orchidea" class="manufacturer" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Gardenia_Orchidea_H*" stem="Gardenia_Orchidea" class="manufacturer" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Imola_Ceramica" class="manufacturer" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Imola_Ceramica_L+H*" stem="Imola_Ceramica" class="manufacturer" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Imola_Ceramica_H*" stem="Imola_Ceramica" class="manufacturer" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Iris_Ceramica" class="manufacturer" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Iris_Ceramica_L+H*" stem="Iris_Ceramica" class="manufacturer" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Iris_Ceramica_H*" stem="Iris_Ceramica" class="manufacturer" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="NovaBell" class="manufacturer" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="NovaBell_L+H*" stem="NovaBell" class="manufacturer" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="NovaBell_H*" stem="NovaBell" class="manufacturer" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Porcelaingres" class="manufacturer" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Porcelaingres_L+H*" stem="Porcelaingres" class="manufacturer" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Porcelaingres_H*" stem="Porcelaingres" class="manufacturer" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Porcelanosa" class="manufacturer" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Porcelanosa_L+H*" stem="Porcelanosa" class="manufacturer" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Porcelanosa_H*" stem="Porcelanosa" class="manufacturer" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Sphinx_Tiles" class="manufacturer" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Sphinx_Tiles_L+H*" stem="Sphinx_Tiles" class="manufacturer" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Sphinx_Tiles_H*" stem="Sphinx_Tiles" class="manufacturer" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Steuler" class="manufacturer" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Steuler_L+H*" stem="Steuler" class="manufacturer" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Steuler_H*" stem="Steuler" class="manufacturer" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Villeroy_and_Boch" class="manufacturer" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Villeroy_and_Boch_L+H*" stem="Villeroy_and_Boch" class="manufacturer" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Villeroy_and_Boch_H*" stem="Villeroy_and_Boch" class="manufacturer" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Abbazie" class="series" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Abbazie_L+H*" stem="Abbazie" class="series" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Abbazie_H*" stem="Abbazie" class="series" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="Abbazie" class="series" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="Abbazie_L+H*" stem="Abbazie" class="series" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="Abbazie_H*" stem="Abbazie" class="series" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="NNP" word="Aguamarina" class="series" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Aguamarina_L+H*" stem="Aguamarina" class="series" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Aguamarina_H*" stem="Aguamarina" class="series" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="Aguamarina" class="series" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="Aguamarina_L+H*" stem="Aguamarina" class="series" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="Aguamarina_H*" stem="Aguamarina" class="series" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="NNP" word="Alt_Mettlach" class="series" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Alt_Mettlach_L+H*" stem="Alt_Mettlach" class="series" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Alt_Mettlach_H*" stem="Alt_Mettlach" class="series" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="Alt_Mettlach" class="series" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="Alt_Mettlach_L+H*" stem="Alt_Mettlach" class="series" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="Alt_Mettlach_H*" stem="Alt_Mettlach" class="series" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="NNP" word="Altamira" class="series" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Altamira_L+H*" stem="Altamira" class="series" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Altamira_H*" stem="Altamira" class="series" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="Altamira" class="series" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="Altamira_L+H*" stem="Altamira" class="series" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="Altamira_H*" stem="Altamira" class="series" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="NNP" word="Amazonita" class="series" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Amazonita_L+H*" stem="Amazonita" class="series" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Amazonita_H*" stem="Amazonita" class="series" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="Amazonita" class="series" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="Amazonita_L+H*" stem="Amazonita" class="series" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="Amazonita_H*" stem="Amazonita" class="series" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="NNP" word="Anasol" class="series" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Anasol_L+H*" stem="Anasol" class="series" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Anasol_H*" stem="Anasol" class="series" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="Anasol" class="series" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="Anasol_L+H*" stem="Anasol" class="series" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="Anasol_H*" stem="Anasol" class="series" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="NNP" word="Aramis" class="series" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Aramis_L+H*" stem="Aramis" class="series" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Aramis_H*" stem="Aramis" class="series" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="Aramis" class="series" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="Aramis_L+H*" stem="Aramis" class="series" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="Aramis_H*" stem="Aramis" class="series" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="NNP" word="Asterix" class="series" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Asterix_L+H*" stem="Asterix" class="series" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Asterix_H*" stem="Asterix" class="series" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="Asterix" class="series" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="Asterix_L+H*" stem="Asterix" class="series" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="Asterix_H*" stem="Asterix" class="series" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="NNP" word="Armonie" class="series" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Armonie_L+H*" stem="Armonie" class="series" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Armonie_H*" stem="Armonie" class="series" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="Armonie" class="series" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="Armonie_L+H*" stem="Armonie" class="series" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="Armonie_H*" stem="Armonie" class="series" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="NNP" word="Ateliers" class="series" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Ateliers_L+H*" stem="Ateliers" class="series" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Ateliers_H*" stem="Ateliers" class="series" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="Ateliers" class="series" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="Ateliers_L+H*" stem="Ateliers" class="series" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="Ateliers_H*" stem="Ateliers" class="series" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="NNP" word="Blue_Jeans" class="series" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Blue_Jeans_L+H*" stem="Blue_Jeans" class="series" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Blue_Jeans_H*" stem="Blue_Jeans" class="series" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="Blue_Jeans" class="series" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="Blue_Jeans_L+H*" stem="Blue_Jeans" class="series" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="Blue_Jeans_H*" stem="Blue_Jeans" class="series" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="NNP" word="Carioca" class="series" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Carioca_L+H*" stem="Carioca" class="series" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Carioca_H*" stem="Carioca" class="series" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="Carioca" class="series" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="Carioca_L+H*" stem="Carioca" class="series" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="Carioca_H*" stem="Carioca" class="series" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="NNP" word="Cardiff" class="series" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Cardiff_L+H*" stem="Cardiff" class="series" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Cardiff_H*" stem="Cardiff" class="series" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="Cardiff" class="series" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="Cardiff_L+H*" stem="Cardiff" class="series" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="Cardiff_H*" stem="Cardiff" class="series" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="NNP" word="Century" class="series" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Century_L+H*" stem="Century" class="series" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Century_H*" stem="Century" class="series" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="Century" class="series" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="Century_L+H*" stem="Century" class="series" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="Century_H*" stem="Century" class="series" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="NNP" word="Century_Esprit" class="series" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Century_Esprit_L+H*" stem="Century_Esprit" class="series" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Century_Esprit_H*" stem="Century_Esprit" class="series" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="Century_Esprit" class="series" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="Century_Esprit_L+H*" stem="Century_Esprit" class="series" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="Century_Esprit_H*" stem="Century_Esprit" class="series" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="NNP" word="Colorado" class="series" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Colorado_L+H*" stem="Colorado" class="series" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Colorado_H*" stem="Colorado" class="series" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="Colorado" class="series" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="Colorado_L+H*" stem="Colorado" class="series" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="Colorado_H*" stem="Colorado" class="series" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="NNP" word="Creative_System_Amazonas" class="series" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Creative_System_Amazonas_L+H*" stem="Creative_System_Amazonas" class="series" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Creative_System_Amazonas_H*" stem="Creative_System_Amazonas" class="series" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="Creative_System_Amazonas" class="series" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="Creative_System_Amazonas_L+H*" stem="Creative_System_Amazonas" class="series" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="Creative_System_Amazonas_H*" stem="Creative_System_Amazonas" class="series" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="NNP" word="Creative_System_Safari" class="series" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Creative_System_Safari_L+H*" stem="Creative_System_Safari" class="series" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Creative_System_Safari_H*" stem="Creative_System_Safari" class="series" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="Creative_System_Safari" class="series" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="Creative_System_Safari_L+H*" stem="Creative_System_Safari" class="series" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="Creative_System_Safari_H*" stem="Creative_System_Safari" class="series" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="NNP" word="Darlington" class="series" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Darlington_L+H*" stem="Darlington" class="series" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Darlington_H*" stem="Darlington" class="series" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="Darlington" class="series" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="Darlington_L+H*" stem="Darlington" class="series" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="Darlington_H*" stem="Darlington" class="series" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="NNP" word="Funny_Day" class="series" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Funny_Day_L+H*" stem="Funny_Day" class="series" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Funny_Day_H*" stem="Funny_Day" class="series" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="Funny_Day" class="series" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="Funny_Day_L+H*" stem="Funny_Day" class="series" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="Funny_Day_H*" stem="Funny_Day" class="series" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="NNP" word="Girotondo_Tile" class="series" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Girotondo_Tile_L+H*" stem="Girotondo_Tile" class="series" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Girotondo_Tile_H*" stem="Girotondo_Tile" class="series" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="Girotondo_Tile" class="series" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="Girotondo_Tile_L+H*" stem="Girotondo_Tile" class="series" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="Girotondo_Tile_H*" stem="Girotondo_Tile" class="series" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="NNP" word="Helenus" class="series" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Helenus_L+H*" stem="Helenus" class="series" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Helenus_H*" stem="Helenus" class="series" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="Helenus" class="series" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="Helenus_L+H*" stem="Helenus" class="series" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="Helenus_H*" stem="Helenus" class="series" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="NNP" word="Hippo" class="series" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Hippo_L+H*" stem="Hippo" class="series" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Hippo_H*" stem="Hippo" class="series" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="Hippo" class="series" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="Hippo_L+H*" stem="Hippo" class="series" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="Hippo_H*" stem="Hippo" class="series" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="NNP" word="HundertWasser" class="series" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="HundertWasser_L+H*" stem="HundertWasser" class="series" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="HundertWasser_H*" stem="HundertWasser" class="series" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="HundertWasser" class="series" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="HundertWasser_L+H*" stem="HundertWasser" class="series" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="HundertWasser_H*" stem="HundertWasser" class="series" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="NNP" word="I_marmi" class="series" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="I_marmi_L+H*" stem="I_marmi" class="series" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="I_marmi_H*" stem="I_marmi" class="series" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="I_marmi" class="series" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="I_marmi_L+H*" stem="I_marmi" class="series" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="I_marmi_H*" stem="I_marmi" class="series" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="NNP" word="I_marmi_Art" class="series" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="I_marmi_Art_L+H*" stem="I_marmi_Art" class="series" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="I_marmi_Art_H*" stem="I_marmi_Art" class="series" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="I_marmi_Art" class="series" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="I_marmi_Art_L+H*" stem="I_marmi_Art" class="series" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="I_marmi_Art_H*" stem="I_marmi_Art" class="series" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="NNP" word="Jazz" class="series" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Jazz_L+H*" stem="Jazz" class="series" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Jazz_H*" stem="Jazz" class="series" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="Jazz" class="series" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="Jazz_L+H*" stem="Jazz" class="series" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="Jazz_H*" stem="Jazz" class="series" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="NNP" word="Kerarock" class="series" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Kerarock_L+H*" stem="Kerarock" class="series" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Kerarock_H*" stem="Kerarock" class="series" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="Kerarock" class="series" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="Kerarock_L+H*" stem="Kerarock" class="series" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="Kerarock_H*" stem="Kerarock" class="series" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="NNP" word="Le_Pietre" class="series" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Le_Pietre_L+H*" stem="Le_Pietre" class="series" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Le_Pietre_H*" stem="Le_Pietre" class="series" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="Le_Pietre" class="series" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="Le_Pietre_L+H*" stem="Le_Pietre" class="series" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="Le_Pietre_H*" stem="Le_Pietre" class="series" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="NNP" word="Levante" class="series" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Levante_L+H*" stem="Levante" class="series" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Levante_H*" stem="Levante" class="series" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="Levante" class="series" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="Levante_L+H*" stem="Levante" class="series" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="Levante_H*" stem="Levante" class="series" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="NNP" word="Lollipop" class="series" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Lollipop_L+H*" stem="Lollipop" class="series" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Lollipop_H*" stem="Lollipop" class="series" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="Lollipop" class="series" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="Lollipop_L+H*" stem="Lollipop" class="series" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="Lollipop_H*" stem="Lollipop" class="series" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="NNP" word="Opus_Romano" class="series" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Opus_Romano_L+H*" stem="Opus_Romano" class="series" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Opus_Romano_H*" stem="Opus_Romano" class="series" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="Opus_Romano" class="series" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="Opus_Romano_L+H*" stem="Opus_Romano" class="series" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="Opus_Romano_H*" stem="Opus_Romano" class="series" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="NNP" word="Palace" class="series" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Palace_L+H*" stem="Palace" class="series" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Palace_H*" stem="Palace" class="series" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="Palace" class="series" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="Palace_L+H*" stem="Palace" class="series" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="Palace_H*" stem="Palace" class="series" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="NNP" word="Sandstein" class="series" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Sandstein_L+H*" stem="Sandstein" class="series" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Sandstein_H*" stem="Sandstein" class="series" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="Sandstein" class="series" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="Sandstein_L+H*" stem="Sandstein" class="series" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="Sandstein_H*" stem="Sandstein" class="series" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="NNP" word="Smart" class="series" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Smart_L+H*" stem="Smart" class="series" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Smart_H*" stem="Smart" class="series" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="Smart" class="series" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="Smart_L+H*" stem="Smart" class="series" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="Smart_H*" stem="Smart" class="series" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="NNP" word="Tirrenia" class="series" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Tirrenia_L+H*" stem="Tirrenia" class="series" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Tirrenia_H*" stem="Tirrenia" class="series" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="Tirrenia" class="series" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="Tirrenia_L+H*" stem="Tirrenia" class="series" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="Tirrenia_H*" stem="Tirrenia" class="series" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="NNP" word="Viso_Tile" class="series" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Viso_Tile_L+H*" stem="Viso_Tile" class="series" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Viso_Tile_H*" stem="Viso_Tile" class="series" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="Viso_Tile" class="series" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="Viso_Tile_L+H*" stem="Viso_Tile" class="series" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="Viso_Tile_H*" stem="Viso_Tile" class="series" macros="@rh-P @kon-P @OWNER-P"/>
  <entry coart="true" pos="Gest" stem="*circ*" word="GI-00:GC-e"/>
  <entry coart="true" pos="Gest" stem="*circ*" word="GI-01:GC-e"/>
  <entry coart="true" pos="Gest" stem="*circ*" word="GI-03:GC-e"/>
  <entry coart="true" pos="Gest" stem="*circ*" word="GI-25:GC-e"/>
  <entry coart="true" pos="Gest" stem="*circ*" word="GI-28:GC-e"/>
  <entry coart="true" pos="Gest" stem="*circ*" word="GI-29:GC-e"/>
  <entry coart="true" pos="Gest" stem="*circ*" word="GI-30:GC-e"/>
  <entry coart="true" pos="Gest" stem="*circ*" word="GI-31:GC-e"/>
  <entry coart="true" pos="Gest" stem="*circ*" word="GI-32:GC-e"/>
  <entry coart="true" pos="Gest" stem="*circ*" word="GI-33:GC-e"/>
  <entry coart="true" pos="Gest" stem="*circ*" word="GI-34:GC-e"/>
  <entry coart="true" pos="Gest" stem="*circ*" word="GI-35:GC-e"/>
  <entry coart="true" pos="Gest" stem="*wave*" word="GI-36:GC-w"/>
  <entry coart="true" pos="Gest" stem="*wave*" word="GI-37:GC-w"/>
  <entry coart="true" pos="Gest" stem="*wave*" word="GI-40:GC-w"/>
  <entry coart="true" pos="Gest" stem="*wave*" word="GI-41:GC-w"/>
  <entry coart="true" pos="Gest" stem="*wave*" word="GI-44:GC-w"/>
  <entry coart="true" pos="Nod" stem="*nod*" word="NI-00"/>
  <macro name="@mass">
    <fs val="mass" attr="num" id="2"/>
  </macro>
  <macro name="@sg">
    <fs val="sg" attr="num" id="2"/>
    <lf>
      <satop nomvar="X">
        <diamond mode="num">
          <prop name="sg"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@sg-agr">
    <fs val="sg" attr="num" id="1"/>
    <fs val="sg" attr="num" id="2"/>
  </macro>
  <macro name="@sg-or-mass-agr">
    <fs id="1">
      <feat attr="num">
        <featvar name="NUM:sg-or-mass"/>
      </feat>
    </fs>
    <fs id="2">
      <feat attr="num">
        <featvar name="NUM:sg-or-mass"/>
      </feat>
    </fs>
  </macro>
  <macro name="@sg-2">
    <fs val="sg" attr="num" id="2"/>
  </macro>
  <macro name="@sg-or-mass-2">
    <fs val="sg-or-mass" attr="num" id="2"/>
  </macro>
  <macro name="@sg-P">
    <lf>
      <satop nomvar="P">
        <diamond mode="num">
          <prop name="sg"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@pl">
    <fs val="pl" attr="num" id="2"/>
    <lf>
      <satop nomvar="X">
        <diamond mode="num">
          <prop name="pl"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@pl-agr">
    <fs val="pl" attr="num" id="1"/>
    <fs val="pl" attr="num" id="2"/>
  </macro>
  <macro name="@pl-2">
    <fs val="pl" attr="num" id="2"/>
  </macro>
  <macro name="@pl-or-mass-2">
    <fs val="pl-or-mass" attr="num" id="2"/>
  </macro>
  <macro name="@pl-P">
    <lf>
      <satop nomvar="P">
        <diamond mode="num">
          <prop name="pl"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@1st">
    <fs val="1st" attr="pers" id="2"/>
  </macro>
  <macro name="@1st-agr">
    <fs val="1st" attr="pers" id="1"/>
    <fs val="1st" attr="pers" id="2"/>
  </macro>
  <macro name="@2nd">
    <fs val="2nd" attr="pers" id="2"/>
  </macro>
  <macro name="@2nd-agr">
    <fs val="2nd" attr="pers" id="1"/>
    <fs val="2nd" attr="pers" id="2"/>
  </macro>
  <macro name="@non-3rd-agr">
    <fs id="1">
      <feat attr="pers">
        <featvar name="PERS:non-3rd"/>
      </feat>
    </fs>
    <fs id="2">
      <feat attr="pers">
        <featvar name="PERS:non-3rd"/>
      </feat>
    </fs>
  </macro>
  <macro name="@3rd">
    <fs val="3rd" attr="pers" id="2"/>
  </macro>
  <macro name="@3rd-agr">
    <fs val="3rd" attr="pers" id="1"/>
    <fs val="3rd" attr="pers" id="2"/>
  </macro>
  <macro name="@nom">
    <fs val="nom" attr="case" id="2"/>
  </macro>
  <macro name="@acc">
    <fs val="acc" attr="case" id="2"/>
  </macro>
  <macro name="@pp-from">
    <fs val="from" attr="lex" id="3"/>
  </macro>
  <macro name="@pp-to">
    <fs val="to" attr="lex" id="3"/>
  </macro>
  <macro name="@prt-up">
    <fs val="up" attr="lex" id="4"/>
  </macro>
  <macro name="@prt-with">
    <fs val="with" attr="lex" id="4"/>
  </macro>
  <macro name="@ng">
    <fs val="ng" attr="form" id="1"/>
  </macro>
  <macro name="@base">
    <fs val="base" attr="form" id="1"/>
  </macro>
  <macro name="@base6">
    <fs val="base" attr="form" id="6"/>
  </macro>
  <macro name="@dcl">
    <fs id="1">
      <feat val="dcl" attr="form"/>
    </fs>
  </macro>
  <macro name="@adj">
    <fs val="adj" attr="form" id="1"/>
  </macro>
  <macro name="@adj6">
    <fs val="adj" attr="form" id="6"/>
  </macro>
  <macro name="@X-location">
    <fs id="2">
      <feat attr="index">
        <lf>
          <nomvar name="X:location"/>
        </lf>
      </feat>
    </fs>
  </macro>
  <macro name="@X-person">
    <fs id="2">
      <feat attr="index">
        <lf>
          <nomvar name="X:person"/>
        </lf>
      </feat>
    </fs>
  </macro>
  <macro name="@past">
    <lf>
      <satop nomvar="E">
        <diamond mode="tense">
          <prop name="past"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@pres">
    <lf>
      <satop nomvar="E">
        <diamond mode="tense">
          <prop name="pres"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro xmlns:xalan2="http://xml.apache.org/xslt" name="@th-X">
    <fs id="2">
      <feat attr="info">
        <lf>
          <prop name="th"/>
        </lf>
      </feat>
    </fs>
    <lf>
      <satop nomvar="X">
        <diamond mode="info">
          <prop name="th"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro xmlns:xalan2="http://xml.apache.org/xslt" name="@rh-X">
    <fs id="2">
      <feat attr="info">
        <lf>
          <prop name="rh"/>
        </lf>
      </feat>
    </fs>
    <lf>
      <satop nomvar="X">
        <diamond mode="info">
          <prop name="rh"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro xmlns:xalan2="http://xml.apache.org/xslt" name="@INFO-X">
    <fs id="2">
      <feat attr="info">
        <lf>
          <var name="INFO"/>
        </lf>
      </feat>
    </fs>
    <lf>
      <satop nomvar="X">
        <diamond mode="info">
          <var name="INFO"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro xmlns:xalan2="http://xml.apache.org/xslt" name="@th-S">
    <fs id="1">
      <feat attr="info">
        <lf>
          <prop name="th"/>
        </lf>
      </feat>
    </fs>
    <lf>
      <satop nomvar="S">
        <diamond mode="info">
          <prop name="th"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro xmlns:xalan2="http://xml.apache.org/xslt" name="@rh-S">
    <fs id="1">
      <feat attr="info">
        <lf>
          <prop name="rh"/>
        </lf>
      </feat>
    </fs>
    <lf>
      <satop nomvar="S">
        <diamond mode="info">
          <prop name="rh"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro xmlns:xalan2="http://xml.apache.org/xslt" name="@INFO-S">
    <fs id="1">
      <feat attr="info">
        <lf>
          <var name="INFO"/>
        </lf>
      </feat>
    </fs>
    <lf>
      <satop nomvar="S">
        <diamond mode="info">
          <var name="INFO"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro xmlns:xalan2="http://xml.apache.org/xslt" name="@th-Q">
    <fs id="2">
      <feat attr="info">
        <lf>
          <prop name="th"/>
        </lf>
      </feat>
    </fs>
    <lf>
      <satop nomvar="Q">
        <diamond mode="info">
          <prop name="th"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro xmlns:xalan2="http://xml.apache.org/xslt" name="@rh-Q">
    <fs id="2">
      <feat attr="info">
        <lf>
          <prop name="rh"/>
        </lf>
      </feat>
    </fs>
    <lf>
      <satop nomvar="Q">
        <diamond mode="info">
          <prop name="rh"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro xmlns:xalan2="http://xml.apache.org/xslt" name="@INFO-Q">
    <fs id="2">
      <feat attr="info">
        <lf>
          <var name="INFO"/>
        </lf>
      </feat>
    </fs>
    <lf>
      <satop nomvar="Q">
        <diamond mode="info">
          <var name="INFO"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro xmlns:xalan2="http://xml.apache.org/xslt" name="@th-P">
    <fs id="1">
      <feat attr="info">
        <lf>
          <prop name="th"/>
        </lf>
      </feat>
    </fs>
    <fs id="2">
      <feat attr="info">
        <lf>
          <prop name="th"/>
        </lf>
      </feat>
    </fs>
    <lf>
      <satop nomvar="P">
        <diamond mode="info">
          <prop name="th"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro xmlns:xalan2="http://xml.apache.org/xslt" name="@rh-P">
    <fs id="1">
      <feat attr="info">
        <lf>
          <prop name="rh"/>
        </lf>
      </feat>
    </fs>
    <fs id="2">
      <feat attr="info">
        <lf>
          <prop name="rh"/>
        </lf>
      </feat>
    </fs>
    <lf>
      <satop nomvar="P">
        <diamond mode="info">
          <prop name="rh"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro xmlns:xalan2="http://xml.apache.org/xslt" name="@INFO-P">
    <fs id="1">
      <feat attr="info">
        <lf>
          <var name="INFO"/>
        </lf>
      </feat>
    </fs>
    <fs id="2">
      <feat attr="info">
        <lf>
          <var name="INFO"/>
        </lf>
      </feat>
    </fs>
    <lf>
      <satop nomvar="P">
        <diamond mode="info">
          <var name="INFO"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro xmlns:xalan2="http://xml.apache.org/xslt" name="@th-E">
    <fs id="1">
      <feat attr="info">
        <lf>
          <prop name="th"/>
        </lf>
      </feat>
    </fs>
    <lf>
      <satop nomvar="E">
        <diamond mode="info">
          <prop name="th"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro xmlns:xalan2="http://xml.apache.org/xslt" name="@rh-E">
    <fs id="1">
      <feat attr="info">
        <lf>
          <prop name="rh"/>
        </lf>
      </feat>
    </fs>
    <lf>
      <satop nomvar="E">
        <diamond mode="info">
          <prop name="rh"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro xmlns:xalan2="http://xml.apache.org/xslt" name="@INFO-E">
    <fs id="1">
      <feat attr="info">
        <lf>
          <var name="INFO"/>
        </lf>
      </feat>
    </fs>
    <lf>
      <satop nomvar="E">
        <diamond mode="info">
          <var name="INFO"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro xmlns:xalan2="http://xml.apache.org/xslt" name="@INFO-3">
    <fs id="3">
      <feat attr="info">
        <lf>
          <var name="INFO"/>
        </lf>
      </feat>
    </fs>
  </macro>
  <macro xmlns:xalan2="http://xml.apache.org/xslt" name="@OWNER-X">
    <fs id="2">
      <feat attr="owner">
        <lf>
          <var name="OWNER"/>
        </lf>
      </feat>
    </fs>
    <lf>
      <satop nomvar="X">
        <diamond mode="owner">
          <var name="OWNER"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro xmlns:xalan2="http://xml.apache.org/xslt" name="@OWNER-S">
    <fs id="1">
      <feat attr="owner">
        <lf>
          <var name="OWNER"/>
        </lf>
      </feat>
    </fs>
    <lf>
      <satop nomvar="S">
        <diamond mode="owner">
          <var name="OWNER"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro xmlns:xalan2="http://xml.apache.org/xslt" name="@OWNER-Q">
    <fs id="2">
      <feat attr="owner">
        <lf>
          <var name="OWNER"/>
        </lf>
      </feat>
    </fs>
    <lf>
      <satop nomvar="Q">
        <diamond mode="owner">
          <var name="OWNER"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro xmlns:xalan2="http://xml.apache.org/xslt" name="@OWNER-P">
    <fs id="1">
      <feat attr="owner">
        <lf>
          <var name="OWNER"/>
        </lf>
      </feat>
    </fs>
    <fs id="2">
      <feat attr="owner">
        <lf>
          <var name="OWNER"/>
        </lf>
      </feat>
    </fs>
    <lf>
      <satop nomvar="P">
        <diamond mode="owner">
          <var name="OWNER"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro xmlns:xalan2="http://xml.apache.org/xslt" name="@OWNER-E">
    <fs id="1">
      <feat attr="owner">
        <lf>
          <var name="OWNER"/>
        </lf>
      </feat>
    </fs>
    <lf>
      <satop nomvar="E">
        <diamond mode="owner">
          <var name="OWNER"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro xmlns:xalan2="http://xml.apache.org/xslt" name="@OWNER-3">
    <fs id="3">
      <feat attr="owner">
        <lf>
          <var name="OWNER"/>
        </lf>
      </feat>
    </fs>
  </macro>
  <macro xmlns:xalan2="http://xml.apache.org/xslt" name="@kon-X">
    <lf>
      <satop nomvar="X">
        <diamond mode="kon">
          <prop name="+"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro xmlns:xalan2="http://xml.apache.org/xslt" name="@nokon-X">
    <lf>
      <satop nomvar="X">
        <diamond mode="kon">
          <prop name="-"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro xmlns:xalan2="http://xml.apache.org/xslt" name="@kon-S">
    <lf>
      <satop nomvar="S">
        <diamond mode="kon">
          <prop name="+"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro xmlns:xalan2="http://xml.apache.org/xslt" name="@nokon-S">
    <lf>
      <satop nomvar="S">
        <diamond mode="kon">
          <prop name="-"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro xmlns:xalan2="http://xml.apache.org/xslt" name="@kon-Q">
    <lf>
      <satop nomvar="Q">
        <diamond mode="kon">
          <prop name="+"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro xmlns:xalan2="http://xml.apache.org/xslt" name="@nokon-Q">
    <lf>
      <satop nomvar="Q">
        <diamond mode="kon">
          <prop name="-"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro xmlns:xalan2="http://xml.apache.org/xslt" name="@kon-P">
    <lf>
      <satop nomvar="P">
        <diamond mode="kon">
          <prop name="+"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro xmlns:xalan2="http://xml.apache.org/xslt" name="@nokon-P">
    <lf>
      <satop nomvar="P">
        <diamond mode="kon">
          <prop name="-"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro xmlns:xalan2="http://xml.apache.org/xslt" name="@kon-E">
    <lf>
      <satop nomvar="E">
        <diamond mode="kon">
          <prop name="+"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro xmlns:xalan2="http://xml.apache.org/xslt" name="@nokon-E">
    <lf>
      <satop nomvar="E">
        <diamond mode="kon">
          <prop name="-"/>
        </diamond>
      </satop>
    </lf>
  </macro>
</morph>


================================================
FILE: grammars/comic/rules-base.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!-- 
Copyright (C) 2003 University of Edinburgh (Michael White) 
$Revision: 1.2 $, $Date: 2004/10/05 11:01:47 $ 
-->
<rules
  name="comic"
  xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
  xsi:noNamespaceSchemaLocation="../rules.xsd"
>
  <application dir="forward"/>
  <application dir="backward"/>
  <composition dir="forward" harmonic="true"/>
  <!--
  <composition dir="forward" harmonic="false"/>
  -->
  <composition dir="backward" harmonic="true"/>
  <composition dir="backward" harmonic="false"/>
  <typeraising dir="forward" useDollar="false"/>
  <typeraising dir="forward" useDollar="false">
    <arg><atomcat type="pp"/></arg>
  </typeraising>
  <typeraising dir="backward" useDollar="true"/>
  <typeraising dir="backward" useDollar="true">
    <arg><atomcat type="pp"/></arg>
  </typeraising>
  <!--
  <substitution dir="forward" harmonic="true"/>
  <substitution dir="forward" harmonic="false"/>
  <substitution dir="backward" harmonic="true"/>
  <substitution dir="backward" harmonic="false"/>
  -->
</rules>


================================================
FILE: grammars/comic/rules.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!-- 
Copyright (C) 2003 University of Edinburgh (Michael White) 
$Revision: 1.71 $, $Date: 2005/07/22 20:44:18 $ 
-->
<rules xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" name="comic" xsi:noNamespaceSchemaLocation="../rules.xsd">
  <application dir="forward"/>
  <application dir="backward"/>
  <composition dir="forward" harmonic="true"/>
  <!--
  <composition dir="forward" harmonic="false"/>
  -->
  <composition dir="backward" harmonic="true"/>
  <composition dir="backward" harmonic="false"/>
  <typeraising dir="forward" useDollar="false"/>
  <typeraising dir="forward" useDollar="false">
    <arg>
      <atomcat type="pp"/>
    </arg>
  </typeraising>
  <typeraising dir="backward" useDollar="true"/>
  <typeraising dir="backward" useDollar="true">
    <arg>
      <atomcat type="pp"/>
    </arg>
  </typeraising>
  <!--
  <substitution dir="forward" harmonic="true"/>
  <substitution dir="forward" harmonic="false"/>
  <substitution dir="backward" harmonic="true"/>
  <substitution dir="backward" harmonic="false"/>
  -->
  <typechanging name="rrel">
    <arg>
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/"/>
        <atomcat type="np">
          <fs id="2">
            <feat val="3rd" attr="pers"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </arg>
    <result>
      <complexcat>
        <atomcat type="n">
          <fs inheritsFrom="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
            <feat attr="case">
              <featvar name="CASE"/>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="n">
          <fs inheritsFrom="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
            <feat attr="case">
              <featvar name="CASE"/>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="GenRel">
              <nomvar name="E:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </result>
  </typechanging>
  <typechanging name="tpc">
    <arg>
      <atomcat type="np">
        <fs id="2">
          <feat attr="index">
            <lf>
              <nomvar name="X"/>
            </lf>
          </feat>
          <feat attr="info">
            <lf>
              <prop name="th"/>
            </lf>
          </feat>
          <feat attr="owner">
            <lf>
              <prop name="h"/>
            </lf>
          </feat>
        </fs>
      </atomcat>
    </arg>
    <result>
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="fronted" attr="form"/>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat val="dcl" attr="form"/>
            </fs>
          </atomcat>
          <slash dir="/"/>
          <atomcat type="np">
            <fs id="2"/>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="tpc">
              <prop name="+"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </result>
  </typechanging>
  <typechanging name="bnp">
    <arg>
      <atomcat type="n">
        <fs id="2">
          <feat attr="index">
            <lf>
              <nomvar name="X"/>
            </lf>
          </feat>
          <feat val="pl-or-mass" attr="num"/>
        </fs>
      </atomcat>
    </arg>
    <result>
      <atomcat type="np">
        <fs id="2">
          <feat val="3rd" attr="pers"/>
        </fs>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="det">
              <prop name="nil"/>
            </diamond>
          </satop>
        </lf>
      </atomcat>
    </result>
  </typechanging>
  <typechanging name="s-list">
    <arg>
      <complexcat>
        <atomcat type="s_conj">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="L1"/>
              </lf>
            </feat>
            <feat attr="op-index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash/>
        <dollar name="1"/>
      </complexcat>
    </arg>
    <result>
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash/>
        <dollar name="1"/>
        <lf>
          <satop nomvar="S:situation">
            <diamond mode="First">
              <nomvar name="L1:struct"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </result>
  </typechanging>
  <typechanging name="pred-adj-list-to-adj">
    <arg>
      <complexcat>
        <atomcat type="s_conj">
          <fs id="1">
            <feat val="adj" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="L1"/>
              </lf>
            </feat>
            <feat attr="op-index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </arg>
    <result>
      <complexcat>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="GenRel">
              <nomvar name="S:proposition"/>
              <diamond mode="First">
                <nomvar name="L1:struct"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </result>
  </typechanging>
  <typechanging name="np-list-c">
    <arg>
      <atomcat type="np_conj">
        <fs id="1">
          <feat val="pl" attr="num"/>
          <feat attr="case">
            <featvar name="CASE"/>
          </feat>
          <feat val="coll" attr="type"/>
          <feat attr="index">
            <lf>
              <nomvar name="L1"/>
            </lf>
          </feat>
          <feat attr="op-index">
            <lf>
              <nomvar name="S"/>
            </lf>
          </feat>
        </fs>
      </atomcat>
    </arg>
    <result>
      <atomcat type="np">
        <fs inheritsFrom="1">
          <feat attr="index">
            <lf>
              <nomvar name="S"/>
            </lf>
          </feat>
        </fs>
        <lf>
          <satop nomvar="S:sem-obj">
            <diamond mode="First">
              <nomvar name="L1:struct"/>
            </diamond>
          </satop>
        </lf>
      </atomcat>
    </result>
  </typechanging>
  <typechanging name="np-list-d-&gt;T">
    <arg>
      <atomcat type="np_conj">
        <fs>
          <feat attr="num">
            <featvar name="NUM:num-vals"/>
          </feat>
          <feat attr="case">
            <featvar name="CASE"/>
          </feat>
          <feat val="distr" attr="type"/>
          <feat attr="index">
            <lf>
              <nomvar name="L1"/>
            </lf>
          </feat>
          <feat attr="op-index">
            <lf>
              <nomvar name="S"/>
            </lf>
          </feat>
          <feat attr="info">
            <lf>
              <var name="INFO"/>
            </lf>
          </feat>
          <feat attr="owner">
            <lf>
              <var name="OWNER"/>
            </lf>
          </feat>
        </fs>
      </atomcat>
    </arg>
    <result>
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash ability="active" varmodality="M" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash ability="active" varmodality="M" dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="num">
                <featvar name="NUM:num-vals"/>
              </feat>
              <feat val="3rd" attr="pers"/>
              <feat attr="case">
                <featvar name="CASE"/>
              </feat>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="S:situation">
            <diamond mode="First">
              <nomvar name="L1:struct"/>
            </diamond>
            <diamond mode="BoundVar">
              <nomvar name="X:sem-obj"/>
            </diamond>
            <diamond mode="Pred">
              <nomvar name="E:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </result>
  </typechanging>
  <typechanging name="np-list-d-&lt;T">
    <arg>
      <atomcat type="np_conj">
        <fs>
          <feat attr="num">
            <featvar name="NUM:num-vals"/>
          </feat>
          <feat attr="case">
            <featvar name="CASE"/>
          </feat>
          <feat val="distr" attr="type"/>
          <feat attr="index">
            <lf>
              <nomvar name="L1"/>
            </lf>
          </feat>
          <feat attr="op-index">
            <lf>
              <nomvar name="S"/>
            </lf>
          </feat>
          <feat attr="info">
            <lf>
              <var name="INFO"/>
            </lf>
          </feat>
          <feat attr="owner">
            <lf>
              <var name="OWNER"/>
            </lf>
          </feat>
        </fs>
      </atomcat>
    </arg>
    <result>
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash/>
        <dollar name="1"/>
        <slash ability="active" varmodality="M" dir="\"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
          <slash ability="active" varmodality="M" dir="/"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="num">
                <featvar name="NUM:num-vals"/>
              </feat>
              <feat val="3rd" attr="pers"/>
              <feat attr="case">
                <featvar name="CASE"/>
              </feat>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="S:situation">
            <diamond mode="First">
              <nomvar name="L1:struct"/>
            </diamond>
            <diamond mode="BoundVar">
              <nomvar name="X:sem-obj"/>
            </diamond>
            <diamond mode="Pred">
              <nomvar name="E:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </result>
  </typechanging>
  <typechanging name="card">
    <arg>
      <atomcat type="num">
        <fs>
          <feat attr="index">
            <lf>
              <nomvar name="Y"/>
            </lf>
          </feat>
          <feat attr="num">
            <featvar name="NUM"/>
          </feat>
        </fs>
      </atomcat>
    </arg>
    <result>
      <complexcat>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
            <feat attr="info">
              <lf>
                <var name="INFO"/>
              </lf>
            </feat>
            <feat attr="owner">
              <lf>
                <var name="OWNER"/>
              </lf>
            </feat>
            <feat attr="num">
              <featvar name="NUM"/>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
            <feat attr="info">
              <lf>
                <var name="INFO"/>
              </lf>
            </feat>
            <feat attr="owner">
              <lf>
                <var name="OWNER"/>
              </lf>
            </feat>
            <feat attr="num">
              <featvar name="NUM"/>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="Card">
              <nomvar name="Y:num"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </result>
  </typechanging>
  <typechanging name="card-h">
    <arg>
      <atomcat type="num">
        <fs>
          <feat attr="index">
            <lf>
              <nomvar name="Y"/>
            </lf>
          </feat>
          <feat val="pl" attr="num"/>
        </fs>
      </atomcat>
    </arg>
    <result>
      <atomcat type="n">
        <fs id="2">
          <feat attr="index">
            <lf>
              <nomvar name="X"/>
            </lf>
          </feat>
          <feat attr="info">
            <lf>
              <var name="INFO"/>
            </lf>
          </feat>
          <feat attr="owner">
            <lf>
              <var name="OWNER"/>
            </lf>
          </feat>
          <feat val="pl" attr="num"/>
        </fs>
        <lf>
          <satop nomvar="X:sem-obj">
            <prop name="pro-n"/>
            <diamond mode="info">
              <var name="INFO"/>
            </diamond>
            <diamond mode="owner">
              <var name="OWNER"/>
            </diamond>
            <diamond mode="kon">
              <prop name="-"/>
            </diamond>
            <diamond mode="Card">
              <nomvar name="Y:num"/>
            </diamond>
          </satop>
        </lf>
      </atomcat>
    </result>
  </typechanging>
  <typechanging name="purp-i">
    <arg>
      <complexcat>
        <atomcat type="s">
          <fs>
            <feat val="inf" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E2"/>
              </lf>
            </feat>
            <feat attr="info">
              <lf>
                <var name="INFO"/>
              </lf>
            </feat>
            <feat attr="owner">
              <lf>
                <var name="OWNER"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </arg>
    <result>
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="fronted" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <atomcat type="s">
          <fs id="1">
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
            <feat attr="info">
              <lf>
                <var name="INFO"/>
              </lf>
            </feat>
            <feat attr="owner">
              <lf>
                <var name="OWNER"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="S:proposition">
            <prop name="purpose-rel"/>
            <diamond mode="info">
              <var name="INFO"/>
            </diamond>
            <diamond mode="owner">
              <var name="OWNER"/>
            </diamond>
            <diamond mode="kon">
              <prop name="-"/>
            </diamond>
            <diamond mode="Core">
              <nomvar name="E:situation"/>
            </diamond>
            <diamond mode="Trib">
              <nomvar name="E2:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </result>
  </typechanging>
  <typechanging name="num-elt">
    <arg>
      <atomcat type="num">
        <fs id="2">
          <feat attr="index">
            <lf>
              <nomvar name="X"/>
            </lf>
          </feat>
        </fs>
      </atomcat>
    </arg>
    <result>
      <complexcat>
        <atomcat type="np">
          <fs inheritsFrom="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
            <feat attr="info">
              <lf>
                <var name="INFO"/>
              </lf>
            </feat>
            <feat attr="owner">
              <lf>
                <var name="OWNER"/>
              </lf>
            </feat>
            <feat val="3rd" attr="pers"/>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <atomcat type="pp">
          <fs>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
            <feat val="of" attr="lex"/>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="det">
              <prop name="nil"/>
            </diamond>
            <diamond mode="ElementOf">
              <nomvar name="Y:sem-obj"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </result>
  </typechanging>
</rules>


================================================
FILE: grammars/comic/testbed.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!-- 
Copyright (C) 2003-4 University of Edinburgh (Michael White) 
$Revision: 1.36 $, $Date: 2005/01/31 11:41:08 $ 
-->
<regression>

  <comment>Describing the style.</comment>

  <item numOfParses="2" string="here_L+H* LH% we have a design in the classic_H* style LL% .">
    <lf>
      <node id="h1" pred="have" info="rh" mood="dcl" tense="pres">
        <rel name="Owner">
          <node id="p1" pred="pro1" num="pl"/>
        </rel>
        <rel name="Poss">
          <node id="d1" pred="design" det="a" num="sg">
            <rel name="FigInv">
              <node id="i1" pred="in">
                <rel name="Ground">
                  <node id="s1" pred="style" det="the" num="sg">
                    <rel name="HasProp">
                      <node id="c1" pred="classic" kon="+"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="Location">
          <node id="h2" pred="here" info="th" kon="+"/>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="here is another_H* modern design LL% .">
    <lf>
      <node id="h1" pred="here-be" info="rh" mood="dcl" tense="pres">
        <rel name="Arg">
          <node id="d1" pred="design" num="sg">
            <rel name="Det">
              <node id="a1" pred="another" kon="+"/>
            </rel>
            <rel name="HasProp">
              <node id="m1" pred="modern"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="this_H* design_H* is in the country_H* style LL% .">
    <lf>
      <node id="b1" pred="be" info="rh" mood="dcl" tense="pres">
        <rel name="Arg">
          <node id="d1" pred="design" kon="+" num="sg">
            <rel name="Det">
              <node id="t1" pred="this" kon="+"/>
            </rel>
          </node>
        </rel>
        <rel name="Prop">
          <node id="i1" pred="in">
            <rel name="Fig">
              <node idref="d1"/>
            </rel>
            <rel name="Ground">
              <node id="s1" pred="style" det="the" num="sg">
                <rel name="HasProp">
                  <node id="c1" pred="country" kon="+"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="this_H* design_H* is classic_H* LL% .">
    <lf>
      <node id="b1" pred="be" info="rh" mood="dcl" tense="pres">
        <rel name="Arg">
          <node id="d1" pred="design" kon="+" num="sg">
            <rel name="Det">
              <node id="t1" pred="this" kon="+"/>
            </rel>
          </node>
        </rel>
        <rel name="Prop">
          <node id="c1" pred="classic" kon="+">
            <rel name="Of">
              <node idref="d1"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="2" string="this_H* design_H* is also_H* classic LL% .">
    <lf>
      <node id="b1" pred="be" info="rh" mood="dcl" tense="pres">
        <rel name="Arg">
          <node id="d1" pred="design" kon="+" num="sg">
            <rel name="Det">
              <node id="t1" pred="this" kon="+"/>
            </rel>
          </node>
        </rel>
        <rel name="Prop">
          <node id="c1" pred="classic">
            <rel name="Of">
              <node idref="d1"/>
            </rel>
            <rel name="HasProp">
              <node id="a1" pred="also" kon="+"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="2" string="this_H* design_H* is also_H* in the family style LL% .">
    <lf>
      <node id="b1" pred="be" info="rh" mood="dcl" tense="pres">
        <rel name="Arg">
          <node id="d1" pred="design" kon="+" num="sg">
            <rel name="Det">
              <node id="t1" pred="this" kon="+"/>
            </rel>
          </node>
        </rel>
        <rel name="Prop">
          <node id="i1" pred="in">
            <rel name="Fig">
              <node idref="d1"/>
            </rel>
            <rel name="Ground">
              <node id="s1" pred="style" det="the" num="sg">
                <rel name="HasProp">
                  <node id="f1" pred="family"/>
                </rel>
              </node>
            </rel>
            <rel name="HasProp">
              <node id="a1" pred="also" kon="+"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="once_again_L+H* LH% this_H* design_H* is modern LL% .">
    <lf>
      <node id="b1" pred="be" info="rh" mood="dcl" tense="pres">
        <rel name="Arg">
          <node id="d1" pred="design" kon="+" num="sg">
            <rel name="Det">
              <node id="t1" pred="this" kon="+"/>
            </rel>
          </node>
        </rel>
        <rel name="Prop">
          <node id="m1" pred="modern">
            <rel name="Of">
              <node idref="d1"/>
            </rel>
          </node>
        </rel>
        <rel name="HasProp">
          <node id="o1" pred="once-again" info="th" kon="+"/>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="once_again_L+H* LH% it is in the modern_H* style LL% .">
    <lf>
      <node id="b1" pred="be" info="rh" mood="dcl" tense="pres">
        <rel name="Arg">
          <node id="p1" pred="pro3n" num="sg"/>
        </rel>
        <rel name="Prop">
          <node id="i1" pred="in">
            <rel name="Fig">
              <node idref="p1"/>
            </rel>
            <rel name="Ground">
              <node id="s1" pred="style" det="the" num="sg">
                <rel name="HasProp">
                  <node id="m1" pred="modern" kon="+"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="HasProp">
          <node id="o1" pred="once-again" info="th" kon="+"/>
        </rel>
      </node>
    </lf>
  </item>

  <comment>Manufacturer and series.</comment>

  <item numOfParses="1" string="it draws from Armonie_H* LL% , by Coem_H* LL% .">
    <lf>
      <node id="e1" pred="elab-rel" info="rh" mood="dcl">
        <rel name="Core">
          <node id="d1" pred="draw-from" tense="pres">
            <rel name="Artifact">
              <node id="p1" pred="pro3n" num="sg"/>
            </rel>
            <rel name="Source">
              <node id="a1" pred="Armonie" kon="+"/>
            </rel>
          </node>
        </rel>
        <rel name="Trib">
          <node id="h1" pred="has-rel">
            <rel name="Of">
              <node idref="a1"/>
            </rel>
            <rel name="Creator">
              <node id="c1" pred="Coem" kon="+"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="it also_H* draws from Armonie LL% .">
    <lf>
      <node id="d1" pred="draw-from" info="rh" mood="dcl" tense="pres">
        <rel name="Artifact">
          <node id="p1" pred="pro3n" num="sg"/>
        </rel>
        <rel name="Source">
          <node id="a1" pred="Armonie"/>
        </rel>
        <rel name="HasProp">
          <node id="a2" pred="also" kon="+"/>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="2" string="it uses tiles from Coem_H* 's Armonie_H* series LL% .">
    <lf>
      <node id="u1" pred="use" info="rh" mood="dcl" tense="pres">
        <rel name="Artifact">
          <node id="p1" pred="pro3n" num="sg"/>
        </rel>
        <rel name="Material">
          <node id="t1" pred="tile" det="nil" num="pl">
            <rel name="Source">
              <node id="s1" pred="series" num="sg">
                <rel name="HasProp">
                  <node id="a1" pred="Armonie" kon="+"/>
                </rel>
                <rel name="GenOwner">
                  <node id="c1" pred="Coem" kon="+"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="it also_H* uses tiles from the Century collection LL% .">
    <lf>
      <node id="u1" pred="use" info="rh" mood="dcl" tense="pres">
        <rel name="Artifact">
          <node id="p1" pred="pro3n" num="sg"/>
        </rel>
        <rel name="Material">
          <node id="t1" pred="tile" det="nil" num="pl">
            <rel name="Source">
              <node id="c1" pred="collection" det="the" num="sg">
                <rel name="HasProp">
                  <node id="c2" pred="Century"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="HasProp">
          <node id="a1" pred="also" kon="+"/>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="it is based_on the Armonie_H* collection LL% , by Coem_H* LL% .">
    <lf>
      <node id="e1" pred="elab-rel" info="rh" mood="dcl">
        <rel name="Core">
          <node id="b1" pred="be" tense="pres">
            <rel name="Arg">
              <node id="p1" pred="pro3n" num="sg"/>
            </rel>
            <rel name="Prop">
              <node id="b2" pred="based-on">
                <rel name="Artifact">
                  <node idref="p1"/>
                </rel>
                <rel name="Source">
                  <node id="c1" pred="collection" det="the" num="sg">
                    <rel name="HasProp">
                      <node id="a1" pred="Armonie" kon="+"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="Trib">
          <node id="h1" pred="has-rel">
            <rel name="Of">
              <node idref="c1"/>
            </rel>
            <rel name="Creator">
              <node id="c2" pred="Coem" kon="+"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="2" string="it is also_H* based_on Armonie LL% .">
    <lf>
      <node id="b1" pred="be" info="rh" mood="dcl" tense="pres">
        <rel name="Arg">
          <node id="p1" pred="pro3n" num="sg"/>
        </rel>
        <rel name="Prop">
          <node id="b2" pred="based-on">
            <rel name="Artifact">
              <node idref="p1"/>
            </rel>
            <rel name="Source">
              <node id="a1" pred="Armonie"/>
            </rel>
            <rel name="HasProp">
              <node id="a2" pred="also" kon="+"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="the tiles are from the Armonie_H* collection LL% , by Coem_H* LL% .">
    <lf>
      <node id="e1" pred="elab-rel" info="rh" mood="dcl">
        <rel name="Core">
          <node id="b1" pred="be" tense="pres">
            <rel name="Arg">
              <node id="t1" pred="tile" det="the" num="pl"/>
            </rel>
            <rel name="Prop">
              <node id="h1" pred="has-rel">
                <rel name="Of">
                  <node idref="t1"/>
                </rel>
                <rel name="Source">
                  <node id="c1" pred="collection" det="the" num="sg">
                    <rel name="HasProp">
                      <node id="a1" pred="Armonie" kon="+"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="Trib">
          <node id="h2" pred="has-rel">
            <rel name="Of">
              <node idref="c1"/>
            </rel>
            <rel name="Creator">
              <node id="c2" pred="Coem" kon="+"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="its tiles are from the Kerarock_H* collection LL% , by Steuler_H* LL% .">
    <lf>
      <node id="e1" pred="elab-rel" info="rh" mood="dcl">
        <rel name="Core">
          <node id="b1" pred="be" tense="pres">
            <rel name="Arg">
              <node id="t1" pred="tile" num="pl">
                <rel name="GenOwner">
                  <node id="p1" pred="pro3n" num="sg"/>
                </rel>
              </node>
            </rel>
            <rel name="Prop">
              <node id="h1" pred="has-rel">
                <rel name="Of">
                  <node idref="t1"/>
                </rel>
                <rel name="Source">
                  <node id="c1" pred="collection" det="the" num="sg">
                    <rel name="HasProp">
                      <node id="k1" pred="Kerarock" kon="+"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="Trib">
          <node id="h2" pred="has-rel">
            <rel name="Of">
              <node idref="c1"/>
            </rel>
            <rel name="Creator">
              <node id="s1" pred="Steuler" kon="+"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="once_again_L+H* LH% the tiles are by Porcelaingres_H* LL% .">
    <lf>
      <node id="b1" pred="be" info="rh" mood="dcl" tense="pres">
        <rel name="Arg">
          <node id="t1" pred="tile" det="the" num="pl"/>
        </rel>
        <rel name="Prop">
          <node id="h1" pred="has-rel">
            <rel name="Of">
              <node idref="t1"/>
            </rel>
            <rel name="Creator">
              <node id="p1" pred="Porcelaingres" kon="+"/>
            </rel>
          </node>
        </rel>
        <rel name="HasProp">
          <node id="o1" pred="once-again" info="th" kon="+"/>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="2" string="they are also_H* from Armonie LL% .">
    <lf>
      <node id="b1" pred="be" info="rh" mood="dcl" tense="pres">
        <rel name="Arg">
          <node id="p1" pred="pro3n" num="pl"/>
        </rel>
        <rel name="Prop">
          <node id="h1" pred="has-rel">
            <rel name="Of">
              <node idref="p1"/>
            </rel>
            <rel name="Source">
              <node id="a1" pred="Armonie"/>
            </rel>
            <rel name="HasProp">
              <node id="a2" pred="also" kon="+"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="2" string="this_H* series_H* is also_H* by Coem LL% .">
    <lf>
      <node id="b1" pred="be" info="rh" mood="dcl" tense="pres">
        <rel name="Arg">
          <node id="s1" pred="series" kon="+" num="sg">
            <rel name="Det">
              <node id="t1" pred="this" kon="+"/>
            </rel>
          </node>
        </rel>
        <rel name="Prop">
          <node id="h1" pred="has-rel">
            <rel name="Of">
              <node idref="s1"/>
            </rel>
            <rel name="Creator">
              <node id="c1" pred="Coem"/>
            </rel>
            <rel name="HasProp">
              <node id="a1" pred="also" kon="+"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="this_H* collection_H* is by Steuler_H* LL% .">
    <lf>
      <node id="b1" pred="be" info="rh" mood="dcl" tense="pres">
        <rel name="Arg">
          <node id="c1" pred="collection" kon="+" num="sg">
            <rel name="Det">
              <node id="t1" pred="this" kon="+"/>
            </rel>
          </node>
        </rel>
        <rel name="Prop">
          <node id="h1" pred="has-rel">
            <rel name="Of">
              <node idref="c1"/>
            </rel>
            <rel name="Creator">
              <node id="s1" pred="Steuler" kon="+"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>

  <comment>Decorative tiles.</comment>

  <item numOfParses="2" string="there are floral_H* motifs_H* on the decorative_H* tiles LL% .">
    <lf>
      <node id="t1" pred="there-be" info="rh" mood="dcl" tense="pres">
        <rel name="Arg">
          <node id="m1" pred="motif" det="nil" kon="+" num="pl">
            <rel name="HasProp">
              <node id="f1" pred="floral" kon="+"/>
            </rel>
          </node>
        </rel>
        <rel name="Prop">
          <node id="o1" pred="on">
            <rel name="Fig">
              <node idref="m1"/>
            </rel>
            <rel name="Ground">
              <node id="t2" pred="tile" det="the" num="pl">
                <rel name="HasProp">
                  <node id="d1" pred="decorative" kon="+"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="there are also_H* mosaics LL% .">
    <lf>
      <node id="t1" pred="there-be" info="rh" mood="dcl" tense="pres">
        <rel name="Arg">
          <node id="m1" pred="mosaics" det="nil" num="pl"/>
        </rel>
        <rel name="HasProp">
          <node id="a1" pred="also" kon="+"/>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="4" string="there are also_H* floral motifs LH% and abstract shapes on the decorative tiles LL% .">
    <lf>
      <node id="t1" pred="there-be" info="rh" mood="dcl" tense="pres">
        <rel name="Arg">
          <node id="a1" pred="and">
            <rel name="List">
              <node id="m1" pred="motif" det="nil" num="pl">
                <rel name="HasProp">
                  <node id="f1" pred="floral"/>
                </rel>
              </node>
              <node id="s1" pred="shape" det="nil" num="pl">
                <rel name="HasProp">
                  <node id="a2" pred="abstract"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="Prop">
          <node id="o1" pred="on">
            <rel name="Fig">
              <node idref="a1"/>
            </rel>
            <rel name="Ground">
              <node id="t2" pred="tile" det="the" num="pl">
                <rel name="HasProp">
                  <node id="d1" pred="decorative"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="HasProp">
          <node id="a3" pred="also" kon="+"/>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="2" string="there are also_H* floral motifs on the decorative tiles LL% .">
    <lf>
      <node id="t1" pred="there-be" info="rh" mood="dcl" tense="pres">
        <rel name="Arg">
          <node id="m1" pred="motif" det="nil" num="pl">
            <rel name="HasProp">
              <node id="f1" pred="floral"/>
            </rel>
          </node>
        </rel>
        <rel name="Prop">
          <node id="o1" pred="on">
            <rel name="Fig">
              <node idref="m1"/>
            </rel>
            <rel name="Ground">
              <node id="t2" pred="tile" det="the" num="pl">
                <rel name="HasProp">
                  <node id="d1" pred="decorative"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="HasProp">
          <node id="a1" pred="also" kon="+"/>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="it also_H* has abstract shapes LL% .">
    <lf>
      <node id="h1" pred="have" info="rh" mood="dcl" tense="pres">
        <rel name="Owner">
          <node id="p1" pred="pro3n" num="sg"/>
        </rel>
        <rel name="Poss">
          <node id="s1" pred="shape" det="nil" num="pl">
            <rel name="HasProp">
              <node id="a1" pred="abstract"/>
            </rel>
          </node>
        </rel>
        <rel name="HasProp">
          <node id="a2" pred="also" kon="+"/>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="2" string="it is based_on the Century_H* collection LL% , with floral_H* motifs_H* on the decorative_H* tiles LL% .">
    <comment>Appositive 'with' now uses an elab-rel.</comment>
    <lf>
      <node id="e1" pred="elab-rel" info="rh" mood="dcl">
        <rel name="Core">
          <node id="b1" pred="be" tense="pres">
            <rel name="Arg">
              <node id="p1" pred="pro3n" num="sg"/>
            </rel>
            <rel name="Prop">
              <node id="b2" pred="based-on">
                <rel name="Artifact">
                  <node idref="p1"/>
                </rel>
                <rel name="Source">
                  <node id="c1" pred="collection" det="the" num="sg">
                    <rel name="HasProp">
                      <node id="c2" pred="Century" kon="+"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="Trib">
          <node id="h1" pred="has-rel">
            <rel name="Of">
              <node idref="x1"/>
            </rel>
            <rel name="Poss">
              <node id="m1" pred="motif" det="nil" kon="+" num="pl">
                <rel name="HasProp">
                  <node id="f1" pred="floral" kon="+"/>
                </rel>
              </node>
            </rel>
            <rel name="Where">
              <node id="o1" pred="on">
                <rel name="Fig">
                  <node idref="m1"/>
                </rel>
                <rel name="Ground">
                  <node id="t1" pred="tile" det="the" num="pl">
                    <rel name="HasProp">
                      <node id="d1" pred="decorative" kon="+"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="4" string="this_H* design_H* has floral_H* motifs_H* LH% and artwork_H* on the decorative_H* tiles LL% .">
    <lf>
      <node id="h1" pred="have" info="rh" mood="dcl" tense="pres">
        <rel name="Owner">
          <node id="d1" pred="design" kon="+" num="sg">
            <rel name="Det">
              <node id="t1" pred="this" kon="+"/>
            </rel>
          </node>
        </rel>
        <rel name="Poss">
          <node id="a1" pred="and">
            <rel name="List">
              <node id="m1" pred="motif" det="nil" kon="+" num="pl">
                <rel name="HasProp">
                  <node id="f1" pred="floral" kon="+"/>
                </rel>
              </node>
              <node id="a2" pred="artwork" det="nil" kon="+"/>
            </rel>
          </node>
        </rel>
        <rel name="Where">
          <node id="o1" pred="on">
            <rel name="Fig">
              <node idref="a1"/>
            </rel>
            <rel name="Ground">
              <node id="t2" pred="tile" det="the" num="pl">
                <rel name="HasProp">
                  <node id="d2" pred="decorative" kon="+"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>

  <comment>Colour scheme.</comment>

  <item numOfParses="3" string="the colours are terracotta_H* LH% and beige_H* LL% .">
    <lf>
      <node id="b1" pred="be" info="rh" mood="dcl" tense="pres">
        <rel name="Arg">
          <node id="c1" pred="colour" det="the" num="pl"/>
        </rel>
        <rel name="Prop">
          <node id="a1" pred="and">
            <rel name="List">
              <node id="t1" pred="terracotta" kon="+">
                <rel name="Of">
                  <node idref="c1"/>
                </rel>
              </node>
              <node id="b2" pred="beige" kon="+">
                <rel name="Of">
                  <node idref="c1"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="3" string="once_again_L+H* LH% the colours are terracotta_H* LH% and beige_H* LL% .">
    <lf>
      <node id="b1" pred="be" info="rh" mood="dcl" tense="pres">
        <rel name="Arg">
          <node id="c1" pred="colour" det="the" num="pl"/>
        </rel>
        <rel name="Prop">
          <node id="a1" pred="and">
            <rel name="List">
              <node id="t1" pred="terracotta" kon="+">
                <rel name="Of">
                  <node idref="c1"/>
                </rel>
              </node>
              <node id="b2" pred="beige" kon="+">
                <rel name="Of">
                  <node idref="c1"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="HasProp">
          <node id="o1" pred="once-again" info="th" kon="+"/>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="the tiles have a terracotta_H* LH% and beige_H* colour_scheme LL% .">
    <lf>
      <node id="h1" pred="have" info="rh" mood="dcl" tense="pres">
        <rel name="Owner">
          <node id="t1" pred="tile" det="the" num="pl"/>
        </rel>
        <rel name="Poss">
          <node id="c1" pred="colour_scheme" det="a" num="sg">
            <rel name="GenRel">
              <node id="a1" pred="and">
                <rel name="List">
                  <node id="t2" pred="terracotta" kon="+">
                    <rel name="Of">
                      <node idref="c1"/>
                    </rel>
                  </node>
                  <node id="b1" pred="beige" kon="+">
                    <rel name="Of">
                      <node idref="c1"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="the tiles also_H* have a blue colour_scheme LL% .">
    <lf>
      <node id="h1" pred="have" info="rh" mood="dcl" tense="pres">
        <rel name="Owner">
          <node id="t1" pred="tile" det="the" num="pl"/>
        </rel>
        <rel name="Poss">
          <node id="c1" pred="colour_scheme" det="a" num="sg">
            <rel name="HasProp">
              <node id="b1" pred="blue"/>
            </rel>
          </node>
        </rel>
        <rel name="HasProp">
          <node id="a1" pred="also" kon="+"/>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="this_H* design_H* also_H* has a blue LH% and green colour_scheme LL% .">
    <lf>
      <node id="h1" pred="have" info="rh" mood="dcl" tense="pres">
        <rel name="Owner">
          <node id="d1" pred="design" kon="+" num="sg">
            <rel name="Det">
              <node id="t1" pred="this" kon="+"/>
            </rel>
          </node>
        </rel>
        <rel name="Poss">
          <node id="c1" pred="colour_scheme" det="a" num="sg">
            <rel name="GenRel">
              <node id="a1" pred="and">
                <rel name="List">
                  <node id="b1" pred="blue">
                    <rel name="Of">
                      <node idref="c1"/>
                    </rel>
                  </node>
                  <node id="g1" pred="green">
                    <rel name="Of">
                      <node idref="c1"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="HasProp">
          <node id="a2" pred="also" kon="+"/>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="the blue_L+H* LH% and beige_L+H* colour_scheme LH% helps_to_set_the_mood_H* LL% .">
    <comment>Added pitch accent onto canned text bits.</comment>
    <lf>
      <node id="h1" pred="help-set-mood" info="rh" kon="+" mood="dcl" tense="pres">
        <rel name="Arg">
          <node id="c1" pred="colour_scheme" det="the" info="th" num="sg">
            <rel name="GenRel">
              <node id="a1" pred="and">
                <rel name="List">
                  <node id="b1" pred="blue" kon="+">
                    <rel name="Of">
                      <node idref="c1"/>
                    </rel>
                  </node>
                  <node id="b2" pred="beige" kon="+">
                    <rel name="Of">
                      <node idref="c1"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="the colours_L+H* LH% emphasise_the_clear,_straight_lined_character_of_your_bathroom_in_a_stylish_way_H* LL% .">
    <lf>
      <node id="e1" pred="emphasise-straight-lined-character" info="rh" kon="+" mood="dcl" tense="pres">
        <rel name="Arg">
          <node id="c1" pred="colour" det="the" info="th" kon="+" num="pl"/>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="2" string="the design features green_H* in the colour_scheme LL% .">
    <lf>
      <node id="f1" pred="feature" info="rh" mood="dcl" tense="pres">
        <rel name="Artifact">
          <node id="d1" pred="design" det="the" num="sg"/>
        </rel>
        <rel name="Poss">
          <node id="g1" pred="green" det="nil" kon="+"/>
        </rel>
        <rel name="Where">
          <node id="i1" pred="in">
            <rel name="Fig">
              <node idref="g1"/>
            </rel>
            <rel name="Ground">
              <node id="c1" pred="colour_scheme" det="the" num="sg"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="this_H* design also_H* features green LL% .">
    <lf>
      <node id="f1" pred="feature" info="rh" mood="dcl" tense="pres">
        <rel name="Artifact">
          <node id="d1" pred="design" num="sg">
            <rel name="Det">
              <node id="t1" pred="this" kon="+"/>
            </rel>
          </node>
        </rel>
        <rel name="Poss">
          <node id="g1" pred="green" det="nil"/>
        </rel>
        <rel name="HasProp">
          <node id="a1" pred="also" kon="+"/>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="2" string="that_L+H* one LH% features blue LH% and_H* beige_H* LL% .">
    <lf>
      <node id="f1" pred="feature" info="rh" mood="dcl" tense="pres">
        <rel name="Artifact">
          <node id="p1" pred="pro_one" info="th" num="sg">
            <rel name="Det">
              <node id="t1" pred="that" kon="+"/>
            </rel>
          </node>
        </rel>
        <rel name="Poss">
          <node id="a1" pred="and" kon="+">
            <rel name="List">
              <node id="b1" pred="blue" det="nil"/>
              <node id="b2" pred="beige" det="nil" kon="+"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="once_again_L+H* LH% the tiles have an off_white_H* LH% and dark_red_H* colour_scheme LL% .">
    <lf>
      <node id="h1" pred="have" info="rh" mood="dcl" tense="pres">
        <rel name="Owner">
          <node id="t1" pred="tile" det="the" num="pl"/>
        </rel>
        <rel name="Poss">
          <node id="c1" pred="colour_scheme" det="a" num="sg">
            <rel name="GenRel">
              <node id="a1" pred="and">
                <rel name="List">
                  <node id="o1" pred="off_white" kon="+">
                    <rel name="Of">
                      <node idref="c1"/>
                    </rel>
                  </node>
                  <node id="d1" pred="dark_red" kon="+">
                    <rel name="Of">
                      <node idref="c1"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="HasProp">
          <node id="o2" pred="once-again" info="th" kon="+"/>
        </rel>
      </node>
    </lf>
  </item>

  <comment>Combining things.</comment>

  <item numOfParses="4" string="once_again_L+H* LH% there are mosaics_H* on the decorative tiles LL% , but L here_L+H* LH% the colour is rose_H* LL% .">
    <lf>
      <node id="b1" pred="but" mood="dcl">
        <rel name="Arg1">
          <node id="t1" pred="there-be" info="rh" tense="pres">
            <rel name="Arg">
              <node id="m1" pred="mosaics" det="nil" kon="+" num="pl"/>
            </rel>
            <rel name="Prop">
              <node id="o1" pred="on">
                <rel name="Fig">
                  <node idref="m1"/>
                </rel>
                <rel name="Ground">
                  <node id="t2" pred="tile" det="the" num="pl">
                    <rel name="HasProp">
                      <node id="d1" pred="decorative"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
            <rel name="HasProp">
              <node id="o2" pred="once-again" info="th" kon="+"/>
            </rel>
          </node>
        </rel>
        <rel name="Arg2">
          <node id="b2" pred="be" info="rh" tense="pres">
            <rel name="Arg">
              <node id="c1" pred="colour" det="the" num="sg"/>
            </rel>
            <rel name="Prop">
              <node id="r1" pred="rose" kon="+">
                <rel name="Of">
                  <node idref="c1"/>
                </rel>
              </node>
            </rel>
            <rel name="Location">
              <node id="h1" pred="here" info="th" kon="+"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="these_L+H* two_L+H* designs LH% are in the family_H* style LL% , while L this_L+H* one LH% is classic_H* LL% .">
    <lf>
      <node id="w1" pred="while" mood="dcl">
        <rel name="Arg1">
          <node id="b1" pred="be" info="rh" tense="pres">
            <rel name="Arg">
              <node id="d1" pred="design" info="th" num="pl">
                <rel name="Det">
                  <node id="t1" pred="this" kon="+"/>
                </rel>
                <rel name="Card">
                  <node id="t2" pred="two" kon="+"/>
                </rel>
              </node>
            </rel>
            <rel name="Prop">
              <node id="i1" pred="in">
                <rel name="Fig">
                  <node idref="d1"/>
                </rel>
                <rel name="Ground">
                  <node id="s1" pred="style" det="the" num="sg">
                    <rel name="HasProp">
                      <node id="f1" pred="family" kon="+"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="Arg2">
          <node id="b2" pred="be" info="rh" tense="pres">
            <rel name="Arg">
              <node id="p1" pred="pro_one" info="th" num="sg">
                <rel name="Det">
                  <node id="t3" pred="this" kon="+"/>
                </rel>
              </node>
            </rel>
            <rel name="Prop">
              <node id="c1" pred="classic" kon="+">
                <rel name="Of">
                  <node idref="p1"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="3" string="the colours are terracotta_H* LH% and beige_H* LL% , giving_the_room_the_feeling_of_a_Tuscan_country_home_H* LL% .">
    <comment>The shared argument (the colours) no longer has to be separated out, since the VPing is now an appositive.</comment>
    <lf>
      <node id="e1" pred="elab-rel" info="rh" mood="dcl">
        <rel name="Core">
          <node id="b1" pred="be" tense="pres">
            <rel name="Arg">
              <node id="c1" pred="colour" det="the" num="pl"/>
            </rel>
            <rel name="Prop">
              <node id="a1" pred="and">
                <rel name="List">
                  <node id="t1" pred="terracotta" kon="+">
                    <rel name="Of">
                      <node idref="c1"/>
                    </rel>
                  </node>
                  <node id="b2" pred="beige" kon="+">
                    <rel name="Of">
                      <node idref="c1"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="Trib">
          <node id="g1" pred="give-tuscan-feeling" kon="+">
            <rel name="Arg">
              <node idref="c1"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="the colours_L+H* LH% give_the_room_the_feeling_of_a_Tuscan_country_home_H* LL% , using tiles from Coem_H* 's Armonie_H* collection LL% .">
    <lf>
      <node id="e1" pred="elab-rel" info="rh" mood="dcl">
        <rel name="Core">
          <node id="g1" pred="give-tuscan-feeling" tense="pres" kon="+">
            <rel name="Arg">
              <node id="c1" pred="colour" det="the" info="th" kon="+" num="pl"/>
            </rel>
          </node>
        </rel>
        <rel name="Trib">
          <node id="u1" pred="use">
            <rel name="Artifact">
              <node idref="c1"/>
            </rel>
            <rel name="Material">
              <node id="t1" pred="tile" det="nil" num="pl">
                <rel name="Source">
                  <node id="c2" pred="collection" num="sg">
                    <rel name="HasProp">
                      <node id="a1" pred="Armonie" kon="+"/>
                    </rel>
                    <rel name="GenOwner">
                      <node id="c3" pred="Coem" kon="+"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="2" string="here is another_H* modern design LL% that features blue_L+H* in the colour_scheme LH% .">
    <comment>
      NB: The relative clause 'that features ...' is now an appositive, and has theme status here; 
          this would be appropriate in the context of the question 'do you have any more designs with 
          blue in the colour scheme?'.
    </comment>
    <lf>
      <node id="e1" pred="elab-rel" info="th" mood="dcl">
        <rel name="Core">
          <node id="h1" pred="here-be" info="rh" tense="pres">
            <rel name="Arg">
              <node id="d1" pred="design" num="sg">
                <rel name="Det">
                  <node id="a1" pred="another" kon="+"/>
                </rel>
                <rel name="HasProp">
                  <node id="m1" pred="modern"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="Trib">
          <node id="f1" pred="feature" tense="pres">
            <rel name="Artifact">
              <node idref="d1"/>
            </rel>
            <rel name="Poss">
              <node id="b1" pred="blue" det="nil" kon="+"/>
            </rel>
            <rel name="Where">
              <node id="i1" pred="in">
                <rel name="Fig">
                  <node idref="b1"/>
                </rel>
                <rel name="Ground">
                  <node id="c1" pred="colour_scheme" det="the" num="sg"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>

  <comment>Transitions.</comment>

  <item numOfParses="1" string="now_L+H* LH% , this_L+H* design LH% here_L+H* LH% is in the family_H* style LL% .">
    <lf>
      <node id="b1" pred="be" info="rh" mood="dcl" tense="pres">
        <rel name="Arg">
          <node id="d1" pred="design" info="th" num="sg">
            <rel name="Det">
              <node id="t1" pred="this" kon="+"/>
            </rel>
          </node>
        </rel>
        <rel name="Prop">
          <node id="i1" pred="in">
            <rel name="Fig">
              <node idref="d1"/>
            </rel>
            <rel name="Ground">
              <node id="s1" pred="style" det="the" num="sg">
                <rel name="HasProp">
                  <node id="f1" pred="family" kon="+"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="Location">
          <node id="h1" pred="here" info="th" kon="+"/>
        </rel>
        <rel name="HasProp">
          <node id="n1" pred="now" info="th" kon="+"/>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="2" string="as you can see_L+H* LH% , the design features blue_H* in the colour_scheme LL% .">
    <lf>
      <node id="f1" pred="feature" info="rh" mood="dcl" tense="pres">
        <rel name="Artifact">
          <node id="d1" pred="design" det="the" num="sg"/>
        </rel>
        <rel name="Poss">
          <node id="b1" pred="blue" det="nil" kon="+"/>
        </rel>
        <rel name="Where">
          <node id="i1" pred="in">
            <rel name="Fig">
              <node idref="b1"/>
            </rel>
            <rel name="Ground">
              <node id="c1" pred="colour_scheme" det="the" num="sg"/>
            </rel>
          </node>
        </rel>
        <rel name="HasProp">
          <node id="a1" pred="as" info="th">
            <rel name="Arg">
              <node id="c2" pred="can">
                <rel name="Body">
                  <node id="s1" pred="see" kon="+">
                    <rel name="Perceiver">
                      <node id="p1" pred="pro2"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="2" string="in_addition_to the classic_L+H* style LH% , there are also modern_H* LH% and country_H* options LL% .">
    <lf>
      <node id="t1" pred="there-be" info="rh" mood="dcl" tense="pres">
        <rel name="Arg">
          <node id="o1" pred="option" det="nil" num="pl">
            <rel name="GenRel">
              <node id="a1" pred="and">
                <rel name="List">
                  <node id="m1" pred="modern" kon="+">
                    <rel name="Of">
                      <node idref="o1"/>
                    </rel>
                  </node>
                  <node id="c1" pred="country" kon="+">
                    <rel name="Of">
                      <node idref="o1"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="HasProp">
          <node id="a2" pred="also"/>
        </rel>
        <rel name="HasProp">
          <node id="i1" pred="in-addition-to" info="th">
            <rel name="Arg">
              <node id="s1" pred="style" det="the" num="sg">
                <rel name="HasProp">
                  <node id="c2" pred="classic" kon="+"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>

  <comment>Further options (in thumbnails).</comment>

  <item numOfParses="2" string="we have more_H* designs in the classic style LL% .">
    <comment>NB: this clause from the sample dialogue gets its own sentence.</comment>
    <lf>
      <node id="h1" pred="have" info="rh" mood="dcl" tense="pres">
        <rel name="Owner">
          <node id="p1" pred="pro1" num="pl"/>
        </rel>
        <rel name="Poss">
          <node id="d1" pred="design" det="nil" num="pl">
            <rel name="FigInv">
              <node id="i1" pred="in">
                <rel name="Ground">
                  <node id="s1" pred="style" det="the" num="sg">
                    <rel name="HasProp">
                      <node id="c1" pred="classic"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
            <rel name="HasProp">
              <node id="m1" pred="more" kon="+"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="we also have modern_H* LH% , family_H* LH% and country_H* designs LL% .">
    <lf>
      <node id="h1" pred="have" info="rh" mood="dcl" tense="pres">
        <rel name="Owner">
          <node id="p1" pred="pro1" num="pl"/>
        </rel>
        <rel name="Poss">
          <node id="d1" pred="design" det="nil" num="pl">
            <rel name="GenRel">
              <node id="a1" pred="and">
                <rel name="List">
                  <node id="m1" pred="modern" kon="+">
                    <rel name="Of">
                      <node idref="d1"/>
                    </rel>
                  </node>
                  <node id="f1" pred="family" kon="+">
                    <rel name="Of">
                      <node idref="d1"/>
                    </rel>
                  </node>
                  <node id="c1" pred="country" kon="+">
                    <rel name="Of">
                      <node idref="d1"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="HasProp">
          <node id="a2" pred="also"/>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="2" string="down_here_L+H* LH% we have some other_H* options in blue LL% .">
    <lf>
      <node id="h1" pred="have" info="rh" mood="dcl" tense="pres">
        <rel name="Owner">
          <node id="p1" pred="pro1" num="pl"/>
        </rel>
        <rel name="Poss">
          <node id="o1" pred="option" det="some" num="pl">
            <rel name="FigInv">
              <node id="i1" pred="in">
                <rel name="Ground">
                  <node id="b1" pred="blue" det="nil"/>
                </rel>
              </node>
            </rel>
            <rel name="HasProp">
              <node id="o2" pred="other" kon="+"/>
            </rel>
          </node>
        </rel>
        <rel name="Location">
          <node id="d1" pred="down_here" info="th" kon="+"/>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="these_L+H* two_L+H* LH% are in the family_H* style LL% .">
    <lf>
      <node id="b1" pred="be" info="rh" mood="dcl" tense="pres">
        <rel name="Arg">
          <node id="p1" pred="pro-n" info="th">
            <rel name="Det">
              <node id="t1" pred="this" kon="+"/>
            </rel>
            <rel name="Card">
              <node id="t2" pred="two" kon="+"/>
            </rel>
          </node>
        </rel>
        <rel name="Prop">
          <node id="i1" pred="in">
            <rel name="Fig">
              <node idref="p1"/>
            </rel>
            <rel name="Ground">
              <node id="s1" pred="style" det="the" num="sg">
                <rel name="HasProp">
                  <node id="f1" pred="family" kon="+"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>

  <comment>Questions.</comment>

  <item numOfParses="1" string="would you like to look at one of these_H* LH% ?">
    <lf>
      <node id="w1" pred="would" info="rh" mood="int">
        <rel name="Body">
          <node id="l1" pred="like">
            <rel name="Experiencer">
              <node id="p1" pred="pro2"/>
            </rel>
            <rel name="Content">
              <node id="l2" pred="look-at">
                <rel name="Perceiver">
                  <node idref="p1"/>
                </rel>
                <rel name="Phenomenon">
                  <node id="o1" pred="one" det="nil">
                    <rel name="ElementOf">
                      <node id="t1" pred="this" kon="+" num="pl"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="would you like to see more_H* designs in the country style LH% ?">
    <lf>
      <node id="w1" pred="would" info="rh" mood="int">
        <rel name="Body">
          <node id="l1" pred="like">
            <rel name="Experiencer">
              <node id="p1" pred="pro2"/>
            </rel>
            <rel name="Content">
              <node id="s1" pred="see">
                <rel name="Perceiver">
                  <node idref="p1"/>
                </rel>
                <rel name="Phenomenon">
                  <node id="d1" pred="design" det="nil" num="pl">
                    <rel name="FigInv">
                      <node id="i1" pred="in">
                        <rel name="Ground">
                          <node id="s2" pred="style" det="the" num="sg">
                            <rel name="HasProp">
                              <node id="c1" pred="country"/>
                            </rel>
                          </node>
                        </rel>
                      </node>
                    </rel>
                    <rel name="HasProp">
                      <node id="m1" pred="more" kon="+"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="would you like to see more designs with blue_L+H* tiles LH% ?">
    <comment>Changed pitch accent and phrase to theme, for clarification context.</comment>
    <lf>
      <node id="w1" pred="would" info="th" mood="int">
        <rel name="Body">
          <node id="l1" pred="like">
            <rel name="Experiencer">
              <node id="p1" pred="pro2"/>
            </rel>
            <rel name="Content">
              <node id="s1" pred="see">
                <rel name="Perceiver">
                  <node idref="p1"/>
                </rel>
                <rel name="Phenomenon">
                  <node id="d1" pred="design" det="nil" num="pl">
                    <rel name="Poss">
                      <node id="t1" pred="tile" det="nil" num="pl">
                        <rel name="HasProp">
                          <node id="b1" pred="blue" kon="+"/>
                        </rel>
                      </node>
                    </rel>
                    <rel name="HasProp">
                      <node id="m1" pred="more"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="would you like to see more family_L+H* designs LH% ?">
    <lf>
      <node id="w1" pred="would" info="th" mood="int">
        <rel name="Body">
          <node id="l1" pred="like">
            <rel name="Experiencer">
              <node id="p1" pred="pro2"/>
            </rel>
            <rel name="Content">
              <node id="s1" pred="see">
                <rel name="Perceiver">
                  <node idref="p1"/>
                </rel>
                <rel name="Phenomenon">
                  <node id="d1" pred="design" det="nil" num="pl">
                    <rel name="HasProp">
                      <node id="m1" pred="more"/>
                    </rel>
                    <rel name="HasProp">
                      <node id="f1" pred="family" kon="+"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="would you like to see them_H* LH% ?">
    <lf>
      <node id="w1" pred="would" info="rh" mood="int">
        <rel name="Body">
          <node id="l1" pred="like">
            <rel name="Experiencer">
              <node id="p1" pred="pro2"/>
            </rel>
            <rel name="Content">
              <node id="s1" pred="see">
                <rel name="Perceiver">
                  <node idref="p1"/>
                </rel>
                <rel name="Phenomenon">
                  <node id="p2" pred="pro3n" kon="+" num="pl"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="2" string="do you want to go with this_H* design_H* LH% ?">
    <lf>
      <node id="w1" pred="want" info="rh" mood="int" tense="pres">
        <rel name="Experiencer">
          <node id="p1" pred="pro2"/>
        </rel>
        <rel name="Content">
          <node id="g1" pred="go-with">
            <rel name="Cognizer">
              <node idref="p1"/>
            </rel>
            <rel name="Chosen">
              <node id="d1" pred="design" kon="+" num="sg">
                <rel name="Det">
                  <node id="t1" pred="this" kon="+"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="4" string="do you mean this modern_L+H* one LH% , with the tiles from the Kerarock_L+H* collection LH% ?">
    <comment>Changed pitch accent and phrase to theme, for clarification context.</comment>
    <lf>
      <node id="e1" pred="elab-rel" info="th" mood="int">
        <rel name="Core">
          <node id="m1" pred="mean" tense="pres">
            <rel name="Communicator">
              <node id="p1" pred="pro2"/>
            </rel>
            <rel name="Referent">
              <node id="p2" pred="pro_one" num="sg">
                <rel name="Det">
                  <node id="t1" pred="this"/>
                </rel>
                <rel name="HasProp">
                  <node id="m2" pred="modern" kon="+"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="Trib">
          <node id="h1" pred="has-rel">
            <rel name="Of">
              <node idref="p2"/>
            </rel>
            <rel name="Poss">
              <node id="t2" pred="tile" det="the" num="pl">
                <rel name="Source">
                  <node id="c1" pred="collection" det="the" num="sg">
                    <rel name="HasProp">
                      <node id="k1" pred="Kerarock" kon="+"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="is this_H* the one you want to go with LH% ?">
    <lf>
      <node id="b1" pred="be" info="rh" mood="int" tense="pres">
        <rel name="Arg">
          <node id="t1" pred="this" kon="+" num="sg"/>
        </rel>
        <rel name="Pred">
          <node id="p1" pred="pro_one" det="the" num="sg">
            <rel name="GenRel">
              <node id="w1" pred="want" tense="pres">
                <rel name="Experiencer">
                  <node id="p2" pred="pro2"/>
                </rel>
                <rel name="Content">
                  <node id="g1" pred="go-with">
                    <rel name="Cognizer">
                      <node idref="p2"/>
                    </rel>
                    <rel name="Chosen">
                      <node idref="p1"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  
  <comment>User tailoring.</comment>
  
  <item numOfParses="1" string="although it 's in the classic_L+H* style LH% , this design does_H* have a blue_H* LH% and beige_H* colour_scheme LL% .">
    <lf>
      <node id="a1:situation" pred="although" info="th" mood="dcl">
        <rel name="Arg1">
          <node id="b1:state" pred="be" tense="pres">
            <rel name="Arg">
              <node id="p1:sem-obj" pred="pro3n" num="sg"/>
            </rel>
            <rel name="Prop">
              <node id="i1:proposition" pred="in">
                <rel name="Fig">
                  <node idref="p1:sem-obj"/>
                </rel>
                <rel name="Ground">
                  <node id="s1:abstraction" pred="style" det="the" num="sg">
                    <rel name="HasProp">
                      <node id="c1:style" pred="classic" kon="+"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="Arg2">
          <node id="d1:state" pred="do" info="rh" kon="+" owner="s" tense="pres">
            <rel name="Body">
              <node id="h1:situation" pred="have">
                <rel name="Owner">
                  <node id="d2:mental-obj" pred="design" num="sg">
                    <rel name="Det">
                      <node id="t1:proposition" pred="this"/>
                    </rel>
                  </node>
                </rel>
                <rel name="Poss">
                  <node id="c2:mental-obj" pred="colour_scheme" det="a" num="sg">
                    <rel name="GenRel">
                      <node id="a2:proposition" pred="and">
                        <rel name="List">
                          <node id="b2:colour" pred="blue" kon="+">
                            <rel name="Of">
                              <node idref="c2:mental-obj"/>
                            </rel>
                          </node>
                          <node id="b3:colour" pred="beige" kon="+">
                            <rel name="Of">
                              <node idref="c2:mental-obj"/>
                            </rel>
                          </node>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="2" string="although it 's by Villeroy_and_Boch_L+H* LH% , it does_H* have animal_H* motifs_H* on the decorative_H* tiles LL% .">
    <lf>
      <node id="a1:situation" pred="although" info="th" mood="dcl">
        <rel name="Arg1">
          <node id="b1:state" pred="be" tense="pres">
            <rel name="Arg">
              <node id="p1:sem-obj" pred="pro3n" num="sg"/>
            </rel>
            <rel name="Prop">
              <node id="h1:proposition" pred="has-rel">
                <rel name="Of">
                  <node idref="p1:sem-obj"/>
                </rel>
                <rel name="Creator">
                  <node id="v1:manufacturer" pred="Villeroy_and_Boch" kon="+"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="Arg2">
          <node id="d1:state" pred="do" info="rh" kon="+" owner="s" tense="pres">
            <rel name="Body">
              <node id="h2:situation" pred="have">
                <rel name="Owner">
                  <node id="p2:sem-obj" pred="pro3n" num="sg"/>
                </rel>
                <rel name="Poss">
                  <node id="m1:decoration" pred="motif" det="nil" kon="+" num="pl">
                    <rel name="HasProp">
                      <node id="a2:quality" pred="animal" kon="+"/>
                    </rel>
                  </node>
                </rel>
                <rel name="Where">
                  <node id="o1:proposition" pred="on">
                    <rel name="Fig">
                      <node idref="m1:decoration"/>
                    </rel>
                    <rel name="Ground">
                      <node id="t1:phys-obj" pred="tile" det="the" num="pl">
                        <rel name="HasProp">
                          <node id="d2:quality" pred="decorative" kon="+"/>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="this_L+H* design_L+H* LH% is_H* in the country_H* style LH% , but L it has a blue_H* LH% and beige_H* colour_scheme LL% .">
    <lf>
      <node id="b1:situation" pred="but" mood="dcl">
        <rel name="Arg1">
          <node id="b2:state" pred="be" info="rh" kon="+" owner="h" tense="pres">
            <rel name="Arg">
              <node id="d1:mental-obj" pred="design" info="th" kon="+" num="sg">
                <rel name="Det">
                  <node id="t1:proposition" pred="this" kon="+"/>
                </rel>
              </node>
            </rel>
            <rel name="Prop">
              <node id="i1:proposition" pred="in">
                <rel name="Fig">
                  <node idref="d1:mental-obj"/>
                </rel>
                <rel name="Ground">
                  <node id="s1:abstraction" pred="style" det="the" num="sg">
                    <rel name="HasProp">
                      <node id="c1:style" pred="country" kon="+"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="Arg2">
          <node id="h1:situation" pred="have" info="rh" tense="pres">
            <rel name="Owner">
              <node id="p1:sem-obj" pred="pro3n" num="sg"/>
            </rel>
            <rel name="Poss">
              <node id="c2:mental-obj" pred="colour_scheme" det="a" num="sg">
                <rel name="GenRel">
                  <node id="a1:proposition" pred="and">
                    <rel name="List">
                      <node id="b3:colour" pred="blue" kon="+">
                        <rel name="Of">
                          <node idref="c2:mental-obj"/>
                        </rel>
                      </node>
                      <node id="b4:colour" pred="beige" kon="+">
                        <rel name="Of">
                          <node idref="c2:mental-obj"/>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="2" string="this_L+H* design_L+H* LH% is_H* by Villeroy_and_Boch_H* LH% , but L it features green_H* in the colour_scheme_H* LL% .">
    <lf>
      <node id="b1:situation" pred="but" mood="dcl">
        <rel name="Arg1">
          <node id="b2:state" pred="be" info="rh" kon="+" owner="h" tense="pres">
            <rel name="Arg">
              <node id="d1:mental-obj" pred="design" info="th" kon="+" num="sg">
                <rel name="Det">
                  <node id="t1:proposition" pred="this" kon="+"/>
                </rel>
              </node>
            </rel>
            <rel name="Prop">
              <node id="h1:proposition" pred="has-rel">
                <rel name="Of">
                  <node idref="d1:mental-obj"/>
                </rel>
                <rel name="Creator">
                  <node id="v1:manufacturer" pred="Villeroy_and_Boch" kon="+"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="Arg2">
          <node id="f1:proposition" pred="feature" info="rh" tense="pres">
            <rel name="Artifact">
              <node id="p1:sem-obj" pred="pro3n" num="sg"/>
            </rel>
            <rel name="Poss">
              <node id="g1:colour" pred="green" det="nil" kon="+"/>
            </rel>
            <rel name="Where">
              <node id="i1:proposition" pred="in">
                <rel name="Fig">
                  <node idref="g1:colour"/>
                </rel>
                <rel name="Ground">
                  <node id="c1:mental-obj" pred="colour_scheme" det="the" kon="+" num="sg"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="3" string="it features green_H* in the colour_scheme_H* though LL% .">
    <lf>
      <node id="f1:proposition" pred="feature" info="rh" mood="dcl" tense="pres">
        <rel name="Artifact">
          <node id="p1:sem-obj" pred="pro3n" num="sg"/>
        </rel>
        <rel name="Poss">
          <node id="g1:colour" pred="green" det="nil" kon="+"/>
        </rel>
        <rel name="Where">
          <node id="i1:proposition" pred="in">
            <rel name="Fig">
              <node idref="g1:colour"/>
            </rel>
            <rel name="Ground">
              <node id="c1:mental-obj" pred="colour_scheme" det="the" kon="+" num="sg"/>
            </rel>
          </node>
        </rel>
        <rel name="HasProp">
          <node id="t1:proposition" pred="though"/>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="2" string="it 's in the modern_H* style though LL% .">
    <lf>
      <node id="b1:state" pred="be" info="rh" mood="dcl" tense="pres">
        <rel name="Arg">
          <node id="p1:sem-obj" pred="pro3n" num="sg"/>
        </rel>
        <rel name="Prop">
          <node id="i1:proposition" pred="in">
            <rel name="Fig">
              <node idref="p1:sem-obj"/>
            </rel>
            <rel name="Ground">
              <node id="s1:abstraction" pred="style" det="the" num="sg">
                <rel name="HasProp">
                  <node id="m1:style" pred="modern" kon="+"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="HasProp">
          <node id="t1:proposition" pred="though"/>
        </rel>
      </node>
    </lf>
  </item>
</regression>


================================================
FILE: grammars/comic/types-extras.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!--
Copyright (C) 2003-4 University of Edinburgh (Michael White)
$Revision: 1.3 $, $Date: 2004/11/21 14:22:18 $ 
-->
<types name="comic" 
  xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" 
  xsi:noNamespaceSchemaLocation="../types.xsd"
>

  <!-- additional sorts for comic (builds on ../core-en/types.xml) -->
  <type name="colour" parents="abstraction proposition"/>
  <type name="colour_prop" parents="proposition"/>
  <type name="decoration" parents="phys-obj"/>
  <type name="manufacturer" parents="organization"/>
  <type name="quality" parents="proposition"/>
  <type name="series" parents="abstraction proposition"/>
  <type name="size" parents="abstraction proposition"/>
  <type name="style" parents="abstraction proposition"/>
  
</types>


================================================
FILE: grammars/comic/types.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!--
Copyright (C) 2003-4 University of Edinburgh (Michael White)
$Revision: 1.14 $, $Date: 2005/07/22 20:44:18 $ 
-->
<types xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" name="comic" xsi:noNamespaceSchemaLocation="../types.xsd">
  <!-- form vals -->
  <type name="form-vals"/>
  <type name="dcl-base" parents="form-vals"/>
  <type name="dcl" parents="dcl-base"/>
  <type name="fronted" parents="dcl-base"/>
  <type name="q-base" parents="form-vals"/>
  <type name="q" parents="q-base"/>
  <type name="wh" parents="q-base"/>
  <type name="base" parents="form-vals"/>
  <type name="emb" parents="form-vals"/>
  <type name="inf" parents="form-vals"/>
  <type name="adj" parents="form-vals"/>
  <type name="ng" parents="form-vals"/>
  <!-- person vals (nb: could merge this with number vals) -->
  <type name="pers-vals"/>
  <type name="3rd" parents="pers-vals"/>
  <type name="non-3rd" parents="pers-vals"/>
  <type name="1st" parents="non-3rd"/>
  <type name="2nd" parents="non-3rd"/>
  <!-- number vals -->
  <type name="num-vals"/>
  <type name="sg-or-mass" parents="num-vals"/>
  <type name="sg" parents="sg-or-mass"/>
  <type name="pl-or-mass" parents="num-vals"/>
  <type name="pl" parents="pl-or-mass"/>
  <type name="mass" parents="sg-or-mass pl-or-mass"/>
  <!-- ontological sorts (adapted in part from WordNet 2.0) -->
  <type name="sem-obj"/>
  <type name="abstraction" parents="sem-obj"/>
  <type name="date" parents="abstraction"/>
  <type name="measure" parents="abstraction"/>
  <type name="amt" parents="measure"/>
  <type name="dur" parents="measure"/>
  <type name="num" parents="abstraction"/>
  <type name="time" parents="abstraction"/>
  <type name="location" parents="sem-obj"/>
  <type name="city" parents="location"/>
  <type name="entity" parents="sem-obj"/>
  <type name="causal-agent" parents="entity"/>
  <type name="organization" parents="causal-agent"/>
  <type name="mental-obj" parents="entity"/>
  <type name="phys-obj" parents="entity"/>
  <type name="animate-being" parents="phys-obj"/>
  <type name="person" parents="animate-being causal-agent"/>
  <type name="grouping" parents="sem-obj"/>
  <type name="situation" parents="sem-obj"/>
  <type name="change" parents="situation"/>
  <type name="action" parents="change"/>
  <type name="statement" parents="action"/>
  <type name="motion" parents="change"/>
  <type name="quantification" parents="situation"/>
  <type name="state" parents="situation"/>
  <type name="proposition" parents="state"/>
  <type name="experience" parents="state"/>
  <!-- a structural element in the semantics -->
  <type name="struct"/>
  <!-- additional sorts for comic (builds on ../core-en/types.xml) -->
  <type name="colour" parents="abstraction proposition"/>
  <type name="colour_prop" parents="proposition"/>
  <type name="decoration" parents="phys-obj"/>
  <type name="manufacturer" parents="organization"/>
  <type name="quality" parents="proposition"/>
  <type name="series" parents="abstraction proposition"/>
  <type name="size" parents="abstraction proposition"/>
  <type name="style" parents="abstraction proposition"/>
</types>


================================================
FILE: grammars/convert-lists.xsl
================================================
<?xml version="1.0"?>
<!-- 
Copyright (C) 2003-4 University of Edinburgh (Michael White) 
$Revision: 1.3 $, $Date: 2005/07/18 21:19:41 $ 

This utility transformation converts old Coord lists into simple, flat ones.
-->
<xsl:transform 
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform" 
  version="1.0"
  xmlns:xalan2="http://xml.apache.org/xslt"
  exclude-result-prefixes="xalan2">

  <xsl:output indent="yes" xalan2:indent-amount="2"/> 
  <xsl:strip-space elements="*"/>

  
  <!-- skip Coord in normal traversal -->
  <xsl:template match="rel[@name='Coord']"/>
  
  <!-- flatten nodes under List rel -->
  <xsl:template match="rel[@name='List']">
    <rel name="List">
      <xsl:call-template name="flatten-list">
        <xsl:with-param name="node" select="node"/>
      </xsl:call-template>
    </rel>
  </xsl:template>
  
  <!-- flatten list -->
  <xsl:template name="flatten-list">
    <xsl:param name="node"/>
    <xsl:apply-templates select="$node"/>
    <xsl:variable name="coord" select="$node/rel[@name='Coord']"/>
    <xsl:if test="$coord">
      <xsl:call-template name="flatten-list">
        <xsl:with-param name="node" select="$coord/node"/>
      </xsl:call-template>
    </xsl:if>
  </xsl:template>
  
  
  <!-- Copy -->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: grammars/convert-to-graph.xsl
================================================
<?xml version="1.0"?>
<!-- 
Copyright (C) 2003-5 University of Edinburgh (Michael White)
$Revision: 1.4 $, $Date: 2005/09/16 02:49:39 $ 

This transformation converts a hybrid logic dependency semantics representation
to a node-rel graph.
-->
<xsl:transform 
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform" 
  version="1.0"
  xmlns:xalan2="http://xml.apache.org/xslt"
  exclude-result-prefixes="xalan2">

  <xsl:output indent="yes" xalan2:indent-amount="2"/> 
  <xsl:strip-space elements="*"/>

  
  <!-- convert satops to nodes --> 
  <xsl:template match="satop">
    <node id="{@nom}">
      <xsl:apply-templates/>
    </node>
  </xsl:template>

  <!-- add pred -->
  <xsl:template match="prop">
    <xsl:attribute name="pred"><xsl:value-of select="@name"/></xsl:attribute>
  </xsl:template>  
  
  <!-- convert sem features -->
  <xsl:template match="diamond[not(nom)]">
    <xsl:attribute name="{@mode}"><xsl:value-of select="prop/@name"/></xsl:attribute>
  </xsl:template>
  
  <!-- convert modal rels to rels with nodes -->
  <xsl:template match="diamond[nom]">
    <rel name="{@mode}">
      <node>
        <xsl:apply-templates/>
      </node>
    </rel>
  </xsl:template>
  
  <!-- convert initial nominals to id's --> 
  <xsl:template match="nom[following-sibling::*]">
    <xsl:attribute name="id"><xsl:value-of select="@name"/></xsl:attribute>
  </xsl:template>
  
  <!-- convert solo nominals to idref's --> 
  <xsl:template match="nom[not(following-sibling::*)]">
    <xsl:attribute name="idref"><xsl:value-of select="@name"/></xsl:attribute>
  </xsl:template>


  <!-- convert xor to one-of -->
  <xsl:template match="op[@name='xor']">
    <one-of>
      <xsl:for-each select="*">
        <!-- add atts unless satop or diamond -->
        <xsl:choose>
          <xsl:when test="not(self::satop or self::diamond)">
            <atts><xsl:apply-templates/></atts>
          </xsl:when>
          <xsl:otherwise>
          </xsl:otherwise>
        </xsl:choose>
      </xsl:for-each>
    </one-of>
  </xsl:template>
  
  <!-- convert opts -->
  <xsl:template match="op[@name='opt']">
    <opt><xsl:apply-templates/></opt>
  </xsl:template>
    
  <!-- filter conj -->
  <xsl:template match="op[@name='conj']">
    <xsl:apply-templates/>
  </xsl:template>
    
  
  <!-- Copy -->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: grammars/convert-to-hlds.xsl
================================================
<?xml version="1.0"?>
<!-- 
Copyright (C) 2003-5 University of Edinburgh (Michael White)
$Revision: 1.16 $, $Date: 2009/11/12 00:40:44 $ 

This transformation converts a node-rel graph to a hybrid logic 
dependency semantics representation.
-->
<xsl:transform 
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform" 
  version="1.0"
  xmlns:xalan2="http://xml.apache.org/xslt"
  exclude-result-prefixes="xalan2">

  <xsl:output indent="yes" xalan2:indent-amount="2"/> 
  <xsl:strip-space elements="*"/>

  
  <!-- check for non-empty node content of node elts with id's -->
  <xsl:template match="node[@id and (@shared='true' or count(@*[name(.)!='id'] | *) = 0)]" priority="1.5">
    <xsl:message terminate="yes">Error: node with id = <xsl:value-of select="@id"/> should be a reference (with idref)</xsl:message>
  </xsl:template>
  
    
  <!-- convert stand-alone nodes to satops --> 
  <xsl:template match="node[@id and not(parent::rel or parent::one-of[parent::rel])]" priority="1.0">
    <satop nom="{@id}">
      <xsl:call-template name="convert-feats-and-children"/>
    </satop>
  </xsl:template>
  
  <!-- convert dependent nodes using an initial nominal --> 
  <xsl:template match="node[@id]">
    <!-- add conj op under one-of -->
    <xsl:choose>
      <xsl:when test="parent::one-of">
        <op name="conj">
          <nom name="{@id}">
	    <!-- copy continuation feature through -->
	    <xsl:copy-of select="@continuation"/>
	  </nom>
          <xsl:call-template name="convert-feats-and-children"/>
        </op>
      </xsl:when>
      <xsl:otherwise>
        <nom name="{@id}">
	  <!-- copy continuation feature through -->
	  <xsl:copy-of select="@continuation"/>
	</nom>
        <xsl:call-template name="convert-feats-and-children"/>
      </xsl:otherwise>
    </xsl:choose>
  </xsl:template>
  
  <!-- convert stand-alone node references with children or attributes to satops (keeping shared attribute, if present) --> 
  <xsl:template match="node[@idref and count(@*[name(.)!='idref' and name(.)!='shared'] | *) &gt; 0 and not(parent::rel or parent::one-of[parent::rel])]" priority="1.0">
    <satop nom="{@idref}">
      <xsl:copy-of select="@shared"/>
      <xsl:call-template name="convert-feats-and-children"/>
    </satop>
  </xsl:template>
  
  <!-- convert dependent node references with children or attributes using an initial nominal (keeping shared attribute, if present) --> 
  <xsl:template match="node[@idref and count(@*[name(.)!='idref' and name(.)!='shared'] | *) &gt; 0]">
    <!-- add conj op under one-of -->
    <xsl:choose>
      <xsl:when test="parent::one-of">
        <op name="conj">
          <nom name="{@idref}"> <xsl:copy-of select="@shared"/> </nom>
          <xsl:call-template name="convert-feats-and-children"/>
        </op>
      </xsl:when>
      <xsl:otherwise>
        <nom name="{@idref}"> <xsl:copy-of select="@shared"/> </nom>
        <xsl:call-template name="convert-feats-and-children"/>
      </xsl:otherwise>
    </xsl:choose>
  </xsl:template>
  
  <!-- convert empty node references (with no attributes) to nominals (keeping shared attribute, if present) --> 
  <xsl:template match="node[@idref and count(@*[name(.)!='idref' and name(.)!='shared'] | *) = 0]">
    <nom name="{@idref}"> <xsl:copy-of select="@shared"/> </nom>
  </xsl:template>

    
  <!-- convert rels -->
  <xsl:template match="rel">
    <diamond mode="{@name}">
      <xsl:apply-templates/>
    </diamond>
  </xsl:template>
  
  
  <!-- convert one-of -->
  <xsl:template match="one-of">
    <op name="xor">
      <xsl:apply-templates/>
    </op>
  </xsl:template>

  <!-- convert opt -->
  <xsl:template match="opt">
    <op name="opt">
      <xsl:apply-templates/>
    </op>
  </xsl:template>

  
  <!-- convert atts -->
  <!-- nb: atts can include rels, and can be used to group them too -->
  <xsl:template match="atts">
    <!-- add conj op if multiple preds -->
    <xsl:choose>
      <xsl:when test="count(@*) &gt; 1 or *">
        <op name="conj">
          <xsl:call-template name="convert-feats-and-children"/>
        </op>
      </xsl:when>
      <xsl:otherwise>
        <xsl:call-template name="convert-feats-and-children"/>
      </xsl:otherwise>
    </xsl:choose>
  </xsl:template>

  
  <!-- convert sem features of current node and children -->
  <xsl:template name="convert-feats-and-children">
    <!-- convert sem features -->
    <xsl:call-template name="convert-feats"/>
    <!-- do rest -->
    <xsl:apply-templates/>
  </xsl:template>
  
  <!-- convert sem features of current node -->
  <xsl:template name="convert-feats">
    <!-- pass 'contination' feature through -->
    <xsl:copy-of select="@continuation"/>
    <!-- add pred (if any) -->
    <xsl:if test="@pred">
      <prop name="{@pred}"/>
    </xsl:if>
    <!-- do rest -->
    <xsl:for-each select="@*[name(.) != 'id' and name(.) != 'idref' and name(.) != 'pred' and name(.) != 'shared' and name(.) != 'continuation']">
      <diamond mode="{name(.)}"><prop name="{.}"/></diamond>
    </xsl:for-each>
  </xsl:template>
  
  
  <!-- Copy -->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: grammars/core-en/add-chunks.xsl
================================================
<?xml version="1.0"?>
<!-- 
Copyright (C) 2003-4 University of Edinburgh (Michael White)
$Revision: 1.3 $, $Date: 2005/07/18 21:19:44 $ 
-->
<xsl:transform 
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform" 
  version="1.0"
  xmlns:xalan2="http://xml.apache.org/xslt"
  exclude-result-prefixes="xalan2">

  <xsl:output indent="yes" xalan2:indent-amount="2"/> 
  <xsl:strip-space elements="*"/>

  <!-- use shared add-chunks.xsl, primarily -->
  <xsl:include href="../add-chunks.xsl"/>
  
  <!-- nothing else currently ... --> 

</xsl:transform>


================================================
FILE: grammars/core-en/add-intonation-info.xsl
================================================
<?xml version="1.0"?>
<!-- 
Copyright (C) 2003-4 University of Edinburgh (Michael White) 
$Revision: 1.5 $, $Date: 2006/03/28 14:56:34 $ 

This transformation adds dictionary entries for accented forms, 
along with macros for propagating intonation info.
-->
<xsl:transform 
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform" 
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  exclude-result-prefixes="xalan xalan2">

  <xsl:output indent="yes" xalan2:indent-amount="2"/> 
  <xsl:strip-space elements="*"/>

  <xsl:variable name="apostrophe">'</xsl:variable>
  
  <!-- Add info, k-contrast, owner macros to dictionary -->
  <xsl:template match="dictionary">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
      <xsl:call-template name="add-macros"/>
    </xsl:copy>
  </xsl:template>
  
  
  <!-- Nominal, Numeric entries --> 
  <xsl:template match="entry[@pos='NNP' or @pos='N' or @pos='Pro' or @pos='Num' or @pos='NNP-Date' or @pos='NNP-Time' or @pos='NNP-Amt']">
    <xsl:call-template name="add-accented-forms">
      <xsl:with-param name="nokon-macros" select="'@INFO-X @nokon-X @OWNER-X'"/>
      <xsl:with-param name="th-kon-macros" select="'@th-X @kon-X @OWNER-X'"/>
      <xsl:with-param name="rh-kon-macros" select="'@rh-X @kon-X @OWNER-X'"/>
    </xsl:call-template>
  </xsl:template>
  
  <!-- Quant NP, Det entries --> 
  <xsl:template match="entry[@pos='QNP' or @pos='QDet']">
    <xsl:call-template name="add-accented-forms">
      <xsl:with-param name="nokon-macros" select="'@INFO-S @nokon-S @OWNER-S'"/>
      <xsl:with-param name="th-kon-macros" select="'@th-S @kon-S @OWNER-S'"/>
      <xsl:with-param name="rh-kon-macros" select="'@rh-S @kon-S @OWNER-S'"/>
    </xsl:call-template>
  </xsl:template>
  
  <!-- Wh NP, Det entries --> 
  <xsl:template match="entry[@pos='WhNP' or @pos='Wh']">
    <xsl:call-template name="add-accented-forms">
      <xsl:with-param name="nokon-macros" select="'@INFO-Q @nokon-Q @OWNER-Q'"/>
      <xsl:with-param name="th-kon-macros" select="'@th-Q @kon-Q @OWNER-Q'"/>
      <xsl:with-param name="rh-kon-macros" select="'@rh-Q @kon-Q @OWNER-Q'"/>
    </xsl:call-template>
  </xsl:template>
  
  <!-- Adj, Adv, Temp Adv, Pred Det, Poss Pro, AmPm entries --> 
  <xsl:template match="entry[@pos='Adj' or @pos='Adv' or @pos='TempAdv' or @pos='PDet' or @pos='PossPro' or @pos='AmPm']">
    <xsl:call-template name="add-accented-forms">
      <xsl:with-param name="nokon-macros" select="'@INFO-P @nokon-P @OWNER-P'"/>
      <xsl:with-param name="th-kon-macros" select="'@th-P @kon-P @OWNER-P'"/>
      <xsl:with-param name="rh-kon-macros" select="'@rh-P @kon-P @OWNER-P'"/>
    </xsl:call-template>
  </xsl:template>
  
  <!-- Verbal entries -->
  <xsl:template match="entry[@pos='V' and not(@stem='do')]">
    <xsl:call-template name="add-accented-forms">
      <xsl:with-param name="nokon-macros" select="'@INFO-E @nokon-E @OWNER-E'"/>
      <xsl:with-param name="th-kon-macros" select="'@th-E @kon-E @OWNER-E'"/>
      <xsl:with-param name="rh-kon-macros" select="'@rh-E @kon-E @OWNER-E'"/>
    </xsl:call-template>
  </xsl:template>

  <!-- 'do': need special handling of do-support -->
  <xsl:template match="entry[@stem='do']">
    <!-- make accented forms, excluding do-support -->
    <xsl:variable name="entry-with-accented-forms">
      <xsl:call-template name="add-accented-forms">
        <xsl:with-param name="nokon-macros" select="'@INFO-E @nokon-E @OWNER-E'"/>
        <xsl:with-param name="th-kon-macros" select="'@th-E @kon-E @OWNER-E'"/>
        <xsl:with-param name="rh-kon-macros" select="'@rh-E @kon-E @OWNER-E'"/>
        <xsl:with-param name="extra-excludes" select="'Do-Support'"/>
      </xsl:call-template>
    </xsl:variable>
    <!-- add existing forms, excluding modal family -->
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($entry-with-accented-forms)/*"/>
      <xsl:with-param name="ext">
        <xsl:for-each select="word">
          <word form="{@form}" excluded="{normalize-space(concat(@excluded,' Modal'))}">
            <xsl:apply-templates select="@macros"/>
          </word>
        </xsl:for-each>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:template>

  
  <!-- Simple prep entries and poss 's: just add INFO and OWNER vars -->
  <xsl:template match="entry[@pos='Prep' or @pos='PossS']">
    <xsl:copy>
      <xsl:apply-templates select="@*"/>
      <xsl:attribute name="macros">
        <xsl:value-of select="normalize-space(concat(@macros,' ','@INFO-3 @OWNER-3'))"/>
      </xsl:attribute>
      <xsl:apply-templates select="*"/>
    </xsl:copy>
  </xsl:template>

  
  <!-- Conjunctions: just 'but' for now (reconciling other forms tbd) -->
  <xsl:template match="entry[@pos='Conj']">
    <xsl:call-template name="add-accented-forms">
      <xsl:with-param name="nokon-macros" select="'@INFO-S @nokon-S @OWNER-S'"/>
      <xsl:with-param name="th-kon-macros" select="'@th-S @kon-S @OWNER-S'"/>
      <xsl:with-param name="rh-kon-macros" select="'@rh-S @kon-S @OWNER-S'"/>
    </xsl:call-template>
  </xsl:template>

  
  <!-- Add word forms with pitch accents and appropriate macros to current entry -->
  <xsl:template name="add-accented-forms">
    <xsl:param name="nokon-macros"/>
    <xsl:param name="th-kon-macros"/>
    <xsl:param name="rh-kon-macros"/>
    <xsl:param name="extra-excludes" select="''"/>
    <xsl:copy>
      <!-- copy attributes and member-of|stem-for list -->
      <xsl:apply-templates select="@*"/>
      <xsl:apply-templates select="member-of|stem-for"/>
      <!-- if no word forms listed, add accented word forms based on word or stem -->
      <xsl:if test="not(word)">
        <xsl:variable name="form">
          <xsl:choose>
            <xsl:when test="@word"><xsl:value-of select="@word"/></xsl:when>
            <xsl:otherwise><xsl:value-of select="@stem"/></xsl:otherwise>
          </xsl:choose>
        </xsl:variable>
        <word form="{$form}" macros="{$nokon-macros}"/>
        <!-- avoid accents on reduced forms -->
        <xsl:if test="not(@pos='V' and contains($form, $apostrophe))">
          <word form="{concat($form,'_L+H*')}" macros="{$th-kon-macros}"/>
          <word form="{concat($form,'_H*')}" macros="{$rh-kon-macros}"/>
        </xsl:if>
      </xsl:if>
      <!-- otherwise add accented word forms for each listed word form, with any extra excludes -->
      <xsl:for-each select="word">
        <xsl:variable name="excluded" select="normalize-space(concat(@excluded,' ',$extra-excludes))"/>
        <word form="{@form}" macros="{normalize-space(concat(@macros,' ',$nokon-macros))}">
          <xsl:if test="$excluded != ''">
            <xsl:attribute name="excluded"><xsl:copy-of select="$excluded"/></xsl:attribute>
          </xsl:if>
        </word>
        <!-- avoid accents on reduced forms -->
        <xsl:if test="not(../@pos='V' and contains(@form, $apostrophe))">
          <word form="{concat(@form,'_L+H*')}" macros="{normalize-space(concat(@macros,' ',$th-kon-macros))}">
            <xsl:if test="$excluded != ''">
              <xsl:attribute name="excluded"><xsl:copy-of select="$excluded"/></xsl:attribute>
            </xsl:if>
          </word>
          <word form="{concat(@form,'_H*')}" macros="{normalize-space(concat(@macros,' ',$rh-kon-macros))}">
            <xsl:if test="$excluded != ''">
              <xsl:attribute name="excluded"><xsl:copy-of select="$excluded"/></xsl:attribute>
            </xsl:if>
          </word>
        </xsl:if>
      </xsl:for-each>
    </xsl:copy>
  </xsl:template>


  <!-- Macros for info, k-contrast, owner -->
  <xsl:template name="add-macros">
    <!-- info -->
    <macro name="@th-X">
      <fs id="2">
        <feat attr="info"><lf><prop name="th"/></lf></feat>
      </fs>
      <lf>
        <satop nomvar="X">
          <diamond mode="info"><prop name="th"/></diamond>
        </satop>
      </lf>
    </macro>
  
    <macro name="@rh-X">
      <fs id="2">
        <feat attr="info"><lf><prop name="rh"/></lf></feat>
      </fs>
      <lf>
        <satop nomvar="X">
          <diamond mode="info"><prop name="rh"/></diamond>
        </satop>
      </lf>
    </macro>
  
    <macro name="@INFO-X">
      <fs id="2">
        <feat attr="info"><lf><var name="INFO"/></lf></feat>
      </fs>
      <lf>
        <satop nomvar="X">
          <diamond mode="info"><var name="INFO"/></diamond>
        </satop>
      </lf>
    </macro>
  
    <macro name="@th-S">
      <fs id="1">
        <feat attr="info"><lf><prop name="th"/></lf></feat>
      </fs>
      <lf>
        <satop nomvar="S">
          <diamond mode="info"><prop name="th"/></diamond>
        </satop>
      </lf>
    </macro>
  
    <macro name="@rh-S">
      <fs id="1">
        <feat attr="info"><lf><prop name="rh"/></lf></feat>
      </fs>
      <lf>
        <satop nomvar="S">
          <diamond mode="info"><prop name="rh"/></diamond>
        </satop>
      </lf>
    </macro>
  
    <macro name="@INFO-S">
      <fs id="1">
        <feat attr="info"><lf><var name="INFO"/></lf></feat>
      </fs>
      <lf>
        <satop nomvar="S">
          <diamond mode="info"><var name="INFO"/></diamond>
        </satop>
      </lf>
    </macro>
  
    <macro name="@th-Q">
      <fs id="2">
        <feat attr="info"><lf><prop name="th"/></lf></feat>
      </fs>
      <lf>
        <satop nomvar="Q">
          <diamond mode="info"><prop name="th"/></diamond>
        </satop>
      </lf>
    </macro>
  
    <macro name="@rh-Q">
      <fs id="2">
        <feat attr="info"><lf><prop name="rh"/></lf></feat>
      </fs>
      <lf>
        <satop nomvar="Q">
          <diamond mode="info"><prop name="rh"/></diamond>
        </satop>
      </lf>
    </macro>
  
    <macro name="@INFO-Q">
      <fs id="2">
        <feat attr="info"><lf><var name="INFO"/></lf></feat>
      </fs>
      <lf>
        <satop nomvar="Q">
          <diamond mode="info"><var name="INFO"/></diamond>
        </satop>
      </lf>
    </macro>
  
    <macro name="@th-P">
      <fs id="1">
        <feat attr="info"><lf><prop name="th"/></lf></feat>
      </fs>
      <fs id="2">
        <feat attr="info"><lf><prop name="th"/></lf></feat>
      </fs>
      <lf>
        <satop nomvar="P">
          <diamond mode="info"><prop name="th"/></diamond>
        </satop>
      </lf>
    </macro>
  
    <macro name="@rh-P">
      <fs id="1">
        <feat attr="info"><lf><prop name="rh"/></lf></feat>
      </fs>
      <fs id="2">
        <feat attr="info"><lf><prop name="rh"/></lf></feat>
      </fs>
      <lf>
        <satop nomvar="P">
          <diamond mode="info"><prop name="rh"/></diamond>
        </satop>
      </lf>
    </macro>
  
    <macro name="@INFO-P">
      <fs id="1">
        <feat attr="info"><lf><var name="INFO"/></lf></feat>
      </fs>
      <fs id="2">
        <feat attr="info"><lf><var name="INFO"/></lf></feat>
      </fs>
      <lf>
        <satop nomvar="P">
          <diamond mode="info"><var name="INFO"/></diamond>
        </satop>
      </lf>
    </macro>
  
    <macro name="@th-E">
      <fs id="1">
        <feat attr="info"><lf><prop name="th"/></lf></feat>
      </fs>
      <lf>
        <satop nomvar="E">
          <diamond mode="info"><prop name="th"/></diamond>
        </satop>
      </lf>
    </macro>
  
    <macro name="@rh-E">
      <fs id="1">
        <feat attr="info"><lf><prop name="rh"/></lf></feat>
      </fs>
      <lf>
        <satop nomvar="E">
          <diamond mode="info"><prop name="rh"/></diamond>
        </satop>
      </lf>
    </macro>
  
    <macro name="@INFO-E">
      <fs id="1">
        <feat attr="info"><lf><var name="INFO"/></lf></feat>
      </fs>
      <lf>
        <satop nomvar="E">
          <diamond mode="info"><var name="INFO"/></diamond>
        </satop>
      </lf>
    </macro>
  
    <macro name="@INFO-3">
      <fs id="3">
        <feat attr="info"><lf><var name="INFO"/></lf></feat>
      </fs>
    </macro>
  
    <!-- owner -->
    <macro name="@OWNER-X">
      <fs id="2">
        <feat attr="owner"><lf><var name="OWNER"/></lf></feat>
      </fs>
      <lf>
        <satop nomvar="X">
          <diamond mode="owner"><var name="OWNER"/></diamond>
        </satop>
      </lf>
    </macro>
  
    <macro name="@OWNER-S">
      <fs id="1">
        <feat attr="owner"><lf><var name="OWNER"/></lf></feat>
      </fs>
      <lf>
        <satop nomvar="S">
          <diamond mode="owner"><var name="OWNER"/></diamond>
        </satop>
      </lf>
    </macro>
  
    <macro name="@OWNER-Q">
      <fs id="2">
        <feat attr="owner"><lf><var name="OWNER"/></lf></feat>
      </fs>
      <lf>
        <satop nomvar="Q">
          <diamond mode="owner"><var name="OWNER"/></diamond>
        </satop>
      </lf>
    </macro>
  
    <macro name="@OWNER-P">
      <fs id="1">
        <feat attr="owner"><lf><var name="OWNER"/></lf></feat>
      </fs>
      <fs id="2">
        <feat attr="owner"><lf><var name="OWNER"/></lf></feat>
      </fs>
      <lf>
        <satop nomvar="P">
          <diamond mode="owner"><var name="OWNER"/></diamond>
        </satop>
      </lf>
    </macro>
    
    <macro name="@OWNER-E">
      <fs id="1">
        <feat attr="owner"><lf><var name="OWNER"/></lf></feat>
      </fs>
      <lf>
        <satop nomvar="E">
          <diamond mode="owner"><var name="OWNER"/></diamond>
        </satop>
      </lf>
    </macro>
    
    <macro name="@OWNER-3">
      <fs id="3">
        <feat attr="owner"><lf><var name="OWNER"/></lf></feat>
      </fs>
    </macro>
  
    <!-- k-contrast -->
    <macro name="@kon-X">
      <lf>
        <satop nomvar="X">
          <diamond mode="kon"><prop name="+"/></diamond>
        </satop>
      </lf>
    </macro>
  
    <macro name="@nokon-X">
      <lf>
        <satop nomvar="X">
          <diamond mode="kon"><prop name="-"/></diamond>
        </satop>
      </lf>
    </macro>
  
    <macro name="@kon-S">
      <lf>
        <satop nomvar="S">
          <diamond mode="kon"><prop name="+"/></diamond>
        </satop>
      </lf>
    </macro>
  
    <macro name="@nokon-S">
      <lf>
        <satop nomvar="S">
          <diamond mode="kon"><prop name="-"/></diamond>
        </satop>
      </lf>
    </macro>
  
    <macro name="@kon-Q">
      <lf>
        <satop nomvar="Q">
          <diamond mode="kon"><prop name="+"/></diamond>
        </satop>
      </lf>
    </macro>
  
    <macro name="@nokon-Q">
      <lf>
        <satop nomvar="Q">
          <diamond mode="kon"><prop name="-"/></diamond>
        </satop>
      </lf>
    </macro>
  
    <macro name="@kon-P">
      <lf>
        <satop nomvar="P">
          <diamond mode="kon"><prop name="+"/></diamond>
        </satop>
      </lf>
    </macro>
  
    <macro name="@nokon-P">
      <lf>
        <satop nomvar="P">
          <diamond mode="kon"><prop name="-"/></diamond>
        </satop>
      </lf>
    </macro>
  
    <macro name="@kon-E">
      <lf>
        <satop nomvar="E">
          <diamond mode="kon"><prop name="+"/></diamond>
        </satop>
      </lf>
    </macro>
  
    <macro name="@nokon-E">
      <lf>
        <satop nomvar="E">
          <diamond mode="kon"><prop name="-"/></diamond>
        </satop>
      </lf>
    </macro>
  </xsl:template>

  
  <!-- ***** Extend ***** -->
  <xsl:template name="extend">
    <xsl:param name="elt"/>
    <xsl:param name="ext"/>
    <xsl:element name="{name($elt)}">
      <xsl:apply-templates select="$elt/@*"/>
      <xsl:apply-templates select="$elt/node()"/>
      <xsl:copy-of select="$ext"/>
    </xsl:element>
  </xsl:template>


  <!-- Copy -->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: grammars/core-en/adj.xsl
================================================
<?xml version="1.0"?>
<!-- 
Copyright (C) 2003-4 University of Edinburgh (Michael White)
$Revision: 1.9 $, $Date: 2005/07/22 20:44:22 $ 

NB: These namespace declarations seem to work with the version of Xalan 
    that comes with JDK 1.4.  With newer versions of Xalan, 
    different namespace declarations may be required. 
-->
<xsl:transform 
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform" 
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  exclude-result-prefixes="xalan xalan2">

  
  <!-- ***** Categories ***** -->

  <xsl:variable name="adj">
    <complexcat>
      <xsl:copy-of select="$n.2.X"/>
      <slash dir="/" mode="^" />
      <xsl:copy-of select="$n.2.X"/>
    </complexcat>
  </xsl:variable>
  
  <xsl:variable name="adj-np">
    <complexcat>
      <xsl:copy-of select="$np.2.X"/>
      <slash dir="/" mode="^" />
      <xsl:copy-of select="$np.2.X"/>
    </complexcat>
  </xsl:variable>
  
  
  <!-- ***** Adjective Families ***** -->
  <xsl:template name="add-adj-families">

  <xsl:variable name="X.HasProp.P.Default">
    <lf>
      <satop nomvar="X:sem-obj">
        <diamond mode="HasProp">
          <nomvar name="P:proposition"/>
          <prop name="[*DEFAULT*]"/>
        </diamond>
      </satop>
    </lf>
  </xsl:variable>
  
  <xsl:variable name="P.Default.Of.X">  
    <lf>
      <satop nomvar="P:proposition">
        <prop name="[*DEFAULT*]"/>
        <diamond mode="Of"><nomvar name="X:sem-obj"/></diamond>
      </satop>
    </lf>
  </xsl:variable>

  <family name="Adjective" pos="Adj" closed="true">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($adj)/*"/>
        <xsl:with-param name="ext" select="$X.HasProp.P.Default"/>
      </xsl:call-template>
    </entry>
    <entry name="Predicative">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($pred.adj)/*"/>
        <xsl:with-param name="ext" select="$P.Default.Of.X"/>
      </xsl:call-template>
    </entry>
  </family>

  <xsl:variable name="X-measure.HasProp.P.Default">
    <lf>
      <satop nomvar="X:measure">
        <diamond mode="HasProp">
          <nomvar name="P:proposition"/>
          <prop name="[*DEFAULT*]"/>
        </diamond>
      </satop>
    </lf>
  </xsl:variable>
  
  <family name="Adjective-Measure" pos="Adj" closed="true">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($adj-np)/*"/>
        <xsl:with-param name="ext" select="$X-measure.HasProp.P.Default"/>
      </xsl:call-template>
    </entry>
  </family>

  </xsl:template>

</xsl:transform>


================================================
FILE: grammars/core-en/adv.xsl
================================================
<?xml version="1.0"?>
<!-- 
Copyright (C) 2003-4 University of Edinburgh (Michael White)
$Revision: 1.4 $, $Date: 2004/11/21 12:06:50 $ 

NB: These namespace declarations seem to work with the version of Xalan 
    that comes with JDK 1.4.  With newer versions of Xalan, 
    different namespace declarations may be required. 
-->
<xsl:transform 
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform" 
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  exclude-result-prefixes="xalan xalan2">

  
  <!-- ***** Categories ***** -->

  <xsl:variable name="adv.initial">
    <complexcat>
      <xsl:copy-of select="$s.from-1.fronted"/>
      <slash dir="/" mode="^"/>
      <xsl:copy-of select="$s.1.E.dcl"/>
    </complexcat>
  </xsl:variable>
  
  <xsl:variable name="adv.transitional">
    <complexcat>
      <xsl:copy-of select="$s.from-1.fronted"/>
      <slash dir="/" mode="^"/>
      <xsl:copy-of select="$s.1.E"/>
      <slash dir="/" mode="*"/>
      <xsl:copy-of select="$punct.comma"/>
    </complexcat>
  </xsl:variable>
  
  <xsl:variable name="adv.forward">
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($vp.1.E.2.X)/*"/>
      <xsl:with-param name="ext">
        <slash dir="/" mode="^"/>
        <xsl:copy-of select="$vp.1.E.2.X"/>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>
  
  <!--
    NB: Using s\s here to allow: 
          [there is]s/np [also]s\s [a United flight]np
        Not sure if this overgenerates much.
  -->
  <xsl:variable name="adv.backward">
    <complexcat>
      <xsl:copy-of select="$s.1.E"/>
      <slash dir="\"/>
      <xsl:copy-of select="$s.1.E"/>
    </complexcat>
  </xsl:variable>
  
   
  <!-- ***** Adverb Families ***** -->
  <xsl:template name="add-adv-families">

  <xsl:variable name="E.HasProp.P.Default">
    <lf>
      <satop nomvar="E:situation">
        <diamond mode="HasProp">
          <nomvar name="P:proposition"/>
          <prop name="[*DEFAULT*]"/>
        </diamond>
      </satop>
    </lf>
  </xsl:variable>
  
  <family name="Adverb" pos="Adv" closed="true">
    <entry name="Initial">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($adv.initial)/*"/>
        <xsl:with-param name="ext" select="$E.HasProp.P.Default"/>
      </xsl:call-template>
    </entry>
    <entry name="Forward">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($adv.forward)/*"/>
        <xsl:with-param name="ext" select="$E.HasProp.P.Default"/>
      </xsl:call-template>
    </entry>
    <entry name="Backward">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($adv.backward)/*"/>
        <xsl:with-param name="ext" select="$E.HasProp.P.Default"/>
      </xsl:call-template>
    </entry>
  </family>

  <!-- Locative Adverbs -->
  <xsl:variable name="E.Location.P.Default">
    <lf>
      <satop nomvar="E:situation">
        <diamond mode="Location">
          <nomvar name="P:location"/>
          <prop name="[*DEFAULT*]"/>
        </diamond>
      </satop>
    </lf>
  </xsl:variable>
  
  <family name="Loc-Adverb" pos="Adv" closed="true">
    <entry name="Initial">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($adv.initial)/*"/>
        <xsl:with-param name="ext" select="$E.Location.P.Default"/>
      </xsl:call-template>
    </entry>
    <entry name="Forward">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($adv.forward)/*"/>
        <xsl:with-param name="ext" select="$E.Location.P.Default"/>
      </xsl:call-template>
    </entry>
    <entry name="Backward">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($adv.backward)/*"/>
        <xsl:with-param name="ext" select="$E.Location.P.Default"/>
      </xsl:call-template>
    </entry>
  </family>
  
  <!-- Transitional Adverbs -->
  <family name="Transitional-Adverb" pos="Adv" closed="true">
    <entry name="Initial">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($adv.transitional)/*"/>
        <xsl:with-param name="ext" select="$E.HasProp.P.Default"/>
      </xsl:call-template>
    </entry>
  </family>
  
  </xsl:template>

</xsl:transform>


================================================
FILE: grammars/core-en/auxv.xsl
================================================
<?xml version="1.0"?>
<!-- 
Copyright (C) 2003-4 University of Edinburgh (Michael White)
$Revision: 1.4 $, $Date: 2004/11/20 16:34:43 $ 

NB: These namespace declarations seem to work with the version of Xalan 
    that comes with JDK 1.4.  With newer versions of Xalan, 
    different namespace declarations may be required. 
-->
<xsl:transform 
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform" 
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  exclude-result-prefixes="xalan xalan2">

  
  <!-- ***** Categories ***** -->

  
  <!-- ***** Aux Families ***** -->
  <xsl:template name="add-aux-families">

  <!-- Modal -->
  <!-- NB: form=dcl is specified here, rather than in morph file, 
           so that form=q is not mistakenly overridden with inverted aux form -->
  <xsl:variable name="aux">
    <complexcat>
      <xsl:copy-of select="$s.1.E.dcl.default"/>
      <slash dir="\" mode="&lt;"/>
      <xsl:copy-of select="$np.2.X.nom.default"/>
      <slash dir="/" mode="^"/>
      <complexcat>
        <xsl:copy-of select="$s.E2.base"/>
        <slash dir="\" mode="&lt;"/>
        <xsl:copy-of select="$np.2.X"/>
      </complexcat>
    </complexcat>
  </xsl:variable>

  <xsl:variable name="aux.inverted">
    <complexcat>
      <xsl:copy-of select="$s.1.from-2.E.q"/>
      <slash dir="/" mode="^"/>
      <xsl:copy-of select="$s.2.E2.base"/>
    </complexcat>
  </xsl:variable>

  <xsl:variable name="E.Default.Body.E2">
    <lf>
      <satop nomvar="E:state">
        <prop name="[*DEFAULT*]"/>
        <diamond mode="Body"><nomvar name="E2:situation"/></diamond>
      </satop>
    </lf>
  </xsl:variable>
  
  <family name="Modal" pos="V" closed="true">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($aux)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Body.E2"/>
      </xsl:call-template>
    </entry>
    <entry name="Inverted">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($aux.inverted)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Body.E2"/>
      </xsl:call-template>
    </entry>
  </family>
  
  <!-- Progressive -->
  <!-- NB: same as Modal except subcats for form=ng -->
  <xsl:variable name="prog">
    <complexcat>
      <xsl:copy-of select="$s.1.E.dcl.default"/>
      <slash dir="\" mode="&lt;"/>
      <xsl:copy-of select="$np.2.X.nom.default"/>
      <slash dir="/" mode="^"/>
      <complexcat>
        <xsl:copy-of select="$s.E2.ng"/>
        <slash dir="\" mode="&lt;"/>
        <xsl:copy-of select="$np.2.X"/>
      </complexcat>
    </complexcat>
  </xsl:variable>

  <xsl:variable name="prog.inverted">
    <complexcat>
      <xsl:copy-of select="$s.1.from-2.E.q"/>
      <slash dir="/" mode="^"/>
      <xsl:copy-of select="$s.2.E2.ng"/>
    </complexcat>
  </xsl:variable>

  <family name="Progressive" pos="V" closed="true" indexRel="prog">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($prog)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Body.E2"/>
      </xsl:call-template>
    </entry>
    <entry name="Inverted">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($prog.inverted)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Body.E2"/>
      </xsl:call-template>
    </entry>
  </family>
  
  <!-- Negation -->
  <!-- NB: form agreement in morph file -->
  <xsl:variable name="neg">
    <complexcat>
      <xsl:copy-of select="$s.1.from-6.E"/>
      <slash dir="\" mode="&lt;"/>
      <xsl:copy-of select="$np.2.X"/>
      <slash dir="/" mode="^"/>
      <complexcat>
        <xsl:copy-of select="$s.6.E2"/>
        <slash dir="\" mode="&lt;"/>
        <xsl:copy-of select="$np.2.X"/>
      </complexcat>
    </complexcat>
  </xsl:variable>

  <family name="Negation" pos="V" closed="true">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($neg)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Body.E2"/>
      </xsl:call-template>
    </entry>
  </family>
  
  
  <!-- Do Support -->
  <!-- This treatment of 'do' enables wh-questions 
       extracting from subjects and objects to be treated the same;  
       to indicate positive polarity, 'do' can be treated as a modal, 
       with the possibility of lexical emphasis. -->
  <xsl:variable name="do-support.inverted">
    <complexcat>
      <xsl:copy-of select="$s.1.from-2.E.q"/>
      <slash dir="/" mode="^"/>
      <xsl:copy-of select="$s.2.E.base"/>
    </complexcat>
  </xsl:variable>

  <family name="Do-Support" pos="V" closed="true" indexRel="tense">
    <entry name="Inverted">
      <xsl:copy-of select="$do-support.inverted"/>
    </entry>
  </family>
  
  </xsl:template>

</xsl:transform>


================================================
FILE: grammars/core-en/cats.xsl
================================================
<?xml version="1.0"?>
<!-- 
Copyright (C) 2003-4 University of Edinburgh (Michael White)
$Revision: 1.25 $, $Date: 2008/12/11 17:42:31 $ 

NB: These namespace declarations seem to work with the version of Xalan 
    that comes with JDK 1.4.  With newer versions of Xalan, 
    different namespace declarations may be required. 
-->
<xsl:transform 
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform" 
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  exclude-result-prefixes="xalan xalan2">

  
  <!-- ***** Feature Declarations ******  -->

  <xsl:template name="add-feature-declarations">
    <distributive-features attrs="info owner"/>
    <licensing-features>
      <feat attr="form" val="emb" location="target-only"/>
      <feat attr="form" val="inf" location="target-only"/>
      <feat attr="form" val="adj" location="target-only"/>
      <feat attr="form" val="wh" also-licensed-by="q-base" license-marked-cats="true"/>
      <feat attr="form" val="q" also-licensed-by="q-base" license-marked-cats="true"/>
      <feat attr="form" val="q" also-licensed-by="q-base"/>
      <feat attr="owner" instantiate="false" location="args-only"/>
    </licensing-features>
  </xsl:template>

  
  <!-- ***** Base Categories ******  -->
  
  <!-- NB: The distributive attrs (info and owner) need only appear once per atomic category. -->

  <!-- n -->
  <xsl:variable name="n.2.X.default">
    <atomcat type="n">
      <fs id="2">
        <feat attr="num"><featvar name="NUM:num-vals"/></feat>
        <feat attr="index"><lf><nomvar name="X"/></lf></feat>
        <feat attr="info"><lf><var name="INFO"/></lf></feat>
        <feat attr="owner"><lf><var name="OWNER"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="n.2.X.NUM">
    <atomcat type="n">
      <fs id="2">
        <feat attr="num"><featvar name="NUM:num-vals"/></feat>
        <feat attr="index"><lf><nomvar name="X"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="n.2.X">
    <atomcat type="n">
      <fs id="2">
        <feat attr="index"><lf><nomvar name="X"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="n.2.W">
    <atomcat type="n">
      <fs id="2">
        <feat attr="index"><lf><nomvar name="W"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="n.1.from-2.X">
    <atomcat type="n">
      <fs id="1" inheritsFrom="2">
        <feat attr="index"><lf><nomvar name="X"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="n.from-2.X.CASE">
    <atomcat type="n">
      <fs inheritsFrom="2">
        <feat attr="index"><lf><nomvar name="X"/></lf></feat>
        <feat attr="case"><featvar name="CASE"/></feat>
      </fs>
    </atomcat>
  </xsl:variable>
  

  <!-- np -->
  <xsl:variable name="np.2.X.default">
    <atomcat type="np">
      <fs id="2">
        <feat attr="num"><featvar name="NUM:num-vals"/></feat>
        <feat attr="pers"><featvar name="PERS:pers-vals"/></feat>
        <feat attr="case"><featvar name="CASE"/></feat>
        <feat attr="index"><lf><nomvar name="X"/></lf></feat>
        <feat attr="info"><lf><var name="INFO"/></lf></feat>
        <feat attr="owner"><lf><var name="OWNER"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="np.2.X.nom.default">
    <atomcat type="np">
      <fs id="2">
        <feat attr="num"><featvar name="NUM:num-vals"/></feat>
        <feat attr="pers"><featvar name="PERS:pers-vals"/></feat>
        <feat attr="case" val="nom"/>
        <feat attr="index"><lf><nomvar name="X"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="np.2.X.NUM.3rd.CASE">
    <atomcat type="np">
      <fs id="2">
        <feat attr="num"><featvar name="NUM:num-vals"/></feat>
        <feat attr="pers" val="3rd"/>
        <feat attr="case"><featvar name="CASE"/></feat>
        <feat attr="index"><lf><nomvar name="X"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="np.2.X.3rd">
    <atomcat type="np">
      <fs id="2">
        <feat attr="pers" val="3rd"/>
        <feat attr="index"><lf><nomvar name="X"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="np.2.W.3rd">
    <atomcat type="np">
      <fs id="2">
        <feat attr="pers" val="3rd"/>
        <feat attr="index"><lf><nomvar name="W"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="np.2.X">
    <atomcat type="np">
      <fs id="2">
        <feat attr="index"><lf><nomvar name="X"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="np.X">
    <atomcat type="np">
      <fs>
        <feat attr="index"><lf><nomvar name="X"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="np.3.Y.acc">
    <atomcat type="np">
      <fs id="3">
        <feat attr="case" val="acc"/>
        <feat attr="index"><lf><nomvar name="Y"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="np.3.Y.gen">
    <atomcat type="np">
      <fs id="3">
        <feat attr="case" val="gen"/>
        <feat attr="index"><lf><nomvar name="Y"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="np.3.Y.3rd">
    <atomcat type="np">
      <fs id="3">
        <feat attr="pers" val="3rd"/>
        <feat attr="index"><lf><nomvar name="Y"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="np.Y">
    <atomcat type="np">
      <fs>
        <feat attr="index"><lf><nomvar name="Y"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>
  
  <xsl:variable name="np.4.Z.acc">
    <atomcat type="np">
      <fs id="4">
        <feat attr="case" val="acc"/>
        <feat attr="index"><lf><nomvar name="Z"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>
  
  <xsl:variable name="np.Z">
    <atomcat type="np">
      <fs>
        <feat attr="index"><lf><nomvar name="Z"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>
  
  <xsl:variable name="np.X.CASE">
    <atomcat type="np">
      <fs>
        <feat attr="case"><featvar name="CASE"/></feat>
        <feat attr="index"><lf><nomvar name="X"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="np.X1.CASE">
    <atomcat type="np">
      <fs>
        <feat attr="case"><featvar name="CASE"/></feat>
        <feat attr="index"><lf><nomvar name="X1"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="np.X2.CASE">
    <atomcat type="np">
      <fs>
        <feat attr="case"><featvar name="CASE"/></feat>
        <feat attr="index"><lf><nomvar name="X2"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="np.Y.CASE_Y">
    <atomcat type="np">
      <fs>
        <feat attr="case"><featvar name="CASE_Y"/></feat>
        <feat attr="index"><lf><nomvar name="Y"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="np.Y1.CASE_Y">
    <atomcat type="np">
      <fs>
        <feat attr="case"><featvar name="CASE_Y"/></feat>
        <feat attr="index"><lf><nomvar name="Y1"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="np.Y2.CASE_Y">
    <atomcat type="np">
      <fs>
        <feat attr="case"><featvar name="CASE_Y"/></feat>
        <feat attr="index"><lf><nomvar name="Y2"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="np.from-1.S">
    <atomcat type="np">
      <fs inheritsFrom="1">
        <feat attr="index"><lf><nomvar name="S"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  
  <xsl:variable name="np_conj.default">
    <atomcat type="np_conj">
      <fs>
        <feat attr="num"><featvar name="NUM:num-vals"/></feat>
        <feat attr="pers"><featvar name="PERS:pers-vals"/></feat>
        <feat attr="case"><featvar name="CASE"/></feat>
        <feat attr="type"><featvar name="TYPE"/></feat>
        <feat attr="index"><lf><nomvar name="INDEX"/></lf></feat>
        <feat attr="info"><lf><var name="INFO"/></lf></feat>
        <feat attr="owner"><lf><var name="OWNER"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="np_conj.1.L1.op-index-S.pl.CASE.coll">
    <atomcat type="np_conj">
      <fs id="1">
        <feat attr="num" val="pl"/>
        <feat attr="case"><featvar name="CASE"/></feat>
        <feat attr="type" val="coll"/>
        <feat attr="index"><lf><nomvar name="L1"/></lf></feat>
        <feat attr="op-index"><lf><nomvar name="S"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="np_conj.1.L1.op-index-S.pl.CASE.distr">
    <atomcat type="np_conj">
      <fs id="1">
        <feat attr="num" val="pl"/>
        <feat attr="case"><featvar name="CASE"/></feat>
        <feat attr="type" val="distr"/>
        <feat attr="index"><lf><nomvar name="L1"/></lf></feat>
        <feat attr="op-index"><lf><nomvar name="S"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="np_conj.1.L1.op-index-S.NUM.CASE.distr">
    <atomcat type="np_conj">
      <fs id="1">
        <feat attr="num"><featvar name="NUM:num-vals"/></feat>
        <feat attr="case"><featvar name="CASE"/></feat>
        <feat attr="type" val="distr"/>
        <feat attr="index"><lf><nomvar name="L1"/></lf></feat>
        <feat attr="op-index"><lf><nomvar name="S"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="np_conj.L1.op-index-S.NUM.CASE.distr.INFO.OWNER">
    <atomcat type="np_conj">
      <fs>
        <feat attr="num"><featvar name="NUM:num-vals"/></feat>
        <feat attr="case"><featvar name="CASE"/></feat>
        <feat attr="type" val="distr"/>
        <feat attr="index"><lf><nomvar name="L1"/></lf></feat>
        <feat attr="op-index"><lf><nomvar name="S"/></lf></feat>
        <feat attr="info"><lf><var name="INFO"/></lf></feat>
        <feat attr="owner"><lf><var name="OWNER"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="np_conj.from-1.L1.op-index-S">
    <atomcat type="np_conj">
      <fs inheritsFrom="1">
        <feat attr="index"><lf><nomvar name="L1"/></lf></feat>
        <feat attr="op-index"><lf><nomvar name="S"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>
  
  <xsl:variable name="np_conj.1.L2.op-index-S.INFO.OWNER">
    <atomcat type="np_conj">
      <fs id="1">
        <feat attr="index"><lf><nomvar name="L2"/></lf></feat>
        <feat attr="op-index"><lf><nomvar name="S"/></lf></feat>
        <feat attr="info"><lf><var name="INFO"/></lf></feat>
        <feat attr="owner"><lf><var name="OWNER"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  
  <xsl:variable name="np_expl.lex-Default">
    <atomcat type="np_expl">
      <fs>
        <feat attr="lex" val="[*DEFAULT*]"/>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="np_expl.there">
    <atomcat type="np_expl">
      <fs>
        <feat attr="lex" val="there"/>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="np_expl.here">
    <atomcat type="np_expl">
      <fs>
        <feat attr="lex" val="here"/>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="np_expl.it">
    <atomcat type="np_expl">
      <fs>
        <feat attr="lex" val="it"/>
      </fs>
    </atomcat>
  </xsl:variable>

  
  <!-- num -->
  <xsl:variable name="num.2.X.default">
    <atomcat type="num">
      <fs id="2">
        <feat attr="num"><featvar name="NUM:num-vals"/></feat>
        <feat attr="index"><lf><nomvar name="X"/></lf></feat>
        <feat attr="info"><lf><var name="INFO"/></lf></feat>
        <feat attr="owner"><lf><var name="OWNER"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  
  <!-- p -->
  <xsl:variable name="pp.from-3.lex-Default">
    <atomcat type="pp">
      <fs inheritsFrom="3">
        <feat attr="lex" val="[*DEFAULT*]"/>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="pp.3.Y">
    <atomcat type="pp">
      <fs id="3">
        <feat attr="index"><lf><nomvar name="Y"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="pp.3.Y.about">
    <atomcat type="pp">
      <fs id="3">
        <feat attr="index"><lf><nomvar name="Y"/></lf></feat>
        <feat attr="lex" val="about"/>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="pp.3.Y.at">
    <atomcat type="pp">
      <fs id="3">
        <feat attr="index"><lf><nomvar name="Y"/></lf></feat>
        <feat attr="lex" val="at"/>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="pp.3.Y.for">
    <atomcat type="pp">
      <fs id="3">
        <feat attr="index"><lf><nomvar name="Y"/></lf></feat>
        <feat attr="lex" val="for"/>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="pp.3.Y.from">
    <atomcat type="pp">
      <fs id="3">
        <feat attr="index"><lf><nomvar name="Y"/></lf></feat>
        <feat attr="lex" val="from"/>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="pp.3.Y.in">
    <atomcat type="pp">
      <fs id="3">
        <feat attr="index"><lf><nomvar name="Y"/></lf></feat>
        <feat attr="lex" val="in"/>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="pp.3.Y.of">
    <atomcat type="pp">
      <fs id="3">
        <feat attr="index"><lf><nomvar name="Y"/></lf></feat>
        <feat attr="lex" val="of"/>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="pp.3.Y.on">
    <atomcat type="pp">
      <fs id="3">
        <feat attr="index"><lf><nomvar name="Y"/></lf></feat>
        <feat attr="lex" val="on"/>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="pp.3.Y.to">
    <atomcat type="pp">
      <fs id="3">
        <feat attr="index"><lf><nomvar name="Y"/></lf></feat>
        <feat attr="lex" val="to"/>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="pp.3.Y.with">
    <atomcat type="pp">
      <fs id="3">
        <feat attr="index"><lf><nomvar name="Y"/></lf></feat>
        <feat attr="lex" val="with"/>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="pp.4.Z.in">
    <atomcat type="pp">
      <fs id="4">
        <feat attr="index"><lf><nomvar name="Z"/></lf></feat>
        <feat attr="lex" val="in"/>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="pp.4.Z.on">
    <atomcat type="pp">
      <fs id="4">
        <feat attr="index"><lf><nomvar name="Z"/></lf></feat>
        <feat attr="lex" val="on"/>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="pp.4.Z.to">
    <atomcat type="pp">
      <fs id="4">
        <feat attr="index"><lf><nomvar name="Z"/></lf></feat>
        <feat attr="lex" val="to"/>
      </fs>
    </atomcat>
  </xsl:variable>

  
  <!-- punct -->
  <xsl:variable name="punct.comma">
    <atomcat type="punct">
      <fs>
        <feat attr="lex" val=","/>
      </fs>
    </atomcat>
  </xsl:variable>
  

  <xsl:variable name="bt.LH">
    <atomcat type="bt">
      <fs>
        <feat attr="lex" val="LH%"/>
      </fs>
    </atomcat>
  </xsl:variable>
  

  <!-- s -->
  <xsl:variable name="s.1.E.default">
    <atomcat type="s">
      <fs id="1">
        <feat attr="num"><featvar name="NUM:num-vals"/></feat>
        <feat attr="pers"><featvar name="PERS:pers-vals"/></feat>
        <feat attr="form"><featvar name="FORM:form-vals"/></feat>
        <feat attr="index"><lf><nomvar name="E"/></lf></feat>
        <feat attr="info"><lf><var name="INFO"/></lf></feat>
        <feat attr="owner"><lf><var name="OWNER"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="s.1.E.dcl.default">
    <atomcat type="s">
      <fs id="1">
        <feat attr="num"><featvar name="NUM:num-vals"/></feat>
        <feat attr="pers"><featvar name="PERS:pers-vals"/></feat>
        <feat attr="form" val="dcl"/>
        <feat attr="index"><lf><nomvar name="E"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="s.1.E.q.default">
    <atomcat type="s">
      <fs id="1">
        <feat attr="num"><featvar name="NUM:num-vals"/></feat>
        <feat attr="pers"><featvar name="PERS:pers-vals"/></feat>
        <feat attr="form" val="q"/>
        <feat attr="index"><lf><nomvar name="E"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="s.1.E.dcl">
    <atomcat type="s">
      <fs id="1">
        <feat attr="form" val="dcl"/>
        <feat attr="index"><lf><nomvar name="E"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>
  
  <xsl:variable name="s.1.E.dcl-base.phr">
    <atomcat type="s">
      <fs id="1">
        <feat attr="form" val="dcl-base"/>
        <feat attr="info" val="phr"/>
        <feat attr="index"><lf><nomvar name="E"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>
  
  <xsl:variable name="s.1.E.ng.phr">
    <atomcat type="s">
      <fs id="1">
        <feat attr="form" val="ng"/>
        <feat attr="info" val="phr"/>
        <feat attr="index"><lf><nomvar name="E"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>
  
  <xsl:variable name="s.1.E.base">
    <atomcat type="s">
      <fs id="1">
        <feat attr="form" val="base"/>
        <feat attr="index"><lf><nomvar name="E"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>
  
  <xsl:variable name="s.1.E.wh">
    <atomcat type="s">
      <fs id="1">
        <feat attr="form" val="wh"/>
        <feat attr="index"><lf><nomvar name="E"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>
  
  <xsl:variable name="s.1.E.q">
    <atomcat type="s">
      <fs id="1">
        <feat attr="form" val="q"/>
        <feat attr="index"><lf><nomvar name="E"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>
  
  <xsl:variable name="s.1.E.q-base.phr">
    <atomcat type="s">
      <fs id="1">
        <feat attr="form" val="q-base"/>
        <feat attr="info" val="phr"/>
        <feat attr="index"><lf><nomvar name="E"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>
  
  <xsl:variable name="s.1.E.wh.phr">
    <atomcat type="s">
      <fs id="1">
        <feat attr="form" val="wh"/>
        <feat attr="info" val="phr"/>
        <feat attr="index"><lf><nomvar name="E"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>
  
  <xsl:variable name="s.1.from-2.E.q">
    <atomcat type="s">
      <fs id="1" inheritsFrom="2">
        <feat attr="form" val="q"/>
        <feat attr="index"><lf><nomvar name="E"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>
  
  <xsl:variable name="s.1.from-6.E">
    <atomcat type="s">
      <fs id="1" inheritsFrom="6">
        <feat attr="index"><lf><nomvar name="E"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>
  
  <xsl:variable name="s.1.E">
    <atomcat type="s">
      <fs id="1">
        <feat attr="index"><lf><nomvar name="E"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="s.1.E1">
    <atomcat type="s">
      <fs id="1">
        <feat attr="index"><lf><nomvar name="E1"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>
  
  <xsl:variable name="s.1.E2">
    <atomcat type="s">
      <fs id="1">
        <feat attr="index"><lf><nomvar name="E2"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>
  
  <xsl:variable name="s.1.INFO.s">
    <atomcat type="s">
      <fs id="1">
        <feat attr="info"><lf><var name="INFO"/></lf></feat>
        <feat attr="owner"><lf><prop name="s"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="s.1.INFO.h">
    <atomcat type="s">
      <fs id="1">
        <feat attr="info"><lf><var name="INFO"/></lf></feat>
        <feat attr="owner"><lf><prop name="h"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="s.1.q.INFO.h">
    <atomcat type="s">
      <fs id="1">
        <feat attr="form" val="q"/>
        <feat attr="info"><lf><var name="INFO"/></lf></feat>
        <feat attr="owner"><lf><prop name="h"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="s.1">
    <atomcat type="s">
      <fs id="1"/>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="s.2.E.base">
    <atomcat type="s">
      <fs id="2">
        <feat attr="form" val="base"/>
        <feat attr="index"><lf><nomvar name="E"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>
  
  <xsl:variable name="s.2.E2">
    <atomcat type="s">
      <fs id="2">
        <feat attr="index"><lf><nomvar name="E2"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>
  
  <xsl:variable name="s.2.E2.base">
    <atomcat type="s">
      <fs id="2">
        <feat attr="form" val="base"/>
        <feat attr="index"><lf><nomvar name="E2"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>
  
  <xsl:variable name="s.2.E2.ng">
    <atomcat type="s">
      <fs id="2">
        <feat attr="form" val="ng"/>
        <feat attr="index"><lf><nomvar name="E2"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>
  
  <xsl:variable name="s.2.P.adj">
    <atomcat type="s">
      <fs id="2">
        <feat attr="form" val="adj"/>
        <feat attr="index"><lf><nomvar name="P"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>
  
  <xsl:variable name="s.6.E2">
    <atomcat type="s">
      <fs id="6">
        <feat attr="index"><lf><nomvar name="E2"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>
  
  <xsl:variable name="s.E2.dcl">
    <atomcat type="s">
      <fs>
        <feat attr="form" val="dcl"/>
        <feat attr="index"><lf><nomvar name="E2"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>
  
  <xsl:variable name="s.E2.emb">
    <atomcat type="s">
      <fs>
        <feat attr="form" val="emb"/>
        <feat attr="index"><lf><nomvar name="E2"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>
  
  <xsl:variable name="s.E2.base">
    <atomcat type="s">
      <fs>
        <feat attr="form" val="base"/>
        <feat attr="index"><lf><nomvar name="E2"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="s.E2.ng">
    <atomcat type="s">
      <fs>
        <feat attr="form" val="ng"/>
        <feat attr="index"><lf><nomvar name="E2"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="s.E2.inf">
    <atomcat type="s">
      <fs>
        <feat attr="form" val="inf"/>
        <feat attr="index"><lf><nomvar name="E2"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>
  
  <xsl:variable name="s.P.adj">
    <atomcat type="s">
      <fs>
        <feat attr="form" val="adj"/>
        <feat attr="index"><lf><nomvar name="P"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>
  
  <xsl:variable name="s.P.ng">
    <atomcat type="s">
      <fs>
        <feat attr="form" val="ng"/>
        <feat attr="index"><lf><nomvar name="P"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="s.P2.adj">
    <atomcat type="s">
      <fs>
        <feat attr="form" val="adj"/>
        <feat attr="index"><lf><nomvar name="P2"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>
  
  <xsl:variable name="s.from-1.adj">
    <atomcat type="s">
      <fs inheritsFrom="1">
        <feat attr="form" val="adj"/>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="s.from-1.emb">
    <atomcat type="s">
      <fs inheritsFrom="1">
        <feat attr="form" val="emb"/>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="s.from-1.fronted">
    <atomcat type="s">
      <fs inheritsFrom="1">
        <feat attr="form" val="fronted"/>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="s.from-1.inf">
    <atomcat type="s">
      <fs inheritsFrom="1">
        <feat attr="form" val="inf"/>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="s.from-1.S">
    <atomcat type="s">
      <fs inheritsFrom="1">
        <feat attr="index"><lf><nomvar name="S"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="s.from-1.Q.wh">
    <atomcat type="s">
      <fs inheritsFrom="1">
        <feat attr="form" val="wh"/>
        <feat attr="index"><lf><nomvar name="Q"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="s.from-1.E1.NUM.PERS">
    <atomcat type="s">
      <fs inheritsFrom="1">
        <feat attr="num"><featvar name="NUM:num-vals"/></feat>
        <feat attr="pers"><featvar name="PERS:pers-vals"/></feat>
        <feat attr="index"><lf><nomvar name="E1"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="s.from-1.phr.nil">
    <atomcat type="s">
      <fs inheritsFrom="1">
        <feat attr="info" val="phr"/>
        <feat attr="owner" val="nil"/>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="s_conj.default">
    <atomcat type="s_conj">
      <fs>
        <feat attr="num"><featvar name="NUM:num-vals"/></feat>
        <feat attr="pers"><featvar name="PERS:pers-vals"/></feat>
        <feat attr="form"><featvar name="FORM:form-vals"/></feat>
        <feat attr="index"><lf><nomvar name="INDEX"/></lf></feat>
        <feat attr="info"><lf><var name="INFO"/></lf></feat>
        <feat attr="owner"><lf><var name="OWNER"/></lf></feat>
        <feat attr="op-index"><lf><nomvar name="OP-INDEX"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="s_conj.from-1.L1.op-index-S.NUM.PERS">
    <atomcat type="s_conj">
      <fs inheritsFrom="1">
        <feat attr="num"><featvar name="NUM:num-vals"/></feat>
        <feat attr="pers"><featvar name="PERS:pers-vals"/></feat>
        <feat attr="index"><lf><nomvar name="L1"/></lf></feat>
        <feat attr="op-index"><lf><nomvar name="S"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="s_conj.1.L1.op-index-S">
    <atomcat type="s_conj">
      <fs id="1">
        <feat attr="index"><lf><nomvar name="L1"/></lf></feat>
        <feat attr="op-index"><lf><nomvar name="S"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="s_conj.1.L1.op-index-S.adj">
    <atomcat type="s_conj">
      <fs id="1">
        <feat attr="form" val="adj"/>
        <feat attr="index"><lf><nomvar name="L1"/></lf></feat>
        <feat attr="op-index"><lf><nomvar name="S"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="s_conj.1.L2.op-index-S">
    <atomcat type="s_conj">
      <fs id="1">
        <feat attr="index"><lf><nomvar name="L2"/></lf></feat>
        <feat attr="op-index"><lf><nomvar name="S"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  
  <!-- sent -->
  <xsl:variable name="sent.E">
    <atomcat type="sent">
      <fs>
        <feat attr="index"><lf><nomvar name="E"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  
  <!-- VP (ie S\NP) -->
  <xsl:variable name="vp.1.E.2.X">
    <complexcat>
      <xsl:copy-of select="$s.1.E"/>
      <slash dir="\" mode="&lt;"/>
      <xsl:copy-of select="$np.2.X"/>
    </complexcat>
  </xsl:variable>

  <xsl:variable name="vp.E2.inf">
    <complexcat>
      <xsl:copy-of select="$s.E2.inf"/>
      <slash dir="\" mode="&lt;"/>
      <xsl:copy-of select="$np.2.X"/>
    </complexcat>
  </xsl:variable>

  <!-- Predicative forms -->
  <xsl:variable name="pred.adj">    
    <complexcat>
      <xsl:copy-of select="$s.P.adj"/>
      <slash dir="\" mode="&lt;" ability="inert"/>
      <xsl:copy-of select="$np.2.X"/>
    </complexcat>
  </xsl:variable>

  <xsl:variable name="pred.adj.Y">    
    <complexcat>
      <xsl:copy-of select="$s.P.adj"/>
      <slash dir="\" mode="&lt;" ability="inert"/>
      <xsl:copy-of select="$np.Y"/>
    </complexcat>
  </xsl:variable>

  <xsl:variable name="pred.adj.P2.Y">    
    <complexcat>
      <xsl:copy-of select="$s.P2.adj"/>
      <slash dir="\" mode="&lt;" ability="inert"/>
      <xsl:copy-of select="$np.Y"/>
    </complexcat>
  </xsl:variable>

  <xsl:variable name="pred.ng">    
    <complexcat>
      <xsl:copy-of select="$s.P.ng"/>
      <slash dir="\" mode="&lt;"/>
      <xsl:copy-of select="$np.2.X"/>
    </complexcat>
  </xsl:variable>


  <!-- ***** Shared LFs ******  -->
  
  <!-- Rhetorical Relations -->
  <xsl:variable name="S.Default.Core.E.Trib.E2">
    <lf>
      <satop nomvar="S:proposition">
        <prop name="[*DEFAULT*]"/>
        <diamond mode="info"><var name="INFO"/></diamond>
        <diamond mode="owner"><var name="OWNER"/></diamond>
        <diamond mode="kon"><prop name="-"/></diamond>
        <diamond mode="Core"><nomvar name="E:situation"/></diamond>
        <diamond mode="Trib"><nomvar name="E2:situation"/></diamond>
      </satop>
    </lf>
  </xsl:variable>

  <xsl:variable name="S.purpose-rel.Core.E.Trib.E2">
    <lf>
      <satop nomvar="S:proposition">
        <prop name="purpose-rel"/>
        <diamond mode="info"><var name="INFO"/></diamond>
        <diamond mode="owner"><var name="OWNER"/></diamond>
        <diamond mode="kon"><prop name="-"/></diamond>
        <diamond mode="Core"><nomvar name="E:situation"/></diamond>
        <diamond mode="Trib"><nomvar name="E2:situation"/></diamond>
      </satop>
    </lf>
  </xsl:variable>

  <xsl:variable name="S.Default.Core.E.Trib.P">
    <lf>
      <satop nomvar="S:proposition">
        <prop name="[*DEFAULT*]"/>
        <diamond mode="info"><var name="INFO"/></diamond>
        <diamond mode="owner"><var name="OWNER"/></diamond>
        <diamond mode="kon"><prop name="-"/></diamond>
        <diamond mode="Core"><nomvar name="E:situation"/></diamond>
        <diamond mode="Trib"><nomvar name="P:situation"/></diamond>
      </satop>
    </lf>
  </xsl:variable>

  <xsl:variable name="S.elab-rel.Core.E.Trib.P">
    <lf>
      <satop nomvar="S:proposition">
        <prop name="elab-rel"/>
        <diamond mode="info"><var name="INFO"/></diamond>
        <diamond mode="owner"><var name="OWNER"/></diamond>
        <diamond mode="kon"><prop name="-"/></diamond>
        <diamond mode="Core"><nomvar name="E:situation"/></diamond>
        <diamond mode="Trib"><nomvar name="P:situation"/></diamond>
      </satop>
    </lf>
  </xsl:variable>


  <!-- ***** Dummy family, for establishing features for a category ******  -->

  <xsl:template name="add-dummy-family">
    <family name="Dummy" pos="Dummy" closed="true">
      <entry name="np_conj">
        <xsl:copy-of select="$np_conj.default"/>
      </entry>
      <entry name="s_conj">
        <xsl:copy-of select="$s_conj.default"/>
      </entry>
    </family>
  </xsl:template>
  
</xsl:transform>


================================================
FILE: grammars/core-en/conj.xsl
================================================
<?xml version="1.0"?>
<!-- 
Copyright (C) 2003-4 University of Edinburgh (Michael White)
$Revision: 1.9 $, $Date: 2008/12/11 17:42:31 $ 

NB: These namespace declarations seem to work with the version of Xalan 
    that comes with JDK 1.4.  With newer versions of Xalan, 
    different namespace declarations may be required. 
-->
<xsl:transform 
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform" 
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  exclude-result-prefixes="xalan xalan2">

  
  <!-- ***** Categories ***** -->

  <!-- NP coord with 'and' sets num to pl; with 'or', num is unconstrained -->
  <xsl:variable name="bw.np.X1.CASE.bw.bt.fw.np.X2.CASE">
    <slash dir="\" mode="*"/>
    <xsl:copy-of select="$np.X1.CASE"/>
    <slash dir="\" mode="*"/>
    <xsl:copy-of select="$bt.LH"/>
    <slash dir="/" mode="*"/>
    <xsl:copy-of select="$np.X2.CASE"/>
  </xsl:variable>
  
  <xsl:variable name="conj.np.pl.coll">
    <complexcat>
      <xsl:copy-of select="$np_conj.1.L1.op-index-S.pl.CASE.coll"/>
      <xsl:copy-of select="$bw.np.X1.CASE.bw.bt.fw.np.X2.CASE"/>
    </complexcat>
  </xsl:variable>

  <xsl:variable name="conj.np.pl.distr">
    <complexcat>
      <xsl:copy-of select="$np_conj.1.L1.op-index-S.pl.CASE.distr"/>
      <xsl:copy-of select="$bw.np.X1.CASE.bw.bt.fw.np.X2.CASE"/>
    </complexcat>
  </xsl:variable>
  
  <xsl:variable name="conj.np.NUM.distr">
    <complexcat>
      <xsl:copy-of select="$np_conj.1.L1.op-index-S.NUM.CASE.distr"/>
      <xsl:copy-of select="$bw.np.X1.CASE.bw.bt.fw.np.X2.CASE"/>
    </complexcat>
  </xsl:variable>
  
  <xsl:variable name="S.Default.Last.L_N.L1.elem.Item.X1.Next.L2.elem.Item.X2.EqL.L_N">
    <lf>
      <satop nomvar="S:sem-obj">
        <prop name="[*DEFAULT*]"/>
        <diamond mode="Last"><nomvar name="L_N:struct"/></diamond>
      </satop>
      <satop nomvar="L1:struct">
        <prop name="elem"/>
        <diamond mode="Item"><nomvar name="X1:sem-obj"/></diamond>
        <diamond mode="Next">
          <nomvar name="L2:struct"/>
          <prop name="elem"/>
          <diamond mode="Item"><nomvar name="X2:sem-obj"/></diamond>
          <diamond mode="EqL"><nomvar name="L_N:struct"/></diamond>
        </diamond>
      </satop>
    </lf>
  </xsl:variable>

  <!-- sentential coord -->
  <xsl:variable name="conj.sentential.result">
    <xsl:copy-of select="$s_conj.from-1.L1.op-index-S.NUM.PERS"/>
    <slash/>
    <dollar name="1"/>
  </xsl:variable>
  
  <xsl:variable name="conj.sentential.left-arg">
    <slash dir="\" mode="*"/>
    <complexcat>
      <xsl:copy-of select="$s.from-1.E1.NUM.PERS"/>
      <slash/>
      <dollar name="1"/>
    </complexcat>
  </xsl:variable>
  
  <xsl:variable name="conj.sentential.right-arg">
    <slash dir="/" mode="*"/>
    <complexcat>
      <xsl:copy-of select="$s.1.E2"/>
      <slash/>
      <dollar name="1"/>
    </complexcat>
  </xsl:variable>
  
  <xsl:variable name="conj.sentential">
    <complexcat>
      <xsl:copy-of select="$conj.sentential.result"/>
      <xsl:copy-of select="$conj.sentential.left-arg"/>
      <slash dir="\" mode="*"/>
      <xsl:copy-of select="$bt.LH"/>
      <xsl:copy-of select="$conj.sentential.right-arg"/>
    </complexcat>
  </xsl:variable>
  
  <xsl:variable name="S.Default.Last.L_N.L1.elem.Item.E1.Next.L2.elem.Item.E2.EqL.L_N">
    <lf>
      <satop nomvar="S:situation">
        <prop name="[*DEFAULT*]"/>
        <diamond mode="Last"><nomvar name="L_N:struct"/></diamond>
      </satop>
      <satop nomvar="L1:struct">
        <prop name="elem"/>
        <diamond mode="Item"><nomvar name="E1:situation"/></diamond>
        <diamond mode="Next">
          <nomvar name="L2:struct"/>
          <prop name="elem"/>
          <diamond mode="Item"><nomvar name="E2:situation"/></diamond>
          <diamond mode="EqL"><nomvar name="L_N:struct"/></diamond>
        </diamond>
      </satop>
    </lf>
  </xsl:variable>

  <!-- initial, subordinating conj only (this doesn't capture the true relational semantics) -->
  <xsl:variable name="subconj.initial.only">
    <complexcat>
      <xsl:copy-of select="$s.from-1.S"/>
      <slash dir="/" mode="*"/>
      <xsl:copy-of select="$s.1.E2"/>
    </complexcat>
  </xsl:variable>
  
  <xsl:variable name="subconj.initial.vp.only">
    <complexcat>
      <xsl:copy-of select="$s.from-1.S"/>
      <slash dir="/" mode="*"/>
      <complexcat>
        <xsl:copy-of select="$s.1.E2"/>
        <slash dir="\" mode="&lt;"/>
        <xsl:copy-of select="$np.X"/>
      </complexcat>
    </complexcat>
  </xsl:variable>
  
  <xsl:variable name="S.Default.Arg.E2">
    <lf>
      <satop nomvar="S:situation">
        <prop name="[*DEFAULT*]"/>
        <diamond mode="Arg">
          <nomvar name="E2:situation"/>
        </diamond>
      </satop>
    </lf>
  </xsl:variable>


  <!-- Sentential List completion -->
  <xsl:variable name="s-list">
    <typechanging name="s-list">
      <arg>
        <complexcat>
          <xsl:copy-of select="$s_conj.1.L1.op-index-S"/>
          <slash/>
          <dollar name="1"/>
        </complexcat>
      </arg>
      <result>
        <complexcat>
          <xsl:copy-of select="$s.from-1.S"/>
          <slash/>
          <dollar name="1"/>
          <lf>
            <satop nomvar="S:situation">
              <diamond mode="First">
                <nomvar name="L1:struct"/>
              </diamond>
            </satop>
          </lf>
        </complexcat>
      </result>
    </typechanging>
  </xsl:variable>
  
  <!-- Pred-Adj List completion and conversion to prenominal adj -->
  <!-- NB: This is too general; should use subtypes to restrict applicability -->
  <xsl:variable name="pred-adj-list-to-adj">
    <typechanging name="pred-adj-list-to-adj">
      <arg>
        <complexcat>
          <xsl:copy-of select="$s_conj.1.L1.op-index-S.adj"/>
          <slash dir="\"/>
          <xsl:copy-of select="$np.2.X"/>
        </complexcat>
      </arg>
      <result>
        <xsl:call-template name="extend">
          <xsl:with-param name="elt" select="xalan:nodeset($adj)/*"/>
          <xsl:with-param name="ext">
            <lf>
              <satop nomvar="X:sem-obj">
                <diamond mode="GenRel">
                  <nomvar name="S:proposition"/>
                  <diamond mode="First"><nomvar name="L1:struct"/></diamond>
                </diamond>
              </satop>
            </lf>
          </xsl:with-param>
        </xsl:call-template>
      </result>
    </typechanging>
  </xsl:variable>
  

  <!-- NP List completion -->
  <xsl:variable name="np-list-c">
    <typechanging name="np-list-c">
      <arg>
        <xsl:copy-of select="$np_conj.1.L1.op-index-S.pl.CASE.coll"/>
      </arg>
      <result>
        <xsl:call-template name="extend">
          <xsl:with-param name="elt" select="xalan:nodeset($np.from-1.S)/*"/>
          <xsl:with-param name="ext">
            <lf>
              <satop nomvar="S:sem-obj">
                <diamond mode="First">
                  <nomvar name="L1:struct"/>
                </diamond>
              </satop>
            </lf>
          </xsl:with-param>
        </xsl:call-template>
      </result>
    </typechanging>
  </xsl:variable>
  
  <xsl:variable name="S.First.L1.BoundVar.X.Pred.E">
    <lf>
      <satop nomvar="S:situation">
        <diamond mode="First">
          <nomvar name="L1:struct"/>
        </diamond>
        <diamond mode="BoundVar"><nomvar name="X:sem-obj"/></diamond>
        <diamond mode="Pred"><nomvar name="E:situation"/></diamond>
      </satop>
    </lf>
  </xsl:variable>
  
  <xsl:variable name="np-list-d-rightward-TR">
    <typechanging name="np-list-d-&gt;T">
      <arg>
        <xsl:copy-of select="$np_conj.L1.op-index-S.NUM.CASE.distr.INFO.OWNER"/>
      </arg>
      <result>
        <xsl:call-template name="extend">
          <xsl:with-param name="elt" select="xalan:nodeset($qnp.rightward-TR)/*"/>
          <xsl:with-param name="ext" select="$S.First.L1.BoundVar.X.Pred.E"/>
        </xsl:call-template>
      </result>
    </typechanging>
  </xsl:variable>
  
  <xsl:variable name="np-list-d-leftward-TR">
    <typechanging name="np-list-d-&lt;T">
      <arg>
        <xsl:copy-of select="$np_conj.L1.op-index-S.NUM.CASE.distr.INFO.OWNER"/>
      </arg>
      <result>
        <xsl:call-template name="extend">
          <xsl:with-param name="elt" select="xalan:nodeset($qnp.leftward-TR)/*"/>
          <xsl:with-param name="ext" select="$S.First.L1.BoundVar.X.Pred.E"/>
        </xsl:call-template>
      </result>
    </typechanging>
  </xsl:variable>
  
  
  <!-- More sentential options -->
  <xsl:variable name="conj.sentential.binary">
    <complexcat>
      <xsl:copy-of select="$s.from-1.S"/>
      <slash/>
      <dollar name="1"/>
      <xsl:copy-of select="$conj.sentential.left-arg"/>
      <xsl:copy-of select="$conj.sentential.right-arg"/>
    </complexcat>
  </xsl:variable>
  
  <xsl:variable name="conj.sentential.s.vp">
    <complexcat>
      <xsl:copy-of select="$s.from-1.S"/>
      <slash dir="\" mode="*"/>
      <xsl:copy-of select="$s.1.E1"/>
      <slash dir="\" mode="*"/>
      <xsl:copy-of select="$punct.comma"/>
      <slash dir="/" mode="*"/>
      <complexcat>
        <xsl:copy-of select="$s.2.E2"/>
        <slash dir="\" mode="&lt;"/>
        <xsl:copy-of select="$np.X"/>
      </complexcat>
    </complexcat>
  </xsl:variable>
  
  <xsl:variable name="subconj.medial">
    <complexcat>
      <xsl:copy-of select="$s.from-1.S"/>
      <slash dir="\" mode="*"/>
      <xsl:copy-of select="$s.from-1.E1.NUM.PERS"/>
      <slash dir="\" mode="*"/>
      <xsl:copy-of select="$punct.comma"/>
      <slash dir="/" mode="*"/>
      <xsl:copy-of select="$s.1.E2"/>
    </complexcat>
  </xsl:variable>
  
  <xsl:variable name="subconj.initial">
    <complexcat>
      <xsl:copy-of select="$s.from-1.S"/>
      <slash dir="/" mode="*"/>
      <xsl:copy-of select="$s.1.E2"/>
      <slash dir="/" mode="*"/>
      <xsl:copy-of select="$punct.comma"/>
      <slash dir="/" mode="*"/>
      <xsl:copy-of select="$s.from-1.E1.NUM.PERS"/>
    </complexcat>
  </xsl:variable>
  
  <xsl:variable name="S.Default.Arg1.E1.Arg2.E2">
    <lf>
      <satop nomvar="S:situation">
        <prop name="[*DEFAULT*]"/>
        <diamond mode="Arg1">
          <nomvar name="E1:situation"/>
        </diamond>
        <diamond mode="Arg2">
          <nomvar name="E2:situation"/>
        </diamond>
      </satop>
    </lf>
  </xsl:variable>

  <xsl:variable name="S.Default.Arg2.E2">
    <lf>
      <satop nomvar="S:situation">
        <prop name="[*DEFAULT*]"/>
        <diamond mode="Arg2">
          <nomvar name="E2:situation"/>
        </diamond>
      </satop>
    </lf>
  </xsl:variable>
  
  
  <xsl:variable name="subconj.transitional">
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($adv.transitional)/*"/>
      <xsl:with-param name="ext">
        <slash dir="/" mode="*"/>
        <xsl:copy-of select="$s.E2.dcl"/>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>

  <xsl:variable name="E.HasProp.S.Default.Arg.E2">
    <lf>
      <satop nomvar="E:situation">
        <diamond mode="HasProp">
          <nomvar name="S:situation"/>
          <prop name="[*DEFAULT*]"/>
          <diamond mode="Arg">
            <nomvar name="E2:situation"/>
          </diamond>
        </diamond>
      </satop>
    </lf>
  </xsl:variable>

  
  <!-- ***** Conjunction Families ***** -->
  <xsl:template name="add-conj-families">

  <family name="Conj" pos="Conj" closed="true">
    <entry name="NP-Collective"> 
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($conj.np.pl.coll)/*"/>
        <xsl:with-param name="ext" select="$S.Default.Last.L_N.L1.elem.Item.X1.Next.L2.elem.Item.X2.EqL.L_N"/>
      </xsl:call-template>
    </entry>
    <entry name="NP-Distributive-and">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($conj.np.pl.distr)/*"/>
        <xsl:with-param name="ext" select="$S.Default.Last.L_N.L1.elem.Item.X1.Next.L2.elem.Item.X2.EqL.L_N"/>
      </xsl:call-template>
    </entry>
    <entry name="NP-Distributive-or">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($conj.np.NUM.distr)/*"/>
        <xsl:with-param name="ext" select="$S.Default.Last.L_N.L1.elem.Item.X1.Next.L2.elem.Item.X2.EqL.L_N"/>
      </xsl:call-template>
    </entry>
    <entry name="Sentential">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($conj.sentential)/*"/>
        <xsl:with-param name="ext" select="$S.Default.Last.L_N.L1.elem.Item.E1.Next.L2.elem.Item.E2.EqL.L_N"/>
      </xsl:call-template>
    </entry>
    <!-- deferring arg clusters and gapping for now -->
  </family>

  <family name="Conj-Sentential-Binary" pos="Conj" closed="true">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($conj.sentential.binary)/*"/>
        <xsl:with-param name="ext" select="$S.Default.Arg1.E1.Arg2.E2"/>
      </xsl:call-template>
    </entry>
    <entry name="S-VP">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($conj.sentential.s.vp)/*"/>
        <xsl:with-param name="ext" select="$S.Default.Arg1.E1.Arg2.E2"/>
      </xsl:call-template>
    </entry>
  </family>

  <family name="Subconj-Initial-Only" pos="Conj" closed="true">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($subconj.initial.only)/*"/>
        <xsl:with-param name="ext" select="$S.Default.Arg2.E2"/>
      </xsl:call-template>
    </entry>
    <entry name="VP">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($subconj.initial.vp.only)/*"/>
        <xsl:with-param name="ext" select="$S.Default.Arg2.E2"/>
      </xsl:call-template>
    </entry>
  </family>
  
  <family name="Subconj-Medial" pos="Conj" closed="true">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($subconj.medial)/*"/>
        <xsl:with-param name="ext" select="$S.Default.Arg1.E1.Arg2.E2"/>
      </xsl:call-template>
    </entry>
  </family>

  <family name="Subconj-Initial" pos="Conj" closed="true">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($subconj.initial)/*"/>
        <xsl:with-param name="ext" select="$S.Default.Arg1.E1.Arg2.E2"/>
      </xsl:call-template>
    </entry>
  </family>

  <family name="Subconj-Transitional" pos="Conj" closed="true">
    <entry name="Initial">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($subconj.transitional)/*"/>
        <xsl:with-param name="ext" select="$E.HasProp.S.Default.Arg.E2"/>
      </xsl:call-template>
    </entry>
  </family>

  </xsl:template>

</xsl:transform>


================================================
FILE: grammars/core-en/derive-features.xsl
================================================
<?xml version="1.0"?>
<!-- 
Copyright (C) 2003-4 University of Edinburgh (Michael White) 
$Revision: 1.7 $, $Date: 2005/10/26 17:12:28 $ 

This transformation propagates the info and owner features downwards  
and adds a default no k-contrast feature.
-->
<xsl:transform 
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform" 
  version="1.0"
  xmlns:xalan2="http://xml.apache.org/xslt"
  exclude-result-prefixes="xalan2">

  <xsl:output indent="yes" xalan2:indent-amount="2"/> 
  <xsl:strip-space elements="*"/>

  
  <!-- add derived features to nodes (but not node references) --> 
  <xsl:template match="node[not(@idref)]">
    <xsl:copy>
    
      <!-- copy attrs -->
      <xsl:apply-templates select="@*"/>
      
      <!-- inherit nearest @info, or default to rheme, if none -->
      <xsl:if test="not(@info)">
        <xsl:variable name="nearest-info" select="ancestor::node[@info][1]/@info"/>
        <xsl:choose>
          <!-- inherit nearest @info -->
          <xsl:when test="$nearest-info">
            <xsl:attribute name="info"><xsl:value-of select="$nearest-info"/></xsl:attribute>
          </xsl:when>
          <!-- otherwise info=rh -->
          <xsl:otherwise>
            <xsl:attribute name="info">rh</xsl:attribute>
          </xsl:otherwise>
        </xsl:choose>
      </xsl:if>
      <!-- inherit nearest @owner, or set by info/mood, if none -->
      <xsl:if test="not(@owner)">
        <xsl:variable name="nearest-owner" select="ancestor-or-self::node[@owner][1]/@owner"/>
        <xsl:variable name="nearest-other-node" select="ancestor-or-self::node[@info or @mood][1]"/>
        <xsl:choose>
          <!-- inherit nearest @owner, if any -->
          <xsl:when test="$nearest-owner">
            <xsl:attribute name="owner"><xsl:value-of select="$nearest-owner"/></xsl:attribute>
          </xsl:when>
          <!-- use owner=h if nearest info=th or mood=int -->
          <xsl:when test="$nearest-other-node/@info='th' or $nearest-other-node/@mood='int'">
            <xsl:attribute name="owner">h</xsl:attribute>
          </xsl:when>
          <!-- otherwise owner=s -->
          <xsl:otherwise>
            <xsl:attribute name="owner">s</xsl:attribute>
          </xsl:otherwise>
        </xsl:choose>
      </xsl:if>
      <!-- add no k-contrast feature, if none on node or one-of/atts -->
      <xsl:if test="not(@kon) and not(one-of/atts[@kon])">
        <xsl:attribute name="kon">-</xsl:attribute>
      </xsl:if>
      
      <!-- copy rest -->      
      <xsl:apply-templates select="node()"/>
      
    </xsl:copy>
  </xsl:template>
  
  
  <!-- Copy -->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: grammars/core-en/det.xsl
================================================
<?xml version="1.0"?>
<!-- 
Copyright (C) 2003-4 University of Edinburgh (Michael White)
$Revision: 1.5 $, $Date: 2004/11/21 12:06:50 $ 

NB: These namespace declarations seem to work with the version of Xalan 
    that comes with JDK 1.4.  With newer versions of Xalan, 
    different namespace declarations may be required. 
-->
<xsl:transform 
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform" 
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  exclude-result-prefixes="xalan xalan2">

  
  <!-- ***** Categories ***** -->

  <xsl:variable name="fslash-n.2.X.NUM">
    <slash dir="/" mode="^" />
    <xsl:copy-of select="$n.2.X.NUM"/>
  </xsl:variable>
  
  
  <!-- ***** Determiner Families ***** -->
  <xsl:template name="add-det-families">

  <!-- Simple Determiners -->
  <xsl:variable name="det">
    <complexcat>
      <xsl:copy-of select="$np.2.X.3rd"/>
      <xsl:copy-of select="$fslash-n.2.X.NUM"/>
    </complexcat>
  </xsl:variable>
  
  <xsl:variable name="X.det.Default">
    <lf>
      <satop nomvar="X:sem-obj">
        <diamond mode="det">
          <prop name="[*DEFAULT*]"/>
        </diamond>
      </satop>
    </lf>
  </xsl:variable>
  
  <family name="Det" pos="Det" closed="true" indexRel="det">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($det)/*"/>
        <xsl:with-param name="ext" select="$X.det.Default"/>
      </xsl:call-template>
    </entry>
  </family>

  <!-- Predicational Determiners -->
  <xsl:variable name="X.Det.P.Default">
    <lf>
      <satop nomvar="X:sem-obj">
        <diamond mode="Det">
          <nomvar name="P:proposition"/>
          <prop name="[*DEFAULT*]"/>
        </diamond>
      </satop>
    </lf>
  </xsl:variable>
  
  <family name="PDet" pos="PDet" closed="true">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($det)/*"/>
        <xsl:with-param name="ext" select="$X.Det.P.Default"/>
      </xsl:call-template>
    </entry>
  </family>
  
  <!-- 'One' Determiner: essentially a special case of the card and bare plural rules --> 
  <family name="One-Det" pos="Num" closed="true">
    <entry name="Primary">
      <complexcat>
        <xsl:copy-of select="$np.2.W.3rd"/>
        <slash dir="/" mode="^" />
        <xsl:copy-of select="$n.2.W"/>
        <lf>
          <satop nomvar="W:sem-obj">
            <diamond mode="det"><prop name="nil"/></diamond>
            <diamond mode="Card"><nomvar name="X:num"/></diamond>
          </satop>
          <satop nomvar="X:num">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>

  <!-- Possessive Pronouns -->
  <xsl:variable name="X.GenOwner.P.Default">
    <lf>
      <satop nomvar="X:sem-obj">
        <diamond mode="GenOwner">
          <nomvar name="P:sem-obj"/>
          <prop name="[*DEFAULT*]"/>
        </diamond>
      </satop>
    </lf>
  </xsl:variable>
  
  <family name="PossPro" pos="PossPro" closed="true">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($det)/*"/>
        <xsl:with-param name="ext" select="$X.GenOwner.P.Default"/>
      </xsl:call-template>
    </entry>
  </family>
  
  <!-- 's :- np[X]/n[X]\np[Y] :- @X(<GenOwner>Y) -->
  <xsl:variable name="poss.s">
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($det)/*"/>
      <xsl:with-param name="ext">
        <slash dir="\" mode="&lt;"/>
        <xsl:copy-of select="$np.3.Y.gen"/>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>
  
  <xsl:variable name="X.GenOwner.Y">
    <lf>
      <satop nomvar="X:sem-obj">
        <diamond mode="GenOwner">
          <nomvar name="Y:sem-obj"/>
        </diamond>
      </satop>
    </lf>
  </xsl:variable>
  
  <family name="PossS" pos="PossS" closed="true" indexRel="GenOwner">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($poss.s)/*"/>
        <xsl:with-param name="ext" select="$X.GenOwner.Y"/>
      </xsl:call-template>
    </entry>
  </family>
  
  <!-- Quantificational Determiners -->
  <xsl:variable name="qdet.rightward-TR">
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($qnp.rightward-TR)/*"/>
      <xsl:with-param name="ext" select="$fslash-n.2.X.NUM"/>
    </xsl:call-template>
  </xsl:variable>

  <xsl:variable name="qdet.leftward-TR">    
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($qnp.leftward-TR)/*"/>
      <xsl:with-param name="ext" select="$fslash-n.2.X.NUM"/>
    </xsl:call-template>
  </xsl:variable>

  <family name="QuantDet" pos="QDet" closed="true">
    <entry name="RightwardTypeRaised">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($qdet.rightward-TR)/*"/>
        <xsl:with-param name="ext" select="$S.Default.Restr.X.Body.E"/>
      </xsl:call-template>
    </entry>
    <entry name="LeftwardTypeRaised">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($qdet.leftward-TR)/*"/>
        <xsl:with-param name="ext" select="$S.Default.Restr.X.Body.E"/>
      </xsl:call-template>
    </entry>
  </family>

  <!-- Wh Determiners -->
  <xsl:variable name="wh-det.subj">    
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($wh-np.subj)/*"/>
      <xsl:with-param name="ext" select="$fslash-n.2.X.NUM"/>
    </xsl:call-template>
  </xsl:variable>

  <xsl:variable name="wh-det.obj">    
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($wh-np.obj)/*"/>
      <xsl:with-param name="ext" select="$fslash-n.2.X.NUM"/>
    </xsl:call-template>
  </xsl:variable>

  <xsl:variable name="wh-det.leftward-TR">    
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($wh-np.leftward-TR)/*"/>
      <xsl:with-param name="ext" select="$fslash-n.2.X.NUM"/>
    </xsl:call-template>
  </xsl:variable>

  <family name="WhDet" pos="Wh" closed="true">
    <entry name="SubjectExtraction">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($wh-det.subj)/*"/>
        <xsl:with-param name="ext" select="$Q.Default.Restr.X.Body.E"/>
      </xsl:call-template>
    </entry>
    <entry name="ObjectExtraction">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($wh-det.obj)/*"/>
        <xsl:with-param name="ext" select="$Q.Default.Restr.X.Body.E"/>
      </xsl:call-template>
    </entry>
    <entry name="ObjectInSitu">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($wh-det.leftward-TR)/*"/>
        <xsl:with-param name="ext" select="$Q.Default.Restr.X.Body.E"/>
      </xsl:call-template>
    </entry>
  </family>

  </xsl:template>

</xsl:transform>


================================================
FILE: grammars/core-en/dict.xsl
================================================
<?xml version="1.0"?>
<!-- 
Copyright (C) 2003-4 University of Edinburgh (Michael White)
$Revision: 1.23 $, $Date: 2005/11/11 22:01:20 $ 

NB: These namespace declarations seem to work with the version of Xalan 
    that comes with JDK 1.4.  With newer versions of Xalan, 
    different namespace declarations may be required. 
-->
<xsl:transform 
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform" 
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  exclude-result-prefixes="xalan xalan2">

  
  <!-- ***** Core Entries ***** -->
  <xsl:template name="add-entries">

  <!-- Dummy entry, for establishing features for a category -->
  <entry stem="*dummy*" pos="Dummy">
    <member-of family="Dummy"/>
  </entry>

  <!-- Generic entries for dates, times, numbers, amounts, durations -->
  <entry stem="[*DATE*]" pos="NNP" class="date"/>
  <entry stem="[*TIME*]" pos="NNP" class="time"/>
  <entry stem="[*NUM*]" pos="Num" class="num" macros="@pl-2"/>
  <entry stem="[*AMT*]" pos="NNP" class="amt"/>
  <entry stem="[*DUR*]" pos="NNP" class="dur"/>
  
  <!-- Boundary Tones -->
  <entry stem="L" pos="BT">
    <member-of family="BoundaryTone-L-LL%"/>
  </entry>
  <entry stem="LL%" pos="BT">
    <member-of family="BoundaryTone-L-LL%"/>
  </entry>
  <entry stem="LH%" pos="BT">
    <member-of family="BoundaryTone-LH%"/>
  </entry>
  <entry stem="HH%" pos="BT">
    <member-of family="BoundaryTone-HH%"/>
  </entry>
  
  <!-- Punctuation -->
  <entry stem="," pos=",">
    <member-of family="Comma"/>
    <member-of family="Comma-Elab" pred="elab-rel"/>
  </entry>
  <entry stem="." pos=".">
    <member-of family="FullStop"/>
  </entry>
  <entry stem="?" pos="?">
    <member-of family="QuestionMark"/>
  </entry>

  <!-- Complementizer -->
  <entry stem="that" pos="Comp">
    <member-of family="Comp"/>
  </entry>

  <!-- Relative Pronoun -->
  <entry stem="that" pos="RelPro">
    <member-of family="RelPro"/>
    <member-of family="RelPro-Appos" pred="elab-rel"/>
  </entry>

  <!-- Personal Pronouns, including possessives -->
  <entry stem="pro1" pos="Pro" class="animate-being" macros="@1st">
    <member-of family="ProNP"/>
    <word form="I" macros="@sg @nom"/>
    <word form="me" macros="@sg @acc"/>
    <word form="we" macros="@pl @nom"/>
    <word form="us" macros="@pl @acc"/>
  </entry>
  <entry stem="pro1" pos="PossPro" class="animate-being">
    <member-of family="PossPro"/>
    <word form="my" macros="@sg-P"/>
    <word form="our" macros="@pl-P"/>
  </entry>
  <entry word="you" stem="pro2" pos="Pro" class="animate-being" macros="@2nd">
    <member-of family="ProNP"/>
  </entry>
  <entry word="your" stem="pro2" pos="PossPro" class="animate-being">
    <member-of family="PossPro"/>
  </entry>
  <entry stem="pro3f" pos="Pro" macros="@3rd">
    <member-of family="ProNP"/>
    <word form="she" macros="@sg @nom"/>
    <word form="her" macros="@sg @acc"/>
  </entry>
  <entry word="her" stem="pro3f" pos="PossPro" macros="@sg-P">
    <member-of family="PossPro"/>
  </entry>
  <entry stem="pro3m" pos="Pro" macros="@3rd">
    <member-of family="ProNP"/>
    <word form="he" macros="@sg @nom"/>
    <word form="him" macros="@sg @acc"/>
  </entry>
  <entry word="his" stem="pro3m" pos="PossPro" macros="@sg-P">
    <member-of family="PossPro"/>
  </entry>
  <entry stem="pro3n" pos="Pro" macros="@3rd">
    <member-of family="ProNP"/>
    <word form="it" macros="@sg"/>
    <word form="they" macros="@pl @nom"/>
    <word form="them" macros="@pl @acc"/>
  </entry>
  <entry stem="pro3n" pos="PossPro">
    <member-of family="PossPro"/>
    <word form="its" macros="@sg-P"/>
    <word form="their" macros="@pl-P"/>
  </entry>

  <!-- Demonstrative Pronouns -->
  <entry stem="this" pos="Pro" macros="@3rd">
    <member-of family="ProNP"/>
    <word form="this" macros="@sg"/>
    <word form="these" macros="@pl"/>
  </entry>
  
  <entry stem="that" pos="Pro" macros="@3rd">
    <member-of family="ProNP"/>
    <word form="that" macros="@sg"/>
    <word form="those" macros="@pl"/>
  </entry>
  
  <!-- Pro-One -->
  <entry stem="pro_one" pos="N">
    <word form="one" macros="@sg"/>
    <word form="ones" macros="@pl"/>
  </entry>
  
  <!-- Expletive NPs -->
  <entry stem="it" pos="Expl">
    <member-of family="ExplNP"/>
  </entry>
  <entry stem="there" pos="Expl">
    <member-of family="ExplNP"/>
  </entry>
  <entry stem="here" pos="Expl">
    <member-of family="ExplNP"/>
  </entry>
  
  <!-- Conjunctions -->
  <entry stem="and" pos="Conj">
    <member-of family="Conj"/>
    <stem-for family="Conj" entry="NP-Collective"/>
    <stem-for family="Conj" entry="NP-Distributive-and"/>
    <member-of family="Subconj-Initial-Only"/>
  </entry>
  <entry stem="or" pos="Conj">
    <member-of family="Conj"/>
    <stem-for family="Conj" entry="NP-Distributive-or"/>
    <member-of family="Subconj-Initial-Only"/>
  </entry>
  <entry stem="but" pos="Conj">
    <member-of family="Conj-Sentential-Binary"/>
    <member-of family="Subconj-Initial-Only"/>
    <member-of family="Subconj-Medial"/>
  </entry>
  <entry stem="although" pos="Conj">
    <member-of family="Subconj-Initial"/>
  </entry>
  <entry stem="if" pos="Conj">
    <member-of family="Subconj-Initial"/>
  </entry>
  <entry stem="while" pos="Conj">
    <member-of family="Subconj-Medial"/>
  </entry>

  <!-- Quantifiers -->
  <entry stem="everyone" pred="every" pos="QNP" macros="@sg-2">
    <member-of family="QuantNP"/>
  </entry>
  <entry stem="both" pos="QNP" macros="@pl-2">
    <member-of family="QuantNP"/>
  </entry>
  <entry stem="neither" pos="QNP" macros="@sg-2">
    <member-of family="QuantNP"/>
  </entry>
  <entry stem="none" pos="QNP" macros="@pl-2">
    <member-of family="QuantNP"/>
  </entry>
  <entry stem="all" pos="QNP" macros="@pl-or-mass-2">
    <member-of family="QuantNP"/>
  </entry>

  <!-- Wh words -->
  <entry stem="what" pos="WhNP">
    <member-of family="WhNP"/>
  </entry>
  <entry stem="where" pos="WhNP" macros="@X-location">
    <member-of family="WhNP"/>
  </entry>
  <entry stem="who" pos="WhNP" macros="@X-person">
    <member-of family="WhNP"/>
  </entry>

  <!-- Simple determiners -->
  <entry stem="a" pos="Det" macros="@sg-2">
    <member-of family="Det"/>
    <word form="a"/>
    <word form="an"/>
  </entry>
  <entry stem="some" pos="Det">
    <member-of family="Det"/>
  </entry>
  <entry stem="the" pos="Det">
    <member-of family="Det"/>
  </entry>

  <!-- Predicational determiners -->
  <entry stem="another" pos="PDet" macros="@sg-2">
    <member-of family="PDet"/>
  </entry>
  <entry stem="this" pos="PDet">
    <member-of family="PDet"/>
    <word form="this" macros="@sg-or-mass-2"/>
    <word form="these" macros="@pl-2"/>
  </entry>
  <entry stem="that" pos="PDet">
    <member-of family="PDet"/>
    <word form="that" macros="@sg-or-mass-2"/>
    <word form="those" macros="@pl-2"/>
  </entry>
  
  <!-- Possessive 's -->
  <entry stem="'s" pos="PossS">
    <member-of family="PossS"/>
  </entry>

  <!-- Quant dets -->
  <entry stem="all" pos="QDet" macros="@pl-or-mass-2">
    <member-of family="QuantDet"/>
  </entry>
  <entry stem="both" pos="QDet" macros="@pl-2">
    <member-of family="QuantDet"/>
  </entry>
  <entry stem="every" pos="QDet" macros="@sg-2">
    <member-of family="QuantDet"/>
  </entry>
  <entry stem="neither" pos="QDet" macros="@sg-2">
    <member-of family="QuantDet"/>
  </entry>
  <entry stem="no" pos="QDet">
    <member-of family="QuantDet"/>
  </entry>

  <!-- Wh dets -->
  <entry stem="what" pos="Wh">
    <member-of family="WhDet"/>
  </entry>
  <entry stem="which" pos="Wh">
    <member-of family="WhDet"/>
  </entry>

  <!-- Adverbs -->
  <entry stem="also" pos="Adv">
    <member-of family="Adverb"/>
  </entry>
  <entry stem="either" pos="Adv">
    <member-of family="Adverb"/>
  </entry>
  <entry stem="though" pos="Adv">
    <member-of family="Adverb"/>
  </entry>
  <entry stem="too" pos="Adv">
    <member-of family="Adverb"/>
  </entry>

  <!-- Prepositions -->
  <entry stem="with" pos="Prep">
    <member-of family="Prep-Nom"/>
    <member-of family="With-Poss"/>
  </entry>
  
  <!-- Modal verbs -->
  <entry stem="can" pos="V">
    <member-of family="Modal"/>
  </entry>
  <entry stem="may" pos="V">
    <member-of family="Modal"/>
  </entry>
  <entry stem="should" pos="V">
    <member-of family="Modal"/>
  </entry>
  <entry stem="would" pos="V">
    <member-of family="Modal"/>
    <word form="would"/>
    <word form="'d"/>
  </entry>
  <entry stem="will" pos="V">
    <member-of family="Modal"/>
    <word form="will"/>
    <word form="'ll"/>
  </entry>

  <!-- Not -->
  <entry stem="not" pos="V">
    <member-of family="Negation"/>
    <word form="not" macros="@base @base6"/>
    <word form="n't" macros="@base @base6"/>
    <word form="not" macros="@adj @adj6"/>
    <word form="n't" macros="@adj @adj6"/>
  </entry>
  
  <!-- Do -->
  <entry stem="do" pos="V">
    <member-of family="Modal"/>
    <member-of family="Do-Support"/>
    <word form="do" macros="@pres @sg-agr @non-3rd-agr"/>
    <word form="does" macros="@pres @sg-or-mass-agr @3rd-agr"/>
    <word form="do" macros="@pres @pl-agr"/>
    <word form="did" macros="@past"/>
  </entry>

  <!-- Be -->
  <entry stem="be" pos="V">
    <member-of family="Copula"/>
    <member-of family="Progressive" pred="prog"/>
    <member-of family="ThereExistential" pred="there-be"/>
    <member-of family="HereExistential" pred="here-be"/>
    <word form="be" macros="@base" excluded="Inverted"/>
    <word form="am" macros="@pres @sg-agr @1st-agr"/>
    <word form="'m" macros="@pres @sg-agr @1st-agr"/>
    <word form="are" macros="@pres @sg-agr @2nd-agr"/>
    <word form="'re" macros="@pres @sg-agr @2nd-agr"/>
    <word form="is" macros="@pres @sg-or-mass-agr @3rd-agr"/>
    <word form="'s" macros="@pres @sg-or-mass-agr @3rd-agr"/>
    <word form="are" macros="@pres @pl-agr"/>
    <word form="'re" macros="@pres @pl-agr"/>
    <word form="was" macros="@past @sg-agr @1st-agr"/>
    <word form="were" macros="@past @sg-agr @2nd-agr"/>
    <word form="was" macros="@past @sg-or-mass-agr @3rd-agr"/>
    <word form="were" macros="@past @pl-agr"/>
  </entry>

  <!-- Have (aux use tbd) -->
  <entry stem="have" pos="V">
    <member-of family="Possession"/>
    <word form="have" macros="@base" excluded="Inverted"/>
    <word form="have" macros="@pres @sg-agr @non-3rd-agr"/>
    <word form="has" macros="@pres @sg-or-mass-agr @3rd-agr"/>
    <word form="have" macros="@pres @pl-agr"/>
    <word form="had" macros="@past"/>
  </entry>

  <!-- Like -->
  <entry stem="like" pos="V">
    <member-of family="Experiencer-Subj"/>
    <word form="like" macros="@base"/>
    <word form="liking" macros="@ng"/>
    <word form="like" macros="@pres @sg-agr @non-3rd-agr"/>
    <word form="likes" macros="@pres @sg-or-mass-agr @3rd-agr"/>
    <word form="like" macros="@pres @pl-agr"/>
    <word form="liked" macros="@past"/>
  </entry>

  <!-- Make -->
  <entry stem="make" pos="V">
    <member-of family="Agentive-Causing"/>
    <word form="make" macros="@base"/>
    <word form="making" macros="@ng"/>
    <word form="make" macros="@pres @sg-agr @non-3rd-agr"/>
    <word form="makes" macros="@pres @sg-or-mass-agr @3rd-agr"/>
    <word form="make" macros="@pres @pl-agr"/>
    <word form="made" macros="@past"/>
  </entry>

  <!-- Mention -->
  <entry stem="mention" pos="V">
    <member-of family="Statement"/>
    <word form="mention" macros="@pres @sg-agr @non-3rd-agr"/>
    <word form="mentions" macros="@pres @sg-or-mass-agr @3rd-agr"/>
    <word form="mention" macros="@pres @pl-agr"/>
    <word form="mentioned" macros="@past"/>
  </entry>

  <!-- Say -->
  <entry stem="say" pos="V">
    <member-of family="Statement"/>
    <word form="say" macros="@pres @sg-agr @non-3rd-agr"/>
    <word form="says" macros="@pres @sg-or-mass-agr @3rd-agr"/>
    <word form="say" macros="@pres @pl-agr"/>
    <word form="said" macros="@past"/>
  </entry>

  <!-- Specific numbers -->
  <entry stem="one" pos="Num" class="num" macros="@sg-2">
    <member-of family="One-Det"/>
  </entry>
  <entry stem="1" pos="Num" class="num" macros="@sg-2">
    <member-of family="One-Det"/>
  </entry>
  <entry stem="several" pos="Num" class="num" macros="@pl-2"/>
  <entry stem="two" pos="Num" class="num" macros="@pl-2"/>
  <entry stem="three" pos="Num" class="num" macros="@pl-2"/>
  <entry stem="four" pos="Num" class="num" macros="@pl-2"/>
  <entry stem="five" pos="Num" class="num" macros="@pl-2"/>
  <entry stem="six" pos="Num" class="num" macros="@pl-2"/>
  <entry stem="seven" pos="Num" class="num" macros="@pl-2"/>
  <entry stem="eight" pos="Num" class="num" macros="@pl-2"/>
  <entry stem="nine" pos="Num" class="num" macros="@pl-2"/>
  <entry stem="ten" pos="Num" class="num" macros="@pl-2"/>
  
  </xsl:template>


  <!-- ***** Core Macros ***** -->
  <xsl:template name="add-macros">
  
  <macro name="@mass">
    <fs id="2" attr="num" val="mass"/>
  </macro>

  <macro name="@sg">
    <fs id="2" attr="num" val="sg"/>
    <lf>
      <satop nomvar="X">
        <diamond mode="num"><prop name="sg"/></diamond>
      </satop>
    </lf>
  </macro>

  <macro name="@sg-agr">
    <fs id="1" attr="num" val="sg"/>
    <fs id="2" attr="num" val="sg"/>
  </macro>

  <macro name="@sg-or-mass-agr">
    <fs id="1">
      <feat attr="num"><featvar name="NUM:sg-or-mass"/></feat>
    </fs>
    <fs id="2">
      <feat attr="num"><featvar name="NUM:sg-or-mass"/></feat>
    </fs>
  </macro>

  <macro name="@sg-2">
    <fs id="2" attr="num" val="sg"/>
  </macro>

  <macro name="@sg-or-mass-2">
    <fs id="2" attr="num" val="sg-or-mass"/>
  </macro>

  <macro name="@sg-P">
    <lf>
      <satop nomvar="P">
        <diamond mode="num"><prop name="sg"/></diamond>
      </satop>
    </lf>
  </macro>

  <macro name="@pl">
    <fs id="2" attr="num" val="pl"/>
    <lf>
      <satop nomvar="X">
        <diamond mode="num"><prop name="pl"/></diamond>
      </satop>
    </lf>
  </macro>

  <macro name="@pl-agr">
    <fs id="1" attr="num" val="pl"/>
    <fs id="2" attr="num" val="pl"/>
  </macro>

  <macro name="@pl-2">
    <fs id="2" attr="num" val="pl"/>
  </macro>

  <macro name="@pl-or-mass-2">
    <fs id="2" attr="num" val="pl-or-mass"/>
  </macro>

  <macro name="@pl-P">
    <lf>
      <satop nomvar="P">
        <diamond mode="num"><prop name="pl"/></diamond>
      </satop>
    </lf>
  </macro>

  <macro name="@1st">
    <fs id="2" attr="pers" val="1st"/>
  </macro>

  <macro name="@1st-agr">
    <fs id="1" attr="pers" val="1st"/>
    <fs id="2" attr="pers" val="1st"/>
  </macro>

  <macro name="@2nd">
    <fs id="2" attr="pers" val="2nd"/>
  </macro>

  <macro name="@2nd-agr">
    <fs id="1" attr="pers" val="2nd"/>
    <fs id="2" attr="pers" val="2nd"/>
  </macro>

  <macro name="@non-3rd-agr">
    <fs id="1">
      <feat attr="pers"><featvar name="PERS:non-3rd"/></feat>
    </fs>
    <fs id="2">
      <feat attr="pers"><featvar name="PERS:non-3rd"/></feat>
    </fs>
  </macro>

  <macro name="@3rd">
    <fs id="2" attr="pers" val="3rd"/>
  </macro>

  <macro name="@3rd-agr">
    <fs id="1" attr="pers" val="3rd"/>
    <fs id="2" attr="pers" val="3rd"/>
  </macro>

  <macro name="@nom">
    <fs id="2" attr="case" val="nom"/>
  </macro>

  <macro name="@acc">
    <fs id="2" attr="case" val="acc"/>
  </macro>

  <macro name="@pp-from">
    <fs id="3" attr="lex" val="from"/>
  </macro>

  <macro name="@pp-to">
    <fs id="3" attr="lex" val="to"/>
  </macro>

  <macro name="@prt-up">
    <fs id="4" attr="lex" val="up"/>
  </macro>

  <macro name="@prt-with">
    <fs id="4" attr="lex" val="with"/>
  </macro>

  <macro name="@ng">
    <fs id="1" attr="form" val="ng"/>
  </macro>

  <macro name="@base">
    <fs id="1" attr="form" val="base"/>
  </macro>

  <macro name="@base6">
    <fs id="6" attr="form" val="base"/>
  </macro>

  <macro name="@dcl">
    <fs id="1">
      <feat attr="form" val="dcl"/>
    </fs>
  </macro>

  <macro name="@adj">
    <fs id="1" attr="form" val="adj"/>
  </macro>

  <macro name="@adj6">
    <fs id="6" attr="form" val="adj"/>
  </macro>

  <macro name="@X-location">
    <fs id="2">
      <feat attr="index"><lf><nomvar name="X:location"/></lf></feat> 
    </fs>
  </macro>

  <macro name="@X-person">
    <fs id="2">
      <feat attr="index"><lf><nomvar name="X:person"/></lf></feat> 
    </fs>
  </macro>

  <macro name="@past">
    <lf>
      <satop nomvar="E">
        <diamond mode="tense"><prop name="past"/></diamond>
      </satop>
    </lf>
  </macro>

  <macro name="@pres">
    <lf>
      <satop nomvar="E">
        <diamond mode="tense"><prop name="pres"/></diamond>
      </satop>
    </lf>
  </macro>

  </xsl:template>

</xsl:transform>


================================================
FILE: grammars/core-en/drop-features.xsl
================================================
<?xml version="1.0"?>
<!-- 
Copyright (C) 2003-4 University of Edinburgh (Michael White) 
$Revision: 1.6 $, $Date: 2005/07/18 21:19:44 $ 

This transformation drops any info and owner features that are derivable from 
their parent nodes, as well as any default no k-contrast features.
-->
<xsl:transform 
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform" 
  version="1.0"
  xmlns:xalan2="http://xml.apache.org/xslt"
  exclude-result-prefixes="xalan2">

  <xsl:output indent="yes" xalan2:indent-amount="2"/> 
  <xsl:strip-space elements="*"/>

  
  <!-- drop default no k-contrast features -->
  <xsl:template match="@kon[string(.)='-']"/>

  <!-- drop info or owner features when same as parent -->
  <xsl:template match="@info[string(.)=string(../ancestor::node[@info][1]/@info)]" priority="1.0"/>
  <xsl:template match="@owner[string(.)=string(../ancestor::node[@owner][1]/@owner)]" priority="1.0"/>
  
  <!-- drop info when missing -->
  <xsl:template match="@info[string(.)='']"/>

  <!-- drop owner when predictable from info or mood -->
  <xsl:template match="@owner[string(.)='h' and ../@info='th']"/>
  <xsl:template match="@owner[string(.)='h' and ../@mood='int']"/>
  <xsl:template match="@owner[string(.)='s' and not(../ancestor::node[@owner][1]/@owner) 
                              and (../@info='rh' or ../@info='') and not(../@mood='int')]"/>
  
  
  <!-- Copy -->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: grammars/core-en/lexicon.xsl
================================================
<?xml version="1.0"?>
<!-- 
Copyright (C) 2003-4 University of Edinburgh (Michael White)
$Revision: 1.4 $, $Date: 2004/10/05 11:01:47 $ 

The principal sources for this grammar are Hockenmaier 03, Baldridge 02 
and Carpenter 92.  The intonation stuff is from Steedman LI 00. 
Semantic roles taken from FrameNet where possible.

Notes: 
 - The features s[base] and s[inf] are used instead of s[b] and s[to]  
   (cf Hockenmaier 03).
 - Boundary tones are handled differently from Steedman LI 00, namely with 
   distributed semantic features, in order to better allow for discontinuous 
   themes/rhemes.  Also, NP and S lists have LH% boundaries built in (though 
   binary conjunctions like 'but' don't).

NB: These namespace declarations seem to work with the version of Xalan 
    that comes with JDK 1.4.  With newer versions of Xalan, 
    different namespace declarations may be required. 
-->
<xsl:transform 
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform" 
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  exclude-result-prefixes="xalan xalan2">
  
  <xsl:include href="templates.xsl"/>
  <xsl:include href="cats.xsl"/>
  <xsl:include href="np.xsl"/>
  <xsl:include href="det.xsl"/>
  <xsl:include href="adj.xsl"/>
  <xsl:include href="adv.xsl"/>
  <xsl:include href="pp.xsl"/>
  <xsl:include href="v.xsl"/>
  <xsl:include href="auxv.xsl"/>
  <xsl:include href="conj.xsl"/>
  <xsl:include href="misc.xsl"/>
  <xsl:include href="punct.xsl"/>
  <xsl:include href="unary-rules.xsl"/>

  <xsl:template name="add-core-families">
    <xsl:call-template name="add-dummy-family"/>
    <xsl:call-template name="add-np-families"/>
    <xsl:call-template name="add-det-families"/>
    <xsl:call-template name="add-adj-families"/>
    <xsl:call-template name="add-adv-families"/>
    <xsl:call-template name="add-pp-families"/>
    <xsl:call-template name="add-v-families"/>
    <xsl:call-template name="add-aux-families"/>
    <xsl:call-template name="add-conj-families"/>
    <xsl:call-template name="add-misc-families"/>
    <xsl:call-template name="add-punct-families"/>
  </xsl:template>
  
</xsl:transform>


================================================
FILE: grammars/core-en/misc.xsl
================================================
<?xml version="1.0"?>
<!-- 
Copyright (C) 2003-4 University of Edinburgh (Michael White)
$Revision: 1.5 $, $Date: 2004/11/21 12:06:50 $ 

NB: These namespace declarations seem to work with the version of Xalan 
    that comes with JDK 1.4.  With newer versions of Xalan, 
    different namespace declarations may be required. 
-->
<xsl:transform 
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform" 
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  exclude-result-prefixes="xalan xalan2">

  
  <!-- ***** Categories ***** -->
  <xsl:variable name="X.GenRel.E">
    <lf>
      <satop nomvar="X:sem-obj">
        <diamond mode="GenRel"><nomvar name="E:situation"/></diamond>
      </satop>
    </lf>
  </xsl:variable>  
  
  
  <!-- ***** Misc Families ***** -->
  <xsl:template name="add-misc-families">

  <!-- Relativizer -->
  <xsl:variable name="rel">
    <complexcat>
      <xsl:copy-of select="$n.from-2.X.CASE"/>
      <setarg>
        <slash dir="\" mode="*"/>
        <xsl:copy-of select="$n.from-2.X.CASE"/>
        <slash dir="/" mode="*"/>
        <complexcat>
          <xsl:copy-of select="$s.1.E.dcl"/>
          <slash dir="|"/>
          <xsl:copy-of select="$np.2.X.3rd"/>
        </complexcat>
      </setarg>
    </complexcat>
  </xsl:variable>

  <!-- Appositive Relative Clauses -->  
  <xsl:variable name="rel.appos">
    <complexcat>
      <xsl:copy-of select="$s.from-1.S"/>
      <slash dir="\" mode="*"/>
      <xsl:copy-of select="$s.1.E.default"/>
      <slash dir="/" mode="*"/>
      <complexcat>
        <xsl:copy-of select="$s.E2.dcl"/>
        <slash dir="|"/>
        <xsl:copy-of select="$np.2.X.3rd"/>
      </complexcat>
    </complexcat>
  </xsl:variable>

  <family name="RelPro" pos="RelPro" closed="true" indexRel="GenRel">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($rel)/*"/>
        <xsl:with-param name="ext" select="$X.GenRel.E"/>
      </xsl:call-template>
    </entry>
  </family>
  
  <family name="RelPro-Appos" pos="RelPro" closed="true">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($rel.appos)/*"/>
        <xsl:with-param name="ext" select="$S.Default.Core.E.Trib.E2"/>
      </xsl:call-template>
    </entry>
  </family>
  
  
  <!-- Complementizer -->
  <xsl:variable name="comp">
    <complexcat>
      <xsl:copy-of select="$s.from-1.emb"/>
      <slash dir="/" mode="^"/>
      <xsl:copy-of select="$s.1.E.dcl"/>
    </complexcat>
  </xsl:variable>

  <family name="Comp" pos="Comp" closed="true" indexRel="*NoSem*">
    <entry name="Primary">
      <xsl:copy-of select="$comp"/>
    </entry>
  </family>

  </xsl:template>

</xsl:transform>


================================================
FILE: grammars/core-en/np.xsl
================================================
<?xml version="1.0"?>
<!-- 
Copyright (C) 2003-4 University of Edinburgh (Michael White)
$Revision: 1.10 $, $Date: 2004/11/21 12:06:50 $ 

NB: These namespace declarations seem to work with the version of Xalan 
    that comes with JDK 1.4.  With newer versions of Xalan, 
    different namespace declarations may be required. 
-->
<xsl:transform 
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform" 
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  exclude-result-prefixes="xalan xalan2">

  
  <!-- ***** Categories ***** -->

  <!-- Noun -->
  <xsl:variable name="X.Default">
    <lf>
      <satop nomvar="X:sem-obj">
        <prop name="[*DEFAULT*]"/>
      </satop>
    </lf>
  </xsl:variable>


  <!-- NP -->
  <xsl:variable name="qnp.rightward-TR">
    <complexcat>
      <xsl:copy-of select="$s.from-1.S"/>
      <slash dir="/" varmodality="M" ability="active"/>
      <complexcat>
        <xsl:copy-of select="$s.1.E"/>
        <slash dir="\" varmodality="M" ability="active"/>
        <xsl:copy-of select="$np.2.X.NUM.3rd.CASE"/>
      </complexcat>
    </complexcat>
  </xsl:variable>

  <xsl:variable name="qnp.leftward-TR">
    <complexcat>
      <xsl:copy-of select="$s.from-1.S"/>
      <slash/>
      <dollar name="1"/>
      <slash dir="\" varmodality="M" ability="active"/>
      <complexcat>
        <xsl:copy-of select="$s.1.E"/>
        <slash/>
        <dollar name="1"/>
        <slash dir="/" varmodality="M" ability="active"/>
        <xsl:copy-of select="$np.2.X.NUM.3rd.CASE"/>
      </complexcat>
    </complexcat>
  </xsl:variable>

  <xsl:variable name="S.Default.Restr.X.Body.E">  
    <lf>
      <satop nomvar="S:quantification">
        <prop name="[*DEFAULT*]"/>
        <diamond mode="Restr">
          <nomvar name="X:sem-obj"/>
        </diamond>
        <diamond mode="Body"><nomvar name="E:situation"/></diamond>
      </satop>
    </lf>
  </xsl:variable>

  <xsl:variable name="wh-np.subj">
    <complexcat>
      <xsl:copy-of select="$s.from-1.Q.wh"/>
      <slash dir="/" mode="^"/>
      <complexcat>
        <xsl:copy-of select="$s.1.E"/>
        <slash dir="\" mode="&lt;"/>
        <xsl:copy-of select="$np.2.X.NUM.3rd.CASE"/>
      </complexcat>
    </complexcat>
  </xsl:variable>

  <xsl:variable name="wh-np.obj">
    <complexcat>
      <xsl:copy-of select="$s.from-1.Q.wh"/>
      <slash dir="/" mode="^"/>
      <complexcat>
        <xsl:copy-of select="$s.1.E.q"/>
        <slash dir="/"/>
        <xsl:copy-of select="$np.2.X.NUM.3rd.CASE"/>
      </complexcat>
    </complexcat>
  </xsl:variable>

  <xsl:variable name="wh-np.leftward-TR">
    <complexcat>
      <xsl:copy-of select="$s.from-1.Q.wh"/>
      <slash/>
      <dollar name="1"/>
      <slash dir="\" varmodality="M" ability="active"/>
      <complexcat>
        <xsl:copy-of select="$s.1.E"/>
        <slash/>
        <dollar name="1"/>
        <slash dir="/" varmodality="M" ability="active"/>
        <xsl:copy-of select="$np.2.X.NUM.3rd.CASE"/>
      </complexcat>
    </complexcat>
  </xsl:variable>

  <xsl:variable name="Q.Default.Restr.X.Body.E">  
    <lf>
      <satop nomvar="Q:quantification">
        <prop name="[*DEFAULT*]"/>
        <diamond mode="Restr">
          <nomvar name="X:sem-obj"/>
        </diamond>
        <diamond mode="Body"><nomvar name="E:situation"/></diamond>
      </satop>
    </lf>
  </xsl:variable>

  
  <!-- ***** NP Families ***** -->
  <xsl:template name="add-np-families">

  <!-- Noun -->
  <family name="Noun" pos="N">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($n.2.X.default)/*"/>
        <xsl:with-param name="ext" select="$X.Default"/>
      </xsl:call-template>
    </entry>
  </family>

  
  <!-- Num -->
  <family name="Num" pos="Num">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($num.2.X.default)/*"/>
        <xsl:with-param name="ext">
          <lf>
            <satop nomvar="X:num">
              <prop name="[*DEFAULT*]"/>
            </satop>
          </lf>
        </xsl:with-param>
      </xsl:call-template>
    </entry>
  </family>
  
  
  <!-- NP -->
  <family name="ProNP" pos="Pro" closed="true">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($np.2.X.default)/*"/>
        <xsl:with-param name="ext" select="$X.Default"/>
      </xsl:call-template>
    </entry>
  </family>

  <family name="Name" pos="NNP">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($np.2.X.3rd)/*"/>
        <xsl:with-param name="ext" select="$X.Default"/>
      </xsl:call-template>
    </entry>
  </family>


  <xsl:variable name="np_expl.lex-Default.rightward-TR">
    <complexcat>
      <xsl:copy-of select="$s.1"/>
      <slash dir="/" varmodality="M" ability="active"/>
      <complexcat>
        <xsl:copy-of select="$s.1"/>
        <slash dir="\" varmodality="M" ability="active"/>
        <xsl:copy-of select="$np_expl.lex-Default"/>
      </complexcat>
    </complexcat>
  </xsl:variable>

  <family name="ExplNP" pos="Expl" closed="true" indexRel="*NoSem*">
    <entry name="Primary">
      <xsl:copy-of select="$np_expl.lex-Default"/>
    </entry>
    <entry name="RightwardTypeRaised">
      <xsl:copy-of select="$np_expl.lex-Default.rightward-TR"/>
    </entry>
  </family>

  <family name="QuantNP" pos="QNP" closed="true">
    <entry name="RightwardTypeRaised">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($qnp.rightward-TR)/*"/>
        <xsl:with-param name="ext" select="$S.Default.Restr.X.Body.E"/>
      </xsl:call-template>
    </entry>
    <entry name="LeftwardTypeRaised">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($qnp.leftward-TR)/*"/>
        <xsl:with-param name="ext" select="$S.Default.Restr.X.Body.E"/>
      </xsl:call-template>
    </entry>
  </family>

  <family name="WhNP" pos="WhNP" closed="true">
    <entry name="SubjectExtraction">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($wh-np.subj)/*"/>
        <xsl:with-param name="ext" select="$Q.Default.Restr.X.Body.E"/>
      </xsl:call-template>
    </entry>
    <entry name="ObjectExtraction">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($wh-np.obj)/*"/>
        <xsl:with-param name="ext" select="$Q.Default.Restr.X.Body.E"/>
      </xsl:call-template>
    </entry>
    <entry name="ObjectInSitu">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($wh-np.leftward-TR)/*"/>
        <xsl:with-param name="ext" select="$Q.Default.Restr.X.Body.E"/>
      </xsl:call-template>
    </entry>
  </family>

  </xsl:template>

</xsl:transform>


================================================
FILE: grammars/core-en/pp.xsl
================================================
<?xml version="1.0"?>
<!-- 
Copyright (C) 2003-4 University of Edinburgh (Michael White)
$Revision: 1.8 $, $Date: 2004/11/21 12:06:50 $ 

NB: These namespace declarations seem to work with the version of Xalan 
    that comes with JDK 1.4.  With newer versions of Xalan, 
    different namespace declarations may be required. 
-->
<xsl:transform 
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform" 
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  exclude-result-prefixes="xalan xalan2">

  
  <!-- ***** Categories ***** -->

  <xsl:variable name="prep.n-postmod">
    <complexcat>
      <xsl:copy-of select="$n.2.X"/>
      <slash dir="\" mode="&lt;"/>
      <xsl:copy-of select="$n.2.X"/>
      <slash dir="/" mode="&lt;"/>
      <xsl:copy-of select="$np.3.Y.acc"/>
    </complexcat>
  </xsl:variable>
  
  <xsl:variable name="prep.n-postmod.plus.pred.Y">    
    <xsl:call-template name="insert-after-last-leftward-arg">
      <xsl:with-param name="elt" select="xalan:nodeset($prep.n-postmod)/*"/>
      <xsl:with-param name="ins">
        <slash dir="/" mode="&lt;"/>
        <xsl:copy-of select="$pred.adj.Y"/>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>

  <xsl:variable name="pred.prep">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($pred.adj)/*"/>
        <xsl:with-param name="ext">
          <slash dir="/" mode="&lt;"/>
          <xsl:copy-of select="$np.3.Y.acc"/>
        </xsl:with-param>
      </xsl:call-template>
  </xsl:variable>
  
  <xsl:variable name="prep.appos">
    <complexcat>
      <xsl:copy-of select="$s.from-1.S"/>
      <slash dir="\" mode="*"/>
      <xsl:copy-of select="$s.1.E.default"/>
      <slash dir="\" mode="*"/>
      <xsl:copy-of select="$punct.comma"/>
      <slash dir="/" mode="*"/>
      <xsl:copy-of select="$np.3.Y.acc"/>
    </complexcat>
  </xsl:variable>

  <xsl:variable name="prep.appos.plus.pred.P2.Y">    
    <xsl:call-template name="insert-after-last-leftward-arg">
      <xsl:with-param name="elt" select="xalan:nodeset($prep.appos)/*"/>
      <xsl:with-param name="ins">
        <slash dir="/" mode="&lt;"/>
        <xsl:copy-of select="$pred.adj.P2.Y"/>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>

  <xsl:variable name="prep.transitional">
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($adv.transitional)/*"/>
      <xsl:with-param name="ext">
        <slash dir="/" mode="*"/>
        <xsl:copy-of select="$np.3.Y.acc"/>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>

  <!-- NB: has-rel is a dummy pred which serves as the semantic head -->
  <xsl:template name="make-has-rel-lf">
    <xsl:param name="rel"/>  
    <xsl:param name="sort-X" select="sem-obj"/>
    <xsl:param name="sort-Y" select="sem-obj"/>
    <lf>
      <satop nomvar="P:proposition">
        <prop name="has-rel"/>
        <diamond mode="info"><var name="INFO"/></diamond>
        <diamond mode="owner"><var name="OWNER"/></diamond>
        <diamond mode="kon"><prop name="-"/></diamond>
        <diamond mode="Of"><nomvar name="{concat('X:',$sort-X)}"/></diamond>
        <diamond mode="{$rel}"><nomvar name="{concat('Y:',$sort-Y)}"/></diamond>
      </satop>
    </lf>
  </xsl:template>

   
  <!-- ***** PP Families ***** -->
  <xsl:template name="add-pp-families">

  <family name="Particle" pos="Prep" closed="true" indexRel="*NoSem*">
    <entry name="Primary">
      <atomcat type="prt">
        <fs><feat attr="lex" val="[*DEFAULT*]"/></fs>
      </atomcat>
    </entry>
  </family>
  
  <family name="Prep-Nom" pos="Prep" closed="true" indexRel="*NoSem*">
    <entry name="Nominal">
      <complexcat>
        <xsl:copy-of select="$pp.from-3.lex-Default"/>
        <slash dir="/" mode="&lt;"/>
        <xsl:copy-of select="$np.3.Y.acc"/>
      </complexcat>
    </entry>
  </family>
  
  <xsl:variable name="X.FigInv.P.Default.Ground.Y">
    <lf>
      <satop nomvar="X:sem-obj">
        <diamond mode="FigInv">
          <nomvar name="P:proposition"/>
          <prop name="[*DEFAULT*]"/>
          <diamond mode="Ground"><nomvar name="Y:sem-obj"/></diamond>
        </diamond>
      </satop>
    </lf>
  </xsl:variable>
  
  <xsl:variable name="P.Default.Fig.X.Ground.Y">  
    <lf>
      <satop nomvar="P:proposition">
        <prop name="[*DEFAULT*]"/>
        <diamond mode="Fig"><nomvar name="X:sem-obj"/></diamond>
        <diamond mode="Ground"><nomvar name="Y:sem-obj"/></diamond>
      </satop>
    </lf>
  </xsl:variable>

  <!-- NB: Locative prepositions have Adj as their part-of-speech so that 
           they receive the same treatment as adjectives wrt intonation info.
       NB: Not assigning a sort to nominal (Y) for Ground, to allow for 
           loose usage of locatives. -->
  <family name="Prep-Loc" pos="Adj" closed="true">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($prep.n-postmod)/*"/>
        <xsl:with-param name="ext" select="$X.FigInv.P.Default.Ground.Y"/>
      </xsl:call-template>
    </entry>
    <entry name="Predicative">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($pred.prep)/*"/>
        <xsl:with-param name="ext" select="$P.Default.Fig.X.Ground.Y"/>
      </xsl:call-template>
    </entry>
  </family>

  <!-- With-Poss: appositive builds in elab-rel; Where may optionally give a prop -->
  <xsl:variable name="X.Poss.Y">
    <lf>
      <satop nomvar="X:sem-obj">
        <diamond mode="Poss"><nomvar name="Y:sem-obj"/></diamond>
      </satop>
    </lf>
  </xsl:variable>

  <xsl:variable name="X.Poss.Y.Where.P">
    <lf>
      <satop nomvar="X:sem-obj">
        <diamond mode="Poss"><nomvar name="Y:sem-obj"/></diamond>
        <diamond mode="Where"><nomvar name="P:proposition"/></diamond>
      </satop>
    </lf>
  </xsl:variable>

  <xsl:variable name="S.elab-rel.Core.E.Trib.P.has-rel.Of.X.Poss.Y">
    <xsl:variable name="has-rel-Poss-lf">
      <xsl:call-template name="make-has-rel-lf">
        <xsl:with-param name="rel">Poss</xsl:with-param>
      </xsl:call-template>
    </xsl:variable>
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($S.elab-rel.Core.E.Trib.P)/*"/>
      <xsl:with-param name="ext" select="xalan:nodeset($has-rel-Poss-lf)/lf/*"/>
    </xsl:call-template>
  </xsl:variable>

  <xsl:variable name="S.elab-rel.Core.E.Trib.P.has-rel.Of.X.Poss.Y.Where.P2">
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($S.elab-rel.Core.E.Trib.P.has-rel.Of.X.Poss.Y)/*"/>
      <xsl:with-param name="ext">
        <satop nomvar="P">
          <diamond mode="Where"><nomvar name="P2:proposition"/></diamond>
        </satop>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>

  <family name="With-Poss" pos="Prep" closed="true" indexRel="Poss">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($prep.n-postmod)/*"/>
        <xsl:with-param name="ext" select="$X.Poss.Y"/>
      </xsl:call-template>
    </entry>
    <entry name="Plus-Pred-Y">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($prep.n-postmod.plus.pred.Y)/*"/>
        <xsl:with-param name="ext" select="$X.Poss.Y.Where.P"/>
      </xsl:call-template>
    </entry>
    <entry name="Appos">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($prep.appos)/*"/>
        <xsl:with-param name="ext" select="$S.elab-rel.Core.E.Trib.P.has-rel.Of.X.Poss.Y"/>
      </xsl:call-template>
    </entry>
    <entry name="Appos-Plus-Pred-Y">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($prep.appos.plus.pred.P2.Y)/*"/>
        <xsl:with-param name="ext" select="$S.elab-rel.Core.E.Trib.P.has-rel.Of.X.Poss.Y.Where.P2"/>
      </xsl:call-template>
    </entry>
  </family>
  
  
  <xsl:variable name="E.HasProp.P.Default.Arg.Y">
    <lf>
      <satop nomvar="E:sem-obj">
        <diamond mode="HasProp">
          <nomvar name="P:proposition"/>
          <prop name="[*DEFAULT*]"/>
          <diamond mode="Arg">
            <nomvar name="Y:sem-obj"/>
          </diamond>
        </diamond>
      </satop>
    </lf>
  </xsl:variable>

  <!-- NB: Transitional prepositions have Adv as their part-of-speech so that 
           they receive the same treatment as adverbs wrt intonation info -->
  <family name="Prep-Transitional" pos="Adv" closed="true">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($prep.transitional)/*"/>
        <xsl:with-param name="ext" select="$E.HasProp.P.Default.Arg.Y"/>
      </xsl:call-template>
    </entry>
  </family>
  
  </xsl:template>

</xsl:transform>


================================================
FILE: grammars/core-en/punct.xsl
================================================
<?xml version="1.0"?>
<!-- 
Copyright (C) 2003-4 University of Edinburgh (Michael White)
$Revision: 1.14 $, $Date: 2004/11/21 12:06:50 $ 

NB: These namespace declarations seem to work with the version of Xalan 
    that comes with JDK 1.4.  With newer versions of Xalan, 
    different namespace declarations may be required. 
-->
<xsl:transform 
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform" 
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  exclude-result-prefixes="xalan xalan2">

  
  <!-- ***** Punctuation Families ***** -->
  <xsl:template name="add-punct-families">
  
  <!-- Boundary Tones -->
  <!-- NB: The owner feature is changed to nil to avoid repeated application 
           of these semantically null categories. -->
  <!-- NB: A (temp?) hack: for FLIGHTS, the LL-as-LH family allows LL boundaries to appear in the middle of 
           lists, as if they were LH boundaries.  It would probably be nicer to use 
           underspecification, but this would require extensions to the feature-based licensing 
           code. -->
  <family name="BoundaryTone-L-LL%" pos="BT" closed="true" indexRel="*NoSem*">
    <entry name="S">
      <complexcat>
        <xsl:copy-of select="$s.from-1.phr.nil"/>
        <slash/>
        <dollar name="1"/>
        <slash dir="\" mode="*"/>
        <complexcat>
          <xsl:copy-of select="$s.1.INFO.s"/>
          <slash/>
          <dollar name="1"/>
        </complexcat>
      </complexcat>
    </entry>
  </family>
  
  <family name="BoundaryTone-LL%-as-LH%" pos="BT" closed="true" indexRel="*NoSem*">
    <entry name="BT">
      <xsl:copy-of select="$bt.LH"/>
    </entry>
  </family>
  
  <family name="BoundaryTone-LH%" pos="BT" closed="true" indexRel="*NoSem*">
    <entry name="S">
      <complexcat>
        <xsl:copy-of select="$s.from-1.phr.nil"/>
        <slash/>
        <dollar name="1"/>
        <slash dir="\" mode="*"/>
        <complexcat>
          <xsl:copy-of select="$s.1.INFO.h"/>
          <slash/>
          <dollar name="1"/>
        </complexcat>
      </complexcat>
    </entry>
    <entry name="BT">
      <xsl:copy-of select="$bt.LH"/>
    </entry>
  </family>

  <family name="BoundaryTone-HH%" pos="BT" closed="true" indexRel="*NoSem*">
    <entry name="S-q">
      <complexcat>
        <xsl:copy-of select="$s.from-1.phr.nil"/>
        <slash dir="\" mode="*"/>
        <xsl:copy-of select="$s.1.q.INFO.h"/>
      </complexcat>
    </entry>
  </family>

  
  <!-- List Comma -->  
  <xsl:variable name="comma.conj.sentential">
    <complexcat>
      <xsl:copy-of select="$conj.sentential.result"/>
      <xsl:copy-of select="$conj.sentential.left-arg"/>
      <slash dir="\" mode="*"/>
      <xsl:copy-of select="$bt.LH"/>
      <slash dir="/" mode="*"/>
      <complexcat>
        <xsl:copy-of select="$s_conj.1.L2.op-index-S"/>
        <slash/>
        <dollar name="1"/>
      </complexcat>
    </complexcat>
  </xsl:variable>
  
  <xsl:variable name="L1.elem.Item.E1.Next.L2">
    <lf>
      <satop nomvar="L1:struct">
        <prop name="elem"/>
        <diamond mode="Item"><nomvar name="E1:situation"/></diamond>
        <diamond mode="Next"><nomvar name="L2:struct"/></diamond>
      </satop>
    </lf>
  </xsl:variable>

  <xsl:variable name="comma.conj.np">
    <complexcat>
      <xsl:copy-of select="$np_conj.from-1.L1.op-index-S"/>
      <slash dir="\" mode="*"/>
      <xsl:copy-of select="$np.X1.CASE"/>
      <slash dir="\" mode="*"/>
      <xsl:copy-of select="$bt.LH"/>
      <slash dir="/" mode="*"/>
      <xsl:copy-of select="$np_conj.1.L2.op-index-S.INFO.OWNER"/>
    </complexcat>
  </xsl:variable>

  <xsl:variable name="L1.elem.Item.X1.Next.L2">
    <lf>
      <satop nomvar="L1:struct">
        <prop name="elem"/>
        <diamond mode="Item"><nomvar name="X1:sem-obj"/></diamond>
        <diamond mode="Next"><nomvar name="L2:struct"/></diamond>
      </satop>
    </lf>
  </xsl:variable>

  <!-- Appositive Comma -->  
  <xsl:variable name="comma.vp.ng">
    <complexcat>
      <xsl:copy-of select="$s.from-1.S"/>
      <slash dir="\" mode="*"/>
      <xsl:copy-of select="$s.1.E.default"/>
      <slash dir="/" mode="*"/>
      <complexcat>
        <xsl:copy-of select="$s.E2.ng"/>
        <slash dir="\" mode="&lt;"/>
        <xsl:copy-of select="$np.2.X"/>
      </complexcat>
    </complexcat>
  </xsl:variable>

  <xsl:variable name="comma.pred.adj">
    <complexcat>
      <xsl:copy-of select="$s.from-1.S"/>
      <slash dir="\" mode="*"/>
      <xsl:copy-of select="$s.1.E.default"/>
      <slash dir="/" mode="*"/>
      <xsl:copy-of select="$pred.adj"/>
    </complexcat>
  </xsl:variable>

  <family name="Comma" pos="," closed="true">
    <entry name="Primary" indexRel="*NoSem*">
      <xsl:copy-of select="$punct.comma"/>
    </entry>
    <entry name="Sentential" indexRel="Next">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($comma.conj.sentential)/*"/>
        <xsl:with-param name="ext" select="$L1.elem.Item.E1.Next.L2"/>
      </xsl:call-template>
    </entry>
    <entry name="NP" indexRel="Next">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($comma.conj.np)/*"/>
        <xsl:with-param name="ext" select="$L1.elem.Item.X1.Next.L2"/>
      </xsl:call-template>
    </entry>
  </family>

  <family name="Comma-Elab" pos="," closed="true">
    <entry name="VP-ng">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($comma.vp.ng)/*"/>
        <xsl:with-param name="ext" select="$S.Default.Core.E.Trib.E2"/>
      </xsl:call-template>
    </entry>
    <entry name="Pred-Adj">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($comma.pred.adj)/*"/>
        <xsl:with-param name="ext" select="$S.Default.Core.E.Trib.P"/>
      </xsl:call-template>
    </entry>
  </family>
  
  
  <!-- End Punctuation -->  
  <xsl:variable name="fullstop.dcl-base">
    <complexcat>
      <xsl:copy-of select="$sent.E"/>
      <slash dir="\" mode="*"/>
      <xsl:copy-of select="$s.1.E.dcl-base.phr"/>
    </complexcat>
  </xsl:variable>

  <xsl:variable name="fullstop.vp.ng">
    <complexcat>
      <xsl:copy-of select="$sent.E"/>
      <slash dir="\" mode="*"/>
      <complexcat>
        <xsl:copy-of select="$s.1.E.ng.phr"/>
        <slash dir="\" mode="&lt;"/>
        <xsl:copy-of select="$np.X"/>
      </complexcat>
    </complexcat>
  </xsl:variable>
  
  <xsl:variable name="E.mood.dcl">
    <lf>
      <satop nomvar="E:sem-obj">
        <diamond mode="mood"><prop name="dcl"/></diamond>
      </satop>
    </lf>
  </xsl:variable>
  
  <family name="FullStop" pos="." closed="true" indexRel="mood">
    <entry name="Declare-Dcl-or-Fronted">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($fullstop.dcl-base)/*"/>
        <xsl:with-param name="ext" select="$E.mood.dcl"/>
      </xsl:call-template>
    </entry>
    <entry name="Declare-VP-Ng">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($fullstop.vp.ng)/*"/>
        <xsl:with-param name="ext" select="$E.mood.dcl"/>
      </xsl:call-template>
    </entry>
  </family>

  <xsl:variable name="qmark.q-base">
    <complexcat>
      <xsl:copy-of select="$sent.E"/>
      <slash dir="\" mode="*"/>
      <xsl:copy-of select="$s.1.E.q-base.phr"/>
    </complexcat>
  </xsl:variable>
  
  <!-- NB: this doesn't require an -ing VP -->
  <xsl:variable name="qmark.vp.wh">
    <complexcat>
      <xsl:copy-of select="$sent.E"/>
      <slash dir="\" mode="*"/>
      <complexcat>
        <xsl:copy-of select="$s.1.E.wh.phr"/>
        <slash dir="\" mode="&lt;"/>
        <xsl:copy-of select="$np.X"/>
      </complexcat>
    </complexcat>
  </xsl:variable>
  
  <xsl:variable name="E.mood.int">
    <lf>
      <satop nomvar="E:sem-obj">
        <diamond mode="mood"><prop name="int"/></diamond>
      </satop>
    </lf>
  </xsl:variable>
  
  <family name="QuestionMark" pos="?" closed="true" indexRel="mood">
    <entry name="Ask-Q-or-Wh">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($qmark.q-base)/*"/>
        <xsl:with-param name="ext" select="$E.mood.int"/>
      </xsl:call-template>
    </entry>
    <entry name="Ask-VP-Wh">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($qmark.vp.wh)/*"/>
        <xsl:with-param name="ext" select="$E.mood.int"/>
      </xsl:call-template>
    </entry>
  </family>

  </xsl:template>

</xsl:transform>


================================================
FILE: grammars/core-en/raise-nodes.xsl
================================================
<?xml version="1.0"?>
<!-- 
Copyright (C) 2003-4 University of Edinburgh (Michael White)
$Revision: 1.5 $, $Date: 2006/06/10 19:15:25 $ 
-->
<xsl:transform 
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform" 
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:set="xalan://java.util.HashSet"
  xmlns:xalan2="http://xml.apache.org/xslt"
  exclude-result-prefixes="set xalan xalan2">

  <xsl:output indent="yes" xalan2:indent-amount="2"/> 
  <xsl:strip-space elements="*"/>

  <!-- use shared raise-nodes.xsl, primarily -->
  <xsl:include href="../raise-nodes.xsl"/>
  
  <!-- raise nodes coordinated under 'but' --> 
  <xsl:template match="*[prop[@name='but'] and diamond[@mode='Arg1']]">
    <xsl:call-template name="raise-shared-nodes">
      <!-- look for shared nominals under different args -->
      <xsl:with-param name="rel">Arg1</xsl:with-param>
    </xsl:call-template>
  </xsl:template>
  
</xsl:transform>


================================================
FILE: grammars/core-en/templates.xsl
================================================
<?xml version="1.0"?>
<!-- 
Copyright (C) 2003-4 University of Edinburgh (Michael White)
$Revision: 1.3 $, $Date: 2004/10/05 11:01:47 $ 

NB: These namespace declarations seem to work with the version of Xalan 
    that comes with JDK 1.4.  With newer versions of Xalan, 
    different namespace declarations may be required. 
-->
<xsl:transform 
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform" 
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  exclude-result-prefixes="xalan xalan2">

  
  <!-- ***** Extend ***** -->
  <xsl:template name="extend">
    <xsl:param name="elt"/>
    <xsl:param name="ext"/>
    <xsl:element name="{name($elt)}">
      <xsl:copy-of select="$elt/@*"/>
      <xsl:copy-of select="$elt/node()"/>
      <xsl:copy-of select="$ext"/>
    </xsl:element>
  </xsl:template>

  
  <!-- ***** Insert ***** -->
  <xsl:template name="insert-after">
    <xsl:param name="elt"/>
    <xsl:param name="ins"/>
    <xsl:param name="pos"/>
    <xsl:element name="{name($elt)}">
      <xsl:copy-of select="$elt/@*"/>
      <xsl:copy-of select="$elt/*[position() &lt;= $pos]"/>
      <xsl:copy-of select="$ins"/>
      <xsl:copy-of select="$elt/*[position() &gt; $pos]"/>
    </xsl:element>
  </xsl:template>

  <xsl:template name="insert-after-last-leftward-arg">
    <xsl:param name="elt"/>
    <xsl:param name="ins"/>
    <xsl:variable name="num-nodes-before-backslash" 
      select="count($elt/*[following-sibling::slash[@dir='\']])"/>
    <xsl:variable name="pos">
      <xsl:choose>
        <xsl:when test="$num-nodes-before-backslash = 0">
          <xsl:value-of select="0"/>
        </xsl:when>
        <xsl:otherwise>
          <xsl:value-of select="$num-nodes-before-backslash + 2"/>
        </xsl:otherwise>
      </xsl:choose>
    </xsl:variable>
    <xsl:call-template name="insert-after">
      <xsl:with-param name="elt" select="$elt"/>
      <xsl:with-param name="ins" select="$ins"/>
      <xsl:with-param name="pos" select="$pos"/>
    </xsl:call-template>
  </xsl:template>

  
  <!-- ***** Modification modes ***** -->
  <!-- 
  <xsl:template match="atomcat[@type='s']/fs" mode="make-s-phr">
    <xsl:copy>
      <xsl:apply-templates select="@*" mode="make-s-phr"/>
      <feat attr="info" val="phr"/>
      <xsl:apply-templates select="node()[@attr != 'info']" mode="make-s-phr"/>
    </xsl:copy>
  </xsl:template>
  -->
  
  <!-- ***** Copy ***** -->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

  <!-- 
  <xsl:template match="@*|node()" mode="make-s-phr">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()" mode="make-s-phr"/>
    </xsl:copy>
  </xsl:template>
  -->

</xsl:transform>


================================================
FILE: grammars/core-en/types.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!--
Copyright (C) 2003-4 University of Edinburgh (Michael White)
$Revision: 1.12 $, $Date: 2005/07/22 20:44:23 $ 
-->
<types name="core-en" 
  xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" 
  xsi:noNamespaceSchemaLocation="../types.xsd"
>

  <!-- form vals -->
  <type name="form-vals"/>
  <type name="dcl-base" parents="form-vals"/>
    <type name="dcl" parents="dcl-base"/>
    <type name="fronted" parents="dcl-base"/>
  <type name="q-base" parents="form-vals"/>
    <type name="q" parents="q-base"/>
    <type name="wh" parents="q-base"/>
  <type name="base" parents="form-vals"/>
  <type name="emb" parents="form-vals"/>
  <type name="inf" parents="form-vals"/>
  <type name="adj" parents="form-vals"/>
  <type name="ng" parents="form-vals"/>
  
  <!-- person vals (nb: could merge this with number vals) -->
  <type name="pers-vals"/>
  <type name="3rd" parents="pers-vals"/>
  <type name="non-3rd" parents="pers-vals"/>
    <type name="1st" parents="non-3rd"/>
    <type name="2nd" parents="non-3rd"/>

  <!-- number vals -->
  <type name="num-vals"/>
  <type name="sg-or-mass" parents="num-vals"/>
    <type name="sg" parents="sg-or-mass"/>
  <type name="pl-or-mass" parents="num-vals"/>
    <type name="pl" parents="pl-or-mass"/>
    <type name="mass" parents="sg-or-mass pl-or-mass"/>
  
  <!-- ontological sorts (adapted in part from WordNet 2.0) -->
  <type name="sem-obj"/>
    <type name="abstraction" parents="sem-obj"/>
      <type name="date" parents="abstraction"/>
      <type name="measure" parents="abstraction"/>
        <type name="amt" parents="measure"/>
        <type name="dur" parents="measure"/>
      <type name="num" parents="abstraction"/>
      <type name="time" parents="abstraction"/>
    <type name="location" parents="sem-obj"/>
      <type name="city" parents="location"/>
    <type name="entity" parents="sem-obj"/>
      <type name="causal-agent" parents="entity"/>
        <type name="organization" parents="causal-agent"/>
      <type name="mental-obj" parents="entity"/>
      <type name="phys-obj" parents="entity"/>
        <type name="animate-being" parents="phys-obj"/>
          <type name="person" parents="animate-being causal-agent"/>
    <type name="grouping" parents="sem-obj"/>
    <type name="situation" parents="sem-obj"/>
      <type name="change" parents="situation"/>
        <type name="action" parents="change"/>
          <type name="statement" parents="action"/>
        <type name="motion" parents="change"/>
      <type name="quantification" parents="situation"/>
      <type name="state" parents="situation"/>
        <type name="proposition" parents="state"/>
        <type name="experience" parents="state"/>
  
  <!-- a structural element in the semantics -->
  <type name="struct"/>
</types>


================================================
FILE: grammars/core-en/unary-rules.xsl
================================================
<?xml version="1.0"?>
<!-- 
Copyright (C) 2003-5 University of Edinburgh (Michael White)
$Revision: 1.9 $, $Date: 2008/12/11 17:42:31 $ 

NB: These namespace declarations seem to work with the version of Xalan 
    that comes with JDK 1.4.  With newer versions of Xalan, 
    different namespace declarations may be required. 
-->
<xsl:transform 
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform" 
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  exclude-result-prefixes="xalan xalan2">

  
  <!-- ***** Unary Rules ***** -->
  
  <xsl:template name="add-unary-rules">

  <!-- Reduced relatives -->
  <typechanging name="rrel">
    <arg>
      <complexcat>
        <xsl:copy-of select="$s.1.E.dcl"/>
        <slash dir="/"/>
        <xsl:copy-of select="$np.2.X.3rd"/>
      </complexcat>
    </arg>
    <result>
      <complexcat>
        <xsl:copy-of select="$n.from-2.X.CASE"/>
        <slash dir="\" mode="*"/>
        <xsl:copy-of select="$n.from-2.X.CASE"/>
        <xsl:copy-of select="$X.GenRel.E"/>
      </complexcat>
    </result>
  </typechanging>
  
  <!-- Topicalization: adds <tpc>+ to the semantics; requires theme, h owner -->
  <typechanging name="tpc">
    <arg>
      <atomcat type="np">
        <fs id="2">
          <feat attr="index"><lf><nomvar name="X"/></lf></feat>
          <feat attr="info"><lf><prop name="th"/></lf></feat>
          <feat attr="owner"><lf><prop name="h"/></lf></feat>
        </fs>
      </atomcat>
    </arg>
    <result>
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="form" val="fronted"/>
          </fs>
        </atomcat>
        <slash dir="/" mode="^"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="form" val="dcl"/>
            </fs>
          </atomcat>
          <slash dir="/"/>
          <atomcat type="np">
            <fs id="2"/>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="tpc"><prop name="+"/></diamond>
          </satop>
        </lf>
      </complexcat>
    </result>
  </typechanging>

  <!-- Bare NPs: adds <det>nil to the semantics -->
  <typechanging name="bnp">
    <arg>
      <complexcat>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index"><lf><nomvar name="X"/></lf></feat>
            <feat attr="num" val="pl-or-mass"/>
          </fs>
        </atomcat>
        <slash/>
        <dollar name="1"/>
      </complexcat>
    </arg>
    <result>
      <complexcat>
        <atomcat type="np">
          <fs id="2">
            <feat attr="pers" val="3rd"/>
          </fs>
          <lf>
            <satop nomvar="X:sem-obj">
              <diamond mode="det"><prop name="nil"/></diamond>
            </satop>
          </lf>
        </atomcat>
        <slash/>
        <dollar name="1"/>
      </complexcat>
    </result>
  </typechanging>
  
 
  <!-- List completion -->
  <xsl:copy-of select="$s-list"/>
  <xsl:copy-of select="$pred-adj-list-to-adj"/>
  <xsl:copy-of select="$np-list-c"/>
  <xsl:copy-of select="$np-list-d-rightward-TR"/>
  <xsl:copy-of select="$np-list-d-leftward-TR"/>

  <!-- Cardinality prenominals -->
  <typechanging name="card">
    <arg>
      <atomcat type="num">
        <fs>
          <feat attr="index"><lf><nomvar name="Y"/></lf></feat>
          <feat attr="num"><featvar name="NUM"/></feat>
        </fs>
      </atomcat>
    </arg>
    <result>
      <complexcat>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index"><lf><nomvar name="X"/></lf></feat>
            <feat attr="info"><lf><var name="INFO"/></lf></feat>
            <feat attr="owner"><lf><var name="OWNER"/></lf></feat>
            <feat attr="num"><featvar name="NUM"/></feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="^"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index"><lf><nomvar name="X"/></lf></feat>
            <feat attr="info"><lf><var name="INFO"/></lf></feat>
            <feat attr="owner"><lf><var name="OWNER"/></lf></feat>
            <feat attr="num"><featvar name="NUM"/></feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="Card"><nomvar name="Y:num"/></diamond>
          </satop>
        </lf>
      </complexcat>
    </result>
  </typechanging>
  <typechanging name="card-h">
    <arg>
      <atomcat type="num">
        <fs>
          <feat attr="index"><lf><nomvar name="Y"/></lf></feat>
          <feat attr="num" val="pl"/>
        </fs>
      </atomcat>
    </arg>
    <result>
      <atomcat type="n">
        <fs id="2">
          <feat attr="index"><lf><nomvar name="X"/></lf></feat>
          <feat attr="info"><lf><var name="INFO"/></lf></feat>
          <feat attr="owner"><lf><var name="OWNER"/></lf></feat>
          <feat attr="num" val="pl"/>
        </fs>
        <lf>
          <satop nomvar="X:sem-obj">
            <prop name="pro-n"/>
            <diamond mode="info"><var name="INFO"/></diamond>
            <diamond mode="owner"><var name="OWNER"/></diamond>
            <diamond mode="kon"><prop name="-"/></diamond>
            <diamond mode="Card"><nomvar name="Y:num"/></diamond>
          </satop>
        </lf>
      </atomcat>
    </result>
  </typechanging>

  <!-- purpose clauses -->
  <typechanging name="purp-i">
    <arg> 
      <complexcat>
        <atomcat type="s">
          <fs>
            <feat attr="form" val="inf"/>
            <feat attr="index"><lf><nomvar name="E2"/></lf></feat>
            <feat attr="info"><lf><var name="INFO"/></lf></feat>
            <feat attr="owner"><lf><var name="OWNER"/></lf></feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <xsl:copy-of select="$np.X"/>
      </complexcat>
    </arg>
    <result>
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="form" val="fronted"/>
            <feat attr="index"><lf><nomvar name="S"/></lf></feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="^"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index"><lf><nomvar name="E"/></lf></feat>
            <feat attr="info"><lf><var name="INFO"/></lf></feat>
            <feat attr="owner"><lf><var name="OWNER"/></lf></feat>
          </fs>
        </atomcat>
        <xsl:copy-of select="$S.purpose-rel.Core.E.Trib.E2"/>
      </complexcat>
    </result>
  </typechanging>
  </xsl:template>

</xsl:transform>


================================================
FILE: grammars/core-en/v.xsl
================================================
<?xml version="1.0"?>
<!-- 
Copyright (C) 2003-4 University of Edinburgh (Michael White)
$Revision: 1.16 $, $Date: 2008/12/11 17:42:31 $ 

NB: These namespace declarations seem to work with the version of Xalan 
    that comes with JDK 1.4.  With newer versions of Xalan, 
    different namespace declarations may be required. 
-->
<xsl:transform 
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform" 
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  exclude-result-prefixes="xalan xalan2">

  
  <!-- ***** Categories ***** -->

  <!-- IV -->
  <xsl:variable name="iv">
    <complexcat>
      <xsl:copy-of select="$s.1.E.dcl.default"/>
      <slash dir="\" mode="&lt;"/>
      <xsl:copy-of select="$np.2.X.nom.default"/>
    </complexcat>
  </xsl:variable>

  <!-- TV -->
  <xsl:variable name="tv">    
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($iv)/*"/>
      <xsl:with-param name="ext">
        <slash dir="/" mode="&gt;"/>
        <xsl:copy-of select="$np.3.Y.acc"/>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>
  
  <!-- TV-About -->
  <xsl:variable name="tv.about">    
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($iv)/*"/>
      <xsl:with-param name="ext">
        <slash dir="/" mode="&gt;"/>
        <xsl:copy-of select="$pp.3.Y.about"/>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>
  
  <!-- TV-At -->
  <xsl:variable name="tv.at">    
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($iv)/*"/>
      <xsl:with-param name="ext">
        <slash dir="/" mode="&gt;"/>
        <xsl:copy-of select="$pp.3.Y.at"/>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>
  
  <!-- TV-From -->
  <xsl:variable name="tv.from">    
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($iv)/*"/>
      <xsl:with-param name="ext">
        <slash dir="/" mode="&gt;"/>
        <xsl:copy-of select="$pp.3.Y.from"/>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>
  
  <!-- TV-In -->
  <xsl:variable name="tv.in">    
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($iv)/*"/>
      <xsl:with-param name="ext">
        <slash dir="/" mode="&gt;"/>
        <xsl:copy-of select="$pp.3.Y.in"/>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>
  
  <!-- TV-On -->
  <xsl:variable name="tv.on">    
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($iv)/*"/>
      <xsl:with-param name="ext">
        <slash dir="/" mode="&gt;"/>
        <xsl:copy-of select="$pp.3.Y.on"/>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>
  
  <!-- TV-To -->
  <xsl:variable name="tv.to">    
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($iv)/*"/>
      <xsl:with-param name="ext">
        <slash dir="/" mode="&gt;"/>
        <xsl:copy-of select="$pp.3.Y.to"/>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>
  
  <!-- TV-With -->
  <xsl:variable name="tv.with">    
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($iv)/*"/>
      <xsl:with-param name="ext">
        <slash dir="/" mode="&gt;"/>
        <xsl:copy-of select="$pp.3.Y.with"/>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>
  
  <!-- TV Phrasal -->
  <xsl:variable name="tv.phrasal">    
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($iv)/*"/>
      <xsl:with-param name="ext">
        <setarg>
          <slash dir="/" mode="&gt;"/>
          <xsl:copy-of select="$np.3.Y.acc"/>
          <slash dir="/" mode="*"/>
          <atomcat type="prt">
            <fs id="4"/>
          </atomcat>
        </setarg>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>
  
  <!-- TV-Pred-Y -->
  <xsl:variable name="tv.pred.Y">    
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($iv)/*"/>
      <xsl:with-param name="ext">
        <slash dir="/" mode="&gt;"/>
        <xsl:copy-of select="$pred.adj.Y"/>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>
  
  <!-- DTV -->
  <xsl:variable name="dtv">    
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($tv)/*"/>
      <xsl:with-param name="ext">
        <slash dir="/" mode="&lt;"/>
        <xsl:copy-of select="$np.4.Z.acc"/>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>
  
  <!-- DTV-For -->
  <xsl:variable name="dtv.for">    
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($iv)/*"/>
      <xsl:with-param name="ext">
        <slash dir="/" mode="&gt;"/>
        <xsl:copy-of select="$pp.3.Y.for"/>
        <slash dir="/" mode="&lt;"/>
        <xsl:copy-of select="$np.4.Z.acc"/>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>

  <!-- DTV-To -->
  <xsl:variable name="dtv.to">    
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($tv.to)/*"/>
      <xsl:with-param name="ext">
        <slash dir="/" mode="&lt;"/>
        <xsl:copy-of select="$np.4.Z.acc"/>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>

  <!-- DTV-From-To -->
  <xsl:variable name="dtv.from.to">    
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($iv)/*"/>
      <xsl:with-param name="ext">
        <setarg>
          <slash dir="/" mode="&lt;"/>
          <xsl:copy-of select="$pp.3.Y.from"/>
          <slash dir="/" mode="&lt;"/>
          <xsl:copy-of select="$pp.4.Z.to"/>
        </setarg>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>

  <!-- TV-Plus-In -->
  <xsl:variable name="tv.plus.in">    
    <xsl:call-template name="insert-after-last-leftward-arg">
      <xsl:with-param name="elt" select="xalan:nodeset($tv)/*"/>
      <xsl:with-param name="ins">
        <slash dir="/" mode="&lt;"/>
        <xsl:copy-of select="$pp.4.Z.in"/>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>

  <!-- TV-Plus-On -->
  <xsl:variable name="tv.plus.on">    
    <xsl:call-template name="insert-after-last-leftward-arg">
      <xsl:with-param name="elt" select="xalan:nodeset($tv)/*"/>
      <xsl:with-param name="ins">
        <slash dir="/" mode="&lt;"/>
        <xsl:copy-of select="$pp.4.Z.on"/>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>

  <!-- TV-Plus-Pred-Y -->
  <xsl:variable name="tv.plus.pred.Y">    
    <xsl:call-template name="insert-after-last-leftward-arg">
      <xsl:with-param name="elt" select="xalan:nodeset($tv)/*"/>
      <xsl:with-param name="ins">
        <slash dir="/" mode="&gt;"/>
        <xsl:copy-of select="$pred.adj.Y"/>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>

  <!-- TV-Pred-Y-Plus-On -->
  <xsl:variable name="tv.pred.Y.plus.on">    
    <xsl:call-template name="insert-after-last-leftward-arg">
      <xsl:with-param name="elt" select="xalan:nodeset($tv.pred.Y)/*"/>
      <xsl:with-param name="ins">
        <slash dir="/" mode="&lt;"/>
        <xsl:copy-of select="$pp.4.Z.on"/>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>

  <!-- TV Scomp -->
  <!-- NB: could add a supertype for dcl/emb -->
  <xsl:variable name="tv.scomp.dcl">    
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($iv)/*"/>
      <xsl:with-param name="ext">
        <slash dir="/" mode="&lt;"/>
        <xsl:copy-of select="$s.E2.dcl"/>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>

  <xsl:variable name="tv.scomp.emb">    
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($iv)/*"/>
      <xsl:with-param name="ext">
        <slash dir="/" mode="&lt;"/>
        <xsl:copy-of select="$s.E2.emb"/>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>

  <!-- Subject Control -->
  <xsl:variable name="subject-control">    
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($iv)/*"/>
      <xsl:with-param name="ext">
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <xsl:copy-of select="$s.E2.inf"/>
          <slash dir="\"/>
          <xsl:copy-of select="$np.X"/>
        </complexcat>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>

  <!-- Object Control (not yet used) -->
  <xsl:variable name="object-control">    
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($iv)/*"/>
      <xsl:with-param name="ext">
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <xsl:copy-of select="$s.E2.inf"/>
          <slash dir="\"/>
          <xsl:copy-of select="$np.Y"/>
        </complexcat>
        <slash dir="/" mode="&lt;"/>
        <xsl:copy-of select="$np.3.Y.acc"/>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>

  
  <!-- ***** LFs ***** -->

  <!-- Perceiving: uses Perceiver, Phenomenon roles -->
  <!-- NB: different families for  Looking-At/Seeing/Hearing-About -->
  <xsl:variable name="E.Default.Perceiver.X.Phenomenon.Y">  
    <lf>
      <satop nomvar="E:experience">
        <prop name="[*DEFAULT*]"/>
        <diamond mode="Perceiver"><nomvar name="X:animate-being"/></diamond>
        <diamond mode="Phenomenon"><nomvar name="Y:sem-obj"/></diamond>
      </satop>
    </lf>
  </xsl:variable>
  <xsl:variable name="E.Default.Perceiver.X">  
    <lf>
      <satop nomvar="E:experience">
        <prop name="[*DEFAULT*]"/>
        <diamond mode="Perceiver"><nomvar name="X:animate-being"/></diamond>
      </satop>
    </lf>
  </xsl:variable>

  <!-- Choosing/Going-With: uses Cognizer, Chosen roles -->
  <xsl:variable name="E.Default.Cognizer.X.Chosen.Y">  
    <lf>
      <satop nomvar="E:action">
        <prop name="[*DEFAULT*]"/>
        <diamond mode="Cognizer"><nomvar name="X:causal-agent"/></diamond>
        <diamond mode="Chosen"><nomvar name="Y:sem-obj"/></diamond>
      </satop>
    </lf>
  </xsl:variable>

  
  <!-- ***** Verb Families ***** -->
  <xsl:template name="add-v-families">

  <!-- To Infinitive -->
  <family name="To-Infinitive" pos="Prep" closed="true" indexRel="*NoSem*">
    <entry name="Basic">
      <complexcat>
        <xsl:copy-of select="$s.from-1.inf"/>
        <slash dir="\" mode="&lt;" ability="inert"/>
        <xsl:copy-of select="$np.2.X"/>
        <slash dir="/" mode="^"/>
        <complexcat>
          <xsl:copy-of select="$s.1.E.base"/>
          <slash dir="\" mode="&lt;"/>
          <xsl:copy-of select="$np.2.X"/>
        </complexcat>
      </complexcat>
    </entry>
  </family>

  <!-- Possession: uses Owner and Poss(ession); may 
       also give a prop via the Where role -->
  <xsl:variable name="E.Default.Owner.X.Poss.Y">  
    <lf>
      <satop nomvar="E:situation">
        <prop name="[*DEFAULT*]"/>
        <diamond mode="Owner"><nomvar name="X:sem-obj"/></diamond>
        <diamond mode="Poss"><nomvar name="Y:sem-obj"/></diamond>
      </satop>
    </lf>
  </xsl:variable>

  <xsl:variable name="E.Default.Owner.X.Poss.Y.Where.P">  
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($E.Default.Owner.X.Poss.Y)/*"/>
      <xsl:with-param name="ext">
        <satop nomvar="E:situation">
          <diamond mode="Where"><nomvar name="P:proposition"/></diamond>
        </satop>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>

  <family name="Possession" pos="V" closed="true">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($tv)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Owner.X.Poss.Y"/>
      </xsl:call-template>
    </entry>
    <entry name="TV-Plus-Pred-Y">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($tv.plus.pred.Y)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Owner.X.Poss.Y.Where.P"/>
      </xsl:call-template>
    </entry>
  </family>

  <!-- Statement: Speaker and optional Message -->
  <xsl:variable name="E.Default.Speaker.X">  
    <lf>
      <satop nomvar="E:statement">
        <prop name="[*DEFAULT*]"/>
        <diamond mode="Speaker"><nomvar name="X:causal-agent"/></diamond>
      </satop>
    </lf>
  </xsl:variable>

  <xsl:variable name="E.Default.Speaker.X.Message.E2">  
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($E.Default.Speaker.X)/*"/>
      <xsl:with-param name="ext">
        <satop nomvar="E:statement">
          <diamond mode="Message"><nomvar name="E2:situation"/></diamond>
        </satop>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>

  <family name="Statement" pos="V" closed="true">
    <entry name="IV">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($iv)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Speaker.X"/>
      </xsl:call-template>
    </entry>
    <entry name="TV-SComp-Dcl">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($tv.scomp.dcl)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Speaker.X.Message.E2"/>
      </xsl:call-template>
    </entry>
    <entry name="TV-SComp-Emb">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($tv.scomp.emb)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Speaker.X.Message.E2"/>
      </xsl:call-template>
    </entry>
  </family>

  <!-- Experiencer-Subj (eg liking): uses Experiencer, Content roles -->
  <xsl:variable name="E.Default.Experiencer.X.Content.E2">  
    <lf>
      <satop nomvar="E:experience">
        <prop name="[*DEFAULT*]"/>
        <diamond mode="Experiencer"><nomvar name="X:animate-being"/></diamond>
        <diamond mode="Content"><nomvar name="E2:situation"/></diamond>
      </satop>
    </lf>
  </xsl:variable>
  <xsl:variable name="E.Default.Experiencer.X.Content.Y">  
    <lf>
      <satop nomvar="E:experience">
        <prop name="[*DEFAULT*]"/>
        <diamond mode="Experiencer"><nomvar name="X:animate-being"/></diamond>
        <diamond mode="Content"><nomvar name="Y:sem-obj"/></diamond>
      </satop>
    </lf>
  </xsl:variable>

  <family name="Experiencer-Subj" pos="V" closed="true">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($subject-control)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Experiencer.X.Content.E2"/>
      </xsl:call-template>
    </entry>
    <entry name="TV">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($tv)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Experiencer.X.Content.Y"/>
      </xsl:call-template>
    </entry>
  </family>
  
  <!-- Agentive-Causing: uses Agent and Effect -->
  <xsl:variable name="E.Default.Agent.X.Effect.Y">  
    <lf>
      <satop nomvar="E:situation">
        <prop name="[*DEFAULT*]"/>
        <diamond mode="Agent"><nomvar name="X:causal-agent"/></diamond>
        <diamond mode="Effect"><nomvar name="Y:situation"/></diamond>
      </satop>
    </lf>
  </xsl:variable>

  <family name="Agentive-Causing" pos="V" closed="true">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($tv)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Agent.X.Effect.Y"/>
      </xsl:call-template>
    </entry>
  </family>

  <!-- Copula -->
  <xsl:variable name="copula.pred">
    <complexcat>
      <xsl:copy-of select="$s.1.E.dcl.default"/>
      <slash dir="\" mode="&lt;"/>
      <xsl:copy-of select="$np.2.X.nom.default"/>
      <slash dir="/" mode="&gt;"/>
      <xsl:copy-of select="$pred.adj"/>
    </complexcat>
  </xsl:variable>

  <xsl:variable name="copula.pred.inverted">
    <complexcat>
      <xsl:copy-of select="$s.1.E.q.default"/>
      <slash dir="/" mode="&gt;"/>
      <xsl:copy-of select="$pred.adj"/>
      <slash dir="/" mode="*"/>
      <xsl:copy-of select="$np.2.X.nom.default"/>
    </complexcat>
  </xsl:variable>

  <!-- 
    NB: Both X and P are treated as semantic arguments of be, 
        in order to simplify the realization problem. 
        If just X appeared as a semantic argument, then 
        the realizer would have to guess P.
        If just P appeared as a semantic argument, 
        this would either force a change in the analysis of 
        the inverted form to s/s, complicating subj-v 
        agreement by making it indirect, or force the 
        realizer to handle unbound index vars, making it more 
        complicated and less efficient.
        (But note that inverted 'do' has to handle 
        agreement indirectly using s/s.)
  -->
  <xsl:variable name="E.be.Arg.X.Prop.P">
    <lf>
      <satop nomvar="E:state">
        <prop name="be"/>
        <diamond mode="Arg">
          <nomvar name="X:sem-obj"/>
        </diamond>
        <diamond mode="Prop"><nomvar name="P:proposition"/></diamond>
      </satop>
    </lf>
  </xsl:variable>
  
  <xsl:variable name="copula.tv.inverted">
    <complexcat>
      <xsl:copy-of select="$s.1.E.q.default"/>
      <slash dir="/" mode="&gt;"/>
      <xsl:copy-of select="$np.3.Y.acc"/>
      <slash dir="/" mode="*"/>
      <xsl:copy-of select="$np.2.X.nom.default"/>
    </complexcat>
  </xsl:variable>

  <!-- NB: This doesn't really capture the predicational nature of Y. -->
  <xsl:variable name="E.be.Arg.X.Pred.Y">
    <lf>
      <satop nomvar="E:state">
        <prop name="be"/>
        <diamond mode="Arg">
          <nomvar name="X:sem-obj"/>
        </diamond>
        <diamond mode="Pred"><nomvar name="Y:sem-obj"/></diamond>
      </satop>
    </lf>
  </xsl:variable>
  
  <family name="Copula" pos="V" closed="true">
    <entry name="Pred">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($copula.pred)/*"/>
        <xsl:with-param name="ext" select="$E.be.Arg.X.Prop.P"/>
      </xsl:call-template>
    </entry>
    <entry name="Pred-Inverted">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($copula.pred.inverted)/*"/>
        <xsl:with-param name="ext" select="$E.be.Arg.X.Prop.P"/>
      </xsl:call-template>
    </entry>
    <entry name="NP">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($tv)/*"/>
        <xsl:with-param name="ext" select="$E.be.Arg.X.Pred.Y"/>
      </xsl:call-template>
    </entry>
    <entry name="NP-Inverted">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($copula.tv.inverted)/*"/>
        <xsl:with-param name="ext" select="$E.be.Arg.X.Pred.Y"/>
      </xsl:call-template>
    </entry>
  </family>
  
  <!-- There existential -->
  <!-- NB: would be nice to use features to collapse pred.adj and pred.ng -->
  <xsl:variable name="there-be.np">
    <complexcat>
      <xsl:copy-of select="$s.1.E.dcl.default"/>
      <slash dir="\" mode="&lt;"/>
      <xsl:copy-of select="$np_expl.there"/>
      <slash dir="/" mode="&gt;"/>
      <xsl:copy-of select="$np.2.X.nom.default"/>
    </complexcat>
  </xsl:variable>

  <xsl:variable name="there-be.np.pred.adj">
    <xsl:call-template name="insert-after-last-leftward-arg">
      <xsl:with-param name="elt" select="xalan:nodeset($there-be.np)/*"/>
      <xsl:with-param name="ins">
        <slash dir="/" mode="&gt;"/>
        <xsl:copy-of select="$pred.adj"/>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>

  <xsl:variable name="there-be.np.pred.ng">
    <xsl:call-template name="insert-after-last-leftward-arg">
      <xsl:with-param name="elt" select="xalan:nodeset($there-be.np)/*"/>
      <xsl:with-param name="ins">
        <slash dir="/" mode="&gt;"/>
        <xsl:copy-of select="$pred.ng"/>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>

  <xsl:variable name="there-be.np.inverted">
    <complexcat>
      <xsl:copy-of select="$s.1.E.q.default"/>
      <slash dir="/" mode="&gt;"/>
      <xsl:copy-of select="$np.2.X.nom.default"/>
      <slash dir="/" mode="*"/>
      <xsl:copy-of select="$np_expl.there"/>
    </complexcat>
  </xsl:variable>

  <xsl:variable name="there-be.np.pred.adj.inverted">
    <xsl:call-template name="insert-after">
      <xsl:with-param name="elt" select="xalan:nodeset($there-be.np.inverted)/*"/>
      <xsl:with-param name="ins">
        <slash dir="/" mode="&gt;"/>
        <xsl:copy-of select="$pred.adj"/>
      </xsl:with-param>
      <xsl:with-param name="pos" select="1"/>
    </xsl:call-template>
  </xsl:variable>

  <xsl:variable name="there-be.np.pred.ng.inverted">
    <xsl:call-template name="insert-after">
      <xsl:with-param name="elt" select="xalan:nodeset($there-be.np.inverted)/*"/>
      <xsl:with-param name="ins">
        <slash dir="/" mode="&gt;"/>
        <xsl:copy-of select="$pred.ng"/>
      </xsl:with-param>
      <xsl:with-param name="pos" select="1"/>
    </xsl:call-template>
  </xsl:variable>

  <xsl:variable name="E.there-be.Arg.X">
    <lf>
      <satop nomvar="E:state">
        <prop name="there-be"/>
        <diamond mode="Arg"><nomvar name="X:sem-obj"/></diamond>
      </satop>
    </lf>
  </xsl:variable>
  
  <xsl:variable name="E.there-be.Arg.X.Prop.P">
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($E.there-be.Arg.X)/*"/>
      <xsl:with-param name="ext">
        <satop nomvar="E:state">
          <diamond mode="Prop"><nomvar name="P:situation"/></diamond>
        </satop>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>
  
  <family name="ThereExistential" pos="V" closed="true">
    <entry name="NP">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($there-be.np)/*"/>
        <xsl:with-param name="ext" select="$E.there-be.Arg.X"/>
      </xsl:call-template>
    </entry>
    <entry name="NP-PredAdj">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($there-be.np.pred.adj)/*"/>
        <xsl:with-param name="ext" select="$E.there-be.Arg.X.Prop.P"/>
      </xsl:call-template>
    </entry>
    <entry name="NP-PredNg">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($there-be.np.pred.ng)/*"/>
        <xsl:with-param name="ext" select="$E.there-be.Arg.X.Prop.P"/>
      </xsl:call-template>
    </entry>
    <entry name="NP-Inverted">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($there-be.np.inverted)/*"/>
        <xsl:with-param name="ext" select="$E.there-be.Arg.X"/>
      </xsl:call-template>
    </entry>
    <entry name="NP-PredAdj-Inverted">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($there-be.np.pred.adj.inverted)/*"/>
        <xsl:with-param name="ext" select="$E.there-be.Arg.X.Prop.P"/>
      </xsl:call-template>
    </entry>
    <entry name="NP-PredNg-Inverted">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($there-be.np.pred.ng.inverted)/*"/>
        <xsl:with-param name="ext" select="$E.there-be.Arg.X.Prop.P"/>
      </xsl:call-template>
    </entry>
  </family>
  
  <!-- Here existential -->
  <!-- NB: Probably should just be locative subject with inverted copula -->
  <xsl:variable name="here-be.np">
    <complexcat>
      <xsl:copy-of select="$s.1.E.dcl.default"/>
      <slash dir="\" mode="&lt;"/>
      <xsl:copy-of select="$np_expl.here"/>
      <slash dir="/" mode="&gt;"/>
      <xsl:copy-of select="$np.2.X.nom.default"/>
    </complexcat>
  </xsl:variable>

  <xsl:variable name="E.here-be.Arg.X">
    <lf>
      <satop nomvar="E:state">
        <prop name="here-be"/>
        <diamond mode="Arg"><nomvar name="X:sem-obj"/></diamond>
      </satop>
    </lf>
  </xsl:variable>
  
  <family name="HereExistential" pos="V" closed="true">
    <entry name="NP">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($here-be.np)/*"/>
        <xsl:with-param name="ext" select="$E.here-be.Arg.X"/>
      </xsl:call-template>
    </entry>
  </family>
  
  </xsl:template>

</xsl:transform>


================================================
FILE: grammars/dict.xsd
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!-- 
Copyright (C) 2003 University of Edinburgh (Michael White) 
$Revision: 1.4 $, $Date: 2004/12/07 16:19:27 $ 
-->
<xsd:schema xmlns:xsd="http://www.w3.org/2001/XMLSchema">

  <xsd:annotation>
  <xsd:documentation>
    Schema for dict file.
    
    A dict file is a more refined version of a morph file that groups 
    word forms by their stems (and parts of speech) and lists the mappings 
    to lexical categories.  See the grammar build targets in build.xml 
    for how a dict file can be straightforwardly transformed into the 
    morph.xml and lexicon.xml files required by the run-time system.
    
    See morph.xsd for more information on the the mapping between morph 
    items and lexical categories, and on the macros.
  </xsd:documentation>
  </xsd:annotation>

  <xsd:include schemaLocation="morph.xsd"/>
  
  
  <xsd:element name="dictionary">
    <xsd:annotation>
    <xsd:documentation>
      The root element, containing a list of dictionary entries and macros.
    </xsd:documentation>
    </xsd:annotation>
    <xsd:complexType>
      <xsd:sequence>
        <xsd:element name="entry" type="dictEntryType" maxOccurs="unbounded"/>
        <xsd:element ref="macro" minOccurs="0" maxOccurs="unbounded"/>
      </xsd:sequence>
      <xsd:attribute name="name" type="xsd:string"/>
    </xsd:complexType>
  </xsd:element>

  
  <xsd:complexType name="dictEntryType">
    <xsd:annotation>
    <xsd:documentation>
      A dictionary entry includes any number of 'member-of' and 'stem-for' mapping  
      elements, followed by any number of 'word' elements for different word forms.
      The stem and part of speech (pos) attributes are required.
      If there is just a single word form, it can be specified using the 'word' 
      attribute, with the stem as the default.
      The predicate may also be given with the 'pred' attribute, if it 
      differs from the stem.
      Any macros that apply to all of the entry's word forms may also be listed.
      See morph.xsd for info on the (semantic) class and coart(iculation) attributes.
    </xsd:documentation>
    </xsd:annotation>
      <xsd:sequence>
        <xsd:element ref="member-of" minOccurs="0" maxOccurs="unbounded"/>
        <xsd:element ref="stem-for" minOccurs="0" maxOccurs="unbounded"/>
        <xsd:element ref="word" minOccurs="0" maxOccurs="unbounded"/>
      </xsd:sequence>
    <xsd:attribute name="word" type="token"/>
    <xsd:attribute name="stem" type="token" use="required"/>
    <xsd:attribute name="pos" type="token" use="required"/>
    <xsd:attribute name="pred" type="token"/>
    <xsd:attribute name="macros" type="listOfMacroNames"/>
    <xsd:attribute name="class" type="token"/>
    <xsd:attribute name="coart" type="xsd:boolean"/>
  </xsd:complexType>


  <xsd:element name="member-of">
    <xsd:annotation>
    <xsd:documentation>
      Specifies a mapping from the entry to a family of lexical categories. 
      The 'family' attribute should provide the name of a category family.
      The 'pred' attribute may be used to specify a different predicate 
      to use with this family.
    </xsd:documentation>
    </xsd:annotation>
    <xsd:complexType>
      <xsd:attribute name="family" type="token" use="required"/>
      <xsd:attribute name="pred" type="token"/>
    </xsd:complexType>
  </xsd:element>

  <xsd:element name="stem-for">
    <xsd:annotation>
    <xsd:documentation>
      Specifies a mapping from the entry to a particular entry in a family of 
      lexical categories.
      The 'family' and 'entry' attributes should provide the names of a 
      category family and entry therein.
    </xsd:documentation>
    </xsd:annotation>
    <xsd:complexType>
      <xsd:attribute name="family" type="token" use="required"/>
      <xsd:attribute name="entry" type="token" use="required"/>
    </xsd:complexType>
  </xsd:element>


  <xsd:element name="word">
    <xsd:annotation>
    <xsd:documentation>
      A specific word form, given by the 'form' attribute.
      Any macros that are particular to the word form may be listed.
      Any lexical category families or entries whose mapping should be 
      blocked may also be listed.
    </xsd:documentation>
    </xsd:annotation>
    <xsd:complexType>
      <xsd:attribute name="form" type="token" use="required"/>
      <xsd:attribute name="macros" type="listOfMacroNames"/>
      <xsd:attribute name="excluded" type="listOfTokens"/>  
    </xsd:complexType>
  </xsd:element>
  
</xsd:schema>


================================================
FILE: grammars/extract-morph.xsl
================================================
<?xml version="1.0"?>
<!-- 
Copyright (C) 2003 University of Edinburgh (Michael White)
$Revision: 1.10 $, $Date: 2005/07/18 21:19:41 $ 

This transformation extracts the morph info from a dictionary 
into separate morph entries.
-->
<xsl:transform 
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform" 
  version="1.0"
  xmlns:xalan2="http://xml.apache.org/xslt"
  exclude-result-prefixes="xalan2">

  <xsl:output indent="yes" xalan2:indent-amount="2"/> 
  <xsl:strip-space elements="*"/>

  
  <!-- Change root dictionary node to morph -->
  <xsl:template match="dictionary">
    <morph
      xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
      xsi:noNamespaceSchemaLocation="../morph.xsd"
    >
      <xsl:apply-templates select="@*[name(.) != 'xsi:noNamespaceSchemaLocation'] | node()"/>
    </morph>
  </xsl:template>
  
  <!-- Spell out multiple word forms into separate entries -->
  <xsl:template match="entry[word]">
    <xsl:apply-templates/>
  </xsl:template>
  
  <!-- For single entries, change @stem to @word, if @word not there -->
  <xsl:template match="entry[not(word) and not(@word)]/@stem">
    <xsl:attribute name="word"><xsl:value-of select="."/></xsl:attribute>
  </xsl:template>
  
  <!-- Make a word form into an entry -->
  <xsl:template match="word">
      <entry word="{@form}" pos="{../@pos}">
      <!-- Add @stem from parent if different from @form -->
      <xsl:if test="@form != ../@stem">
        <xsl:attribute name="stem"><xsl:value-of select="../@stem"/></xsl:attribute>
      </xsl:if>
      <!-- Add @class from parent, if present -->
      <xsl:apply-templates select="../@class"/>
      <!-- Add @macros from word and parent, if any -->
      <xsl:variable name="macros" select="normalize-space(concat(../@macros, ' ', @macros))"/>
      <xsl:if test="$macros">
        <xsl:attribute name="macros"><xsl:value-of select="$macros"/></xsl:attribute>
      </xsl:if>
      <!-- Add @excluded, if present -->
      <xsl:apply-templates select="@excluded"/>
    </entry>
  </xsl:template>
  
  <!-- Ignore @pred, member-of and stem-for elements -->
  <xsl:template match="@pred"/>
  <xsl:template match="member-of|stem-for"/>
  
  
  <!-- Copy -->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: grammars/flights/build.xml
================================================
<!-- $Id: build.xml,v 1.9 2007/03/26 14:37:57 mwhite14850 Exp $ -->
<!-- Copyright (C) 2003-4 University of Edinburgh (Michael White) -->
<project default="grammar" basedir=".">

  <!-- =================================================================== -->
  <!-- Initialization target                                               -->
  <!-- =================================================================== -->
  <target name="init">
    <tstamp/>
    <property name="Name" value="OpenCCG"/>
    <property name="name" value="openccg"/>

    <echo message="----------- ${Name} ------------"/>

    <property name="lib.dir" value="${openccg.home}/lib"/>
    <property name="grammars.dir" value="${openccg.home}/grammars"/>
    <property name="core-en.dir" value="${grammars.dir}/core-en"/>

    <path id="validate.classpath">
      <pathelement location="${lib.dir}/xercesImpl.jar"/>
      <pathelement location="${lib.dir}/${name}.jar"/>
    </path>
  </target>
  

  <!-- =================================================================== -->
  <!-- Help on usage                                                       -->
  <!-- =================================================================== -->
  <target name="usage">
    <echo message=""/>
    <echo message=""/>
    <echo message="OpenCCG grammar build file"/>
    <echo message="-------------------------------------------------------------"/>
    <echo message=""/>
    <echo message=" Available targets are:"/>
    <echo message=""/>
    <echo message="   grammar  --> builds the grammar (default)"/>
    <echo message=""/>
    <echo message=" See the comments inside the build.xml file for more details."/>
    <echo message="-------------------------------------------------------------"/>
    <echo message=""/>
    <echo message=""/>
  </target>
  

  <!-- =================================================================== -->
  <!-- Builds grammar                                                     -->
  <!-- =================================================================== -->
  <target name="grammar" depends="init" description="builds grammar">
    <echo message="Transforming dict.xsl to dict.xml"/>
    <java classname="org.apache.xalan.xslt.Process"> 
      <arg value="-XSL"/> <arg value="dict.xsl"/>
      <arg value="-OUT"/> <arg value="dict.xml"/>
    </java>
    <echo message="Transforming lexicon-base.xsl to lexicon-base.xml and unary-rules.xml"/>
    <java classname="org.apache.xalan.xslt.Process"> 
      <arg value="-XSL"/> <arg value="lexicon-base.xsl"/>
      <arg value="-OUT"/> <arg value="lexicon-base.xml"/>
    </java>
    <echo message="Adding family members from dict.xml to lexicon-base.xml, yielding lexicon.xml"/>
    <java classname="org.apache.xalan.xslt.Process"> 
      <arg value="-IN"/> <arg value="lexicon-base.xml"/>
      <arg value="-XSL"/> <arg value="${grammars.dir}/add-family-members.xsl"/>
      <arg value="-PARAM"/> <arg value="dict-file"/> <arg value="${basedir}/dict.xml"/>
      <arg value="-OUT"/> <arg value="lexicon.xml"/>
    </java>
    <echo message="Adding intonation info to dict.xml yielding dict-plus-intonation-info.xml"/>
    <java classname="org.apache.xalan.xslt.Process"> 
      <arg value="-IN"/> <arg value="dict.xml"/>
      <arg value="-XSL"/> <arg value="${core-en.dir}/add-intonation-info.xsl"/>
      <arg value="-OUT"/> <arg value="dict-plus-intonation-info.xml"/>
    </java>
    <echo message="Extracting morph items from dict-plus-intonation-info.xml to morph.xml"/>
    <java classname="org.apache.xalan.xslt.Process"> 
      <arg value="-IN"/> <arg value="dict-plus-intonation-info.xml"/>
      <arg value="-XSL"/> <arg value="${grammars.dir}/extract-morph.xsl"/>
      <arg value="-OUT"/> <arg value="morph.xml"/>
    </java>
    <echo message="Adding type changing rules from unary-rules.xml to rules-base.xml, yielding rules.xml"/>
    <java classname="org.apache.xalan.xslt.Process"> 
      <arg value="-IN"/> <arg value="rules-base.xml"/>
      <arg value="-XSL"/> <arg value="${grammars.dir}/append.xsl"/>
      <arg value="-PARAM"/> <arg value="file-to-append"/> <arg value="${basedir}/unary-rules.xml"/>
      <arg value="-OUT"/> <arg value="rules.xml"/>
    </java>
    <echo message="Adding extra types from types-extras.xml to core-en/types.xml, yielding types.xml"/>
    <java classname="org.apache.xalan.xslt.Process"> 
      <arg value="-IN"/> <arg value="${core-en.dir}/types.xml"/>
      <arg value="-XSL"/> <arg value="${grammars.dir}/append.xsl"/>
      <arg value="-PARAM"/> <arg value="file-to-append"/> <arg value="${basedir}/types-extras.xml"/>
      <arg value="-OUT"/> <arg value="types.xml"/>
    </java>
    <echo message="Validating grammar.xml, lexicon.xml, morph.xml, rules.xml and types.xml"/>
    <java classname="opennlp.ccg.test.Validator" classpathref="validate.classpath" fork="true"> 
      <arg value="grammar.xml"/>
      <arg value="lexicon.xml"/>
      <arg value="morph.xml"/>
      <arg value="rules.xml"/>
      <arg value="types.xml"/>
    </java>
  </target>

</project>

<!-- End of file -->


================================================
FILE: grammars/flights/dict.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<dictionary xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:noNamespaceSchemaLocation="../dict.xsd" name="flights">
  <entry pos="Dummy" stem="*dummy*">
    <member-of family="Dummy"/>
  </entry>
  <entry class="date" pos="NNP" stem="[*DATE*]"/>
  <entry class="time" pos="NNP" stem="[*TIME*]"/>
  <entry macros="@pl-2" class="num" pos="Num" stem="[*NUM*]"/>
  <entry class="amt" pos="NNP" stem="[*AMT*]"/>
  <entry class="dur" pos="NNP" stem="[*DUR*]"/>
  <entry pos="BT" stem="L">
    <member-of family="BoundaryTone-L-LL%"/>
  </entry>
  <entry pos="BT" stem="LL%">
    <member-of family="BoundaryTone-L-LL%"/>
  </entry>
  <entry pos="BT" stem="LH%">
    <member-of family="BoundaryTone-LH%"/>
  </entry>
  <entry pos="BT" stem="HH%">
    <member-of family="BoundaryTone-HH%"/>
  </entry>
  <entry pos="," stem=",">
    <member-of family="Comma"/>
    <member-of pred="elab-rel" family="Comma-Elab"/>
  </entry>
  <entry pos="." stem=".">
    <member-of family="FullStop"/>
  </entry>
  <entry pos="?" stem="?">
    <member-of family="QuestionMark"/>
  </entry>
  <entry pos="Comp" stem="that">
    <member-of family="Comp"/>
  </entry>
  <entry pos="RelPro" stem="that">
    <member-of family="RelPro"/>
    <member-of pred="elab-rel" family="RelPro-Appos"/>
  </entry>
  <entry macros="@1st" class="animate-being" pos="Pro" stem="pro1">
    <member-of family="ProNP"/>
    <word macros="@sg @nom" form="I"/>
    <word macros="@sg @acc" form="me"/>
    <word macros="@pl @nom" form="we"/>
    <word macros="@pl @acc" form="us"/>
  </entry>
  <entry class="animate-being" pos="PossPro" stem="pro1">
    <member-of family="PossPro"/>
    <word macros="@sg-P" form="my"/>
    <word macros="@pl-P" form="our"/>
  </entry>
  <entry macros="@2nd" class="animate-being" pos="Pro" stem="pro2" word="you">
    <member-of family="ProNP"/>
  </entry>
  <entry class="animate-being" pos="PossPro" stem="pro2" word="your">
    <member-of family="PossPro"/>
  </entry>
  <entry macros="@3rd" pos="Pro" stem="pro3f">
    <member-of family="ProNP"/>
    <word macros="@sg @nom" form="she"/>
    <word macros="@sg @acc" form="her"/>
  </entry>
  <entry macros="@sg-P" pos="PossPro" stem="pro3f" word="her">
    <member-of family="PossPro"/>
  </entry>
  <entry macros="@3rd" pos="Pro" stem="pro3m">
    <member-of family="ProNP"/>
    <word macros="@sg @nom" form="he"/>
    <word macros="@sg @acc" form="him"/>
  </entry>
  <entry macros="@sg-P" pos="PossPro" stem="pro3m" word="his">
    <member-of family="PossPro"/>
  </entry>
  <entry macros="@3rd" pos="Pro" stem="pro3n">
    <member-of family="ProNP"/>
    <word macros="@sg" form="it"/>
    <word macros="@pl @nom" form="they"/>
    <word macros="@pl @acc" form="them"/>
  </entry>
  <entry pos="PossPro" stem="pro3n">
    <member-of family="PossPro"/>
    <word macros="@sg-P" form="its"/>
    <word macros="@pl-P" form="their"/>
  </entry>
  <entry macros="@3rd" pos="Pro" stem="this">
    <member-of family="ProNP"/>
    <word macros="@sg" form="this"/>
    <word macros="@pl" form="these"/>
  </entry>
  <entry macros="@3rd" pos="Pro" stem="that">
    <member-of family="ProNP"/>
    <word macros="@sg" form="that"/>
    <word macros="@pl" form="those"/>
  </entry>
  <entry pos="N" stem="pro_one">
    <word macros="@sg" form="one"/>
    <word macros="@pl" form="ones"/>
  </entry>
  <entry pos="Expl" stem="it">
    <member-of family="ExplNP"/>
  </entry>
  <entry pos="Expl" stem="there">
    <member-of family="ExplNP"/>
  </entry>
  <entry pos="Expl" stem="here">
    <member-of family="ExplNP"/>
  </entry>
  <entry pos="Conj" stem="and">
    <member-of family="Conj"/>
    <stem-for entry="NP-Collective" family="Conj"/>
    <stem-for entry="NP-Distributive-and" family="Conj"/>
    <member-of family="Subconj-Initial-Only"/>
  </entry>
  <entry pos="Conj" stem="or">
    <member-of family="Conj"/>
    <stem-for entry="NP-Distributive-or" family="Conj"/>
    <member-of family="Subconj-Initial-Only"/>
  </entry>
  <entry pos="Conj" stem="but">
    <member-of family="Conj-Sentential-Binary"/>
    <member-of family="Subconj-Initial-Only"/>
    <member-of family="Subconj-Medial"/>
  </entry>
  <entry pos="Conj" stem="although">
    <member-of family="Subconj-Initial"/>
  </entry>
  <entry pos="Conj" stem="if">
    <member-of family="Subconj-Initial"/>
  </entry>
  <entry pos="Conj" stem="while">
    <member-of family="Subconj-Medial"/>
  </entry>
  <entry macros="@sg-2" pos="QNP" pred="every" stem="everyone">
    <member-of family="QuantNP"/>
  </entry>
  <entry macros="@pl-2" pos="QNP" stem="both">
    <member-of family="QuantNP"/>
  </entry>
  <entry macros="@sg-2" pos="QNP" stem="neither">
    <member-of family="QuantNP"/>
  </entry>
  <entry macros="@pl-2" pos="QNP" stem="none">
    <member-of family="QuantNP"/>
  </entry>
  <entry macros="@pl-or-mass-2" pos="QNP" stem="all">
    <member-of family="QuantNP"/>
  </entry>
  <entry pos="WhNP" stem="what">
    <member-of family="WhNP"/>
  </entry>
  <entry macros="@X-location" pos="WhNP" stem="where">
    <member-of family="WhNP"/>
  </entry>
  <entry macros="@X-person" pos="WhNP" stem="who">
    <member-of family="WhNP"/>
  </entry>
  <entry macros="@sg-2" pos="Det" stem="a">
    <member-of family="Det"/>
    <word form="a"/>
    <word form="an"/>
  </entry>
  <entry pos="Det" stem="some">
    <member-of family="Det"/>
  </entry>
  <entry pos="Det" stem="the">
    <member-of family="Det"/>
  </entry>
  <entry macros="@sg-2" pos="PDet" stem="another">
    <member-of family="PDet"/>
  </entry>
  <entry pos="PDet" stem="this">
    <member-of family="PDet"/>
    <word macros="@sg-or-mass-2" form="this"/>
    <word macros="@pl-2" form="these"/>
  </entry>
  <entry pos="PDet" stem="that">
    <member-of family="PDet"/>
    <word macros="@sg-or-mass-2" form="that"/>
    <word macros="@pl-2" form="those"/>
  </entry>
  <entry pos="PossS" stem="'s">
    <member-of family="PossS"/>
  </entry>
  <entry macros="@pl-or-mass-2" pos="QDet" stem="all">
    <member-of family="QuantDet"/>
  </entry>
  <entry macros="@pl-2" pos="QDet" stem="both">
    <member-of family="QuantDet"/>
  </entry>
  <entry macros="@sg-2" pos="QDet" stem="every">
    <member-of family="QuantDet"/>
  </entry>
  <entry macros="@sg-2" pos="QDet" stem="neither">
    <member-of family="QuantDet"/>
  </entry>
  <entry pos="QDet" stem="no">
    <member-of family="QuantDet"/>
  </entry>
  <entry pos="Wh" stem="what">
    <member-of family="WhDet"/>
  </entry>
  <entry pos="Wh" stem="which">
    <member-of family="WhDet"/>
  </entry>
  <entry pos="Adv" stem="also">
    <member-of family="Adverb"/>
  </entry>
  <entry pos="Adv" stem="either">
    <member-of family="Adverb"/>
  </entry>
  <entry pos="Adv" stem="though">
    <member-of family="Adverb"/>
  </entry>
  <entry pos="Adv" stem="too">
    <member-of family="Adverb"/>
  </entry>
  <entry pos="Prep" stem="with">
    <member-of family="Prep-Nom"/>
    <member-of family="With-Poss"/>
  </entry>
  <entry pos="V" stem="can">
    <member-of family="Modal"/>
  </entry>
  <entry pos="V" stem="may">
    <member-of family="Modal"/>
  </entry>
  <entry pos="V" stem="should">
    <member-of family="Modal"/>
  </entry>
  <entry pos="V" stem="would">
    <member-of family="Modal"/>
    <word form="would"/>
    <word form="'d"/>
  </entry>
  <entry pos="V" stem="will">
    <member-of family="Modal"/>
    <word form="will"/>
    <word form="'ll"/>
  </entry>
  <entry pos="V" stem="not">
    <member-of family="Negation"/>
    <word macros="@base @base6" form="not"/>
    <word macros="@base @base6" form="n't"/>
    <word macros="@adj @adj6" form="not"/>
    <word macros="@adj @adj6" form="n't"/>
  </entry>
  <entry pos="V" stem="do">
    <member-of family="Modal"/>
    <member-of family="Do-Support"/>
    <word macros="@pres @sg-agr @non-3rd-agr" form="do"/>
    <word macros="@pres @sg-or-mass-agr @3rd-agr" form="does"/>
    <word macros="@pres @pl-agr" form="do"/>
    <word macros="@past" form="did"/>
  </entry>
  <entry pos="V" stem="be">
    <member-of family="Copula"/>
    <member-of pred="prog" family="Progressive"/>
    <member-of pred="there-be" family="ThereExistential"/>
    <member-of pred="here-be" family="HereExistential"/>
    <word excluded="Inverted" macros="@base" form="be"/>
    <word macros="@pres @sg-agr @1st-agr" form="am"/>
    <word macros="@pres @sg-agr @1st-agr" form="'m"/>
    <word macros="@pres @sg-agr @2nd-agr" form="are"/>
    <word macros="@pres @sg-agr @2nd-agr" form="'re"/>
    <word macros="@pres @sg-or-mass-agr @3rd-agr" form="is"/>
    <word macros="@pres @sg-or-mass-agr @3rd-agr" form="'s"/>
    <word macros="@pres @pl-agr" form="are"/>
    <word macros="@pres @pl-agr" form="'re"/>
    <word macros="@past @sg-agr @1st-agr" form="was"/>
    <word macros="@past @sg-agr @2nd-agr" form="were"/>
    <word macros="@past @sg-or-mass-agr @3rd-agr" form="was"/>
    <word macros="@past @pl-agr" form="were"/>
  </entry>
  <entry pos="V" stem="have">
    <member-of family="Possession"/>
    <word excluded="Inverted" macros="@base" form="have"/>
    <word macros="@pres @sg-agr @non-3rd-agr" form="have"/>
    <word macros="@pres @sg-or-mass-agr @3rd-agr" form="has"/>
    <word macros="@pres @pl-agr" form="have"/>
    <word macros="@past" form="had"/>
  </entry>
  <entry pos="V" stem="like">
    <member-of family="Experiencer-Subj"/>
    <word macros="@base" form="like"/>
    <word macros="@ng" form="liking"/>
    <word macros="@pres @sg-agr @non-3rd-agr" form="like"/>
    <word macros="@pres @sg-or-mass-agr @3rd-agr" form="likes"/>
    <word macros="@pres @pl-agr" form="like"/>
    <word macros="@past" form="liked"/>
  </entry>
  <entry pos="V" stem="make">
    <member-of family="Agentive-Causing"/>
    <word macros="@base" form="make"/>
    <word macros="@ng" form="making"/>
    <word macros="@pres @sg-agr @non-3rd-agr" form="make"/>
    <word macros="@pres @sg-or-mass-agr @3rd-agr" form="makes"/>
    <word macros="@pres @pl-agr" form="make"/>
    <word macros="@past" form="made"/>
  </entry>
  <entry pos="V" stem="mention">
    <member-of family="Statement"/>
    <word macros="@pres @sg-agr @non-3rd-agr" form="mention"/>
    <word macros="@pres @sg-or-mass-agr @3rd-agr" form="mentions"/>
    <word macros="@pres @pl-agr" form="mention"/>
    <word macros="@past" form="mentioned"/>
  </entry>
  <entry pos="V" stem="say">
    <member-of family="Statement"/>
    <word macros="@pres @sg-agr @non-3rd-agr" form="say"/>
    <word macros="@pres @sg-or-mass-agr @3rd-agr" form="says"/>
    <word macros="@pres @pl-agr" form="say"/>
    <word macros="@past" form="said"/>
  </entry>
  <entry macros="@sg-2" class="num" pos="Num" stem="one">
    <member-of family="One-Det"/>
  </entry>
  <entry macros="@sg-2" class="num" pos="Num" stem="1">
    <member-of family="One-Det"/>
  </entry>
  <entry macros="@pl-2" class="num" pos="Num" stem="several"/>
  <entry macros="@pl-2" class="num" pos="Num" stem="two"/>
  <entry macros="@pl-2" class="num" pos="Num" stem="three"/>
  <entry macros="@pl-2" class="num" pos="Num" stem="four"/>
  <entry macros="@pl-2" class="num" pos="Num" stem="five"/>
  <entry macros="@pl-2" class="num" pos="Num" stem="six"/>
  <entry macros="@pl-2" class="num" pos="Num" stem="seven"/>
  <entry macros="@pl-2" class="num" pos="Num" stem="eight"/>
  <entry macros="@pl-2" class="num" pos="Num" stem="nine"/>
  <entry macros="@pl-2" class="num" pos="Num" stem="ten"/>
  <entry pos="BT" stem="LL%">
    <member-of family="BoundaryTone-LL%-as-LH%"/>
  </entry>
  <entry pos="and" stem="and">
    <member-of family="And-Punct"/>
  </entry>
  <entry pos="Prep" stem="about">
    <member-of family="Prep-Nom"/>
  </entry>
  <entry pos="TempAdv" stem="after">
    <member-of family="Prep-TimeRel"/>
  </entry>
  <entry pos="Prep" stem="at">
    <member-of family="Prep-Nom"/>
    <member-of family="Prep-Time"/>
  </entry>
  <entry pos="TempAdv" stem="before">
    <member-of family="Prep-TimeRel"/>
  </entry>
  <entry pos="TempAdv" stem="between">
    <member-of family="Between-TimeRel"/>
  </entry>
  <entry pos="TempAdv" stem="by">
    <member-of family="Prep-TimeRel"/>
  </entry>
  <entry pos="TempAdv" stem="earlier">
    <member-of family="Comparative-TimeRel"/>
  </entry>
  <entry pos="Prep" stem="for">
    <member-of family="Prep-Nom"/>
  </entry>
  <entry pos="Prep" stem="from">
    <member-of family="Prep-Nom"/>
  </entry>
  <entry pos="Prep" stem="in">
    <member-of family="Prep-Nom"/>
    <member-of family="Prep-TimeFrame"/>
  </entry>
  <entry pos="TempAdv" stem="later">
    <member-of family="Comparative-TimeRel"/>
  </entry>
  <entry pos="Prep" stem="of">
    <member-of family="Prep-Nom"/>
  </entry>
  <entry pos="Prep" stem="on">
    <member-of family="Prep-Nom"/>
    <member-of family="Prep-Date"/>
    <member-of family="Prep-Airline"/>
  </entry>
  <entry pos="Adj" stem="on">
    <member-of family="Prep-Loc"/>
  </entry>
  <entry pos="Prep" stem="to">
    <member-of family="Prep-Nom"/>
    <member-of family="To-Infinitive"/>
  </entry>
  <entry pos="TempAdv" stem="until">
    <member-of family="Prep-TimeRel"/>
  </entry>
  <entry pos="Prep" stem="with">
    <member-of family="Prep-Nom"/>
  </entry>
  <entry pos="Adv" stem="alternatively">
    <member-of family="Transitional-Adverb"/>
  </entry>
  <entry pos="Adv" stem="however">
    <member-of family="Transitional-Adverb"/>
  </entry>
  <entry pos="Adv" stem="only">
    <member-of family="Adverb"/>
  </entry>
  <entry pos="Adv" stem="on_time">
    <member-of family="Adverb"/>
  </entry>
  <entry pos="Adv" stem="today">
    <member-of family="Adverb"/>
  </entry>
  <entry pos="Adv" stem="yesterday">
    <member-of family="Adverb"/>
  </entry>
  <entry pos="V" stem="arrive">
    <member-of family="Arriving"/>
    <word macros="@base" form="arrive"/>
    <word macros="@ng" form="arriving"/>
    <word macros="@pres @sg-agr @non-3rd-agr" form="arrive"/>
    <word macros="@pres @sg-or-mass-agr @3rd-agr" form="arrives"/>
    <word macros="@pres @pl-agr" form="arrive"/>
    <word macros="@past" form="arrived"/>
  </entry>
  <entry pos="V" stem="book">
    <member-of family="Booking"/>
    <word macros="@base" form="book"/>
    <word macros="@ng" form="booking"/>
    <word macros="@pres @sg-agr @non-3rd-agr" form="book"/>
    <word macros="@pres @sg-or-mass-agr @3rd-agr" form="books"/>
    <word macros="@pres @pl-agr" form="book"/>
    <word macros="@past" form="booked"/>
  </entry>
  <entry pos="V" stem="choose">
    <member-of family="Choosing"/>
    <word macros="@base" form="choose"/>
    <word macros="@ng" form="choosing"/>
    <word macros="@pres @sg-agr @non-3rd-agr" form="choose"/>
    <word macros="@pres @sg-or-mass-agr @3rd-agr" form="chooses"/>
    <word macros="@pres @pl-agr" form="choose"/>
    <word macros="@past" form="chose"/>
  </entry>
  <entry pos="V" stem="connect">
    <member-of family="Connecting"/>
    <word macros="@base" form="connect"/>
    <word macros="@ng" form="connecting"/>
    <word macros="@pres @sg-agr @non-3rd-agr" form="connect"/>
    <word macros="@pres @sg-or-mass-agr @3rd-agr" form="connects"/>
    <word macros="@pres @pl-agr" form="connect"/>
    <word macros="@past" form="connected"/>
  </entry>
  <entry pos="V" stem="cost">
    <member-of family="Costing"/>
    <word macros="@base" form="cost"/>
    <word macros="@ng" form="costing"/>
    <word macros="@pres @sg-agr @non-3rd-agr" form="cost"/>
    <word macros="@pres @sg-or-mass-agr @3rd-agr" form="costs"/>
    <word macros="@pres @pl-agr" form="cost"/>
    <word macros="@past" form="cost"/>
  </entry>
  <entry pos="V" stem="depart">
    <member-of family="Departing"/>
    <word macros="@base" form="depart"/>
    <word macros="@ng" form="departing"/>
    <word macros="@pres @sg-agr @non-3rd-agr" form="depart"/>
    <word macros="@pres @sg-or-mass-agr @3rd-agr" form="departs"/>
    <word macros="@pres @pl-agr" form="depart"/>
    <word macros="@past" form="departed"/>
  </entry>
  <entry pos="V" stem="find">
    <member-of family="Finding"/>
    <word macros="@base" form="find"/>
    <word macros="@ng" form="finding"/>
    <word macros="@pres @sg-agr @non-3rd-agr" form="find"/>
    <word macros="@pres @sg-or-mass-agr @3rd-agr" form="finds"/>
    <word macros="@pres @pl-agr" form="find"/>
    <word macros="@past" form="found"/>
  </entry>
  <entry pos="V" stem="fly">
    <member-of family="Travel"/>
    <word macros="@base" form="fly"/>
    <word macros="@ng" form="flying"/>
    <word macros="@pres @sg-agr @non-3rd-agr" form="fly"/>
    <word macros="@pres @sg-or-mass-agr @3rd-agr" form="flies"/>
    <word macros="@pres @pl-agr" form="fly"/>
    <word macros="@past" form="flew"/>
  </entry>
  <entry pos="V" stem="get">
    <member-of family="Conveyance"/>
    <word macros="@base" form="get"/>
    <word macros="@ng" form="getting"/>
    <word macros="@pres @sg-agr @non-3rd-agr" form="get"/>
    <word macros="@pres @sg-or-mass-agr @3rd-agr" form="gets"/>
    <word macros="@pres @pl-agr" form="get"/>
    <word macros="@past" form="got"/>
  </entry>
  <entry pos="V" stem="go">
    <member-of family="Travel"/>
    <word macros="@base" form="go"/>
    <word macros="@ng" form="going"/>
    <word macros="@pres @sg-agr @non-3rd-agr" form="go"/>
    <word macros="@pres @sg-or-mass-agr @3rd-agr" form="goes"/>
    <word macros="@pres @pl-agr" form="go"/>
    <word macros="@past" form="went"/>
  </entry>
  <entry pos="V" stem="hear">
    <member-of family="Hearing-About"/>
    <word macros="@base" form="hear"/>
    <word macros="@ng" form="hearing"/>
    <word macros="@pres @sg-agr @non-3rd-agr" form="hear"/>
    <word macros="@pres @sg-or-mass-agr @3rd-agr" form="hears"/>
    <word macros="@pres @pl-agr" form="hear"/>
    <word macros="@past" form="heard"/>
  </entry>
  <entry pos="V" stem="leave">
    <member-of family="Departing"/>
    <word macros="@base" form="leave"/>
    <word macros="@ng" form="leaving"/>
    <word macros="@pres @sg-agr @non-3rd-agr" form="leave"/>
    <word macros="@pres @sg-or-mass-agr @3rd-agr" form="leaves"/>
    <word macros="@pres @pl-agr" form="leave"/>
    <word macros="@past" form="left"/>
  </entry>
  <entry pos="V" stem="match">
    <member-of family="Evaluative-Comparison"/>
    <word macros="@base" form="match"/>
    <word macros="@ng" form="matching"/>
    <word macros="@pres @sg-agr @non-3rd-agr" form="match"/>
    <word macros="@pres @sg-or-mass-agr @3rd-agr" form="matches"/>
    <word macros="@pres @pl-agr" form="match"/>
    <word macros="@past" form="matched"/>
  </entry>
  <entry pos="V" stem="need">
    <member-of pred="need-to" family="Needing-To"/>
    <word macros="@base" form="need"/>
    <word macros="@ng" form="needing"/>
    <word macros="@pres @sg-agr @non-3rd-agr" form="need"/>
    <word macros="@pres @sg-or-mass-agr @3rd-agr" form="needs"/>
    <word macros="@pres @pl-agr" form="need"/>
    <word macros="@past" form="needed"/>
  </entry>
  <entry pos="V" stem="offer">
    <member-of family="Offering"/>
    <word macros="@base" form="offer"/>
    <word macros="@ng" form="offering"/>
    <word macros="@pres @sg-agr @non-3rd-agr" form="offer"/>
    <word macros="@pres @sg-or-mass-agr @3rd-agr" form="offers"/>
    <word macros="@pres @pl-agr" form="offer"/>
    <word macros="@past" form="offered"/>
  </entry>
  <entry pos="V" stem="prefer">
    <member-of family="Experiencer-Subj"/>
    <word macros="@base" form="prefer"/>
    <word macros="@ng" form="preferring"/>
    <word macros="@pres @sg-agr @non-3rd-agr" form="prefer"/>
    <word macros="@pres @sg-or-mass-agr @3rd-agr" form="prefers"/>
    <word macros="@pres @pl-agr" form="prefer"/>
    <word macros="@past" form="preferred"/>
  </entry>
  <entry pos="V" stem="require">
    <member-of family="Requiring"/>
    <word macros="@base" form="require"/>
    <word macros="@ng" form="requiring"/>
    <word macros="@pres @sg-agr @non-3rd-agr" form="require"/>
    <word macros="@pres @sg-or-mass-agr @3rd-agr" form="requires"/>
    <word macros="@pres @pl-agr" form="require"/>
    <word macros="@past" form="required"/>
  </entry>
  <entry pos="V" stem="return">
    <member-of family="Travel"/>
    <word macros="@base" form="return"/>
    <word macros="@ng" form="returning"/>
    <word macros="@pres @sg-agr @non-3rd-agr" form="return"/>
    <word macros="@pres @sg-or-mass-agr @3rd-agr" form="returns"/>
    <word macros="@pres @pl-agr" form="return"/>
    <word macros="@past" form="returned"/>
  </entry>
  <entry pos="V" stem="take">
    <member-of family="Taking-Time"/>
    <word macros="@base" form="take"/>
    <word macros="@ng" form="taking"/>
    <word macros="@pres @sg-agr @non-3rd-agr" form="take"/>
    <word macros="@pres @sg-or-mass-agr @3rd-agr" form="takes"/>
    <word macros="@pres @pl-agr" form="take"/>
    <word macros="@past" form="took"/>
  </entry>
  <entry pos="V" stem="travel">
    <member-of family="Travel"/>
    <word macros="@base" form="travel"/>
    <word macros="@ng" form="traveling"/>
    <word macros="@pres @sg-agr @non-3rd-agr" form="travel"/>
    <word macros="@pres @sg-or-mass-agr @3rd-agr" form="travels"/>
    <word macros="@pres @pl-agr" form="travel"/>
    <word macros="@past" form="traveled"/>
  </entry>
  <entry pos="V" stem="want">
    <member-of family="Wanting"/>
    <word macros="@base" form="want"/>
    <word macros="@ng" form="wanting"/>
    <word macros="@pres @sg-agr @non-3rd-agr" form="want"/>
    <word macros="@pres @sg-or-mass-agr @3rd-agr" form="wants"/>
    <word macros="@pres @pl-agr" form="want"/>
    <word macros="@past" form="wanted"/>
  </entry>
  <entry class="timeframe" pos="Adj" stem="afternoon">
    <member-of family="Adj-TimeFrame"/>
  </entry>
  <entry pos="Adj" stem="available">
    <member-of family="Adjective"/>
  </entry>
  <entry class="scalar" pos="Adj" stem="better">
    <member-of family="Adjective"/>
  </entry>
  <entry class="scalar" pos="Adj" stem="best">
    <member-of family="Adjective"/>
  </entry>
  <entry class="scalar" pos="Adj" stem="cheap">
    <member-of family="Adjective"/>
  </entry>
  <entry class="scalar" pos="Adj" stem="cheaper">
    <member-of family="Adjective"/>
  </entry>
  <entry class="scalar" pos="Adj" stem="cheapest">
    <member-of family="Adjective"/>
  </entry>
  <entry pos="Adj" stem="connecting">
    <member-of family="Adjective"/>
  </entry>
  <entry pos="Adj" stem="departure">
    <member-of family="Adjective"/>
  </entry>
  <entry pos="Adj" stem="destination">
    <member-of family="Adjective"/>
  </entry>
  <entry pos="Adj" stem="direct">
    <member-of family="Adjective"/>
  </entry>
  <entry class="scalar" pos="Adj" stem="early">
    <member-of family="Adjective"/>
  </entry>
  <entry class="scalar" pos="Adj" stem="earlier">
    <member-of family="Adjective"/>
  </entry>
  <entry class="scalar" pos="Adj" stem="earliest">
    <member-of family="Adjective"/>
  </entry>
  <entry pos="Adj" stem="even">
    <member-of family="Adjective"/>
    <member-of family="Adjective-Measure"/>
    <word excluded="Predicative" form="even"/>
  </entry>
  <entry class="timeframe" pos="Adj" stem="evening">
    <member-of family="Adj-TimeFrame"/>
  </entry>
  <entry pos="Adj" stem="first">
    <member-of family="Adjective"/>
  </entry>
  <entry pos="Adj" stem="full">
    <member-of family="Adj-Full"/>
  </entry>
  <entry class="scalar" pos="Adj" stem="good">
    <member-of family="Adjective"/>
  </entry>
  <entry class="scalar" pos="Adj" stem="great">
    <member-of family="Adjective"/>
  </entry>
  <entry pos="Adj" stem="just">
    <member-of family="Adjective"/>
    <member-of family="Adjective-Measure"/>
    <word excluded="Predicative" form="just"/>
  </entry>
  <entry pos="Adj" stem="last">
    <member-of family="Adjective"/>
  </entry>
  <entry class="scalar" pos="Adj" stem="late">
    <member-of family="Adjective"/>
  </entry>
  <entry class="scalar" pos="Adj" stem="later">
    <member-of family="Adjective"/>
  </entry>
  <entry class="scalar" pos="Adj" stem="latest">
    <member-of family="Adjective"/>
  </entry>
  <entry class="timeframe" pos="Adj" stem="morning">
    <member-of family="Adj-TimeFrame"/>
  </entry>
  <entry pos="Adj" stem="next">
    <member-of family="Adjective"/>
  </entry>
  <entry pos="Adj" stem="nonstop">
    <member-of family="Adjective"/>
  </entry>
  <entry pos="Adj" stem="only">
    <member-of family="Adjective"/>
    <member-of family="Adjective-Measure"/>
    <word excluded="Predicative" form="only"/>
  </entry>
  <entry pos="Adj" stem="other">
    <member-of family="Adjective"/>
    <word excluded="Predicative" form="other"/>
  </entry>
  <entry pos="Adj" stem="total">
    <member-of family="Adjective"/>
  </entry>
  <entry pos="Adj" stem="willing">
    <member-of family="Adj-Willing"/>
  </entry>
  <entry class="timeframe" pos="N" stem="afternoon">
    <word macros="@sg" form="afternoon"/>
    <word macros="@pl" form="afternoons"/>
  </entry>
  <entry class="airline" pos="N" stem="airline">
    <word macros="@sg" form="airline"/>
    <word macros="@pl" form="airlines"/>
  </entry>
  <entry macros="@mass" class="abstraction" pos="N" stem="availability">
    <member-of family="Noun-Category"/>
  </entry>
  <entry class="scalar" pos="N" stem="cheapest"/>
  <entry class="city" pos="N" stem="city">
    <word macros="@sg" form="city"/>
    <word macros="@pl" form="cities"/>
  </entry>
  <entry class="action" pos="N" stem="connection">
    <member-of family="Noun-Path"/>
    <word macros="@sg" form="connection"/>
    <word macros="@pl" form="connections"/>
  </entry>
  <entry class="date" pos="N" stem="day">
    <word macros="@sg" form="day"/>
    <word macros="@pl" form="days"/>
  </entry>
  <entry class="date" pos="N" stem="date">
    <word macros="@sg" form="date"/>
    <word macros="@pl" form="dates"/>
  </entry>
  <entry class="location" pos="N" stem="destination">
    <word macros="@sg" form="destination"/>
    <word macros="@pl" form="destinations"/>
  </entry>
  <entry class="scalar" pos="N" stem="earliest"/>
  <entry class="timeframe" pos="N" stem="evening">
    <word macros="@sg" form="evening"/>
    <word macros="@pl" form="evenings"/>
  </entry>
  <entry class="phys-obj" pos="N" stem="flight">
    <member-of family="Noun-Travel"/>
    <word macros="@sg" form="flight"/>
    <word macros="@pl" form="flights"/>
  </entry>
  <entry class="scalar" pos="N" stem="latest"/>
  <entry class="date" pos="N" stem="month">
    <word macros="@sg" form="month"/>
    <word macros="@pl" form="months"/>
  </entry>
  <entry class="timeframe" pos="N" stem="morning">
    <word macros="@sg" form="morning"/>
    <word macros="@pl" form="mornings"/>
  </entry>
  <entry class="abstraction" pos="N" stem="nonstop"/>
  <entry class="abstraction" pos="N" stem="pound">
    <word macros="@sg" form="pound"/>
    <word macros="@pl" form="pounds"/>
  </entry>
  <entry class="abstraction" pos="N" stem="option">
    <word macros="@sg" form="option"/>
    <word macros="@pl" form="options"/>
  </entry>
  <entry class="abstraction" pos="N" stem="price">
    <word macros="@sg" form="price"/>
    <word macros="@pl" form="prices"/>
  </entry>
  <entry class="mental-obj" pos="N" stem="requirement">
    <word macros="@sg" form="requirement"/>
    <word macros="@pl" form="requirements"/>
  </entry>
  <entry class="phys-obj" pos="N" stem="seat">
    <word macros="@sg" form="seat"/>
    <word macros="@pl" form="seats"/>
    <member-of family="Noun-Category"/>
  </entry>
  <entry class="action" pos="N" stem="stopover">
    <member-of family="Noun-Path"/>
    <word macros="@sg" form="stopover"/>
    <word macros="@pl" form="stopovers"/>
  </entry>
  <entry class="mental-obj" pos="N" stem="ticket">
    <word macros="@sg" form="ticket"/>
    <word macros="@pl" form="tickets"/>
  </entry>
  <entry class="time" pos="N" stem="time">
    <word macros="@sg" form="time"/>
    <word macros="@pl" form="times"/>
  </entry>
  <entry class="abstraction" pos="N" stem="travel_time">
    <member-of family="Noun-Duration"/>
    <word macros="@sg" form="travel_time"/>
    <word macros="@pl" form="travel_times"/>
  </entry>
  <entry class="time" pos="NNP" stem="noon"/>
  <entry class="time" pos="NNP" stem="midnight"/>
  <entry macros="@sg-2" class="person" pos="NNP" stem="Bob"/>
  <entry macros="@sg-2" class="person" pos="NNP" stem="Gil"/>
  <entry macros="@sg-2" class="person" pos="NNP" stem="Ted"/>
  <entry macros="@sg-2" class="fareclass" pos="NNP" stem="business"/>
  <entry macros="@sg-2" class="fareclass" pos="NNP" stem="business_class"/>
  <entry macros="@sg-2" class="fareclass" pos="NNP" stem="coach"/>
  <entry macros="@sg-2" class="fareclass" pos="NNP" stem="economy"/>
  <entry macros="@sg-2" class="fareclass" pos="NNP" stem="first"/>
  <entry macros="@sg-2" class="fareclass" pos="NNP" stem="first_class"/>
  <entry macros="@sg-2" class="airline" pos="NNP" stem="Air_France"/>
  <entry class="airline" pos="Adj" stem="Air_France">
    <member-of family="Adj-Airline"/>
  </entry>
  <entry macros="@sg-2" class="airline" pos="NNP" stem="American"/>
  <entry class="airline" pos="Adj" stem="American">
    <member-of family="Adj-Airline"/>
  </entry>
  <entry macros="@sg-2" class="airline" pos="NNP" stem="BMI"/>
  <entry class="airline" pos="Adj" stem="BMI">
    <member-of family="Adj-Airline"/>
  </entry>
  <entry macros="@sg-2" class="airline" pos="NNP" stem="British_Airways"/>
  <entry class="airline" pos="Adj" stem="British_Airways">
    <member-of family="Adj-Airline"/>
  </entry>
  <entry macros="@sg-2" class="airline" pos="NNP" stem="Delta"/>
  <entry class="airline" pos="Adj" stem="Delta">
    <member-of family="Adj-Airline"/>
  </entry>
  <entry macros="@sg-2" class="airline" pos="NNP" stem="Easyjet"/>
  <entry class="airline" pos="Adj" stem="Easyjet">
    <member-of family="Adj-Airline"/>
  </entry>
  <entry macros="@sg-2" class="airline" pos="NNP" stem="Flybe"/>
  <entry class="airline" pos="Adj" stem="Flybe">
    <member-of family="Adj-Airline"/>
  </entry>
  <entry macros="@sg-2" class="airline" pos="NNP" stem="KLM"/>
  <entry class="airline" pos="Adj" stem="KLM">
    <member-of family="Adj-Airline"/>
  </entry>
  <entry macros="@sg-2" class="airline" pos="NNP" stem="Lufthansa"/>
  <entry class="airline" pos="Adj" stem="Lufthansa">
    <member-of family="Adj-Airline"/>
  </entry>
  <entry macros="@sg-2" class="airline" pos="NNP" stem="SN_Brussels_Airlines"/>
  <entry class="airline" pos="Adj" stem="SN_Brussels_Airlines">
    <member-of family="Adj-Airline"/>
  </entry>
  <entry macros="@sg-2" class="airline" pos="NNP" stem="Ryanair"/>
  <entry class="airline" pos="Adj" stem="Ryanair">
    <member-of family="Adj-Airline"/>
  </entry>
  <entry macros="@sg-2" class="airline" pos="NNP" stem="Scot_Airways"/>
  <entry class="airline" pos="Adj" stem="Scot_Airways">
    <member-of family="Adj-Airline"/>
  </entry>
  <entry macros="@sg-2" class="airline" pos="NNP" stem="United"/>
  <entry class="airline" pos="Adj" stem="United">
    <member-of family="Adj-Airline"/>
  </entry>
  <entry macros="@sg-2" class="airline" pos="NNP" stem="VLM"/>
  <entry class="airline" pos="Adj" stem="VLM">
    <member-of family="Adj-Airline"/>
  </entry>
  <entry macros="@sg-2" class="airport" pos="NNP" stem="Amsterdam_Schiphol"/>
  <entry macros="@sg-2" class="airport" pos="NNP" stem="Boston_Logan"/>
  <entry macros="@sg-2" class="airport" pos="NNP" stem="Helsinki_airport"/>
  <entry macros="@sg-2" class="airport" pos="NNP" stem="London_City_Airport"/>
  <entry macros="@sg-2" class="airport" pos="NNP" stem="London_Gatwick"/>
  <entry macros="@sg-2" class="airport" pos="NNP" stem="London_Heathrow"/>
  <entry macros="@sg-2" class="airport" pos="NNP" stem="Heathrow"/>
  <entry macros="@sg-2" class="airport" pos="NNP" stem="San_Francisco_International"/>
  <entry macros="@sg-2" class="city" pos="NNP" stem="Aalborg"/>
  <entry macros="@sg-2" class="city" pos="NNP" stem="Amsterdam"/>
  <entry macros="@sg-2" class="city" pos="NNP" stem="Barcelona"/>
  <entry macros="@sg-2" class="city" pos="NNP" stem="Berlin"/>
  <entry macros="@sg-2" class="city" pos="NNP" stem="Birmingham"/>
  <entry macros="@sg-2" class="city" pos="NNP" stem="Boston"/>
  <entry macros="@sg-2" class="city" pos="NNP" stem="Bristol"/>
  <entry macros="@sg-2" class="city" pos="NNP" stem="Brussels"/>
  <entry macros="@sg-2" class="city" pos="NNP" stem="Dublin"/>
  <entry macros="@sg-2" class="city" pos="NNP" stem="Edinburgh"/>
  <entry macros="@sg-2" class="city" pos="NNP" stem="Frankfurt"/>
  <entry macros="@sg-2" class="city" pos="NNP" stem="Helsinki"/>
  <entry macros="@sg-2" class="city" pos="NNP" stem="London"/>
  <entry macros="@sg-2" class="city" pos="NNP" stem="Manchester"/>
  <entry macros="@sg-2" class="city" pos="NNP" stem="Madrid"/>
  <entry macros="@sg-2" class="city" pos="NNP" stem="Milan"/>
  <entry macros="@sg-2" class="city" pos="NNP" stem="Paris"/>
  <entry macros="@sg-2" class="city" pos="NNP" stem="San_Francisco"/>
  <macro name="@mass">
    <fs val="mass" attr="num" id="2"/>
  </macro>
  <macro name="@sg">
    <fs val="sg" attr="num" id="2"/>
    <lf>
      <satop nomvar="X">
        <diamond mode="num">
          <prop name="sg"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@sg-agr">
    <fs val="sg" attr="num" id="1"/>
    <fs val="sg" attr="num" id="2"/>
  </macro>
  <macro name="@sg-or-mass-agr">
    <fs id="1">
      <feat attr="num">
        <featvar name="NUM:sg-or-mass"/>
      </feat>
    </fs>
    <fs id="2">
      <feat attr="num">
        <featvar name="NUM:sg-or-mass"/>
      </feat>
    </fs>
  </macro>
  <macro name="@sg-2">
    <fs val="sg" attr="num" id="2"/>
  </macro>
  <macro name="@sg-or-mass-2">
    <fs val="sg-or-mass" attr="num" id="2"/>
  </macro>
  <macro name="@sg-P">
    <lf>
      <satop nomvar="P">
        <diamond mode="num">
          <prop name="sg"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@pl">
    <fs val="pl" attr="num" id="2"/>
    <lf>
      <satop nomvar="X">
        <diamond mode="num">
          <prop name="pl"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@pl-agr">
    <fs val="pl" attr="num" id="1"/>
    <fs val="pl" attr="num" id="2"/>
  </macro>
  <macro name="@pl-2">
    <fs val="pl" attr="num" id="2"/>
  </macro>
  <macro name="@pl-or-mass-2">
    <fs val="pl-or-mass" attr="num" id="2"/>
  </macro>
  <macro name="@pl-P">
    <lf>
      <satop nomvar="P">
        <diamond mode="num">
          <prop name="pl"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@1st">
    <fs val="1st" attr="pers" id="2"/>
  </macro>
  <macro name="@1st-agr">
    <fs val="1st" attr="pers" id="1"/>
    <fs val="1st" attr="pers" id="2"/>
  </macro>
  <macro name="@2nd">
    <fs val="2nd" attr="pers" id="2"/>
  </macro>
  <macro name="@2nd-agr">
    <fs val="2nd" attr="pers" id="1"/>
    <fs val="2nd" attr="pers" id="2"/>
  </macro>
  <macro name="@non-3rd-agr">
    <fs id="1">
      <feat attr="pers">
        <featvar name="PERS:non-3rd"/>
      </feat>
    </fs>
    <fs id="2">
      <feat attr="pers">
        <featvar name="PERS:non-3rd"/>
      </feat>
    </fs>
  </macro>
  <macro name="@3rd">
    <fs val="3rd" attr="pers" id="2"/>
  </macro>
  <macro name="@3rd-agr">
    <fs val="3rd" attr="pers" id="1"/>
    <fs val="3rd" attr="pers" id="2"/>
  </macro>
  <macro name="@nom">
    <fs val="nom" attr="case" id="2"/>
  </macro>
  <macro name="@acc">
    <fs val="acc" attr="case" id="2"/>
  </macro>
  <macro name="@pp-from">
    <fs val="from" attr="lex" id="3"/>
  </macro>
  <macro name="@pp-to">
    <fs val="to" attr="lex" id="3"/>
  </macro>
  <macro name="@prt-up">
    <fs val="up" attr="lex" id="4"/>
  </macro>
  <macro name="@prt-with">
    <fs val="with" attr="lex" id="4"/>
  </macro>
  <macro name="@ng">
    <fs val="ng" attr="form" id="1"/>
  </macro>
  <macro name="@base">
    <fs val="base" attr="form" id="1"/>
  </macro>
  <macro name="@base6">
    <fs val="base" attr="form" id="6"/>
  </macro>
  <macro name="@dcl">
    <fs id="1">
      <feat val="dcl" attr="form"/>
    </fs>
  </macro>
  <macro name="@adj">
    <fs val="adj" attr="form" id="1"/>
  </macro>
  <macro name="@adj6">
    <fs val="adj" attr="form" id="6"/>
  </macro>
  <macro name="@X-location">
    <fs id="2">
      <feat attr="index">
        <lf>
          <nomvar name="X:location"/>
        </lf>
      </feat>
    </fs>
  </macro>
  <macro name="@X-person">
    <fs id="2">
      <feat attr="index">
        <lf>
          <nomvar name="X:person"/>
        </lf>
      </feat>
    </fs>
  </macro>
  <macro name="@past">
    <lf>
      <satop nomvar="E">
        <diamond mode="tense">
          <prop name="past"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@pres">
    <lf>
      <satop nomvar="E">
        <diamond mode="tense">
          <prop name="pres"/>
        </diamond>
      </satop>
    </lf>
  </macro>
</dictionary>


================================================
FILE: grammars/flights/dict.xsl
================================================
<?xml version="1.0"?>
<!-- 
Copyright (C) 2003-4 University of Edinburgh (Michael White) 
$Revision: 1.34 $, $Date: 2008/12/12 05:09:29 $ 

NB: These namespace declarations seem to work with the version of Xalan 
    that comes with JDK 1.4.  With newer versions of Xalan, 
    different namespace declarations may be required. 
-->
<xsl:transform 
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform" 
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  exclude-result-prefixes="xalan xalan2">
  

  <!-- ***** Import Core Dictionary Definitions ***** -->
  <xsl:import href="../core-en/dict.xsl"/>
  
  <xsl:output indent="yes" xalan2:indent-amount="2"/> 
  <xsl:strip-space elements="*"/>

  
  <!-- ***** Start Output Here ***** -->
  <xsl:template match="/">
  <dictionary name="flights"
    xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
    xsi:noNamespaceSchemaLocation="../dict.xsd"
  >
  
  <!-- Add core entries -->
  <xsl:call-template name="add-entries"/>

  <!-- NB: A (temp?) hack: the LL-as-LH family allows LL boundaries to appear in the middle of 
           lists, as if they were LH boundaries.  It might be nicer to use underspecification. -->
  <entry stem="LL%" pos="BT">
    <member-of family="BoundaryTone-LL%-as-LH%"/>
  </entry>
  
  <!-- 'and' as punctuation -->
  <entry stem="and" pos="and">
    <member-of family="And-Punct"/>
  </entry>
  
  <!-- Prepositions, Temporal Adverbials -->
  <entry stem="about" pos="Prep">
    <member-of family="Prep-Nom"/>
  </entry>
  <entry stem="after" pos="TempAdv">
    <member-of family="Prep-TimeRel"/>
  </entry>
  <entry stem="at" pos="Prep">
    <member-of family="Prep-Nom"/>
    <member-of family="Prep-Time"/>
  </entry>
  <entry stem="before" pos="TempAdv">
    <member-of family="Prep-TimeRel"/>
  </entry>
  <entry stem="between" pos="TempAdv">
    <member-of family="Between-TimeRel"/>
  </entry>
  <entry stem="by" pos="TempAdv">
    <member-of family="Prep-TimeRel"/>
  </entry>
  <entry stem="earlier" pos="TempAdv">
    <member-of family="Comparative-TimeRel"/>
  </entry>
  <entry stem="for" pos="Prep">
    <member-of family="Prep-Nom"/>
  </entry>
  <entry stem="from" pos="Prep">
    <member-of family="Prep-Nom"/>
  </entry>
  <entry stem="in" pos="Prep">
    <member-of family="Prep-Nom"/>
    <member-of family="Prep-TimeFrame"/>
  </entry>
  <entry stem="later" pos="TempAdv">
    <member-of family="Comparative-TimeRel"/>
  </entry>
  <entry stem="of" pos="Prep">
    <member-of family="Prep-Nom"/>
  </entry>
  <entry stem="on" pos="Prep">
    <member-of family="Prep-Nom"/>
    <member-of family="Prep-Date"/>
    <member-of family="Prep-Airline"/>
  </entry>
  <entry stem="on" pos="Adj">
    <member-of family="Prep-Loc"/>
  </entry>
  <entry stem="to" pos="Prep">
    <member-of family="Prep-Nom"/>
    <member-of family="To-Infinitive"/>
  </entry>
  <entry stem="until" pos="TempAdv">
    <member-of family="Prep-TimeRel"/>
  </entry>
  <entry stem="with" pos="Prep">
    <member-of family="Prep-Nom"/>
  </entry>


  <!-- Other Adverbs -->
  <entry stem="alternatively" pos="Adv">
    <member-of family="Transitional-Adverb"/>
  </entry>
  <entry stem="however" pos="Adv">
    <member-of family="Transitional-Adverb"/>
  </entry>
  <entry stem="only" pos="Adv">
    <member-of family="Adverb"/>
  </entry>
  <entry stem="on_time" pos="Adv">
    <member-of family="Adverb"/>
  </entry>
  <entry stem="today" pos="Adv">
    <member-of family="Adverb"/>
  </entry>
  <entry stem="yesterday" pos="Adv">
    <member-of family="Adverb"/>
  </entry>

  
  <!-- Verbs -->
  <entry stem="arrive" pos="V">
    <member-of family="Arriving"/>
    <word form="arrive" macros="@base"/>
    <word form="arriving" macros="@ng"/>
    <word form="arrive" macros="@pres @sg-agr @non-3rd-agr"/>
    <word form="arrives" macros="@pres @sg-or-mass-agr @3rd-agr"/>
    <word form="arrive" macros="@pres @pl-agr"/>
    <word form="arrived" macros="@past"/>
  </entry>

  <entry stem="book" pos="V">
    <member-of family="Booking"/>
    <word form="book" macros="@base"/>
    <word form="booking" macros="@ng"/>
    <word form="book" macros="@pres @sg-agr @non-3rd-agr"/>
    <word form="books" macros="@pres @sg-or-mass-agr @3rd-agr"/>
    <word form="book" macros="@pres @pl-agr"/>
    <word form="booked" macros="@past"/>
  </entry>

  <entry stem="choose" pos="V">
    <member-of family="Choosing"/>
    <word form="choose" macros="@base"/>
    <word form="choosing" macros="@ng"/>
    <word form="choose" macros="@pres @sg-agr @non-3rd-agr"/>
    <word form="chooses" macros="@pres @sg-or-mass-agr @3rd-agr"/>
    <word form="choose" macros="@pres @pl-agr"/>
    <word form="chose" macros="@past"/>
  </entry>

  <entry stem="connect" pos="V">
    <member-of family="Connecting"/>
    <word form="connect" macros="@base"/>
    <word form="connecting" macros="@ng"/>
    <word form="connect" macros="@pres @sg-agr @non-3rd-agr"/>
    <word form="connects" macros="@pres @sg-or-mass-agr @3rd-agr"/>
    <word form="connect" macros="@pres @pl-agr"/>
    <word form="connected" macros="@past"/>
  </entry>

  <entry stem="cost" pos="V">
    <member-of family="Costing"/>
    <word form="cost" macros="@base"/>
    <word form="costing" macros="@ng"/>
    <word form="cost" macros="@pres @sg-agr @non-3rd-agr"/>
    <word form="costs" macros="@pres @sg-or-mass-agr @3rd-agr"/>
    <word form="cost" macros="@pres @pl-agr"/>
    <word form="cost" macros="@past"/>
  </entry>

  <entry stem="depart" pos="V">
    <member-of family="Departing"/>
    <word form="depart" macros="@base"/>
    <word form="departing" macros="@ng"/>
    <word form="depart" macros="@pres @sg-agr @non-3rd-agr"/>
    <word form="departs" macros="@pres @sg-or-mass-agr @3rd-agr"/>
    <word form="depart" macros="@pres @pl-agr"/>
    <word form="departed" macros="@past"/>
  </entry>

  <entry stem="find" pos="V">
    <member-of family="Finding"/>
    <word form="find" macros="@base"/>
    <word form="finding" macros="@ng"/>
    <word form="find" macros="@pres @sg-agr @non-3rd-agr"/>
    <word form="finds" macros="@pres @sg-or-mass-agr @3rd-agr"/>
    <word form="find" macros="@pres @pl-agr"/>
    <word form="found" macros="@past"/>
  </entry>

  <entry stem="fly" pos="V">
    <member-of family="Travel"/>
    <word form="fly" macros="@base"/>
    <word form="flying" macros="@ng"/>
    <word form="fly" macros="@pres @sg-agr @non-3rd-agr"/>
    <word form="flies" macros="@pres @sg-or-mass-agr @3rd-agr"/>
    <word form="fly" macros="@pres @pl-agr"/>
    <word form="flew" macros="@past"/>
  </entry>

  <entry stem="get" pos="V">
    <member-of family="Conveyance"/>
    <word form="get" macros="@base"/>
    <word form="getting" macros="@ng"/>
    <word form="get" macros="@pres @sg-agr @non-3rd-agr"/>
    <word form="gets" macros="@pres @sg-or-mass-agr @3rd-agr"/>
    <word form="get" macros="@pres @pl-agr"/>
    <word form="got" macros="@past"/>
  </entry>

  <entry stem="go" pos="V">
    <member-of family="Travel"/>
    <word form="go" macros="@base"/>
    <word form="going" macros="@ng"/>
    <word form="go" macros="@pres @sg-agr @non-3rd-agr"/>
    <word form="goes" macros="@pres @sg-or-mass-agr @3rd-agr"/>
    <word form="go" macros="@pres @pl-agr"/>
    <word form="went" macros="@past"/>
  </entry>

  <entry stem="hear" pos="V">
    <member-of family="Hearing-About"/>
    <word form="hear" macros="@base"/>
    <word form="hearing" macros="@ng"/>
    <word form="hear" macros="@pres @sg-agr @non-3rd-agr"/>
    <word form="hears" macros="@pres @sg-or-mass-agr @3rd-agr"/>
    <word form="hear" macros="@pres @pl-agr"/>
    <word form="heard" macros="@past"/>
  </entry>

  <entry stem="leave" pos="V">
    <member-of family="Departing"/>
    <word form="leave" macros="@base"/>
    <word form="leaving" macros="@ng"/>
    <word form="leave" macros="@pres @sg-agr @non-3rd-agr"/>
    <word form="leaves" macros="@pres @sg-or-mass-agr @3rd-agr"/>
    <word form="leave" macros="@pres @pl-agr"/>
    <word form="left" macros="@past"/>
  </entry>

  <entry stem="match" pos="V">
    <member-of family="Evaluative-Comparison"/>
    <word form="match" macros="@base"/>
    <word form="matching" macros="@ng"/>
    <word form="match" macros="@pres @sg-agr @non-3rd-agr"/>
    <word form="matches" macros="@pres @sg-or-mass-agr @3rd-agr"/>
    <word form="match" macros="@pres @pl-agr"/>
    <word form="matched" macros="@past"/>
  </entry>

  <entry stem="need" pos="V">
    <member-of family="Needing-To" pred="need-to"/>
    <word form="need" macros="@base"/>
    <word form="needing" macros="@ng"/>
    <word form="need" macros="@pres @sg-agr @non-3rd-agr"/>
    <word form="needs" macros="@pres @sg-or-mass-agr @3rd-agr"/>
    <word form="need" macros="@pres @pl-agr"/>
    <word form="needed" macros="@past"/>
  </entry>

  <entry stem="offer" pos="V">
    <member-of family="Offering"/>
    <word form="offer" macros="@base"/>
    <word form="offering" macros="@ng"/>
    <word form="offer" macros="@pres @sg-agr @non-3rd-agr"/>
    <word form="offers" macros="@pres @sg-or-mass-agr @3rd-agr"/>
    <word form="offer" macros="@pres @pl-agr"/>
    <word form="offered" macros="@past"/>
  </entry>

  <!-- nb: 'prefer' in same family as 'like'; not sure about 'want' -->
  <entry stem="prefer" pos="V">
    <member-of family="Experiencer-Subj"/>
    <word form="prefer" macros="@base"/>
    <word form="preferring" macros="@ng"/>
    <word form="prefer" macros="@pres @sg-agr @non-3rd-agr"/>
    <word form="prefers" macros="@pres @sg-or-mass-agr @3rd-agr"/>
    <word form="prefer" macros="@pres @pl-agr"/>
    <word form="preferred" macros="@past"/>
  </entry>
  
  <entry stem="require" pos="V">
    <member-of family="Requiring"/>
    <word form="require" macros="@base"/>
    <word form="requiring" macros="@ng"/>
    <word form="require" macros="@pres @sg-agr @non-3rd-agr"/>
    <word form="requires" macros="@pres @sg-or-mass-agr @3rd-agr"/>
    <word form="require" macros="@pres @pl-agr"/>
    <word form="required" macros="@past"/>
  </entry>

  <entry stem="return" pos="V">
    <member-of family="Travel"/>
    <word form="return" macros="@base"/>
    <word form="returning" macros="@ng"/>
    <word form="return" macros="@pres @sg-agr @non-3rd-agr"/>
    <word form="returns" macros="@pres @sg-or-mass-agr @3rd-agr"/>
    <word form="return" macros="@pres @pl-agr"/>
    <word form="returned" macros="@past"/>
  </entry>

  <entry stem="take" pos="V">
    <member-of family="Taking-Time"/>
    <word form="take" macros="@base"/>
    <word form="taking" macros="@ng"/>
    <word form="take" macros="@pres @sg-agr @non-3rd-agr"/>
    <word form="takes" macros="@pres @sg-or-mass-agr @3rd-agr"/>
    <word form="take" macros="@pres @pl-agr"/>
    <word form="took" macros="@past"/>
  </entry>

  <entry stem="travel" pos="V">
    <member-of family="Travel"/>
    <word form="travel" macros="@base"/>
    <word form="traveling" macros="@ng"/>
    <word form="travel" macros="@pres @sg-agr @non-3rd-agr"/>
    <word form="travels" macros="@pres @sg-or-mass-agr @3rd-agr"/>
    <word form="travel" macros="@pres @pl-agr"/>
    <word form="traveled" macros="@past"/>
  </entry>

  <entry stem="want" pos="V">
    <member-of family="Wanting"/>
    <word form="want" macros="@base"/>
    <word form="wanting" macros="@ng"/>
    <word form="want" macros="@pres @sg-agr @non-3rd-agr"/>
    <word form="wants" macros="@pres @sg-or-mass-agr @3rd-agr"/>
    <word form="want" macros="@pres @pl-agr"/>
    <word form="wanted" macros="@past"/>
  </entry>

  <!-- Adjectives -->
  <!-- NB: 'just', 'only', 'other' far too simple (and excl. of Predicative entry a bit of a hack) -->
  <entry stem="afternoon" pos="Adj" class="timeframe">
    <member-of family="Adj-TimeFrame"/>
  </entry>
  <entry stem="available" pos="Adj">
    <member-of family="Adjective"/>
  </entry>
  <!-- 
    other price possibilities: 
      affordable.a, cheap.a, costly.a, exorbitant.a, expensive.a, free.a, inexpensive.a, 
      low-cost.a, low-priced.a, overpriced.a, pricey.a 
  -->
  <entry stem="better" pos="Adj" class="scalar">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="best" pos="Adj" class="scalar">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="cheap" pos="Adj" class="scalar">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="cheaper" pos="Adj" class="scalar">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="cheapest" pos="Adj" class="scalar">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="connecting" pos="Adj">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="departure" pos="Adj">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="destination" pos="Adj">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="direct" pos="Adj">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="early" pos="Adj" class="scalar">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="earlier" pos="Adj" class="scalar">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="earliest" pos="Adj" class="scalar">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="even" pos="Adj">
    <member-of family="Adjective"/>
    <member-of family="Adjective-Measure"/>
    <word form="even" excluded="Predicative"/>
  </entry>
  <entry stem="evening" pos="Adj" class="timeframe">
    <member-of family="Adj-TimeFrame"/>
  </entry>
  <entry stem="first" pos="Adj">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="full" pos="Adj">
    <member-of family="Adj-Full"/>
  </entry>
  <entry stem="good" pos="Adj" class="scalar">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="great" pos="Adj" class="scalar">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="just" pos="Adj">
    <member-of family="Adjective"/>
    <member-of family="Adjective-Measure"/>
    <word form="just" excluded="Predicative"/>
  </entry>
  <entry stem="last" pos="Adj">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="late" pos="Adj" class="scalar">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="later" pos="Adj" class="scalar">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="latest" pos="Adj" class="scalar">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="morning" pos="Adj" class="timeframe">
    <member-of family="Adj-TimeFrame"/>
  </entry>
  <entry stem="next" pos="Adj">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="nonstop" pos="Adj">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="only" pos="Adj">
    <member-of family="Adjective"/>
    <member-of family="Adjective-Measure"/>
    <word form="only" excluded="Predicative"/>
  </entry>
  <entry stem="other" pos="Adj">
    <member-of family="Adjective"/>
    <word form="other" excluded="Predicative"/>
  </entry>
  <entry stem="total" pos="Adj">
    <member-of family="Adjective"/>
  </entry>
  <entry stem="willing" pos="Adj">
    <member-of family="Adj-Willing"/>
  </entry>
  
  <!-- Nouns -->
  <entry stem="afternoon" pos="N" class="timeframe">
    <word form="afternoon" macros="@sg"/>
    <word form="afternoons" macros="@pl"/>
  </entry>
  <entry stem="airline" pos="N" class="airline">
    <word form="airline" macros="@sg"/>
    <word form="airlines" macros="@pl"/>
  </entry>
  <entry stem="availability" pos="N" class="abstraction" macros="@mass">
    <member-of family="Noun-Category"/>
  </entry>
  <entry stem="cheapest" pos="N" class="scalar"/>
  <entry stem="city" pos="N" class="city">
    <word form="city" macros="@sg"/>
    <word form="cities" macros="@pl"/>
  </entry>
  <entry stem="connection" pos="N" class="action">
    <member-of family="Noun-Path"/>
    <word form="connection" macros="@sg"/>
    <word form="connections" macros="@pl"/>
  </entry>
  <entry stem="day" pos="N" class="date">
    <word form="day" macros="@sg"/>
    <word form="days" macros="@pl"/>
  </entry>
  <entry stem="date" pos="N" class="date">
    <word form="date" macros="@sg"/>
    <word form="dates" macros="@pl"/>
  </entry>
  <entry stem="destination" pos="N" class="location">
    <word form="destination" macros="@sg"/>
    <word form="destinations" macros="@pl"/>
  </entry>
  <entry stem="earliest" pos="N" class="scalar"/>
  <entry stem="evening" pos="N" class="timeframe">
    <word form="evening" macros="@sg"/>
    <word form="evenings" macros="@pl"/>
  </entry>
  <entry stem="flight" pos="N" class="phys-obj">
    <member-of family="Noun-Travel"/>
    <word form="flight" macros="@sg"/>
    <word form="flights" macros="@pl"/>
  </entry>
  <entry stem="latest" pos="N" class="scalar"/>
  <entry stem="month" pos="N" class="date">
    <word form="month" macros="@sg"/>
    <word form="months" macros="@pl"/>
  </entry>
  <entry stem="morning" pos="N" class="timeframe">
    <word form="morning" macros="@sg"/>
    <word form="mornings" macros="@pl"/>
  </entry>
  <entry stem="nonstop" pos="N" class="abstraction"/>
  <entry stem="pound" pos="N" class="abstraction">
    <word form="pound" macros="@sg"/>
    <word form="pounds" macros="@pl"/>
  </entry>
  <entry stem="option" pos="N" class="abstraction">
    <word form="option" macros="@sg"/>
    <word form="options" macros="@pl"/>
  </entry>
  <entry stem="price" pos="N" class="abstraction">
    <word form="price" macros="@sg"/>
    <word form="prices" macros="@pl"/>
  </entry>
  <entry stem="requirement" pos="N" class="mental-obj">
    <word form="requirement" macros="@sg"/>
    <word form="requirements" macros="@pl"/>
  </entry>
  <entry stem="seat" pos="N" class="phys-obj">
    <word form="seat" macros="@sg"/>
    <word form="seats" macros="@pl"/>
    <member-of family="Noun-Category"/>
  </entry>
  <entry stem="stopover" pos="N" class="action">
    <member-of family="Noun-Path"/>
    <word form="stopover" macros="@sg"/>
    <word form="stopovers" macros="@pl"/>
  </entry>
  <entry stem="ticket" pos="N" class="mental-obj">
    <word form="ticket" macros="@sg"/>
    <word form="tickets" macros="@pl"/>
  </entry>
  <entry stem="time" pos="N" class="time">
    <word form="time" macros="@sg"/>
    <word form="times" macros="@pl"/>
  </entry>
  <entry stem="travel_time" pos="N" class="abstraction">
    <member-of family="Noun-Duration"/>
    <word form="travel_time" macros="@sg"/>
    <word form="travel_times" macros="@pl"/>
  </entry>

  <!-- named times -->
  <entry stem="noon" pos="NNP" class="time"/>
  <entry stem="midnight" pos="NNP" class="time"/>
  
  <!-- Proper Names (with some also as adjectives, for now) -->
  <entry stem="Bob" pos="NNP" class="person" macros="@sg-2"/>
  <entry stem="Gil" pos="NNP" class="person" macros="@sg-2"/>
  <entry stem="Ted" pos="NNP" class="person" macros="@sg-2"/>

  <entry stem="business" pos="NNP" class="fareclass" macros="@sg-2"/>
  <entry stem="business_class" pos="NNP" class="fareclass" macros="@sg-2"/>
  <entry stem="coach" pos="NNP" class="fareclass" macros="@sg-2"/>
  <entry stem="economy" pos="NNP" class="fareclass" macros="@sg-2"/>
  <entry stem="first" pos="NNP" class="fareclass" macros="@sg-2"/>
  <entry stem="first_class" pos="NNP" class="fareclass" macros="@sg-2"/>
  
  <entry stem="Air_France" pos="NNP" class="airline" macros="@sg-2"/>
  <entry stem="Air_France" pos="Adj" class="airline">
    <member-of family="Adj-Airline"/>
  </entry>
  <entry stem="American" pos="NNP" class="airline" macros="@sg-2"/>
  <entry stem="American" pos="Adj" class="airline">
    <member-of family="Adj-Airline"/>
  </entry>
  <entry stem="BMI" pos="NNP" class="airline" macros="@sg-2"/>
  <entry stem="BMI" pos="Adj" class="airline">
    <member-of family="Adj-Airline"/>
  </entry>
  <entry stem="British_Airways" pos="NNP" class="airline" macros="@sg-2"/>
  <entry stem="British_Airways" pos="Adj" class="airline">
    <member-of family="Adj-Airline"/>
  </entry>
  <entry stem="Delta" pos="NNP" class="airline" macros="@sg-2"/>
  <entry stem="Delta" pos="Adj" class="airline">
    <member-of family="Adj-Airline"/>
  </entry>
  <entry stem="Easyjet" pos="NNP" class="airline" macros="@sg-2"/>
  <entry stem="Easyjet" pos="Adj" class="airline">
    <member-of family="Adj-Airline"/>
  </entry>
  <entry stem="Flybe" pos="NNP" class="airline" macros="@sg-2"/>
  <entry stem="Flybe" pos="Adj" class="airline">
    <member-of family="Adj-Airline"/>
  </entry>
  <entry stem="KLM" pos="NNP" class="airline" macros="@sg-2"/>
  <entry stem="KLM" pos="Adj" class="airline">
    <member-of family="Adj-Airline"/>
  </entry>
  <entry stem="Lufthansa" pos="NNP" class="airline" macros="@sg-2"/>
  <entry stem="Lufthansa" pos="Adj" class="airline">
    <member-of family="Adj-Airline"/>
  </entry>
  <entry stem="SN_Brussels_Airlines" pos="NNP" class="airline" macros="@sg-2"/>
  <entry stem="SN_Brussels_Airlines" pos="Adj" class="airline">
    <member-of family="Adj-Airline"/>
  </entry>
  <entry stem="Ryanair" pos="NNP" class="airline" macros="@sg-2"/>
  <entry stem="Ryanair" pos="Adj" class="airline">
    <member-of family="Adj-Airline"/>
  </entry>
  <entry stem="Scot_Airways" pos="NNP" class="airline" macros="@sg-2"/>
  <entry stem="Scot_Airways" pos="Adj" class="airline">
    <member-of family="Adj-Airline"/>
  </entry>
  <entry stem="United" pos="NNP" class="airline" macros="@sg-2"/>
  <entry stem="United" pos="Adj" class="airline">
    <member-of family="Adj-Airline"/>
  </entry>
  <entry stem="VLM" pos="NNP" class="airline" macros="@sg-2"/>
  <entry stem="VLM" pos="Adj" class="airline">
    <member-of family="Adj-Airline"/>
  </entry>

  <entry stem="Amsterdam_Schiphol" pos="NNP" class="airport" macros="@sg-2"/>
  <entry stem="Boston_Logan" pos="NNP" class="airport" macros="@sg-2"/>
  <entry stem="Helsinki_airport" pos="NNP" class="airport" macros="@sg-2"/>
  <entry stem="London_City_Airport" pos="NNP" class="airport" macros="@sg-2"/>
  <entry stem="London_Gatwick" pos="NNP" class="airport" macros="@sg-2"/>
  <entry stem="London_Heathrow" pos="NNP" class="airport" macros="@sg-2"/>
  <entry stem="Heathrow" pos="NNP" class="airport" macros="@sg-2"/>
  <entry stem="San_Francisco_International" pos="NNP" class="airport" macros="@sg-2"/>

  <entry stem="Aalborg" pos="NNP" class="city" macros="@sg-2"/>
  <entry stem="Amsterdam" pos="NNP" class="city" macros="@sg-2"/>
  <entry stem="Barcelona" pos="NNP" class="city" macros="@sg-2"/>
  <entry stem="Berlin" pos="NNP" class="city" macros="@sg-2"/>
  <entry stem="Birmingham" pos="NNP" class="city" macros="@sg-2"/>
  <entry stem="Boston" pos="NNP" class="city" macros="@sg-2"/>
  <entry stem="Bristol" pos="NNP" class="city" macros="@sg-2"/>
  <entry stem="Brussels" pos="NNP" class="city" macros="@sg-2"/>
  <entry stem="Dublin" pos="NNP" class="city" macros="@sg-2"/>
  <entry stem="Edinburgh" pos="NNP" class="city" macros="@sg-2"/>
  <entry stem="Frankfurt" pos="NNP" class="city" macros="@sg-2"/>
  <entry stem="Helsinki" pos="NNP" class="city" macros="@sg-2"/>
  <entry stem="London" pos="NNP" class="city" macros="@sg-2"/>
  <entry stem="Manchester" pos="NNP" class="city" macros="@sg-2"/>
  <entry stem="Madrid" pos="NNP" class="city" macros="@sg-2"/>
  <entry stem="Milan" pos="NNP" class="city" macros="@sg-2"/>
  <entry stem="Paris" pos="NNP" class="city" macros="@sg-2"/>
  <entry stem="San_Francisco" pos="NNP" class="city" macros="@sg-2"/>


  <!-- Add core macros -->
  <xsl:call-template name="add-macros"/>
  
  </dictionary>
  </xsl:template>
</xsl:transform>


================================================
FILE: grammars/flights/flairs.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!-- Examples from FLAIRS submission. -->
<!-- NB: Dash expansions have been replaced with full stops. -->
<regression>

  <comment>Student example.</comment>
  
  <item numOfParses="2" string="there 's a direct_H* flight on BMI_H* with a good_H* price LL% .">
    <lf>
      <node id="t1" pred="there-be" info="rh" mood="dcl" tense="pres">
        <rel name="Arg">
          <node id="f1" pred="flight" det="a" num="sg">
            <rel name="Airline">
              <node id="b1" pred="BMI" kon="+"/>
            </rel>
            <rel name="Poss">
              <node id="p1" pred="price" det="a" num="sg">
                <rel name="HasProp">
                  <node id="g1" pred="good" kon="+"/>
                </rel>
              </node>
            </rel>
            <rel name="HasProp">
              <node id="d1" pred="direct" kon="+"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="it arrives at 16:10_H* LL% and costs 112GBP_H* LL% .">
    <lf>
      <node id="a1" pred="and" info="rh" mood="dcl">
        <rel name="List">
          <node id="a2" pred="arrive" tense="pres">
            <rel name="Theme">
              <node idref="p1"/>
            </rel>
            <rel name="Time">
              <node id="n1" pred="16:10" kon="+"/>
            </rel>
          </node>
          <node id="c1" pred="cost" tense="pres">
            <rel name="Goods">
              <node idref="p1"/>
            </rel>
            <rel name="Asset">
              <node id="n2" pred="112GBP" kon="+"/>
            </rel>
          </node>
        </rel>
        <node id="p1" pred="pro3n" num="sg"/>
      </node>
    </lf>
  </item>
  <item numOfParses="2" string="the cheapest_L+H* flight LH% is on Ryanair_H* LL% .">
    <comment>
      To make "on Ryanair" into a predicative adjective, so that it can serve as the 
      propositional complement of the copula, a dummy 'has-rel' head is introduced.
    </comment>
    <lf>
      <node id="b1" pred="be" info="rh" mood="dcl" tense="pres">
        <rel name="Arg">
          <node id="f1" pred="flight" det="the" info="th" num="sg">
            <rel name="HasProp">
              <node id="c1" pred="cheapest" kon="+"/>
            </rel>
          </node>
        </rel>
        <rel name="Prop">
          <node id="h1" pred="has-rel">
            <rel name="Of">
              <node idref="f1"/>
            </rel>
            <rel name="Airline">
              <node id="r1" pred="Ryanair" kon="+"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="it arrives at 12:45_H* LL% and costs just 50GBP_H* LL% , but it requires a connection_H* in Dublin_H* LL% .">
    <lf>
      <node id="b1" pred="but" info="rh" mood="dcl">
        <rel name="Arg1">
          <node id="a1" pred="and">
            <rel name="List">
              <node id="a2" pred="arrive" tense="pres">
                <rel name="Theme">
                  <node idref="p1"/>
                </rel>
                <rel name="Time">
                  <node id="n1" pred="12:45" kon="+"/>
                </rel>
              </node>
              <node id="c1" pred="cost" tense="pres">
                <rel name="Goods">
                  <node idref="p1"/>
                </rel>
                <rel name="Asset">
                  <node id="n2" pred="50GBP" kon="+">
                    <rel name="HasProp">
                      <node id="j1" pred="just"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
            <node id="p1" pred="pro3n" num="sg"/>
          </node>
        </rel>
        <rel name="Arg2">
          <node id="r1" pred="require" tense="pres">
            <rel name="Agent">
              <node id="p2" pred="pro3n" num="sg"/>
            </rel>
            <rel name="Duty">
              <node id="c2" pred="connection" det="a" kon="+" num="sg">
                <rel name="Path">
                  <node id="d1" pred="Dublin" kon="+"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  
  <comment>Frequent Flyer example.</comment>
  
  <item numOfParses="1" string="there 's a KLM_H* flight LL% arriving Brussels_H* at 16:50_H* LL% , but business_class_H* is not_H* available_H* LH% and you 'd need to connect_H* in Amsterdam_H* LL% .">
    <lf>
      <node id="b1" pred="but" info="rh" mood="dcl">
        <rel name="Arg1">
          <node id="t1" pred="there-be" tense="pres">
            <rel name="Arg">
              <node id="f1" pred="flight" det="a" num="sg">
                <rel name="Airline">
                  <node id="k1" pred="KLM" kon="+"/>
                </rel>
              </node>
            </rel>
            <rel name="Prop">
              <node id="a1" pred="arrive">
                <rel name="Theme">
                  <node idref="f1"/>
                </rel>
                <rel name="Goal">
                  <node id="b2" pred="Brussels" kon="+"/>
                </rel>
                <rel name="Time">
                  <node id="n1" pred="16:50" kon="+"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="Arg2">
          <node id="a2" pred="and">
            <rel name="List">
              <node id="b3" pred="be" tense="pres">
                <rel name="Arg">
                  <node id="b4" pred="business_class" kon="+"/>
                </rel>
                <rel name="Prop">
                  <node id="n2" pred="not" kon="+">
                    <rel name="Body">
                      <node id="a3" pred="available" kon="+">
                        <rel name="Of">
                          <node idref="b4"/>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
              </node>
              <node id="w1" pred="would">
                <rel name="Body">
                  <node id="n3" pred="need-to">
                    <rel name="Agent">
                      <node id="p1" pred="pro2"/>
                    </rel>
                    <rel name="Duty">
                      <node id="c1" pred="connect" kon="+">
                        <rel name="Traveler">
                          <node idref="p1"/>
                        </rel>
                        <rel name="Path">
                          <node id="a4" pred="Amsterdam" kon="+"/>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="3" string="if you want to fly direct_L+H* LH% , there 's a BMI_H* flight LL% that arrives at 16:10_H* LL% , but it has no_H* availability_H* in business_class either LL% .">
    <lf>
      <node id="i1" pred="if" info="th" mood="dcl">
        <rel name="Arg1">
          <node id="w1" pred="want" tense="pres">
            <rel name="Experiencer">
              <node id="p1" pred="pro2"/>
            </rel>
            <rel name="Situation">
              <node id="f1" pred="fly">
                <rel name="Traveler">
                  <node idref="p1"/>
                </rel>
                <rel name="Prop">
                  <node id="d1" pred="direct" kon="+">
                    <rel name="Of">
                      <node idref="x1"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="Arg2">
          <node id="b1" pred="but" info="rh" owner="s">
            <rel name="Arg1">
              <node id="e1" pred="elab-rel">
                <rel name="Core">
                  <node id="t1" pred="there-be" tense="pres">
                    <rel name="Arg">
                      <node id="f2" pred="flight" det="a" num="sg">
                        <rel name="Airline">
                          <node id="b2" pred="BMI" kon="+"/>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
                <rel name="Trib">
                  <node id="a1" pred="arrive" tense="pres">
                    <rel name="Theme">
                      <node idref="x2"/>
                    </rel>
                    <rel name="Time">
                      <node id="n1" pred="16:10" kon="+"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
            <rel name="Arg2">
              <node id="n2" pred="no" kon="+">
                <rel name="Restr">
                  <node id="a2" pred="availability" kon="+">
                    <rel name="Category">
                      <node id="b3" pred="business_class"/>
                    </rel>
                  </node>
                </rel>
                <rel name="Body">
                  <node id="h1" pred="have" tense="pres">
                    <rel name="Owner">
                      <node id="p2" pred="pro3n" num="sg"/>
                    </rel>
                    <rel name="Poss">
                      <node idref="a2"/>
                    </rel>
                  </node>
                </rel>
                <rel name="HasProp">
                  <node id="e2" pred="either"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="there are_L+H* seats in business_class LH% on the British_Airways_H* flight LL% that arrives at 16:20_H* LL% .">
    <lf>
      <node id="e1" pred="elab-rel" info="rh" mood="dcl">
        <rel name="Core">
          <node id="t1" pred="there-be" info="th" kon="+" tense="pres">
            <rel name="Arg">
              <node id="s1" pred="seat" det="nil" num="pl">
                <rel name="Category">
                  <node id="b1" pred="business_class"/>
                </rel>
              </node>
            </rel>
            <rel name="Prop">
              <node id="o1" pred="on" info="rh" owner="s">
                <rel name="Fig">
                  <node idref="s1"/>
                </rel>
                <rel name="Ground">
                  <node id="f1" pred="flight" det="the" num="sg">
                    <rel name="Airline">
                      <node id="b2" pred="British_Airways" kon="+"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="Trib">
          <node id="a1" pred="arrive" tense="pres">
            <rel name="Theme">
              <node idref="x1"/>
            </rel>
            <rel name="Time">
              <node id="n1" pred="16:20" kon="+"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="it requires a connection_H* in Manchester_H* though LL% .">
    <lf>
      <node id="r1" pred="require" info="rh" mood="dcl" tense="pres">
        <rel name="Agent">
          <node id="p1" pred="pro3n" num="sg"/>
        </rel>
        <rel name="Duty">
          <node id="c1" pred="connection" det="a" kon="+" num="sg">
            <rel name="Path">
              <node id="m1" pred="Manchester" kon="+"/>
            </rel>
          </node>
        </rel>
        <rel name="HasProp">
          <node id="t1" pred="though"/>
        </rel>
      </node>
    </lf>
  </item>
  
  <comment>Business Class example.</comment>
  
  <item numOfParses="1" string="you can fly business_class_H* on British_Airways_H* LL% , arriving at 16:20_H* LL% , but you 'd need to connect_H* in Manchester_H* LL% .">
    <lf>
      <node id="b1" pred="but" info="rh" mood="dcl">
        <rel name="Arg1">
          <node id="e1" pred="elab-rel">
            <rel name="Core">
              <node id="c1" pred="can">
                <rel name="Body">
                  <node id="f1" pred="fly">
                    <rel name="Traveler">
                      <node id="p1" pred="pro2"/>
                    </rel>
                    <rel name="Airline">
                      <node id="b2" pred="British_Airways" kon="+"/>
                    </rel>
                    <rel name="Category">
                      <node id="b3" pred="business_class" kon="+"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
            <rel name="Trib">
              <node id="a1" pred="arrive">
                <rel name="Theme">
                  <node idref="x1"/>
                </rel>
                <rel name="Time">
                  <node id="n1" pred="16:20" kon="+"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="Arg2">
          <node id="w1" pred="would">
            <rel name="Body">
              <node id="n2" pred="need-to">
                <rel name="Agent">
                  <node id="p2" pred="pro2"/>
                </rel>
                <rel name="Duty">
                  <node id="c2" pred="connect" kon="+">
                    <rel name="Traveler">
                      <node idref="p2"/>
                    </rel>
                    <rel name="Path">
                      <node id="m1" pred="Manchester" kon="+"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="2" string="there is a direct_L+H* flight LH% on BMI_H* LL% , arriving at 16:10_H* LL% , but it has no_H* availability_H* in business_class_H* LL% .">
    <lf>
      <node id="b1" pred="but" info="rh" mood="dcl">
        <rel name="Arg1">
          <node id="e1" pred="elab-rel">
            <rel name="Core">
              <node id="t1" pred="there-be" info="th" tense="pres">
                <rel name="Arg">
                  <node id="f1" pred="flight" det="a" num="sg">
                    <rel name="HasProp">
                      <node id="d1" pred="direct" kon="+"/>
                    </rel>
                  </node>
                </rel>
                <rel name="Prop">
                  <node id="h1" pred="has-rel" info="rh" owner="s">
                    <rel name="Of">
                      <node idref="f1"/>
                    </rel>
                    <rel name="Airline">
                      <node id="b2" pred="BMI" kon="+"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
            <rel name="Trib">
              <node id="a1" pred="arrive">
                <rel name="Theme">
                  <node idref="x1"/>
                </rel>
                <rel name="Time">
                  <node id="n1" pred="16:10" kon="+"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="Arg2">
          <node id="n2" pred="no" kon="+">
            <rel name="Restr">
              <node id="a2" pred="availability" kon="+">
                <rel name="Category">
                  <node id="b3" pred="business_class" kon="+"/>
                </rel>
              </node>
            </rel>
            <rel name="Body">
              <node id="h2" pred="have" tense="pres">
                <rel name="Owner">
                  <node id="p1" pred="pro3n" num="sg"/>
                </rel>
                <rel name="Poss">
                  <node idref="a2"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  
  <comment>Frequent Flyer variant, with preferred airline second (still a bit awkward).</comment>
  
  <item numOfParses="3" string="if you want to fly with KLM_L+H* LH% , there is a flight LL% , arriving Brussels_H* at 16:50_H* LL% , but business_class_H* is not_H* available_H* LL% .">
    <lf>
      <node id="i1" pred="if" info="th" mood="dcl">
        <rel name="Arg1">
          <node id="w1" pred="want" tense="pres">
            <rel name="Experiencer">
              <node id="p1" pred="pro2"/>
            </rel>
            <rel name="Situation">
              <node id="f1" pred="fly">
                <rel name="Traveler">
                  <node idref="p1"/>
                </rel>
                <rel name="Airline">
                  <node id="k1" pred="KLM" kon="+"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="Arg2">
          <node id="b1" pred="but" info="rh" owner="s">
            <rel name="Arg1">
              <node id="e1" pred="elab-rel">
                <rel name="Core">
                  <node id="t1" pred="there-be" tense="pres">
                    <rel name="Arg">
                      <node id="f2" pred="flight" det="a" num="sg"/>
                    </rel>
                  </node>
                </rel>
                <rel name="Trib">
                  <node id="a1" pred="arrive">
                    <rel name="Theme">
                      <node idref="x1"/>
                    </rel>
                    <rel name="Goal">
                      <node id="b2" pred="Brussels" kon="+"/>
                    </rel>
                    <rel name="Time">
                      <node id="n1" pred="16:50" kon="+"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
            <rel name="Arg2">
              <node id="b3" pred="be" tense="pres">
                <rel name="Arg">
                  <node id="b4" pred="business_class" kon="+"/>
                </rel>
                <rel name="Prop">
                  <node id="n2" pred="not" kon="+">
                    <rel name="Body">
                      <node id="a2" pred="available" kon="+">
                        <rel name="Of">
                          <node idref="b4"/>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  
  <comment>Some extra test cases.</comment>
  
  <item numOfParses="2" string="there is a direct_H* flight LL% on BMI_H* LL% that has availability_H* in business_class_H* LL% .">
    <lf>
      <node id="e1:proposition" pred="elab-rel" info="rh" mood="dcl">
        <rel name="Core">
          <node id="t1:state" pred="there-be" tense="pres">
            <rel name="Arg">
              <node id="f1:phys-obj" pred="flight" det="a" num="sg">
                <rel name="HasProp">
                  <node id="d1:proposition" pred="direct" kon="+"/>
                </rel>
              </node>
            </rel>
            <rel name="Prop">
              <node id="h1:proposition" pred="has-rel">
                <rel name="Of">
                  <node idref="f1:phys-obj"/>
                </rel>
                <rel name="Airline">
                  <node id="b1:airline" pred="BMI" kon="+"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="Trib">
          <node id="h2:situation" pred="have" tense="pres">
            <rel name="Owner">
              <node idref="x1:sem-obj"/>
            </rel>
            <rel name="Poss">
              <node id="a1:abstraction" pred="availability" det="nil" kon="+">
                <rel name="Category">
                  <node id="b2:fareclass" pred="business_class" kon="+"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="2" string="there is a direct_H* flight LL% that has availability_H* in business_class_H* LL% , but it is on BMI_H* LL% .">
    <lf>
      <node id="b1:situation" pred="but" mood="dcl" info="rh">
        <rel name="Arg1">
          <node id="e1:proposition" pred="elab-rel">
            <rel name="Core">
              <node id="t1:state" pred="there-be" tense="pres">
                <rel name="Arg">
                  <node id="f1:phys-obj" pred="flight" det="a" num="sg">
                    <rel name="HasProp">
                      <node id="d1:proposition" pred="direct" kon="+"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
            <rel name="Trib">
              <node id="h1:situation" pred="have" tense="pres">
                <rel name="Owner">
                  <node idref="x1:sem-obj"/>
                </rel>
                <rel name="Poss">
                  <node id="a1:abstraction" pred="availability" det="nil" kon="+">
                    <rel name="Category">
                      <node id="b2:fareclass" pred="business_class" kon="+"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="Arg2">
          <node id="b3:state" pred="be" tense="pres">
            <rel name="Arg">
              <node id="p1:sem-obj" pred="pro3n" num="sg"/>
            </rel>
            <rel name="Prop">
              <node id="h2:proposition" pred="has-rel">
                <rel name="Of">
                  <node idref="p1:sem-obj"/>
                </rel>
                <rel name="Airline">
                  <node id="b4:airline" pred="BMI" kon="+"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="4" string="there is a flight on KLM_L+H* LH% that costs 107.70GBP_H* LL% , but you 'd need to connect_H* in Amsterdam_H* LL% and it has no_H* availability_H* in business_class_H* LL% .">
    <lf>
      <node id="b1:situation" pred="but" info="rh" mood="dcl">
        <rel name="Arg1">
          <node id="e1:proposition" pred="elab-rel">
            <rel name="Core">
              <node id="t1:state" pred="there-be" info="th" tense="pres">
                <rel name="Arg">
                  <node id="f1:phys-obj" pred="flight" det="a" num="sg">
                    <rel name="Airline">
                      <node id="k1:airline" pred="KLM" kon="+"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
            <rel name="Trib">
              <node id="c1:proposition" pred="cost" tense="pres">
                <rel name="Goods">
                  <node idref="x1:phys-obj"/>
                </rel>
                <rel name="Asset">
                  <node id="n1:amt" pred="107.70GBP" kon="+"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="Arg2">
          <node id="a1:situation" pred="and">
            <rel name="List">
              <node id="w1:state" pred="would">
                <rel name="Body">
                  <node id="n2:action" pred="need-to">
                    <rel name="Agent">
                      <node id="p1:person" pred="pro2"/>
                    </rel>
                    <rel name="Duty">
                      <node id="c2:motion" pred="connect" kon="+">
                        <rel name="Traveler">
                          <node idref="p1:person"/>
                        </rel>
                        <rel name="Path">
                          <node id="a2:city" pred="Amsterdam" kon="+"/>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
              </node>
              <node id="n3:quantification" pred="no" kon="+">
                <rel name="Restr">
                  <node id="a3:abstraction" pred="availability" kon="+">
                    <rel name="Category">
                      <node id="b2:fareclass" pred="business_class" kon="+"/>
                    </rel>
                  </node>
                </rel>
                <rel name="Body">
                  <node id="h1:situation" pred="have" tense="pres">
                    <rel name="Owner">
                      <node id="p2:sem-obj" pred="pro3n" num="sg"/>
                    </rel>
                    <rel name="Poss">
                      <node idref="a3:abstraction"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="3" string="if you are willing to fly on Ryanair_L+H* LH% , there is a flight with a great_H* price LL% .">
    <lf>
      <node id="i1:situation" pred="if" info="th" mood="dcl">
        <rel name="Arg1">
          <node id="b1:state" pred="be" tense="pres">
            <rel name="Arg">
              <node id="p1:animate-being" pred="pro2"/>
            </rel>
            <rel name="Prop">
              <node id="w1:proposition" pred="willing">
                <rel name="Experiencer">
                  <node idref="p1:animate-being"/>
                </rel>
                <rel name="Situation">
                  <node id="f1:motion" pred="fly">
                    <rel name="Traveler">
                      <node idref="p1:animate-being"/>
                    </rel>
                    <rel name="Airline">
                      <node id="r1:airline" pred="Ryanair" kon="+"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="Arg2">
          <node id="t1:state" pred="there-be" info="rh" owner="s" tense="pres">
            <rel name="Arg">
              <node id="f2:phys-obj" pred="flight" det="a" num="sg">
                <rel name="Poss">
                  <node id="p2:abstraction" pred="price" det="a" num="sg">
                    <rel name="HasProp">
                      <node id="g1:scalar" pred="great" kon="+"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="2" string="there is a KLM_L+H* flight LH% that arrives at 16:50_H* LL% , but you 'd need to connect_H* in Amsterdam_H* LL% and it has no_H* availability_H* in business_class either LL% .">
    <lf>
      <node id="b1:situation" pred="but" info="rh" mood="dcl">
        <rel name="Arg1">
          <node id="e1:proposition" pred="elab-rel">
            <rel name="Core">
              <node id="t1:state" pred="there-be" info="th" tense="pres">
                <rel name="Arg">
                  <node id="f1:phys-obj" pred="flight" det="a" num="sg">
                    <rel name="Airline">
                      <node id="k1:airline" pred="KLM" kon="+"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
            <rel name="Trib">
              <node id="a1:motion" pred="arrive" tense="pres">
                <rel name="Theme">
                  <node idref="x1:phys-obj"/>
                </rel>
                <rel name="Time">
                  <node id="n1:time" pred="16:50" kon="+"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="Arg2">
          <node id="a2:situation" pred="and">
            <rel name="List">
              <node id="w1:state" pred="would">
                <rel name="Body">
                  <node id="n2:action" pred="need-to">
                    <rel name="Agent">
                      <node id="p1:person" pred="pro2"/>
                    </rel>
                    <rel name="Duty">
                      <node id="c1:motion" pred="connect" kon="+">
                        <rel name="Traveler">
                          <node idref="p1:person"/>
                        </rel>
                        <rel name="Path">
                          <node id="a3:city" pred="Amsterdam" kon="+"/>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
              </node>
              <node id="n3:quantification" pred="no" kon="+">
                <rel name="Restr">
                  <node id="a4:abstraction" pred="availability" kon="+">
                    <rel name="Category">
                      <node id="b2:fareclass" pred="business_class"/>
                    </rel>
                  </node>
                </rel>
                <rel name="Body">
                  <node id="h1:situation" pred="have" tense="pres">
                    <rel name="Owner">
                      <node id="p2:sem-obj" pred="pro3n" num="sg"/>
                    </rel>
                    <rel name="Poss">
                      <node idref="a4:abstraction"/>
                    </rel>
                  </node>
                </rel>
                <rel name="HasProp">
                  <node id="e4:proposition" pred="either"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="the cheapest_L+H* one LH% is a Ryanair_H* flight LL% that arrives at 12:45_H* LL% and costs just 50GBP_H* LL% .">
    <lf>
      <node id="e1:proposition" pred="elab-rel" info="rh" mood="dcl">
        <rel name="Core">
          <node id="b1:state" pred="be" tense="pres">
            <rel name="Arg">
              <node id="p1:sem-obj" pred="pro_one" det="the" info="th" num="sg">
                <rel name="HasProp">
                  <node id="c1:proposition" pred="cheapest" kon="+"/>
                </rel>
              </node>
            </rel>
            <rel name="Pred">
              <node id="f1:phys-obj" pred="flight" det="a" num="sg">
                <rel name="Airline">
                  <node id="r1:airline" pred="Ryanair" kon="+"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="Trib">
          <node id="a1:situation" pred="and">
            <rel name="List">
              <node id="a2:motion" pred="arrive" tense="pres">
                <rel name="Theme">
                  <node idref="x1:phys-obj"/>
                </rel>
                <rel name="Time">
                  <node id="n1:time" pred="12:45" kon="+"/>
                </rel>
              </node>
              <node id="c2:proposition" pred="cost" tense="pres">
                <rel name="Goods">
                  <node idref="x1:phys-obj"/>
                </rel>
                <rel name="Asset">
                  <node id="n2:amt" pred="50GBP" kon="+">
                    <rel name="HasProp">
                      <node id="j1:proposition" pred="just"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="you can fly business_class_L+H* on British_Airways_L+H* LH% , arriving at 16:20_H* LL% , but you 'd need to connect_H* in Manchester_H* LL% .">
    <lf>
      <node id="b1:situation" pred="but" info="rh" mood="dcl">
        <rel name="Arg1">
          <node id="e1:proposition" pred="elab-rel">
            <rel name="Core">
              <node id="c1:state" pred="can" info="th">
                <rel name="Body">
                  <node id="f1:motion" pred="fly">
                    <rel name="Traveler">
                      <node id="p1:animate-being" pred="pro2"/>
                    </rel>
                    <rel name="Airline">
                      <node id="b2:airline" pred="British_Airways" kon="+"/>
                    </rel>
                    <rel name="Category">
                      <node id="b3:fareclass" pred="business_class" kon="+"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
            <rel name="Trib">
              <node id="a1:motion" pred="arrive">
                <rel name="Theme">
                  <node idref="x1:phys-obj"/>
                </rel>
                <rel name="Time">
                  <node id="n1:time" pred="16:20" kon="+"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="Arg2">
          <node id="w1:state" pred="would">
            <rel name="Body">
              <node id="n2:action" pred="need-to">
                <rel name="Agent">
                  <node id="p2:person" pred="pro2"/>
                </rel>
                <rel name="Duty">
                  <node id="c2:motion" pred="connect" kon="+">
                    <rel name="Traveler">
                      <node idref="p2:person"/>
                    </rel>
                    <rel name="Path">
                      <node id="m1:city" pred="Manchester" kon="+"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
</regression>


================================================
FILE: grammars/flights/grammar.xml
================================================
<?xml version="1.0"?>
<!-- 
Copyright (C) 2003-5 University of Edinburgh (Michael White) 
$Revision: 1.9 $, $Date: 2005/07/22 21:09:23 $ 
-->
<grammar name="flights"
  xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
  xsi:noNamespaceSchemaLocation="../grammar.xsd"
>

  <lexicon file="lexicon.xml"/>
  <morphology file="morph.xml"/>
  <rules file="rules.xml"/>
  <types file="types.xml"/>
  <tokenizer replacement-sem-classes="airline airport amt city date dur
    fareclass num person scalar time timeframe"/>

  <LF-from-XML>
    <transform file="../core-en/derive-features.xsl"/>
    <transform file="../treeify-lists.xsl"/>
    <transform file="../convert-to-hlds.xsl"/>
    <transform file="../core-en/add-chunks.xsl"/>
  </LF-from-XML>

  <LF-to-XML>
    <transform file="../core-en/raise-nodes.xsl"/>
    <transform file="../convert-to-graph.xsl"/>
    <transform file="../simplify-lists.xsl"/>
    <transform file="../core-en/drop-features.xsl"/>
  </LF-to-XML>

</grammar>


================================================
FILE: grammars/flights/lexicon-base.xsl
================================================
<?xml version="1.0"?>
<!-- 
Copyright (C) 2003-5 University of Edinburgh (Michael White)
$Revision: 1.92 $, $Date: 2008/12/12 05:09:29 $ 

See ../core-en/lexicon.xsl for comments re grammar.

The semantic roles are taken from FrameNet where possible.

NB: These namespace declarations seem to work with the version of Xalan 
    that comes with JDK 1.4.  In Xalan 2.5, the redirect namespace is 
    supposed to be declared as http://xml.apache.org/xalan/redirect, 
    but giving the classname (magically) seems to work.  
    With newer versions of Xalan, different namespace declarations may be required. 
-->
<xsl:transform 
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform" 
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:redirect="org.apache.xalan.lib.Redirect" 
  extension-element-prefixes="redirect"
  exclude-result-prefixes="xalan xalan2">

  
  <!-- ***** Import Core Lexicon Definitions ***** -->
  <xsl:import href="../core-en/lexicon.xsl"/>
  
  <xsl:output indent="yes" xalan2:indent-amount="2"/> 
  <xsl:strip-space elements="*"/>

  
  <!-- ***** Start Output Here ***** -->
  <xsl:template match="/">
  <ccg-lexicon name="flights" 
    xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
    xsi:noNamespaceSchemaLocation="../lexicon.xsd"
  >

  <!-- ***** Feature Declarations ******  -->
  <xsl:call-template name="add-feature-declarations"/>
  
  
  <!-- ***** Relation Sorting ******  -->
  <relation-sorting order=
    "BoundVar PairedWith
     Restr Body 
     Det Card Num 
     Arg Arg1 Arg2 Of
     Core Trib
     First Last List EqL
     Agent Cognizer Experiencer Fig FigInv Owner Perceiver
     Container ContainerInv Item Theme Traveler Vehicle
     *
     Beneficiary Chosen Ground Poss Possib Pred Prop Situation Sought
     Airline Cargo Category Goods Asset Duty Var
     Source Goal Path
     Location Date Duration Time Time1 Time2 TimeFrame TimeRel AmPm
     HasProp GenOwner
     GenRel Next"/>

     
  <!-- ***** Derived Categories and Families ***** -->
  <xsl:call-template name="add-core-families"/>
  
  <!-- 'and' as punctuation -->
  <xsl:variable name="and-punct">
    <atomcat type="punct"><fs attr="lex" val="and"/></atomcat>
  </xsl:variable>
  
  <family name="And-Punct" pos="and" closed="true" indexRel="*NoSem*">
    <entry name="Primary"><xsl:copy-of select="$and-punct"/></entry>
  </family>
    
  <!-- Path Nouns ('connection', 'stopover') -->
  <!-- NB: Since the Path rel is used with both 'in' and 'at', the 
           type of the argument NP (city/airport) actually makes a difference 
           to realization (though n-grams can easily make the choice too, 
           when the type info is not available). -->
  <xsl:variable name="n.in">
    <complexcat>    
      <xsl:copy-of select="$n.2.X"/>
      <slash dir="/" mode="&gt;"/>
      <xsl:copy-of select="$pp.3.Y.in"/>
    </complexcat>
  </xsl:variable>
  
  <xsl:variable name="n.at">
    <complexcat>    
      <xsl:copy-of select="$n.2.X"/>
      <slash dir="/" mode="&gt;"/>
      <xsl:copy-of select="$pp.3.Y.at"/>
    </complexcat>
  </xsl:variable>
  
  <xsl:variable name="X.Default.Path.Y-city">
    <lf>
      <satop nomvar="X:change">
        <prop name="[*DEFAULT*]"/>
        <diamond mode="Path"><nomvar name="Y:city"/></diamond>
      </satop>
    </lf>
  </xsl:variable>

  <xsl:variable name="X.Default.Path.Y-airport">
    <lf>
      <satop nomvar="X:change">
        <prop name="[*DEFAULT*]"/>
        <diamond mode="Path"><nomvar name="Y:airport"/></diamond>
      </satop>
    </lf>
  </xsl:variable>

  <family name="Noun-Path" pos="N" closed="true">
    <entry name="In-Path">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($n.in)/*"/>
        <xsl:with-param name="ext" select="$X.Default.Path.Y-city"/>
      </xsl:call-template>
    </entry>
    <entry name="At-Path">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($n.at)/*"/>
        <xsl:with-param name="ext" select="$X.Default.Path.Y-airport"/>
      </xsl:call-template>
    </entry>
  </family>

  <!-- Travel Nouns ('flight'); more cases tbd; not sure about type -->
  <xsl:variable name="n.from">
    <complexcat>    
      <xsl:copy-of select="$n.2.X"/>
      <slash dir="/" mode="&gt;"/>
      <xsl:copy-of select="$pp.3.Y.from"/>
    </complexcat>
  </xsl:variable>
  
  <xsl:variable name="n.to">
    <complexcat>    
      <xsl:copy-of select="$n.2.X"/>
      <slash dir="/" mode="&gt;"/>
      <xsl:copy-of select="$pp.3.Y.to"/>
    </complexcat>
  </xsl:variable>
  
  <xsl:variable name="n.from.to">
    <complexcat>    
      <xsl:copy-of select="$n.2.X"/>
      <slash dir="/" mode="&gt;"/>
      <xsl:copy-of select="$pp.4.Z.to"/>
      <slash dir="/" mode="&gt;"/>
      <xsl:copy-of select="$pp.3.Y.from"/>
    </complexcat>
  </xsl:variable>
  
  <xsl:variable name="X.Default.Source.Y">
    <lf>
      <satop nomvar="X:sem-obj">
        <prop name="[*DEFAULT*]"/>
        <diamond mode="Source"><nomvar name="Y:location"/></diamond>
      </satop>
    </lf>
  </xsl:variable>

  <xsl:variable name="X.Default.Goal.Y">
    <lf>
      <satop nomvar="X:sem-obj">
        <prop name="[*DEFAULT*]"/>
        <diamond mode="Goal"><nomvar name="Y:location"/></diamond>
      </satop>
    </lf>
  </xsl:variable>

  <xsl:variable name="X.Default.Source.Y.Goal.Z">
    <lf>
      <satop nomvar="X:sem-obj">
        <prop name="[*DEFAULT*]"/>
        <diamond mode="Source"><nomvar name="Y:location"/></diamond>
        <diamond mode="Goal"><nomvar name="Z:location"/></diamond>
      </satop>
    </lf>
  </xsl:variable>

  <family name="Noun-Travel" pos="N" closed="true">
    <entry name="PP-Source">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($n.from)/*"/>
        <xsl:with-param name="ext" select="$X.Default.Source.Y"/>
      </xsl:call-template>
    </entry>
    <entry name="PP-Goal">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($n.to)/*"/>
        <xsl:with-param name="ext" select="$X.Default.Goal.Y"/>
      </xsl:call-template>
    </entry>
    <entry name="PP-Source-PP-Goal">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($n.from.to)/*"/>
        <xsl:with-param name="ext" select="$X.Default.Source.Y.Goal.Z"/>
      </xsl:call-template>
    </entry>
  </family>

  <!-- Category Nouns ('availability')-->
  <xsl:variable name="X.Default.Category.Y">
    <lf>
      <satop nomvar="X:sem-obj">
        <prop name="[*DEFAULT*]"/>
        <diamond mode="Category"><nomvar name="Y:fareclass"/></diamond>
      </satop>
    </lf>
  </xsl:variable>
  <family name="Noun-Category" pos="N" closed="true">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($n.in)/*"/>
        <xsl:with-param name="ext" select="$X.Default.Category.Y"/>
      </xsl:call-template>
    </entry>
  </family>

  
  <!-- Duration Nouns ('travel_time')-->
  <xsl:variable name="X.Default.Duration.Y">
    <lf>
      <satop nomvar="X:sem-obj">
        <prop name="[*DEFAULT*]"/>
        <diamond mode="Duration"><nomvar name="Y:dur"/></diamond>
      </satop>
    </lf>
  </xsl:variable>
  
  <xsl:variable name="n.of">
    <complexcat>    
      <xsl:copy-of select="$n.2.X"/>
      <slash dir="/" mode="&gt;"/>
      <xsl:copy-of select="$pp.3.Y.of"/>
    </complexcat>
  </xsl:variable>
  
  <family name="Noun-Duration" pos="N" closed="true">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($n.of)/*"/>
        <xsl:with-param name="ext" select="$X.Default.Duration.Y"/>
      </xsl:call-template>
    </entry>
  </family>

  
  <!-- Container Adj ('full') -->
  <xsl:variable name="X.ContainerInv.P.Default">
    <lf>
      <satop nomvar="X:sem-obj">
        <diamond mode="ContainerInv">
          <nomvar name="P:proposition"/>
          <prop name="[*DEFAULT*]"/>
        </diamond>
      </satop>
    </lf>
  </xsl:variable>
  
  <xsl:variable name="pred.adj.pp.in">
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($pred.adj)/*"/>
      <xsl:with-param name="ext">
        <slash dir="/" mode="&lt;"/>
        <xsl:copy-of select="$pp.3.Y.in"/>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>
  
  <xsl:variable name="P.Default.Container.X">  
    <lf>
      <satop nomvar="P:proposition">
        <prop name="[*DEFAULT*]"/>
        <diamond mode="Container"><nomvar name="X:sem-obj"/></diamond>
      </satop>
    </lf>
  </xsl:variable>
  
  <xsl:variable name="P.Default.Container.X.Category.Y">  
    <lf>
      <satop nomvar="P:proposition">
        <prop name="[*DEFAULT*]"/>
        <diamond mode="Container"><nomvar name="X:sem-obj"/></diamond>
        <diamond mode="Category"><nomvar name="Y:fareclass"/></diamond>
      </satop>
    </lf>
  </xsl:variable>

  <family name="Adj-Full" pos="Adj" closed="true">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($adj)/*"/>
        <xsl:with-param name="ext" select="$X.ContainerInv.P.Default"/>
      </xsl:call-template>
    </entry>
    <entry name="Predicative-Container">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($pred.adj)/*"/>
        <xsl:with-param name="ext" select="$P.Default.Container.X"/>
      </xsl:call-template>
    </entry>
    <entry name="Predicative-Container-PP-Category">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($pred.adj.pp.in)/*"/>
        <xsl:with-param name="ext" select="$P.Default.Container.X.Category.Y"/>
      </xsl:call-template>
    </entry>
  </family>


  <!-- TimeFrame adj -->
  <xsl:variable name="X.TimeFrame.P.Default">
    <lf>
      <satop nomvar="X:sem-obj">
        <diamond mode="TimeFrame">
          <nomvar name="P:timeframe"/>
          <prop name="[*DEFAULT*]"/>
        </diamond>
      </satop>
    </lf>
  </xsl:variable>
  
  <family name="Adj-TimeFrame" pos="Adj" closed="true">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($adj)/*"/>
        <xsl:with-param name="ext" select="$X.TimeFrame.P.Default"/>
      </xsl:call-template>
    </entry>
  </family>
  
  
  <!-- Willing Adj ('willing to'); cf. Wanting -->
  <!-- NB: need to make P a state (rather than experience) to be compatible with proposition, 
           as required by the copula -->
  <xsl:variable name="P.Default.Experiencer.X.Situation.E2">  
    <lf>
      <satop nomvar="P:state">
        <prop name="[*DEFAULT*]"/>
        <diamond mode="Experiencer"><nomvar name="X:animate-being"/></diamond>
        <diamond mode="Situation"><nomvar name="E2:situation"/></diamond>
      </satop>
    </lf>
  </xsl:variable>
  
  <!-- Subject Control -->
  <xsl:variable name="pred-adj-control">    
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($pred.adj)/*"/>
      <xsl:with-param name="ext">
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <xsl:copy-of select="$s.E2.inf"/>
          <slash dir="\"/>
          <xsl:copy-of select="$np.X"/>
        </complexcat>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>

  <family name="Adj-Willing" pos="Adj" closed="true">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($pred-adj-control)/*"/>
        <xsl:with-param name="ext" select="$P.Default.Experiencer.X.Situation.E2"/>
      </xsl:call-template>
    </entry>
  </family>

  
  <!-- Airline Adj -->
  <xsl:variable name="X.Airline.P.Default">
    <lf>
      <satop nomvar="X:sem-obj">
        <diamond mode="Airline">
          <nomvar name="P:airline"/>
          <prop name="[*DEFAULT*]"/>
        </diamond>
      </satop>
    </lf>
  </xsl:variable>
  
  <family name="Adj-Airline" pos="Adj" closed="true">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($adj)/*"/>
        <xsl:with-param name="ext" select="$X.Airline.P.Default"/>
      </xsl:call-template>
    </entry>
  </family>
  
  <!-- On-Airline -->
  <xsl:variable name="X.Airline.Y">
    <lf>
      <satop nomvar="X:sem-obj">
        <diamond mode="Airline"><nomvar name="Y:airline"/></diamond>
      </satop>
    </lf>
  </xsl:variable>

  <xsl:variable name="P.has-rel.Of.X.Airline.Y">
    <xsl:call-template name="make-has-rel-lf">
      <xsl:with-param name="rel">Airline</xsl:with-param>
      <xsl:with-param name="sort-Y">airline</xsl:with-param>
    </xsl:call-template>
  </xsl:variable>
  
  <family name="Prep-Airline" pos="Prep" closed="true" indexRel="Airline">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($prep.n-postmod)/*"/>
        <xsl:with-param name="ext" select="$X.Airline.Y"/>
      </xsl:call-template>
    </entry>
    <entry name="Predicative">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($pred.prep)/*"/>
        <xsl:with-param name="ext" select="$P.has-rel.Of.X.Airline.Y"/>
      </xsl:call-template>
    </entry>
  </family>

  <!-- Time/Date Prepositions -->  
  <xsl:variable name="prep.adv">
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($adv.backward)/*"/>
      <xsl:with-param name="ext">
        <slash dir="/" mode="&lt;"/>
        <xsl:copy-of select="$np.3.Y.acc"/>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>
  
  <xsl:variable name="E.Time.Y">
    <lf>
      <satop nomvar="E:situation">
        <diamond mode="Time">
          <nomvar name="Y:time"/>
        </diamond>
      </satop>
    </lf>
  </xsl:variable>
  
  <family name="Prep-Time" pos="Prep" closed="true" indexRel="Time">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($prep.adv)/*"/>
        <xsl:with-param name="ext" select="$E.Time.Y"/>
      </xsl:call-template>
    </entry>
  </family>
  
  <xsl:variable name="E.TimeRel.P.Default">
    <lf>
      <satop nomvar="E:situation">
        <diamond mode="TimeRel">
          <nomvar name="P:proposition"/>
          <prop name="[*DEFAULT*]"/>
        </diamond>
      </satop>
    </lf>
  </xsl:variable>
  
  <xsl:variable name="E.TimeRel.P.Default.Time.Y">
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($E.TimeRel.P.Default)/*"/>
      <xsl:with-param name="ext">
        <satop nomvar="P:proposition">
          <diamond mode="Time"><nomvar name="Y:time"/></diamond>
        </satop>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>

  <family name="Prep-TimeRel" pos="TempAdv" closed="true">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($prep.adv)/*"/>
        <xsl:with-param name="ext" select="$E.TimeRel.P.Default.Time.Y"/>
      </xsl:call-template>
    </entry>
  </family>
  
  <family name="Between-TimeRel" pos="TempAdv" closed="true">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($adv.backward)/*"/>
        <xsl:with-param name="ext">
          <slash dir="/" mode="*"/>
          <xsl:copy-of select="$np.Z"/>
          <slash dir="/" mode="*"/>
          <xsl:copy-of select="$and-punct"/>
          <slash dir="/" mode="*"/>
          <xsl:copy-of select="$np.Y"/>
          <xsl:call-template name="extend">
            <xsl:with-param name="elt" select="xalan:nodeset($E.TimeRel.P.Default)/*"/>
            <xsl:with-param name="ext">
              <satop nomvar="P:proposition">
                <diamond mode="Time1"><nomvar name="Y:time"/></diamond>
                <diamond mode="Time2"><nomvar name="Z:time"/></diamond>
              </satop>
            </xsl:with-param>
          </xsl:call-template>
        </xsl:with-param>
      </xsl:call-template>
    </entry>
  </family>
  
  <family name="Comparative-TimeRel" pos="TempAdv" closed="true">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($adv.backward)/*"/>
        <xsl:with-param name="ext" select="$E.TimeRel.P.Default"/>
      </xsl:call-template>
    </entry>
  </family>
  
  <xsl:variable name="E.TimeFrame.Y">
    <lf>
      <satop nomvar="E:situation">
        <diamond mode="TimeFrame">
          <nomvar name="Y:timeframe"/>
        </diamond>
      </satop>
    </lf>
  </xsl:variable>
  
  <family name="Prep-TimeFrame" pos="Prep" closed="true" indexRel="TimeFrame">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($prep.adv)/*"/>
        <xsl:with-param name="ext" select="$E.TimeFrame.Y"/>
      </xsl:call-template>
    </entry>
  </family>
  
  <xsl:variable name="E.Date.Y">
    <lf>
      <satop nomvar="E:situation">
        <diamond mode="Date">
          <nomvar name="Y:date"/>
        </diamond>
      </satop>
    </lf>
  </xsl:variable>
  
  <family name="Prep-Date" pos="Prep" closed="true" indexRel="Date">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($prep.adv)/*"/>
        <xsl:with-param name="ext" select="$E.Date.Y"/>
      </xsl:call-template>
    </entry>
  </family>
  
  
  <!-- Departing: uses Theme, Source roles -->
  <xsl:variable name="E.Default.Theme.X">  
    <lf>
      <satop nomvar="E:motion">
        <prop name="[*DEFAULT*]"/>
        <diamond mode="Theme"><nomvar name="X:phys-obj"/></diamond>
      </satop>
    </lf>
  </xsl:variable>

  <xsl:variable name="E.Source.Y">
    <lf>
      <satop nomvar="E:motion">
        <diamond mode="Source"><nomvar name="Y:location"/></diamond>
      </satop>
    </lf>
  </xsl:variable>
  
  <xsl:variable name="E.Default.Theme.X.Source.Y">  
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($E.Default.Theme.X)/*"/>
      <xsl:with-param name="ext" select="xalan:nodeset($E.Source.Y)/lf/*"/>
    </xsl:call-template>
  </xsl:variable>

  <family name="Departing" pos="V" closed="true">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($iv)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Theme.X"/>
      </xsl:call-template>
    </entry>
    <entry name="Obj-Source">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($tv)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Theme.X.Source.Y"/>
      </xsl:call-template>
    </entry>
    <entry name="PP-From-Source">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($tv.from)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Theme.X.Source.Y"/>
      </xsl:call-template>
    </entry>
  </family>
  
  <!-- Arriving: uses Theme, Goal roles -->
  <xsl:variable name="E.Goal.Y">
    <lf>
      <satop nomvar="E:motion">
        <diamond mode="Goal">
          <nomvar name="Y:location"/>
        </diamond>
      </satop>
    </lf>
  </xsl:variable>
  
  <xsl:variable name="E.Default.Theme.X.Goal.Y">  
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($E.Default.Theme.X)/*"/>
      <xsl:with-param name="ext" select="xalan:nodeset($E.Goal.Y)/lf/*"/>
    </xsl:call-template>
  </xsl:variable>

  <family name="Arriving" pos="V" closed="true">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($iv)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Theme.X"/>
      </xsl:call-template>
    </entry>
    <entry name="Obj-Goal">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($tv)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Theme.X.Goal.Y"/>
      </xsl:call-template>
    </entry>
    <entry name="PP-in-Goal">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($tv.in)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Theme.X.Goal.Y"/>
      </xsl:call-template>
    </entry>
  </family>
  
  
  <!-- Travel: uses Traveler, Category, Airline, Prop, Source, Goal roles -->
  <!-- NB: not all role combinations are supported, b/c there's no direct support for optional args -->
  <xsl:variable name="E.Default.Traveler.X">  
    <lf>
      <satop nomvar="E:motion">
        <prop name="[*DEFAULT*]"/>
        <diamond mode="Traveler"><nomvar name="X:phys-obj"/></diamond>
      </satop>
    </lf>
  </xsl:variable>

  <xsl:variable name="E.Default.Traveler.X.Category.Y">  
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($E.Default.Traveler.X)/*"/>
      <xsl:with-param name="ext">
        <satop nomvar="E:motion">
          <diamond mode="Category"><nomvar name="Y:fareclass"/></diamond>
        </satop>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>
  
  <xsl:variable name="E.Default.Traveler.X.Prop.P">  
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($E.Default.Traveler.X)/*"/>
      <xsl:with-param name="ext">
        <satop nomvar="E:motion">
          <diamond mode="Prop"><nomvar name="P:proposition"/></diamond>
        </satop>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>
  
  <xsl:variable name="E.Default.Traveler.X.Airline.Y">  
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($E.Default.Traveler.X)/*"/>
      <xsl:with-param name="ext">
        <satop nomvar="E:motion">
          <diamond mode="Airline"><nomvar name="Y:airline"/></diamond>
        </satop>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>
  
  <xsl:variable name="E.Default.Traveler.X.Category.Y.Airline.Z">  
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($E.Default.Traveler.X.Category.Y)/*"/>
      <xsl:with-param name="ext">
        <satop nomvar="E:motion">
          <diamond mode="Airline"><nomvar name="Z:airline"/></diamond>
        </satop>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>
  
  <xsl:variable name="E.Default.Traveler.X.Prop.P.Airline.Z">  
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($E.Default.Traveler.X.Prop.P)/*"/>
      <xsl:with-param name="ext">
        <satop nomvar="E:motion">
          <diamond mode="Airline"><nomvar name="Z:airline"/></diamond>
        </satop>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>
  
  <xsl:variable name="E.Default.Traveler.X.Source.Y">  
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($E.Default.Traveler.X)/*"/>
      <xsl:with-param name="ext" select="xalan:nodeset($E.Source.Y)/lf/*"/>
    </xsl:call-template>
  </xsl:variable>
  
  <xsl:variable name="E.Default.Traveler.X.Goal.Y">  
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($E.Default.Traveler.X)/*"/>
      <xsl:with-param name="ext" select="xalan:nodeset($E.Goal.Y)/lf/*"/>
    </xsl:call-template>
  </xsl:variable>
  
  <xsl:variable name="E.Default.Traveler.X.Source.Y.Goal.Z">  
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($E.Default.Traveler.X.Source.Y)/*"/>
      <xsl:with-param name="ext">
        <satop nomvar="E:motion">
          <diamond mode="Goal"><nomvar name="Z:location"/></diamond>
        </satop>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>
  
  <family name="Travel" pos="V" closed="true">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($iv)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Traveler.X"/>
      </xsl:call-template>
    </entry>
    <entry name="TV">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($tv)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Traveler.X.Category.Y"/>
      </xsl:call-template>
    </entry>
    <entry name="TV-Goal">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($tv)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Traveler.X.Goal.Y"/>
      </xsl:call-template>
    </entry>
    <entry name="TV-Pred-Y">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($tv.pred.Y)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Traveler.X.Prop.P"/>
      </xsl:call-template>
    </entry>
    <entry name="TV-On">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($tv.on)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Traveler.X.Airline.Y"/>
      </xsl:call-template>
    </entry>
    <entry name="TV-With">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($tv.with)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Traveler.X.Airline.Y"/>
      </xsl:call-template>
    </entry>
    <entry name="TV-Plus-On">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($tv.plus.on)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Traveler.X.Category.Y.Airline.Z"/>
      </xsl:call-template>
    </entry>
    <entry name="TV-Pred-Y-Plus-On">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($tv.pred.Y.plus.on)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Traveler.X.Prop.P.Airline.Z"/>
      </xsl:call-template>
    </entry>
    <entry name="TV-From">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($tv.from)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Traveler.X.Source.Y"/>
      </xsl:call-template>
    </entry>
    <entry name="TV-To">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($tv.to)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Traveler.X.Goal.Y"/>
      </xsl:call-template>
    </entry>
    <entry name="DTV-From-To">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($dtv.from.to)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Traveler.X.Source.Y.Goal.Z"/>
      </xsl:call-template>
    </entry>
  </family>

  <!-- Connecting: uses Traveler and Path -->
  <xsl:variable name="E.Default.Traveler.X.Path.Y-city">  
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($E.Default.Traveler.X)/*"/>
      <xsl:with-param name="ext">
        <satop nomvar="E:motion">
          <diamond mode="Path"><nomvar name="Y:city"/></diamond>
        </satop>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>
  
  <xsl:variable name="E.Default.Traveler.X.Path.Y-airport">  
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($E.Default.Traveler.X)/*"/>
      <xsl:with-param name="ext">
        <satop nomvar="E:motion">
          <diamond mode="Path"><nomvar name="Y:airport"/></diamond>
        </satop>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>
  
  <family name="Connecting" pos="V" closed="true">
    <entry name="TV-In">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($tv.in)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Traveler.X.Path.Y-city"/>
      </xsl:call-template>
    </entry>
    <entry name="TV-At">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($tv.at)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Traveler.X.Path.Y-airport"/>
      </xsl:call-template>
    </entry>
  </family>

  <!-- Evaluative Comparison -->
  <xsl:variable name="E.Default.Item.X.Var.Y">  
    <lf>
      <satop nomvar="E:proposition">
        <prop name="[*DEFAULT*]"/>
        <diamond mode="Item"><nomvar name="X:sem-obj"/></diamond>
        <diamond mode="Var"><nomvar name="Y:sem-obj"/></diamond>
      </satop>
    </lf>
  </xsl:variable>
  
  <family name="Evaluative-Comparison" pos="V" closed="true">
    <entry name="TV">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($tv)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Item.X.Var.Y"/>
      </xsl:call-template>
    </entry>
  </family>

  <!-- Choosing: uses Cognizer, Chosen, Possib(ility) roles -->
  <xsl:variable name="E.Default.Cognizer.X.Possib.Y">  
    <lf>
      <satop nomvar="E:action">
        <prop name="[*DEFAULT*]"/>
        <diamond mode="Cognizer"><nomvar name="X:causal-agent"/></diamond>
        <diamond mode="Possib"><nomvar name="Y:sem-obj"/></diamond>
      </satop>
    </lf>
  </xsl:variable>

  <family name="Choosing" pos="V" closed="true">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($tv)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Cognizer.X.Chosen.Y"/>
      </xsl:call-template>
    </entry>
    <entry name="TV-From">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($tv.from)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Cognizer.X.Possib.Y"/>
      </xsl:call-template>
    </entry>
  </family>
  
  <!-- Booking (cf. FrameNet's Commerce): has Agent and Beneficiary, in addition to Goods --> 
  <xsl:variable name="E.Default.Agent.X">  
    <lf>
      <satop nomvar="E:action">
        <prop name="[*DEFAULT*]"/>
        <diamond mode="Agent"><nomvar name="X:causal-agent"/></diamond>
      </satop>
    </lf>
  </xsl:variable>

  <xsl:variable name="E.Default.Agent.X.Goods.Y">  
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($E.Default.Agent.X)/*"/>
      <xsl:with-param name="ext">
        <satop nomvar="E:action">
          <diamond mode="Goods"><nomvar name="Y:phys-obj"/></diamond>
        </satop>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>
  
  <xsl:variable name="E.Default.Agent.X.Goods.Y.Beneficiary.Z">  
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($E.Default.Agent.X.Goods.Y)/*"/>
      <xsl:with-param name="ext">
        <satop nomvar="E:action">
          <diamond mode="Beneficiary"><nomvar name="Z:causal-agent"/></diamond>
        </satop>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>
  
  <xsl:variable name="E.Default.Agent.X.Beneficiary.Y.Goods.Z">  
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($E.Default.Agent.X)/*"/>
      <xsl:with-param name="ext">
        <satop nomvar="E:action">
          <diamond mode="Beneficiary"><nomvar name="Y:causal-agent"/></diamond>
          <diamond mode="Goods"><nomvar name="Z:phys-obj"/></diamond>
        </satop>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>
  
  <family name="Booking" pos="V" closed="true">
    <entry name="TV">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($tv)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Agent.X.Goods.Y"/>
      </xsl:call-template>
    </entry>
    <entry name="DTV">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($dtv)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Agent.X.Goods.Y.Beneficiary.Z"/>
      </xsl:call-template>
    </entry>
    <entry name="DTV-For">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($dtv.for)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Agent.X.Beneficiary.Y.Goods.Z"/>
      </xsl:call-template>
    </entry>
  </family>

  <!-- Offering: just trans for now -->
  <family name="Offering" pos="V" closed="true">
    <entry name="TV">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($tv)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Agent.X.Goods.Y"/>
      </xsl:call-template>
    </entry>
  </family>
  
  <!-- Conveyance (cf. FrameNet's Transportation/Motion): uses Vehicle, Cargo (/Passenger), Goal --> 
  <xsl:variable name="E.Default.Vehicle.X.Goal.Y">  
    <lf>
      <satop nomvar="E:motion">
        <prop name="[*DEFAULT*]"/>
        <diamond mode="Vehicle"><nomvar name="X:phys-obj"/></diamond>
        <diamond mode="Goal"><nomvar name="Y:location"/></diamond>
      </satop>
    </lf>
  </xsl:variable>

  <xsl:variable name="E.Default.Vehicle.X.Goal.Y.Cargo.Z">  
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($E.Default.Vehicle.X.Goal.Y)/*"/>
      <xsl:with-param name="ext">
        <satop nomvar="E:motion">
          <diamond mode="Cargo"><nomvar name="Z:phys-obj"/></diamond>
        </satop>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>
  
  <family name="Conveyance" pos="V" closed="true">
    <entry name="TV-To">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($tv.to)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Vehicle.X.Goal.Y"/>
      </xsl:call-template>
    </entry>
    <entry name="DTV-To">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($dtv.to)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Vehicle.X.Goal.Y.Cargo.Z"/>
      </xsl:call-template>
    </entry>
  </family>

  <!-- Being Obligated: uses Agent and Duty -->
  <xsl:variable name="E.Default.Agent.X.Duty.Y">  
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($E.Default.Agent.X)/*"/>
      <xsl:with-param name="ext">
        <satop nomvar="E:situation">
          <diamond mode="Duty"><nomvar name="Y:sem-obj"/></diamond>
        </satop>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>
  
  <family name="Requiring" pos="V" closed="true">
    <entry name="Obj-Duty">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($tv)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Agent.X.Duty.Y"/>
      </xsl:call-template>
    </entry>
  </family>

  <xsl:variable name="E.Default.Agent.X.Duty.E2">  
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($E.Default.Agent.X)/*"/>
      <xsl:with-param name="ext">
        <satop nomvar="E:situation">
          <diamond mode="Duty"><nomvar name="E2:situation"/></diamond>
        </satop>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>
  
  <family name="Needing-To" pos="V" closed="true">
    <entry name="Obj-Inf">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($subject-control)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Agent.X.Duty.E2"/>
      </xsl:call-template>
    </entry>
  </family>

  <!-- Costing: uses Goods and Asset -->
  <xsl:variable name="E.Default.Goods.X.Asset.Y">  
    <lf>
      <satop nomvar="E:proposition">
        <prop name="[*DEFAULT*]"/>
        <diamond mode="Goods"><nomvar name="X:phys-obj"/></diamond>
        <diamond mode="Asset"><nomvar name="Y:amt"/></diamond>
      </satop>
    </lf>
  </xsl:variable>
  
  <family name="Costing" pos="V" closed="true">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($tv)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Goods.X.Asset.Y"/>
      </xsl:call-template>
    </entry>
  </family>
  
  <!-- Wanting: uses Experiencer and Situation -->
  <xsl:variable name="E.Default.Experiencer.X.Situation.E2">  
    <lf>
      <satop nomvar="E:experience">
        <prop name="[*DEFAULT*]"/>
        <diamond mode="Experiencer"><nomvar name="X:animate-being"/></diamond>
        <diamond mode="Situation"><nomvar name="E2:situation"/></diamond>
      </satop>
    </lf>
  </xsl:variable>
  
  <family name="Wanting" pos="V" closed="true">
    <entry name="Obj-Inf">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($subject-control)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Experiencer.X.Situation.E2"/>
      </xsl:call-template>
    </entry>
  </family>

  <!-- Finding: uses Perceiver and Sought -->
  <xsl:variable name="E.Default.Perceiver.X.Sought.Y">  
    <lf>
      <satop nomvar="E:proposition">
        <prop name="[*DEFAULT*]"/>
        <diamond mode="Perceiver"><nomvar name="X:animate-being"/></diamond>
        <diamond mode="Sought"><nomvar name="Y:phys-obj"/></diamond>
      </satop>
    </lf>
  </xsl:variable>
  
  <family name="Finding" pos="V" closed="true">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($tv)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Perceiver.X.Sought.Y"/>
      </xsl:call-template>
    </entry>
  </family>
  
  <!-- Hearing-About: uses Perceiver, Phenomenon roles -->
  <family name="Hearing-About" pos="V" closed="true">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($tv.about)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Perceiver.X.Phenomenon.Y"/>
      </xsl:call-template>
    </entry>
  </family>
  
  <!-- Taking-Time: uses Activity, Duration roles -->
  <xsl:variable name="E.Default.Activity.X.Duration.Y">
    <lf>
      <satop nomvar="E:situation">
        <prop name="[*DEFAULT*]"/>
        <diamond mode="Activity"><nomvar name="X:situation"/></diamond>
        <diamond mode="Duration"><nomvar name="Y:dur"/></diamond>
      </satop>
    </lf>
  </xsl:variable>
  
  <family name="Taking-Time" pos="V" closed="true">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($tv)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Activity.X.Duration.Y"/>
      </xsl:call-template>
    </entry>
  </family>
  
  </ccg-lexicon>

  
  <!-- ***** Write type changing rules to unary-rules.xml ***** -->
  <redirect:write file="unary-rules.xml">
  <unary-rules>
  <xsl:call-template name="add-unary-rules"/>
  </unary-rules>
  </redirect:write>
  </xsl:template>

</xsl:transform>


================================================
FILE: grammars/flights/lexicon.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<ccg-lexicon xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:noNamespaceSchemaLocation="../lexicon.xsd" name="flights">
  <distributive-features attrs="info owner"/>
  <licensing-features>
    <feat location="target-only" val="emb" attr="form"/>
    <feat location="target-only" val="inf" attr="form"/>
    <feat location="target-only" val="adj" attr="form"/>
    <feat license-marked-cats="true" also-licensed-by="q-base" val="wh" attr="form"/>
    <feat license-marked-cats="true" also-licensed-by="q-base" val="q" attr="form"/>
    <feat also-licensed-by="q-base" val="q" attr="form"/>
    <feat location="args-only" instantiate="false" attr="owner"/>
  </licensing-features>
  <relation-sorting order="BoundVar PairedWith      Restr Body       Det Card Num       Arg Arg1 Arg2 Of      Core Trib      First Last List EqL      Agent Cognizer Experiencer Fig FigInv Owner Perceiver      Container ContainerInv Item Theme Traveler Vehicle      *      Beneficiary Chosen Ground Poss Possib Pred Prop Situation Sought      Airline Cargo Category Goods Asset Duty Var      Source Goal Path      Location Date Duration Time Time1 Time2 TimeFrame TimeRel AmPm      HasProp GenOwner      GenRel Next"/>
  <family closed="true" pos="Dummy" name="Dummy">
    <entry name="np_conj">
      <atomcat type="np_conj">
        <fs>
          <feat attr="num">
            <featvar name="NUM:num-vals"/>
          </feat>
          <feat attr="pers">
            <featvar name="PERS:pers-vals"/>
          </feat>
          <feat attr="case">
            <featvar name="CASE"/>
          </feat>
          <feat attr="type">
            <featvar name="TYPE"/>
          </feat>
          <feat attr="index">
            <lf>
              <nomvar name="INDEX"/>
            </lf>
          </feat>
          <feat attr="info">
            <lf>
              <var name="INFO"/>
            </lf>
          </feat>
          <feat attr="owner">
            <lf>
              <var name="OWNER"/>
            </lf>
          </feat>
        </fs>
      </atomcat>
    </entry>
    <entry name="s_conj">
      <atomcat type="s_conj">
        <fs>
          <feat attr="num">
            <featvar name="NUM:num-vals"/>
          </feat>
          <feat attr="pers">
            <featvar name="PERS:pers-vals"/>
          </feat>
          <feat attr="form">
            <featvar name="FORM:form-vals"/>
          </feat>
          <feat attr="index">
            <lf>
              <nomvar name="INDEX"/>
            </lf>
          </feat>
          <feat attr="info">
            <lf>
              <var name="INFO"/>
            </lf>
          </feat>
          <feat attr="owner">
            <lf>
              <var name="OWNER"/>
            </lf>
          </feat>
          <feat attr="op-index">
            <lf>
              <nomvar name="OP-INDEX"/>
            </lf>
          </feat>
        </fs>
      </atomcat>
    </entry>
    <member stem="*dummy*"/>
  </family>
  <family pos="N" name="Noun">
    <entry name="Primary">
      <atomcat type="n">
        <fs id="2">
          <feat attr="num">
            <featvar name="NUM:num-vals"/>
          </feat>
          <feat attr="index">
            <lf>
              <nomvar name="X"/>
            </lf>
          </feat>
          <feat attr="info">
            <lf>
              <var name="INFO"/>
            </lf>
          </feat>
          <feat attr="owner">
            <lf>
              <var name="OWNER"/>
            </lf>
          </feat>
        </fs>
        <lf>
          <satop nomvar="X:sem-obj">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </atomcat>
    </entry>
  </family>
  <family pos="Num" name="Num">
    <entry name="Primary">
      <atomcat type="num">
        <fs id="2">
          <feat attr="num">
            <featvar name="NUM:num-vals"/>
          </feat>
          <feat attr="index">
            <lf>
              <nomvar name="X"/>
            </lf>
          </feat>
          <feat attr="info">
            <lf>
              <var name="INFO"/>
            </lf>
          </feat>
          <feat attr="owner">
            <lf>
              <var name="OWNER"/>
            </lf>
          </feat>
        </fs>
        <lf>
          <satop nomvar="X:num">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </atomcat>
    </entry>
  </family>
  <family closed="true" pos="Pro" name="ProNP">
    <entry name="Primary">
      <atomcat type="np">
        <fs id="2">
          <feat attr="num">
            <featvar name="NUM:num-vals"/>
          </feat>
          <feat attr="pers">
            <featvar name="PERS:pers-vals"/>
          </feat>
          <feat attr="case">
            <featvar name="CASE"/>
          </feat>
          <feat attr="index">
            <lf>
              <nomvar name="X"/>
            </lf>
          </feat>
          <feat attr="info">
            <lf>
              <var name="INFO"/>
            </lf>
          </feat>
          <feat attr="owner">
            <lf>
              <var name="OWNER"/>
            </lf>
          </feat>
        </fs>
        <lf>
          <satop nomvar="X:sem-obj">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </atomcat>
    </entry>
    <member stem="pro1"/>
    <member stem="pro2"/>
    <member stem="pro3f"/>
    <member stem="pro3m"/>
    <member stem="pro3n"/>
    <member stem="this"/>
    <member stem="that"/>
  </family>
  <family pos="NNP" name="Name">
    <entry name="Primary">
      <atomcat type="np">
        <fs id="2">
          <feat val="3rd" attr="pers"/>
          <feat attr="index">
            <lf>
              <nomvar name="X"/>
            </lf>
          </feat>
        </fs>
        <lf>
          <satop nomvar="X:sem-obj">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </atomcat>
    </entry>
  </family>
  <family indexRel="*NoSem*" closed="true" pos="Expl" name="ExplNP">
    <entry name="Primary">
      <atomcat type="np_expl">
        <fs>
          <feat val="[*DEFAULT*]" attr="lex"/>
        </fs>
      </atomcat>
    </entry>
    <entry name="RightwardTypeRaised">
      <complexcat>
        <atomcat type="s">
          <fs id="1"/>
        </atomcat>
        <slash ability="active" varmodality="M" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1"/>
          </atomcat>
          <slash ability="active" varmodality="M" dir="\"/>
          <atomcat type="np_expl">
            <fs>
              <feat val="[*DEFAULT*]" attr="lex"/>
            </fs>
          </atomcat>
        </complexcat>
      </complexcat>
    </entry>
    <member stem="it"/>
    <member stem="there"/>
    <member stem="here"/>
  </family>
  <family closed="true" pos="QNP" name="QuantNP">
    <entry name="RightwardTypeRaised">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash ability="active" varmodality="M" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash ability="active" varmodality="M" dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="num">
                <featvar name="NUM:num-vals"/>
              </feat>
              <feat val="3rd" attr="pers"/>
              <feat attr="case">
                <featvar name="CASE"/>
              </feat>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="S:quantification">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Restr">
              <nomvar name="X:sem-obj"/>
            </diamond>
            <diamond mode="Body">
              <nomvar name="E:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="LeftwardTypeRaised">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash/>
        <dollar name="1"/>
        <slash ability="active" varmodality="M" dir="\"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
          <slash ability="active" varmodality="M" dir="/"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="num">
                <featvar name="NUM:num-vals"/>
              </feat>
              <feat val="3rd" attr="pers"/>
              <feat attr="case">
                <featvar name="CASE"/>
              </feat>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="S:quantification">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Restr">
              <nomvar name="X:sem-obj"/>
            </diamond>
            <diamond mode="Body">
              <nomvar name="E:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="everyone" pred="every"/>
    <member stem="both"/>
    <member stem="neither"/>
    <member stem="none"/>
    <member stem="all"/>
  </family>
  <family closed="true" pos="WhNP" name="WhNP">
    <entry name="SubjectExtraction">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="wh" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="Q"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="num">
                <featvar name="NUM:num-vals"/>
              </feat>
              <feat val="3rd" attr="pers"/>
              <feat attr="case">
                <featvar name="CASE"/>
              </feat>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="Q:quantification">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Restr">
              <nomvar name="X:sem-obj"/>
            </diamond>
            <diamond mode="Body">
              <nomvar name="E:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="ObjectExtraction">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="wh" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="Q"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat val="q" attr="form"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="/"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="num">
                <featvar name="NUM:num-vals"/>
              </feat>
              <feat val="3rd" attr="pers"/>
              <feat attr="case">
                <featvar name="CASE"/>
              </feat>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="Q:quantification">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Restr">
              <nomvar name="X:sem-obj"/>
            </diamond>
            <diamond mode="Body">
              <nomvar name="E:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="ObjectInSitu">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="wh" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="Q"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash/>
        <dollar name="1"/>
        <slash ability="active" varmodality="M" dir="\"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
          <slash ability="active" varmodality="M" dir="/"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="num">
                <featvar name="NUM:num-vals"/>
              </feat>
              <feat val="3rd" attr="pers"/>
              <feat attr="case">
                <featvar name="CASE"/>
              </feat>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="Q:quantification">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Restr">
              <nomvar name="X:sem-obj"/>
            </diamond>
            <diamond mode="Body">
              <nomvar name="E:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="what"/>
    <member stem="where"/>
    <member stem="who"/>
  </family>
  <family indexRel="det" closed="true" pos="Det" name="Det">
    <entry name="Primary">
      <complexcat>
        <atomcat type="np">
          <fs id="2">
            <feat val="3rd" attr="pers"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="det">
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="a"/>
    <member stem="some"/>
    <member stem="the"/>
  </family>
  <family closed="true" pos="PDet" name="PDet">
    <entry name="Primary">
      <complexcat>
        <atomcat type="np">
          <fs id="2">
            <feat val="3rd" attr="pers"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="Det">
              <nomvar name="P:proposition"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="another"/>
    <member stem="this"/>
    <member stem="that"/>
  </family>
  <family closed="true" pos="Num" name="One-Det">
    <entry name="Primary">
      <complexcat>
        <atomcat type="np">
          <fs id="2">
            <feat val="3rd" attr="pers"/>
            <feat attr="index">
              <lf>
                <nomvar name="W"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="W"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="W:sem-obj">
            <diamond mode="det">
              <prop name="nil"/>
            </diamond>
            <diamond mode="Card">
              <nomvar name="X:num"/>
            </diamond>
          </satop>
          <satop nomvar="X:num">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="one"/>
    <member stem="1"/>
  </family>
  <family closed="true" pos="PossPro" name="PossPro">
    <entry name="Primary">
      <complexcat>
        <atomcat type="np">
          <fs id="2">
            <feat val="3rd" attr="pers"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="GenOwner">
              <nomvar name="P:sem-obj"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="pro1"/>
    <member stem="pro2"/>
    <member stem="pro3f"/>
    <member stem="pro3m"/>
    <member stem="pro3n"/>
  </family>
  <family indexRel="GenOwner" closed="true" pos="PossS" name="PossS">
    <entry name="Primary">
      <complexcat>
        <atomcat type="np">
          <fs id="2">
            <feat val="3rd" attr="pers"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="gen" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="GenOwner">
              <nomvar name="Y:sem-obj"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="'s"/>
  </family>
  <family closed="true" pos="QDet" name="QuantDet">
    <entry name="RightwardTypeRaised">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash ability="active" varmodality="M" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash ability="active" varmodality="M" dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="num">
                <featvar name="NUM:num-vals"/>
              </feat>
              <feat val="3rd" attr="pers"/>
              <feat attr="case">
                <featvar name="CASE"/>
              </feat>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash mode="^" dir="/"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="S:quantification">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Restr">
              <nomvar name="X:sem-obj"/>
            </diamond>
            <diamond mode="Body">
              <nomvar name="E:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="LeftwardTypeRaised">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash/>
        <dollar name="1"/>
        <slash ability="active" varmodality="M" dir="\"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
          <slash ability="active" varmodality="M" dir="/"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="num">
                <featvar name="NUM:num-vals"/>
              </feat>
              <feat val="3rd" attr="pers"/>
              <feat attr="case">
                <featvar name="CASE"/>
              </feat>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash mode="^" dir="/"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="S:quantification">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Restr">
              <nomvar name="X:sem-obj"/>
            </diamond>
            <diamond mode="Body">
              <nomvar name="E:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="all"/>
    <member stem="both"/>
    <member stem="every"/>
    <member stem="neither"/>
    <member stem="no"/>
  </family>
  <family closed="true" pos="Wh" name="WhDet">
    <entry name="SubjectExtraction">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="wh" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="Q"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="num">
                <featvar name="NUM:num-vals"/>
              </feat>
              <feat val="3rd" attr="pers"/>
              <feat attr="case">
                <featvar name="CASE"/>
              </feat>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash mode="^" dir="/"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="Q:quantification">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Restr">
              <nomvar name="X:sem-obj"/>
            </diamond>
            <diamond mode="Body">
              <nomvar name="E:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="ObjectExtraction">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="wh" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="Q"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat val="q" attr="form"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="/"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="num">
                <featvar name="NUM:num-vals"/>
              </feat>
              <feat val="3rd" attr="pers"/>
              <feat attr="case">
                <featvar name="CASE"/>
              </feat>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash mode="^" dir="/"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="Q:quantification">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Restr">
              <nomvar name="X:sem-obj"/>
            </diamond>
            <diamond mode="Body">
              <nomvar name="E:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="ObjectInSitu">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="wh" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="Q"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash/>
        <dollar name="1"/>
        <slash ability="active" varmodality="M" dir="\"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
          <slash ability="active" varmodality="M" dir="/"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="num">
                <featvar name="NUM:num-vals"/>
              </feat>
              <feat val="3rd" attr="pers"/>
              <feat attr="case">
                <featvar name="CASE"/>
              </feat>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash mode="^" dir="/"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="Q:quantification">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Restr">
              <nomvar name="X:sem-obj"/>
            </diamond>
            <diamond mode="Body">
              <nomvar name="E:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="what"/>
    <member stem="which"/>
  </family>
  <family closed="true" pos="Adj" name="Adjective">
    <entry name="Primary">
      <complexcat>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="HasProp">
              <nomvar name="P:proposition"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Predicative">
      <complexcat>
        <atomcat type="s">
          <fs>
            <feat val="adj" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="P"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash ability="inert" mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="P:proposition">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Of">
              <nomvar name="X:sem-obj"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="available"/>
    <member stem="better"/>
    <member stem="best"/>
    <member stem="cheap"/>
    <member stem="cheaper"/>
    <member stem="cheapest"/>
    <member stem="connecting"/>
    <member stem="departure"/>
    <member stem="destination"/>
    <member stem="direct"/>
    <member stem="early"/>
    <member stem="earlier"/>
    <member stem="earliest"/>
    <member stem="even"/>
    <member stem="first"/>
    <member stem="good"/>
    <member stem="great"/>
    <member stem="just"/>
    <member stem="last"/>
    <member stem="late"/>
    <member stem="later"/>
    <member stem="latest"/>
    <member stem="next"/>
    <member stem="nonstop"/>
    <member stem="only"/>
    <member stem="other"/>
    <member stem="total"/>
  </family>
  <family closed="true" pos="Adj" name="Adjective-Measure">
    <entry name="Primary">
      <complexcat>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:measure">
            <diamond mode="HasProp">
              <nomvar name="P:proposition"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="even"/>
    <member stem="just"/>
    <member stem="only"/>
  </family>
  <family closed="true" pos="Adv" name="Adverb">
    <entry name="Initial">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="fronted" attr="form"/>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <atomcat type="s">
          <fs id="1">
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:situation">
            <diamond mode="HasProp">
              <nomvar name="P:proposition"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Forward">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="E:situation">
            <diamond mode="HasProp">
              <nomvar name="P:proposition"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Backward">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:situation">
            <diamond mode="HasProp">
              <nomvar name="P:proposition"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="also"/>
    <member stem="either"/>
    <member stem="though"/>
    <member stem="too"/>
    <member stem="only"/>
    <member stem="on_time"/>
    <member stem="today"/>
    <member stem="yesterday"/>
  </family>
  <family closed="true" pos="Adv" name="Loc-Adverb">
    <entry name="Initial">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="fronted" attr="form"/>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <atomcat type="s">
          <fs id="1">
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:situation">
            <diamond mode="Location">
              <nomvar name="P:location"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Forward">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="E:situation">
            <diamond mode="Location">
              <nomvar name="P:location"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Backward">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:situation">
            <diamond mode="Location">
              <nomvar name="P:location"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
  <family closed="true" pos="Adv" name="Transitional-Adverb">
    <entry name="Initial">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="fronted" attr="form"/>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <atomcat type="punct">
          <fs>
            <feat val="," attr="lex"/>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:situation">
            <diamond mode="HasProp">
              <nomvar name="P:proposition"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="alternatively"/>
    <member stem="however"/>
  </family>
  <family indexRel="*NoSem*" closed="true" pos="Prep" name="Particle">
    <entry name="Primary">
      <atomcat type="prt">
        <fs>
          <feat val="[*DEFAULT*]" attr="lex"/>
        </fs>
      </atomcat>
    </entry>
  </family>
  <family indexRel="*NoSem*" closed="true" pos="Prep" name="Prep-Nom">
    <entry name="Nominal">
      <complexcat>
        <atomcat type="pp">
          <fs inheritsFrom="3">
            <feat val="[*DEFAULT*]" attr="lex"/>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="with"/>
    <member stem="about"/>
    <member stem="at"/>
    <member stem="for"/>
    <member stem="from"/>
    <member stem="in"/>
    <member stem="of"/>
    <member stem="on"/>
    <member stem="to"/>
    <member stem="with"/>
  </family>
  <family closed="true" pos="Adj" name="Prep-Loc">
    <entry name="Primary">
      <complexcat>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="FigInv">
              <nomvar name="P:proposition"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Ground">
                <nomvar name="Y:sem-obj"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Predicative">
      <complexcat>
        <atomcat type="s">
          <fs>
            <feat val="adj" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="P"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash ability="inert" mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="P:proposition">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Fig">
              <nomvar name="X:sem-obj"/>
            </diamond>
            <diamond mode="Ground">
              <nomvar name="Y:sem-obj"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="on"/>
  </family>
  <family indexRel="Poss" closed="true" pos="Prep" name="With-Poss">
    <entry name="Primary">
      <complexcat>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="Poss">
              <nomvar name="Y:sem-obj"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Plus-Pred-Y">
      <complexcat>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs>
              <feat val="adj" attr="form"/>
              <feat attr="index">
                <lf>
                  <nomvar name="P"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash ability="inert" mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs>
              <feat attr="index">
                <lf>
                  <nomvar name="Y"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash mode="&lt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="Poss">
              <nomvar name="Y:sem-obj"/>
            </diamond>
            <diamond mode="Where">
              <nomvar name="P:proposition"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Appos">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat attr="form">
              <featvar name="FORM:form-vals"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
            <feat attr="info">
              <lf>
                <var name="INFO"/>
              </lf>
            </feat>
            <feat attr="owner">
              <lf>
                <var name="OWNER"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="punct">
          <fs>
            <feat val="," attr="lex"/>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="S:proposition">
            <prop name="elab-rel"/>
            <diamond mode="info">
              <var name="INFO"/>
            </diamond>
            <diamond mode="owner">
              <var name="OWNER"/>
            </diamond>
            <diamond mode="kon">
              <prop name="-"/>
            </diamond>
            <diamond mode="Core">
              <nomvar name="E:situation"/>
            </diamond>
            <diamond mode="Trib">
              <nomvar name="P:situation"/>
            </diamond>
          </satop>
          <satop nomvar="P:proposition">
            <prop name="has-rel"/>
            <diamond mode="info">
              <var name="INFO"/>
            </diamond>
            <diamond mode="owner">
              <var name="OWNER"/>
            </diamond>
            <diamond mode="kon">
              <prop name="-"/>
            </diamond>
            <diamond mode="Of">
              <nomvar name="X:"/>
            </diamond>
            <diamond mode="Poss">
              <nomvar name="Y:"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Appos-Plus-Pred-Y">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat attr="form">
              <featvar name="FORM:form-vals"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
            <feat attr="info">
              <lf>
                <var name="INFO"/>
              </lf>
            </feat>
            <feat attr="owner">
              <lf>
                <var name="OWNER"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="punct">
          <fs>
            <feat val="," attr="lex"/>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs>
              <feat val="adj" attr="form"/>
              <feat attr="index">
                <lf>
                  <nomvar name="P2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash ability="inert" mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs>
              <feat attr="index">
                <lf>
                  <nomvar name="Y"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash mode="*" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="S:proposition">
            <prop name="elab-rel"/>
            <diamond mode="info">
              <var name="INFO"/>
            </diamond>
            <diamond mode="owner">
              <var name="OWNER"/>
            </diamond>
            <diamond mode="kon">
              <prop name="-"/>
            </diamond>
            <diamond mode="Core">
              <nomvar name="E:situation"/>
            </diamond>
            <diamond mode="Trib">
              <nomvar name="P:situation"/>
            </diamond>
          </satop>
          <satop nomvar="P:proposition">
            <prop name="has-rel"/>
            <diamond mode="info">
              <var name="INFO"/>
            </diamond>
            <diamond mode="owner">
              <var name="OWNER"/>
            </diamond>
            <diamond mode="kon">
              <prop name="-"/>
            </diamond>
            <diamond mode="Of">
              <nomvar name="X:"/>
            </diamond>
            <diamond mode="Poss">
              <nomvar name="Y:"/>
            </diamond>
          </satop>
          <satop nomvar="P">
            <diamond mode="Where">
              <nomvar name="P2:proposition"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="with"/>
  </family>
  <family closed="true" pos="Adv" name="Prep-Transitional">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="fronted" attr="form"/>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <atomcat type="punct">
          <fs>
            <feat val="," attr="lex"/>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:sem-obj">
            <diamond mode="HasProp">
              <nomvar name="P:proposition"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Arg">
                <nomvar name="Y:sem-obj"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
  <family indexRel="*NoSem*" closed="true" pos="Prep" name="To-Infinitive">
    <entry name="Basic">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="inf" attr="form"/>
          </fs>
        </atomcat>
        <slash ability="inert" mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat val="base" attr="form"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
      </complexcat>
    </entry>
    <member stem="to"/>
  </family>
  <family closed="true" pos="V" name="Possession">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:situation">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Owner">
              <nomvar name="X:sem-obj"/>
            </diamond>
            <diamond mode="Poss">
              <nomvar name="Y:sem-obj"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="TV-Plus-Pred-Y">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs>
              <feat val="adj" attr="form"/>
              <feat attr="index">
                <lf>
                  <nomvar name="P"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash ability="inert" mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs>
              <feat attr="index">
                <lf>
                  <nomvar name="Y"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:situation">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Owner">
              <nomvar name="X:sem-obj"/>
            </diamond>
            <diamond mode="Poss">
              <nomvar name="Y:sem-obj"/>
            </diamond>
          </satop>
          <satop nomvar="E:situation">
            <diamond mode="Where">
              <nomvar name="P:proposition"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="have"/>
  </family>
  <family closed="true" pos="V" name="Statement">
    <entry name="IV">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:statement">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Speaker">
              <nomvar name="X:causal-agent"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="TV-SComp-Dcl">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="/"/>
        <atomcat type="s">
          <fs>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:statement">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Speaker">
              <nomvar name="X:causal-agent"/>
            </diamond>
          </satop>
          <satop nomvar="E:statement">
            <diamond mode="Message">
              <nomvar name="E2:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="TV-SComp-Emb">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="/"/>
        <atomcat type="s">
          <fs>
            <feat val="emb" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:statement">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Speaker">
              <nomvar name="X:causal-agent"/>
            </diamond>
          </satop>
          <satop nomvar="E:statement">
            <diamond mode="Message">
              <nomvar name="E2:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="mention"/>
    <member stem="say"/>
  </family>
  <family closed="true" pos="V" name="Experiencer-Subj">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs>
              <feat val="inf" attr="form"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="E:experience">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Experiencer">
              <nomvar name="X:animate-being"/>
            </diamond>
            <diamond mode="Content">
              <nomvar name="E2:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="TV">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:experience">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Experiencer">
              <nomvar name="X:animate-being"/>
            </diamond>
            <diamond mode="Content">
              <nomvar name="Y:sem-obj"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="like"/>
    <member stem="prefer"/>
  </family>
  <family closed="true" pos="V" name="Agentive-Causing">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:situation">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Agent">
              <nomvar name="X:causal-agent"/>
            </diamond>
            <diamond mode="Effect">
              <nomvar name="Y:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="make"/>
  </family>
  <family closed="true" pos="V" name="Copula">
    <entry name="Pred">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs>
              <feat val="adj" attr="form"/>
              <feat attr="index">
                <lf>
                  <nomvar name="P"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash ability="inert" mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="E:state">
            <prop name="be"/>
            <diamond mode="Arg">
              <nomvar name="X:sem-obj"/>
            </diamond>
            <diamond mode="Prop">
              <nomvar name="P:proposition"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Pred-Inverted">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="q" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs>
              <feat val="adj" attr="form"/>
              <feat attr="index">
                <lf>
                  <nomvar name="P"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash ability="inert" mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash mode="*" dir="/"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:state">
            <prop name="be"/>
            <diamond mode="Arg">
              <nomvar name="X:sem-obj"/>
            </diamond>
            <diamond mode="Prop">
              <nomvar name="P:proposition"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="NP">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:state">
            <prop name="be"/>
            <diamond mode="Arg">
              <nomvar name="X:sem-obj"/>
            </diamond>
            <diamond mode="Pred">
              <nomvar name="Y:sem-obj"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="NP-Inverted">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="q" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:state">
            <prop name="be"/>
            <diamond mode="Arg">
              <nomvar name="X:sem-obj"/>
            </diamond>
            <diamond mode="Pred">
              <nomvar name="Y:sem-obj"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="be"/>
  </family>
  <family closed="true" pos="V" name="ThereExistential">
    <entry name="NP">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np_expl">
          <fs>
            <feat val="there" attr="lex"/>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:state">
            <prop name="there-be"/>
            <diamond mode="Arg">
              <nomvar name="X:sem-obj"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="NP-PredAdj">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np_expl">
          <fs>
            <feat val="there" attr="lex"/>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs>
              <feat val="adj" attr="form"/>
              <feat attr="index">
                <lf>
                  <nomvar name="P"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash ability="inert" mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:state">
            <prop name="there-be"/>
            <diamond mode="Arg">
              <nomvar name="X:sem-obj"/>
            </diamond>
          </satop>
          <satop nomvar="E:state">
            <diamond mode="Prop">
              <nomvar name="P:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="NP-PredNg">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np_expl">
          <fs>
            <feat val="there" attr="lex"/>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs>
              <feat val="ng" attr="form"/>
              <feat attr="index">
                <lf>
                  <nomvar name="P"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:state">
            <prop name="there-be"/>
            <diamond mode="Arg">
              <nomvar name="X:sem-obj"/>
            </diamond>
          </satop>
          <satop nomvar="E:state">
            <diamond mode="Prop">
              <nomvar name="P:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="NP-Inverted">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="q" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <atomcat type="np_expl">
          <fs>
            <feat val="there" attr="lex"/>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:state">
            <prop name="there-be"/>
            <diamond mode="Arg">
              <nomvar name="X:sem-obj"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="NP-PredAdj-Inverted">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="q" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs>
              <feat val="adj" attr="form"/>
              <feat attr="index">
                <lf>
                  <nomvar name="P"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash ability="inert" mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <atomcat type="np_expl">
          <fs>
            <feat val="there" attr="lex"/>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:state">
            <prop name="there-be"/>
            <diamond mode="Arg">
              <nomvar name="X:sem-obj"/>
            </diamond>
          </satop>
          <satop nomvar="E:state">
            <diamond mode="Prop">
              <nomvar name="P:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="NP-PredNg-Inverted">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="q" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs>
              <feat val="ng" attr="form"/>
              <feat attr="index">
                <lf>
                  <nomvar name="P"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <atomcat type="np_expl">
          <fs>
            <feat val="there" attr="lex"/>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:state">
            <prop name="there-be"/>
            <diamond mode="Arg">
              <nomvar name="X:sem-obj"/>
            </diamond>
          </satop>
          <satop nomvar="E:state">
            <diamond mode="Prop">
              <nomvar name="P:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="be" pred="there-be"/>
  </family>
  <family closed="true" pos="V" name="HereExistential">
    <entry name="NP">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np_expl">
          <fs>
            <feat val="here" attr="lex"/>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:state">
            <prop name="here-be"/>
            <diamond mode="Arg">
              <nomvar name="X:sem-obj"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="be" pred="here-be"/>
  </family>
  <family closed="true" pos="V" name="Modal">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs>
              <feat val="base" attr="form"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="E:state">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Body">
              <nomvar name="E2:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Inverted">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="2" id="1">
            <feat val="q" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <atomcat type="s">
          <fs id="2">
            <feat val="base" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:state">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Body">
              <nomvar name="E2:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="can"/>
    <member stem="may"/>
    <member stem="should"/>
    <member stem="would"/>
    <member stem="will"/>
    <member stem="do"/>
  </family>
  <family indexRel="prog" closed="true" pos="V" name="Progressive">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs>
              <feat val="ng" attr="form"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="E:state">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Body">
              <nomvar name="E2:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Inverted">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="2" id="1">
            <feat val="q" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <atomcat type="s">
          <fs id="2">
            <feat val="ng" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:state">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Body">
              <nomvar name="E2:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="be" pred="prog"/>
  </family>
  <family closed="true" pos="V" name="Negation">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="6" id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="6">
              <feat attr="index">
                <lf>
                  <nomvar name="E2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="E:state">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Body">
              <nomvar name="E2:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="not"/>
  </family>
  <family indexRel="tense" closed="true" pos="V" name="Do-Support">
    <entry name="Inverted">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="2" id="1">
            <feat val="q" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <atomcat type="s">
          <fs id="2">
            <feat val="base" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="do"/>
  </family>
  <family closed="true" pos="Conj" name="Conj">
    <entry name="NP-Collective" stem="and">
      <complexcat>
        <atomcat type="np_conj">
          <fs id="1">
            <feat val="pl" attr="num"/>
            <feat attr="case">
              <featvar name="CASE"/>
            </feat>
            <feat val="coll" attr="type"/>
            <feat attr="index">
              <lf>
                <nomvar name="L1"/>
              </lf>
            </feat>
            <feat attr="op-index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="np">
          <fs>
            <feat attr="case">
              <featvar name="CASE"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="bt">
          <fs>
            <feat val="LH%" attr="lex"/>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <atomcat type="np">
          <fs>
            <feat attr="case">
              <featvar name="CASE"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="S:sem-obj">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Last">
              <nomvar name="L_N:struct"/>
            </diamond>
          </satop>
          <satop nomvar="L1:struct">
            <prop name="elem"/>
            <diamond mode="Item">
              <nomvar name="X1:sem-obj"/>
            </diamond>
            <diamond mode="Next">
              <nomvar name="L2:struct"/>
              <prop name="elem"/>
              <diamond mode="Item">
                <nomvar name="X2:sem-obj"/>
              </diamond>
              <diamond mode="EqL">
                <nomvar name="L_N:struct"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="NP-Distributive-and" stem="and">
      <complexcat>
        <atomcat type="np_conj">
          <fs id="1">
            <feat val="pl" attr="num"/>
            <feat attr="case">
              <featvar name="CASE"/>
            </feat>
            <feat val="distr" attr="type"/>
            <feat attr="index">
              <lf>
                <nomvar name="L1"/>
              </lf>
            </feat>
            <feat attr="op-index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="np">
          <fs>
            <feat attr="case">
              <featvar name="CASE"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="bt">
          <fs>
            <feat val="LH%" attr="lex"/>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <atomcat type="np">
          <fs>
            <feat attr="case">
              <featvar name="CASE"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="S:sem-obj">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Last">
              <nomvar name="L_N:struct"/>
            </diamond>
          </satop>
          <satop nomvar="L1:struct">
            <prop name="elem"/>
            <diamond mode="Item">
              <nomvar name="X1:sem-obj"/>
            </diamond>
            <diamond mode="Next">
              <nomvar name="L2:struct"/>
              <prop name="elem"/>
              <diamond mode="Item">
                <nomvar name="X2:sem-obj"/>
              </diamond>
              <diamond mode="EqL">
                <nomvar name="L_N:struct"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="NP-Distributive-or" stem="or">
      <complexcat>
        <atomcat type="np_conj">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="case">
              <featvar name="CASE"/>
            </feat>
            <feat val="distr" attr="type"/>
            <feat attr="index">
              <lf>
                <nomvar name="L1"/>
              </lf>
            </feat>
            <feat attr="op-index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="np">
          <fs>
            <feat attr="case">
              <featvar name="CASE"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="bt">
          <fs>
            <feat val="LH%" attr="lex"/>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <atomcat type="np">
          <fs>
            <feat attr="case">
              <featvar name="CASE"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="S:sem-obj">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Last">
              <nomvar name="L_N:struct"/>
            </diamond>
          </satop>
          <satop nomvar="L1:struct">
            <prop name="elem"/>
            <diamond mode="Item">
              <nomvar name="X1:sem-obj"/>
            </diamond>
            <diamond mode="Next">
              <nomvar name="L2:struct"/>
              <prop name="elem"/>
              <diamond mode="Item">
                <nomvar name="X2:sem-obj"/>
              </diamond>
              <diamond mode="EqL">
                <nomvar name="L_N:struct"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Sentential">
      <complexcat>
        <atomcat type="s_conj">
          <fs inheritsFrom="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="L1"/>
              </lf>
            </feat>
            <feat attr="op-index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash/>
        <dollar name="1"/>
        <slash mode="*" dir="\"/>
        <complexcat>
          <atomcat type="s">
            <fs inheritsFrom="1">
              <feat attr="num">
                <featvar name="NUM:num-vals"/>
              </feat>
              <feat attr="pers">
                <featvar name="PERS:pers-vals"/>
              </feat>
              <feat attr="index">
                <lf>
                  <nomvar name="E1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
        </complexcat>
        <slash mode="*" dir="\"/>
        <atomcat type="bt">
          <fs>
            <feat val="LH%" attr="lex"/>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="E2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
        </complexcat>
        <lf>
          <satop nomvar="S:situation">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Last">
              <nomvar name="L_N:struct"/>
            </diamond>
          </satop>
          <satop nomvar="L1:struct">
            <prop name="elem"/>
            <diamond mode="Item">
              <nomvar name="E1:situation"/>
            </diamond>
            <diamond mode="Next">
              <nomvar name="L2:struct"/>
              <prop name="elem"/>
              <diamond mode="Item">
                <nomvar name="E2:situation"/>
              </diamond>
              <diamond mode="EqL">
                <nomvar name="L_N:struct"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="and"/>
    <member stem="or"/>
  </family>
  <family closed="true" pos="Conj" name="Conj-Sentential-Binary">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash/>
        <dollar name="1"/>
        <slash mode="*" dir="\"/>
        <complexcat>
          <atomcat type="s">
            <fs inheritsFrom="1">
              <feat attr="num">
                <featvar name="NUM:num-vals"/>
              </feat>
              <feat attr="pers">
                <featvar name="PERS:pers-vals"/>
              </feat>
              <feat attr="index">
                <lf>
                  <nomvar name="E1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
        </complexcat>
        <slash mode="*" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="E2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
        </complexcat>
        <lf>
          <satop nomvar="S:situation">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="E1:situation"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="E2:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="S-VP">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="punct">
          <fs>
            <feat val="," attr="lex"/>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="E2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="S:situation">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="E1:situation"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="E2:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="but"/>
  </family>
  <family closed="true" pos="Conj" name="Subconj-Initial-Only">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="S:situation">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg2">
              <nomvar name="E2:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="VP">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="E2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="S:situation">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg2">
              <nomvar name="E2:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="and"/>
    <member stem="or"/>
    <member stem="but"/>
  </family>
  <family closed="true" pos="Conj" name="Subconj-Medial">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="E1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="punct">
          <fs>
            <feat val="," attr="lex"/>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="S:situation">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="E1:situation"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="E2:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="but"/>
    <member stem="while"/>
  </family>
  <family closed="true" pos="Conj" name="Subconj-Initial">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <atomcat type="punct">
          <fs>
            <feat val="," attr="lex"/>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="E1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="S:situation">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="E1:situation"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="E2:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="although"/>
    <member stem="if"/>
  </family>
  <family closed="true" pos="Conj" name="Subconj-Transitional">
    <entry name="Initial">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="fronted" attr="form"/>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <atomcat type="punct">
          <fs>
            <feat val="," attr="lex"/>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <atomcat type="s">
          <fs>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:situation">
            <diamond mode="HasProp">
              <nomvar name="S:situation"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Arg">
                <nomvar name="E2:situation"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
  <family indexRel="GenRel" closed="true" pos="RelPro" name="RelPro">
    <entry name="Primary">
      <complexcat>
        <atomcat type="n">
          <fs inheritsFrom="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
            <feat attr="case">
              <featvar name="CASE"/>
            </feat>
          </fs>
        </atomcat>
        <setarg>
          <slash mode="*" dir="\"/>
          <atomcat type="n">
            <fs inheritsFrom="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
              <feat attr="case">
                <featvar name="CASE"/>
              </feat>
            </fs>
          </atomcat>
          <slash mode="*" dir="/"/>
          <complexcat>
            <atomcat type="s">
              <fs id="1">
                <feat val="dcl" attr="form"/>
                <feat attr="index">
                  <lf>
                    <nomvar name="E"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
            <slash dir="|"/>
            <atomcat type="np">
              <fs id="2">
                <feat val="3rd" attr="pers"/>
                <feat attr="index">
                  <lf>
                    <nomvar name="X"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
          </complexcat>
        </setarg>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="GenRel">
              <nomvar name="E:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="that"/>
  </family>
  <family closed="true" pos="RelPro" name="RelPro-Appos">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat attr="form">
              <featvar name="FORM:form-vals"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
            <feat attr="info">
              <lf>
                <var name="INFO"/>
              </lf>
            </feat>
            <feat attr="owner">
              <lf>
                <var name="OWNER"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs>
              <feat val="dcl" attr="form"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="|"/>
          <atomcat type="np">
            <fs id="2">
              <feat val="3rd" attr="pers"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="S:proposition">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="info">
              <var name="INFO"/>
            </diamond>
            <diamond mode="owner">
              <var name="OWNER"/>
            </diamond>
            <diamond mode="kon">
              <prop name="-"/>
            </diamond>
            <diamond mode="Core">
              <nomvar name="E:situation"/>
            </diamond>
            <diamond mode="Trib">
              <nomvar name="E2:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="that" pred="elab-rel"/>
  </family>
  <family indexRel="*NoSem*" closed="true" pos="Comp" name="Comp">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="emb" attr="form"/>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <atomcat type="s">
          <fs id="1">
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="that"/>
  </family>
  <family indexRel="*NoSem*" closed="true" pos="BT" name="BoundaryTone-L-LL%">
    <entry name="S">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="phr" attr="info"/>
            <feat val="nil" attr="owner"/>
          </fs>
        </atomcat>
        <slash/>
        <dollar name="1"/>
        <slash mode="*" dir="\"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="info">
                <lf>
                  <var name="INFO"/>
                </lf>
              </feat>
              <feat attr="owner">
                <lf>
                  <prop name="s"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
        </complexcat>
      </complexcat>
    </entry>
    <member stem="L"/>
    <member stem="LL%"/>
  </family>
  <family indexRel="*NoSem*" closed="true" pos="BT" name="BoundaryTone-LL%-as-LH%">
    <entry name="BT">
      <atomcat type="bt">
        <fs>
          <feat val="LH%" attr="lex"/>
        </fs>
      </atomcat>
    </entry>
    <member stem="LL%"/>
  </family>
  <family indexRel="*NoSem*" closed="true" pos="BT" name="BoundaryTone-LH%">
    <entry name="S">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="phr" attr="info"/>
            <feat val="nil" attr="owner"/>
          </fs>
        </atomcat>
        <slash/>
        <dollar name="1"/>
        <slash mode="*" dir="\"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="info">
                <lf>
                  <var name="INFO"/>
                </lf>
              </feat>
              <feat attr="owner">
                <lf>
                  <prop name="h"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
        </complexcat>
      </complexcat>
    </entry>
    <entry name="BT">
      <atomcat type="bt">
        <fs>
          <feat val="LH%" attr="lex"/>
        </fs>
      </atomcat>
    </entry>
    <member stem="LH%"/>
  </family>
  <family indexRel="*NoSem*" closed="true" pos="BT" name="BoundaryTone-HH%">
    <entry name="S-q">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="phr" attr="info"/>
            <feat val="nil" attr="owner"/>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="s">
          <fs id="1">
            <feat val="q" attr="form"/>
            <feat attr="info">
              <lf>
                <var name="INFO"/>
              </lf>
            </feat>
            <feat attr="owner">
              <lf>
                <prop name="h"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="HH%"/>
  </family>
  <family closed="true" pos="," name="Comma">
    <entry indexRel="*NoSem*" name="Primary">
      <atomcat type="punct">
        <fs>
          <feat val="," attr="lex"/>
        </fs>
      </atomcat>
    </entry>
    <entry indexRel="Next" name="Sentential">
      <complexcat>
        <atomcat type="s_conj">
          <fs inheritsFrom="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="L1"/>
              </lf>
            </feat>
            <feat attr="op-index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash/>
        <dollar name="1"/>
        <slash mode="*" dir="\"/>
        <complexcat>
          <atomcat type="s">
            <fs inheritsFrom="1">
              <feat attr="num">
                <featvar name="NUM:num-vals"/>
              </feat>
              <feat attr="pers">
                <featvar name="PERS:pers-vals"/>
              </feat>
              <feat attr="index">
                <lf>
                  <nomvar name="E1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
        </complexcat>
        <slash mode="*" dir="\"/>
        <atomcat type="bt">
          <fs>
            <feat val="LH%" attr="lex"/>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <complexcat>
          <atomcat type="s_conj">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="L2"/>
                </lf>
              </feat>
              <feat attr="op-index">
                <lf>
                  <nomvar name="S"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
        </complexcat>
        <lf>
          <satop nomvar="L1:struct">
            <prop name="elem"/>
            <diamond mode="Item">
              <nomvar name="E1:situation"/>
            </diamond>
            <diamond mode="Next">
              <nomvar name="L2:struct"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry indexRel="Next" name="NP">
      <complexcat>
        <atomcat type="np_conj">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="L1"/>
              </lf>
            </feat>
            <feat attr="op-index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="np">
          <fs>
            <feat attr="case">
              <featvar name="CASE"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="bt">
          <fs>
            <feat val="LH%" attr="lex"/>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <atomcat type="np_conj">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="L2"/>
              </lf>
            </feat>
            <feat attr="op-index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
            <feat attr="info">
              <lf>
                <var name="INFO"/>
              </lf>
            </feat>
            <feat attr="owner">
              <lf>
                <var name="OWNER"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="L1:struct">
            <prop name="elem"/>
            <diamond mode="Item">
              <nomvar name="X1:sem-obj"/>
            </diamond>
            <diamond mode="Next">
              <nomvar name="L2:struct"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem=","/>
  </family>
  <family closed="true" pos="," name="Comma-Elab">
    <entry name="VP-ng">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat attr="form">
              <featvar name="FORM:form-vals"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
            <feat attr="info">
              <lf>
                <var name="INFO"/>
              </lf>
            </feat>
            <feat attr="owner">
              <lf>
                <var name="OWNER"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs>
              <feat val="ng" attr="form"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="S:proposition">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="info">
              <var name="INFO"/>
            </diamond>
            <diamond mode="owner">
              <var name="OWNER"/>
            </diamond>
            <diamond mode="kon">
              <prop name="-"/>
            </diamond>
            <diamond mode="Core">
              <nomvar name="E:situation"/>
            </diamond>
            <diamond mode="Trib">
              <nomvar name="E2:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Pred-Adj">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat attr="form">
              <featvar name="FORM:form-vals"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
            <feat attr="info">
              <lf>
                <var name="INFO"/>
              </lf>
            </feat>
            <feat attr="owner">
              <lf>
                <var name="OWNER"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs>
              <feat val="adj" attr="form"/>
              <feat attr="index">
                <lf>
                  <nomvar name="P"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash ability="inert" mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="S:proposition">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="info">
              <var name="INFO"/>
            </diamond>
            <diamond mode="owner">
              <var name="OWNER"/>
            </diamond>
            <diamond mode="kon">
              <prop name="-"/>
            </diamond>
            <diamond mode="Core">
              <nomvar name="E:situation"/>
            </diamond>
            <diamond mode="Trib">
              <nomvar name="P:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="," pred="elab-rel"/>
  </family>
  <family indexRel="mood" closed="true" pos="." name="FullStop">
    <entry name="Declare-Dcl-or-Fronted">
      <complexcat>
        <atomcat type="sent">
          <fs>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="s">
          <fs id="1">
            <feat val="dcl-base" attr="form"/>
            <feat val="phr" attr="info"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:sem-obj">
            <diamond mode="mood">
              <prop name="dcl"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Declare-VP-Ng">
      <complexcat>
        <atomcat type="sent">
          <fs>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat val="ng" attr="form"/>
              <feat val="phr" attr="info"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="E:sem-obj">
            <diamond mode="mood">
              <prop name="dcl"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="."/>
  </family>
  <family indexRel="mood" closed="true" pos="?" name="QuestionMark">
    <entry name="Ask-Q-or-Wh">
      <complexcat>
        <atomcat type="sent">
          <fs>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="s">
          <fs id="1">
            <feat val="q-base" attr="form"/>
            <feat val="phr" attr="info"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:sem-obj">
            <diamond mode="mood">
              <prop name="int"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Ask-VP-Wh">
      <complexcat>
        <atomcat type="sent">
          <fs>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat val="wh" attr="form"/>
              <feat val="phr" attr="info"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="E:sem-obj">
            <diamond mode="mood">
              <prop name="int"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="?"/>
  </family>
  <family indexRel="*NoSem*" closed="true" pos="and" name="And-Punct">
    <entry name="Primary">
      <atomcat type="punct">
        <fs val="and" attr="lex"/>
      </atomcat>
    </entry>
    <member stem="and"/>
  </family>
  <family closed="true" pos="N" name="Noun-Path">
    <entry name="In-Path">
      <complexcat>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="pp">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
            <feat val="in" attr="lex"/>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:change">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Path">
              <nomvar name="Y:city"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="At-Path">
      <complexcat>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="pp">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
            <feat val="at" attr="lex"/>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:change">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Path">
              <nomvar name="Y:airport"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="connection"/>
    <member stem="stopover"/>
  </family>
  <family closed="true" pos="N" name="Noun-Travel">
    <entry name="PP-Source">
      <complexcat>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="pp">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
            <feat val="from" attr="lex"/>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Source">
              <nomvar name="Y:location"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="PP-Goal">
      <complexcat>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="pp">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
            <feat val="to" attr="lex"/>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Goal">
              <nomvar name="Y:location"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="PP-Source-PP-Goal">
      <complexcat>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="pp">
          <fs id="4">
            <feat attr="index">
              <lf>
                <nomvar name="Z"/>
              </lf>
            </feat>
            <feat val="to" attr="lex"/>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="pp">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
            <feat val="from" attr="lex"/>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Source">
              <nomvar name="Y:location"/>
            </diamond>
            <diamond mode="Goal">
              <nomvar name="Z:location"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="flight"/>
  </family>
  <family closed="true" pos="N" name="Noun-Category">
    <entry name="Primary">
      <complexcat>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="pp">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
            <feat val="in" attr="lex"/>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Category">
              <nomvar name="Y:fareclass"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="availability"/>
    <member stem="seat"/>
  </family>
  <family closed="true" pos="N" name="Noun-Duration">
    <entry name="Primary">
      <complexcat>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="pp">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
            <feat val="of" attr="lex"/>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Duration">
              <nomvar name="Y:dur"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="travel_time"/>
  </family>
  <family closed="true" pos="Adj" name="Adj-Full">
    <entry name="Primary">
      <complexcat>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="ContainerInv">
              <nomvar name="P:proposition"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Predicative-Container">
      <complexcat>
        <atomcat type="s">
          <fs>
            <feat val="adj" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="P"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash ability="inert" mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="P:proposition">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Container">
              <nomvar name="X:sem-obj"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Predicative-Container-PP-Category">
      <complexcat>
        <atomcat type="s">
          <fs>
            <feat val="adj" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="P"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash ability="inert" mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="/"/>
        <atomcat type="pp">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
            <feat val="in" attr="lex"/>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="P:proposition">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Container">
              <nomvar name="X:sem-obj"/>
            </diamond>
            <diamond mode="Category">
              <nomvar name="Y:fareclass"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="full"/>
  </family>
  <family closed="true" pos="Adj" name="Adj-TimeFrame">
    <entry name="Primary">
      <complexcat>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="TimeFrame">
              <nomvar name="P:timeframe"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="afternoon"/>
    <member stem="evening"/>
    <member stem="morning"/>
  </family>
  <family closed="true" pos="Adj" name="Adj-Willing">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs>
            <feat val="adj" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="P"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash ability="inert" mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs>
              <feat val="inf" attr="form"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="P:state">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Experiencer">
              <nomvar name="X:animate-being"/>
            </diamond>
            <diamond mode="Situation">
              <nomvar name="E2:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="willing"/>
  </family>
  <family closed="true" pos="Adj" name="Adj-Airline">
    <entry name="Primary">
      <complexcat>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="Airline">
              <nomvar name="P:airline"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="Air_France"/>
    <member stem="American"/>
    <member stem="BMI"/>
    <member stem="British_Airways"/>
    <member stem="Delta"/>
    <member stem="Easyjet"/>
    <member stem="Flybe"/>
    <member stem="KLM"/>
    <member stem="Lufthansa"/>
    <member stem="SN_Brussels_Airlines"/>
    <member stem="Ryanair"/>
    <member stem="Scot_Airways"/>
    <member stem="United"/>
    <member stem="VLM"/>
  </family>
  <family indexRel="Airline" closed="true" pos="Prep" name="Prep-Airline">
    <entry name="Primary">
      <complexcat>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="Airline">
              <nomvar name="Y:airline"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Predicative">
      <complexcat>
        <atomcat type="s">
          <fs>
            <feat val="adj" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="P"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash ability="inert" mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="P:proposition">
            <prop name="has-rel"/>
            <diamond mode="info">
              <var name="INFO"/>
            </diamond>
            <diamond mode="owner">
              <var name="OWNER"/>
            </diamond>
            <diamond mode="kon">
              <prop name="-"/>
            </diamond>
            <diamond mode="Of">
              <nomvar name="X:"/>
            </diamond>
            <diamond mode="Airline">
              <nomvar name="Y:airline"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="on"/>
  </family>
  <family indexRel="Time" closed="true" pos="Prep" name="Prep-Time">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:situation">
            <diamond mode="Time">
              <nomvar name="Y:time"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="at"/>
  </family>
  <family closed="true" pos="TempAdv" name="Prep-TimeRel">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:situation">
            <diamond mode="TimeRel">
              <nomvar name="P:proposition"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
          <satop nomvar="P:proposition">
            <diamond mode="Time">
              <nomvar name="Y:time"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="after"/>
    <member stem="before"/>
    <member stem="by"/>
    <member stem="until"/>
  </family>
  <family closed="true" pos="TempAdv" name="Between-TimeRel">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <atomcat type="np">
          <fs>
            <feat attr="index">
              <lf>
                <nomvar name="Z"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <atomcat type="punct">
          <fs val="and" attr="lex"/>
        </atomcat>
        <slash mode="*" dir="/"/>
        <atomcat type="np">
          <fs>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:situation">
            <diamond mode="TimeRel">
              <nomvar name="P:proposition"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
          <satop nomvar="P:proposition">
            <diamond mode="Time1">
              <nomvar name="Y:time"/>
            </diamond>
            <diamond mode="Time2">
              <nomvar name="Z:time"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="between"/>
  </family>
  <family closed="true" pos="TempAdv" name="Comparative-TimeRel">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:situation">
            <diamond mode="TimeRel">
              <nomvar name="P:proposition"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="earlier"/>
    <member stem="later"/>
  </family>
  <family indexRel="TimeFrame" closed="true" pos="Prep" name="Prep-TimeFrame">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:situation">
            <diamond mode="TimeFrame">
              <nomvar name="Y:timeframe"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="in"/>
  </family>
  <family indexRel="Date" closed="true" pos="Prep" name="Prep-Date">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:situation">
            <diamond mode="Date">
              <nomvar name="Y:date"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="on"/>
  </family>
  <family closed="true" pos="V" name="Departing">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:motion">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Theme">
              <nomvar name="X:phys-obj"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Obj-Source">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:motion">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Theme">
              <nomvar name="X:phys-obj"/>
            </diamond>
          </satop>
          <satop nomvar="E:motion">
            <diamond mode="Source">
              <nomvar name="Y:location"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="PP-From-Source">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="pp">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
            <feat val="from" attr="lex"/>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:motion">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Theme">
              <nomvar name="X:phys-obj"/>
            </diamond>
          </satop>
          <satop nomvar="E:motion">
            <diamond mode="Source">
              <nomvar name="Y:location"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="depart"/>
    <member stem="leave"/>
  </family>
  <family closed="true" pos="V" name="Arriving">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:motion">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Theme">
              <nomvar name="X:phys-obj"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Obj-Goal">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:motion">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Theme">
              <nomvar name="X:phys-obj"/>
            </diamond>
          </satop>
          <satop nomvar="E:motion">
            <diamond mode="Goal">
              <nomvar name="Y:location"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="PP-in-Goal">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="pp">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
            <feat val="in" attr="lex"/>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:motion">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Theme">
              <nomvar name="X:phys-obj"/>
            </diamond>
          </satop>
          <satop nomvar="E:motion">
            <diamond mode="Goal">
              <nomvar name="Y:location"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="arrive"/>
  </family>
  <family closed="true" pos="V" name="Travel">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:motion">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Traveler">
              <nomvar name="X:phys-obj"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="TV">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:motion">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Traveler">
              <nomvar name="X:phys-obj"/>
            </diamond>
          </satop>
          <satop nomvar="E:motion">
            <diamond mode="Category">
              <nomvar name="Y:fareclass"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="TV-Goal">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:motion">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Traveler">
              <nomvar name="X:phys-obj"/>
            </diamond>
          </satop>
          <satop nomvar="E:motion">
            <diamond mode="Goal">
              <nomvar name="Y:location"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="TV-Pred-Y">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs>
              <feat val="adj" attr="form"/>
              <feat attr="index">
                <lf>
                  <nomvar name="P"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash ability="inert" mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs>
              <feat attr="index">
                <lf>
                  <nomvar name="Y"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="E:motion">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Traveler">
              <nomvar name="X:phys-obj"/>
            </diamond>
          </satop>
          <satop nomvar="E:motion">
            <diamond mode="Prop">
              <nomvar name="P:proposition"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="TV-On">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="pp">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
            <feat val="on" attr="lex"/>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:motion">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Traveler">
              <nomvar name="X:phys-obj"/>
            </diamond>
          </satop>
          <satop nomvar="E:motion">
            <diamond mode="Airline">
              <nomvar name="Y:airline"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="TV-With">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="pp">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
            <feat val="with" attr="lex"/>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:motion">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Traveler">
              <nomvar name="X:phys-obj"/>
            </diamond>
          </satop>
          <satop nomvar="E:motion">
            <diamond mode="Airline">
              <nomvar name="Y:airline"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="TV-Plus-On">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="/"/>
        <atomcat type="pp">
          <fs id="4">
            <feat attr="index">
              <lf>
                <nomvar name="Z"/>
              </lf>
            </feat>
            <feat val="on" attr="lex"/>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:motion">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Traveler">
              <nomvar name="X:phys-obj"/>
            </diamond>
          </satop>
          <satop nomvar="E:motion">
            <diamond mode="Category">
              <nomvar name="Y:fareclass"/>
            </diamond>
          </satop>
          <satop nomvar="E:motion">
            <diamond mode="Airline">
              <nomvar name="Z:airline"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="TV-Pred-Y-Plus-On">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="/"/>
        <atomcat type="pp">
          <fs id="4">
            <feat attr="index">
              <lf>
                <nomvar name="Z"/>
              </lf>
            </feat>
            <feat val="on" attr="lex"/>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs>
              <feat val="adj" attr="form"/>
              <feat attr="index">
                <lf>
                  <nomvar name="P"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash ability="inert" mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs>
              <feat attr="index">
                <lf>
                  <nomvar name="Y"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="E:motion">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Traveler">
              <nomvar name="X:phys-obj"/>
            </diamond>
          </satop>
          <satop nomvar="E:motion">
            <diamond mode="Prop">
              <nomvar name="P:proposition"/>
            </diamond>
          </satop>
          <satop nomvar="E:motion">
            <diamond mode="Airline">
              <nomvar name="Z:airline"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="TV-From">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="pp">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
            <feat val="from" attr="lex"/>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:motion">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Traveler">
              <nomvar name="X:phys-obj"/>
            </diamond>
          </satop>
          <satop nomvar="E:motion">
            <diamond mode="Source">
              <nomvar name="Y:location"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="TV-To">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="pp">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
            <feat val="to" attr="lex"/>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:motion">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Traveler">
              <nomvar name="X:phys-obj"/>
            </diamond>
          </satop>
          <satop nomvar="E:motion">
            <diamond mode="Goal">
              <nomvar name="Y:location"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="DTV-From-To">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <setarg>
          <slash mode="&lt;" dir="/"/>
          <atomcat type="pp">
            <fs id="3">
              <feat attr="index">
                <lf>
                  <nomvar name="Y"/>
                </lf>
              </feat>
              <feat val="from" attr="lex"/>
            </fs>
          </atomcat>
          <slash mode="&lt;" dir="/"/>
          <atomcat type="pp">
            <fs id="4">
              <feat attr="index">
                <lf>
                  <nomvar name="Z"/>
                </lf>
              </feat>
              <feat val="to" attr="lex"/>
            </fs>
          </atomcat>
        </setarg>
        <lf>
          <satop nomvar="E:motion">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Traveler">
              <nomvar name="X:phys-obj"/>
            </diamond>
          </satop>
          <satop nomvar="E:motion">
            <diamond mode="Source">
              <nomvar name="Y:location"/>
            </diamond>
          </satop>
          <satop nomvar="E:motion">
            <diamond mode="Goal">
              <nomvar name="Z:location"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="fly"/>
    <member stem="go"/>
    <member stem="return"/>
    <member stem="travel"/>
  </family>
  <family closed="true" pos="V" name="Connecting">
    <entry name="TV-In">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="pp">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
            <feat val="in" attr="lex"/>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:motion">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Traveler">
              <nomvar name="X:phys-obj"/>
            </diamond>
          </satop>
          <satop nomvar="E:motion">
            <diamond mode="Path">
              <nomvar name="Y:city"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="TV-At">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="pp">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
            <feat val="at" attr="lex"/>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:motion">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Traveler">
              <nomvar name="X:phys-obj"/>
            </diamond>
          </satop>
          <satop nomvar="E:motion">
            <diamond mode="Path">
              <nomvar name="Y:airport"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="connect"/>
  </family>
  <family closed="true" pos="V" name="Evaluative-Comparison">
    <entry name="TV">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:proposition">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Item">
              <nomvar name="X:sem-obj"/>
            </diamond>
            <diamond mode="Var">
              <nomvar name="Y:sem-obj"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="match"/>
  </family>
  <family closed="true" pos="V" name="Choosing">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:action">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Cognizer">
              <nomvar name="X:causal-agent"/>
            </diamond>
            <diamond mode="Chosen">
              <nomvar name="Y:sem-obj"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="TV-From">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="pp">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
            <feat val="from" attr="lex"/>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:action">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Cognizer">
              <nomvar name="X:causal-agent"/>
            </diamond>
            <diamond mode="Possib">
              <nomvar name="Y:sem-obj"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="choose"/>
  </family>
  <family closed="true" pos="V" name="Booking">
    <entry name="TV">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:action">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Agent">
              <nomvar name="X:causal-agent"/>
            </diamond>
          </satop>
          <satop nomvar="E:action">
            <diamond mode="Goods">
              <nomvar name="Y:phys-obj"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="DTV">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="/"/>
        <atomcat type="np">
          <fs id="4">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Z"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:action">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Agent">
              <nomvar name="X:causal-agent"/>
            </diamond>
          </satop>
          <satop nomvar="E:action">
            <diamond mode="Goods">
              <nomvar name="Y:phys-obj"/>
            </diamond>
          </satop>
          <satop nomvar="E:action">
            <diamond mode="Beneficiary">
              <nomvar name="Z:causal-agent"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="DTV-For">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="pp">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
            <feat val="for" attr="lex"/>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="/"/>
        <atomcat type="np">
          <fs id="4">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Z"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:action">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Agent">
              <nomvar name="X:causal-agent"/>
            </diamond>
          </satop>
          <satop nomvar="E:action">
            <diamond mode="Beneficiary">
              <nomvar name="Y:causal-agent"/>
            </diamond>
            <diamond mode="Goods">
              <nomvar name="Z:phys-obj"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="book"/>
  </family>
  <family closed="true" pos="V" name="Offering">
    <entry name="TV">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:action">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Agent">
              <nomvar name="X:causal-agent"/>
            </diamond>
          </satop>
          <satop nomvar="E:action">
            <diamond mode="Goods">
              <nomvar name="Y:phys-obj"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="offer"/>
  </family>
  <family closed="true" pos="V" name="Conveyance">
    <entry name="TV-To">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="pp">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
            <feat val="to" attr="lex"/>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:motion">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Vehicle">
              <nomvar name="X:phys-obj"/>
            </diamond>
            <diamond mode="Goal">
              <nomvar name="Y:location"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="DTV-To">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="pp">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
            <feat val="to" attr="lex"/>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="/"/>
        <atomcat type="np">
          <fs id="4">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Z"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:motion">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Vehicle">
              <nomvar name="X:phys-obj"/>
            </diamond>
            <diamond mode="Goal">
              <nomvar name="Y:location"/>
            </diamond>
          </satop>
          <satop nomvar="E:motion">
            <diamond mode="Cargo">
              <nomvar name="Z:phys-obj"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="get"/>
  </family>
  <family closed="true" pos="V" name="Requiring">
    <entry name="Obj-Duty">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:action">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Agent">
              <nomvar name="X:causal-agent"/>
            </diamond>
          </satop>
          <satop nomvar="E:situation">
            <diamond mode="Duty">
              <nomvar name="Y:sem-obj"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="require"/>
  </family>
  <family closed="true" pos="V" name="Needing-To">
    <entry name="Obj-Inf">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs>
              <feat val="inf" attr="form"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="E:action">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Agent">
              <nomvar name="X:causal-agent"/>
            </diamond>
          </satop>
          <satop nomvar="E:situation">
            <diamond mode="Duty">
              <nomvar name="E2:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="need" pred="need-to"/>
  </family>
  <family closed="true" pos="V" name="Costing">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:proposition">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Goods">
              <nomvar name="X:phys-obj"/>
            </diamond>
            <diamond mode="Asset">
              <nomvar name="Y:amt"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="cost"/>
  </family>
  <family closed="true" pos="V" name="Wanting">
    <entry name="Obj-Inf">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs>
              <feat val="inf" attr="form"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="E:experience">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Experiencer">
              <nomvar name="X:animate-being"/>
            </diamond>
            <diamond mode="Situation">
              <nomvar name="E2:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="want"/>
  </family>
  <family closed="true" pos="V" name="Finding">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:proposition">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Perceiver">
              <nomvar name="X:animate-being"/>
            </diamond>
            <diamond mode="Sought">
              <nomvar name="Y:phys-obj"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="find"/>
  </family>
  <family closed="true" pos="V" name="Hearing-About">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="pp">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
            <feat val="about" attr="lex"/>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:experience">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Perceiver">
              <nomvar name="X:animate-being"/>
            </diamond>
            <diamond mode="Phenomenon">
              <nomvar name="Y:sem-obj"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="hear"/>
  </family>
  <family closed="true" pos="V" name="Taking-Time">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM:num-vals"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat val="nom" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat val="acc" attr="case"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:situation">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Activity">
              <nomvar name="X:situation"/>
            </diamond>
            <diamond mode="Duration">
              <nomvar name="Y:dur"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="take"/>
  </family>
</ccg-lexicon>


================================================
FILE: grammars/flights/morph.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<morph xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:noNamespaceSchemaLocation="../morph.xsd" name="flights">
  <entry pos="Dummy" word="*dummy*"/>
  <entry pos="NNP" word="[*DATE*]" class="date" macros="@INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="[*DATE*]_L+H*" stem="[*DATE*]" class="date" macros="@th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="[*DATE*]_H*" stem="[*DATE*]" class="date" macros="@rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="[*TIME*]" class="time" macros="@INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="[*TIME*]_L+H*" stem="[*TIME*]" class="time" macros="@th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="[*TIME*]_H*" stem="[*TIME*]" class="time" macros="@rh-X @kon-X @OWNER-X"/>
  <entry pos="Num" word="[*NUM*]" class="num" macros="@pl-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Num" word="[*NUM*]_L+H*" stem="[*NUM*]" class="num" macros="@pl-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="Num" word="[*NUM*]_H*" stem="[*NUM*]" class="num" macros="@pl-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="[*AMT*]" class="amt" macros="@INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="[*AMT*]_L+H*" stem="[*AMT*]" class="amt" macros="@th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="[*AMT*]_H*" stem="[*AMT*]" class="amt" macros="@rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="[*DUR*]" class="dur" macros="@INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="[*DUR*]_L+H*" stem="[*DUR*]" class="dur" macros="@th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="[*DUR*]_H*" stem="[*DUR*]" class="dur" macros="@rh-X @kon-X @OWNER-X"/>
  <entry pos="BT" word="L"/>
  <entry pos="BT" word="LL%"/>
  <entry pos="BT" word="LH%"/>
  <entry pos="BT" word="HH%"/>
  <entry pos="," word=","/>
  <entry pos="." word="."/>
  <entry pos="?" word="?"/>
  <entry pos="Comp" word="that"/>
  <entry pos="RelPro" word="that"/>
  <entry pos="Pro" word="I" stem="pro1" class="animate-being" macros="@1st @sg @nom @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Pro" word="I_L+H*" stem="pro1" class="animate-being" macros="@1st @sg @nom @th-X @kon-X @OWNER-X"/>
  <entry pos="Pro" word="I_H*" stem="pro1" class="animate-being" macros="@1st @sg @nom @rh-X @kon-X @OWNER-X"/>
  <entry pos="Pro" word="me" stem="pro1" class="animate-being" macros="@1st @sg @acc @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Pro" word="me_L+H*" stem="pro1" class="animate-being" macros="@1st @sg @acc @th-X @kon-X @OWNER-X"/>
  <entry pos="Pro" word="me_H*" stem="pro1" class="animate-being" macros="@1st @sg @acc @rh-X @kon-X @OWNER-X"/>
  <entry pos="Pro" word="we" stem="pro1" class="animate-being" macros="@1st @pl @nom @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Pro" word="we_L+H*" stem="pro1" class="animate-being" macros="@1st @pl @nom @th-X @kon-X @OWNER-X"/>
  <entry pos="Pro" word="we_H*" stem="pro1" class="animate-being" macros="@1st @pl @nom @rh-X @kon-X @OWNER-X"/>
  <entry pos="Pro" word="us" stem="pro1" class="animate-being" macros="@1st @pl @acc @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Pro" word="us_L+H*" stem="pro1" class="animate-being" macros="@1st @pl @acc @th-X @kon-X @OWNER-X"/>
  <entry pos="Pro" word="us_H*" stem="pro1" class="animate-being" macros="@1st @pl @acc @rh-X @kon-X @OWNER-X"/>
  <entry pos="PossPro" word="my" stem="pro1" class="animate-being" macros="@sg-P @INFO-P @nokon-P @OWNER-P"/>
  <entry pos="PossPro" word="my_L+H*" stem="pro1" class="animate-being" macros="@sg-P @th-P @kon-P @OWNER-P"/>
  <entry pos="PossPro" word="my_H*" stem="pro1" class="animate-being" macros="@sg-P @rh-P @kon-P @OWNER-P"/>
  <entry pos="PossPro" word="our" stem="pro1" class="animate-being" macros="@pl-P @INFO-P @nokon-P @OWNER-P"/>
  <entry pos="PossPro" word="our_L+H*" stem="pro1" class="animate-being" macros="@pl-P @th-P @kon-P @OWNER-P"/>
  <entry pos="PossPro" word="our_H*" stem="pro1" class="animate-being" macros="@pl-P @rh-P @kon-P @OWNER-P"/>
  <entry pos="Pro" word="you" stem="pro2" class="animate-being" macros="@2nd @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Pro" word="you_L+H*" stem="pro2" class="animate-being" macros="@2nd @th-X @kon-X @OWNER-X"/>
  <entry pos="Pro" word="you_H*" stem="pro2" class="animate-being" macros="@2nd @rh-X @kon-X @OWNER-X"/>
  <entry pos="PossPro" word="your" stem="pro2" class="animate-being" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="PossPro" word="your_L+H*" stem="pro2" class="animate-being" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="PossPro" word="your_H*" stem="pro2" class="animate-being" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Pro" word="she" stem="pro3f" macros="@3rd @sg @nom @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Pro" word="she_L+H*" stem="pro3f" macros="@3rd @sg @nom @th-X @kon-X @OWNER-X"/>
  <entry pos="Pro" word="she_H*" stem="pro3f" macros="@3rd @sg @nom @rh-X @kon-X @OWNER-X"/>
  <entry pos="Pro" word="her" stem="pro3f" macros="@3rd @sg @acc @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Pro" word="her_L+H*" stem="pro3f" macros="@3rd @sg @acc @th-X @kon-X @OWNER-X"/>
  <entry pos="Pro" word="her_H*" stem="pro3f" macros="@3rd @sg @acc @rh-X @kon-X @OWNER-X"/>
  <entry pos="PossPro" word="her" stem="pro3f" macros="@sg-P @INFO-P @nokon-P @OWNER-P"/>
  <entry pos="PossPro" word="her_L+H*" stem="pro3f" macros="@sg-P @th-P @kon-P @OWNER-P"/>
  <entry pos="PossPro" word="her_H*" stem="pro3f" macros="@sg-P @rh-P @kon-P @OWNER-P"/>
  <entry pos="Pro" word="he" stem="pro3m" macros="@3rd @sg @nom @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Pro" word="he_L+H*" stem="pro3m" macros="@3rd @sg @nom @th-X @kon-X @OWNER-X"/>
  <entry pos="Pro" word="he_H*" stem="pro3m" macros="@3rd @sg @nom @rh-X @kon-X @OWNER-X"/>
  <entry pos="Pro" word="him" stem="pro3m" macros="@3rd @sg @acc @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Pro" word="him_L+H*" stem="pro3m" macros="@3rd @sg @acc @th-X @kon-X @OWNER-X"/>
  <entry pos="Pro" word="him_H*" stem="pro3m" macros="@3rd @sg @acc @rh-X @kon-X @OWNER-X"/>
  <entry pos="PossPro" word="his" stem="pro3m" macros="@sg-P @INFO-P @nokon-P @OWNER-P"/>
  <entry pos="PossPro" word="his_L+H*" stem="pro3m" macros="@sg-P @th-P @kon-P @OWNER-P"/>
  <entry pos="PossPro" word="his_H*" stem="pro3m" macros="@sg-P @rh-P @kon-P @OWNER-P"/>
  <entry pos="Pro" word="it" stem="pro3n" macros="@3rd @sg @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Pro" word="it_L+H*" stem="pro3n" macros="@3rd @sg @th-X @kon-X @OWNER-X"/>
  <entry pos="Pro" word="it_H*" stem="pro3n" macros="@3rd @sg @rh-X @kon-X @OWNER-X"/>
  <entry pos="Pro" word="they" stem="pro3n" macros="@3rd @pl @nom @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Pro" word="they_L+H*" stem="pro3n" macros="@3rd @pl @nom @th-X @kon-X @OWNER-X"/>
  <entry pos="Pro" word="they_H*" stem="pro3n" macros="@3rd @pl @nom @rh-X @kon-X @OWNER-X"/>
  <entry pos="Pro" word="them" stem="pro3n" macros="@3rd @pl @acc @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Pro" word="them_L+H*" stem="pro3n" macros="@3rd @pl @acc @th-X @kon-X @OWNER-X"/>
  <entry pos="Pro" word="them_H*" stem="pro3n" macros="@3rd @pl @acc @rh-X @kon-X @OWNER-X"/>
  <entry pos="PossPro" word="its" stem="pro3n" macros="@sg-P @INFO-P @nokon-P @OWNER-P"/>
  <entry pos="PossPro" word="its_L+H*" stem="pro3n" macros="@sg-P @th-P @kon-P @OWNER-P"/>
  <entry pos="PossPro" word="its_H*" stem="pro3n" macros="@sg-P @rh-P @kon-P @OWNER-P"/>
  <entry pos="PossPro" word="their" stem="pro3n" macros="@pl-P @INFO-P @nokon-P @OWNER-P"/>
  <entry pos="PossPro" word="their_L+H*" stem="pro3n" macros="@pl-P @th-P @kon-P @OWNER-P"/>
  <entry pos="PossPro" word="their_H*" stem="pro3n" macros="@pl-P @rh-P @kon-P @OWNER-P"/>
  <entry pos="Pro" word="this" macros="@3rd @sg @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Pro" word="this_L+H*" stem="this" macros="@3rd @sg @th-X @kon-X @OWNER-X"/>
  <entry pos="Pro" word="this_H*" stem="this" macros="@3rd @sg @rh-X @kon-X @OWNER-X"/>
  <entry pos="Pro" word="these" stem="this" macros="@3rd @pl @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Pro" word="these_L+H*" stem="this" macros="@3rd @pl @th-X @kon-X @OWNER-X"/>
  <entry pos="Pro" word="these_H*" stem="this" macros="@3rd @pl @rh-X @kon-X @OWNER-X"/>
  <entry pos="Pro" word="that" macros="@3rd @sg @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Pro" word="that_L+H*" stem="that" macros="@3rd @sg @th-X @kon-X @OWNER-X"/>
  <entry pos="Pro" word="that_H*" stem="that" macros="@3rd @sg @rh-X @kon-X @OWNER-X"/>
  <entry pos="Pro" word="those" stem="that" macros="@3rd @pl @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Pro" word="those_L+H*" stem="that" macros="@3rd @pl @th-X @kon-X @OWNER-X"/>
  <entry pos="Pro" word="those_H*" stem="that" macros="@3rd @pl @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="one" stem="pro_one" macros="@sg @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="one_L+H*" stem="pro_one" macros="@sg @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="one_H*" stem="pro_one" macros="@sg @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="ones" stem="pro_one" macros="@pl @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="ones_L+H*" stem="pro_one" macros="@pl @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="ones_H*" stem="pro_one" macros="@pl @rh-X @kon-X @OWNER-X"/>
  <entry pos="Expl" word="it"/>
  <entry pos="Expl" word="there"/>
  <entry pos="Expl" word="here"/>
  <entry pos="Conj" word="and" macros="@INFO-S @nokon-S @OWNER-S"/>
  <entry pos="Conj" word="and_L+H*" stem="and" macros="@th-S @kon-S @OWNER-S"/>
  <entry pos="Conj" word="and_H*" stem="and" macros="@rh-S @kon-S @OWNER-S"/>
  <entry pos="Conj" word="or" macros="@INFO-S @nokon-S @OWNER-S"/>
  <entry pos="Conj" word="or_L+H*" stem="or" macros="@th-S @kon-S @OWNER-S"/>
  <entry pos="Conj" word="or_H*" stem="or" macros="@rh-S @kon-S @OWNER-S"/>
  <entry pos="Conj" word="but" macros="@INFO-S @nokon-S @OWNER-S"/>
  <entry pos="Conj" word="but_L+H*" stem="but" macros="@th-S @kon-S @OWNER-S"/>
  <entry pos="Conj" word="but_H*" stem="but" macros="@rh-S @kon-S @OWNER-S"/>
  <entry pos="Conj" word="although" macros="@INFO-S @nokon-S @OWNER-S"/>
  <entry pos="Conj" word="although_L+H*" stem="although" macros="@th-S @kon-S @OWNER-S"/>
  <entry pos="Conj" word="although_H*" stem="although" macros="@rh-S @kon-S @OWNER-S"/>
  <entry pos="Conj" word="if" macros="@INFO-S @nokon-S @OWNER-S"/>
  <entry pos="Conj" word="if_L+H*" stem="if" macros="@th-S @kon-S @OWNER-S"/>
  <entry pos="Conj" word="if_H*" stem="if" macros="@rh-S @kon-S @OWNER-S"/>
  <entry pos="Conj" word="while" macros="@INFO-S @nokon-S @OWNER-S"/>
  <entry pos="Conj" word="while_L+H*" stem="while" macros="@th-S @kon-S @OWNER-S"/>
  <entry pos="Conj" word="while_H*" stem="while" macros="@rh-S @kon-S @OWNER-S"/>
  <entry pos="QNP" word="everyone" macros="@sg-2 @INFO-S @nokon-S @OWNER-S"/>
  <entry pos="QNP" word="everyone_L+H*" stem="everyone" macros="@sg-2 @th-S @kon-S @OWNER-S"/>
  <entry pos="QNP" word="everyone_H*" stem="everyone" macros="@sg-2 @rh-S @kon-S @OWNER-S"/>
  <entry pos="QNP" word="both" macros="@pl-2 @INFO-S @nokon-S @OWNER-S"/>
  <entry pos="QNP" word="both_L+H*" stem="both" macros="@pl-2 @th-S @kon-S @OWNER-S"/>
  <entry pos="QNP" word="both_H*" stem="both" macros="@pl-2 @rh-S @kon-S @OWNER-S"/>
  <entry pos="QNP" word="neither" macros="@sg-2 @INFO-S @nokon-S @OWNER-S"/>
  <entry pos="QNP" word="neither_L+H*" stem="neither" macros="@sg-2 @th-S @kon-S @OWNER-S"/>
  <entry pos="QNP" word="neither_H*" stem="neither" macros="@sg-2 @rh-S @kon-S @OWNER-S"/>
  <entry pos="QNP" word="none" macros="@pl-2 @INFO-S @nokon-S @OWNER-S"/>
  <entry pos="QNP" word="none_L+H*" stem="none" macros="@pl-2 @th-S @kon-S @OWNER-S"/>
  <entry pos="QNP" word="none_H*" stem="none" macros="@pl-2 @rh-S @kon-S @OWNER-S"/>
  <entry pos="QNP" word="all" macros="@pl-or-mass-2 @INFO-S @nokon-S @OWNER-S"/>
  <entry pos="QNP" word="all_L+H*" stem="all" macros="@pl-or-mass-2 @th-S @kon-S @OWNER-S"/>
  <entry pos="QNP" word="all_H*" stem="all" macros="@pl-or-mass-2 @rh-S @kon-S @OWNER-S"/>
  <entry pos="WhNP" word="what" macros="@INFO-Q @nokon-Q @OWNER-Q"/>
  <entry pos="WhNP" word="what_L+H*" stem="what" macros="@th-Q @kon-Q @OWNER-Q"/>
  <entry pos="WhNP" word="what_H*" stem="what" macros="@rh-Q @kon-Q @OWNER-Q"/>
  <entry pos="WhNP" word="where" macros="@X-location @INFO-Q @nokon-Q @OWNER-Q"/>
  <entry pos="WhNP" word="where_L+H*" stem="where" macros="@X-location @th-Q @kon-Q @OWNER-Q"/>
  <entry pos="WhNP" word="where_H*" stem="where" macros="@X-location @rh-Q @kon-Q @OWNER-Q"/>
  <entry pos="WhNP" word="who" macros="@X-person @INFO-Q @nokon-Q @OWNER-Q"/>
  <entry pos="WhNP" word="who_L+H*" stem="who" macros="@X-person @th-Q @kon-Q @OWNER-Q"/>
  <entry pos="WhNP" word="who_H*" stem="who" macros="@X-person @rh-Q @kon-Q @OWNER-Q"/>
  <entry pos="Det" word="a" macros="@sg-2"/>
  <entry pos="Det" word="an" stem="a" macros="@sg-2"/>
  <entry pos="Det" word="some"/>
  <entry pos="Det" word="the"/>
  <entry pos="PDet" word="another" macros="@sg-2 @INFO-P @nokon-P @OWNER-P"/>
  <entry pos="PDet" word="another_L+H*" stem="another" macros="@sg-2 @th-P @kon-P @OWNER-P"/>
  <entry pos="PDet" word="another_H*" stem="another" macros="@sg-2 @rh-P @kon-P @OWNER-P"/>
  <entry pos="PDet" word="this" macros="@sg-or-mass-2 @INFO-P @nokon-P @OWNER-P"/>
  <entry pos="PDet" word="this_L+H*" stem="this" macros="@sg-or-mass-2 @th-P @kon-P @OWNER-P"/>
  <entry pos="PDet" word="this_H*" stem="this" macros="@sg-or-mass-2 @rh-P @kon-P @OWNER-P"/>
  <entry pos="PDet" word="these" stem="this" macros="@pl-2 @INFO-P @nokon-P @OWNER-P"/>
  <entry pos="PDet" word="these_L+H*" stem="this" macros="@pl-2 @th-P @kon-P @OWNER-P"/>
  <entry pos="PDet" word="these_H*" stem="this" macros="@pl-2 @rh-P @kon-P @OWNER-P"/>
  <entry pos="PDet" word="that" macros="@sg-or-mass-2 @INFO-P @nokon-P @OWNER-P"/>
  <entry pos="PDet" word="that_L+H*" stem="that" macros="@sg-or-mass-2 @th-P @kon-P @OWNER-P"/>
  <entry pos="PDet" word="that_H*" stem="that" macros="@sg-or-mass-2 @rh-P @kon-P @OWNER-P"/>
  <entry pos="PDet" word="those" stem="that" macros="@pl-2 @INFO-P @nokon-P @OWNER-P"/>
  <entry pos="PDet" word="those_L+H*" stem="that" macros="@pl-2 @th-P @kon-P @OWNER-P"/>
  <entry pos="PDet" word="those_H*" stem="that" macros="@pl-2 @rh-P @kon-P @OWNER-P"/>
  <entry pos="PossS" word="'s" macros="@INFO-3 @OWNER-3"/>
  <entry pos="QDet" word="all" macros="@pl-or-mass-2 @INFO-S @nokon-S @OWNER-S"/>
  <entry pos="QDet" word="all_L+H*" stem="all" macros="@pl-or-mass-2 @th-S @kon-S @OWNER-S"/>
  <entry pos="QDet" word="all_H*" stem="all" macros="@pl-or-mass-2 @rh-S @kon-S @OWNER-S"/>
  <entry pos="QDet" word="both" macros="@pl-2 @INFO-S @nokon-S @OWNER-S"/>
  <entry pos="QDet" word="both_L+H*" stem="both" macros="@pl-2 @th-S @kon-S @OWNER-S"/>
  <entry pos="QDet" word="both_H*" stem="both" macros="@pl-2 @rh-S @kon-S @OWNER-S"/>
  <entry pos="QDet" word="every" macros="@sg-2 @INFO-S @nokon-S @OWNER-S"/>
  <entry pos="QDet" word="every_L+H*" stem="every" macros="@sg-2 @th-S @kon-S @OWNER-S"/>
  <entry pos="QDet" word="every_H*" stem="every" macros="@sg-2 @rh-S @kon-S @OWNER-S"/>
  <entry pos="QDet" word="neither" macros="@sg-2 @INFO-S @nokon-S @OWNER-S"/>
  <entry pos="QDet" word="neither_L+H*" stem="neither" macros="@sg-2 @th-S @kon-S @OWNER-S"/>
  <entry pos="QDet" word="neither_H*" stem="neither" macros="@sg-2 @rh-S @kon-S @OWNER-S"/>
  <entry pos="QDet" word="no" macros="@INFO-S @nokon-S @OWNER-S"/>
  <entry pos="QDet" word="no_L+H*" stem="no" macros="@th-S @kon-S @OWNER-S"/>
  <entry pos="QDet" word="no_H*" stem="no" macros="@rh-S @kon-S @OWNER-S"/>
  <entry pos="Wh" word="what" macros="@INFO-Q @nokon-Q @OWNER-Q"/>
  <entry pos="Wh" word="what_L+H*" stem="what" macros="@th-Q @kon-Q @OWNER-Q"/>
  <entry pos="Wh" word="what_H*" stem="what" macros="@rh-Q @kon-Q @OWNER-Q"/>
  <entry pos="Wh" word="which" macros="@INFO-Q @nokon-Q @OWNER-Q"/>
  <entry pos="Wh" word="which_L+H*" stem="which" macros="@th-Q @kon-Q @OWNER-Q"/>
  <entry pos="Wh" word="which_H*" stem="which" macros="@rh-Q @kon-Q @OWNER-Q"/>
  <entry pos="Adv" word="also" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adv" word="also_L+H*" stem="also" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adv" word="also_H*" stem="also" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adv" word="either" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adv" word="either_L+H*" stem="either" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adv" word="either_H*" stem="either" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adv" word="though" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adv" word="though_L+H*" stem="though" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adv" word="though_H*" stem="though" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adv" word="too" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adv" word="too_L+H*" stem="too" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adv" word="too_H*" stem="too" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Prep" word="with" macros="@INFO-3 @OWNER-3"/>
  <entry pos="V" word="can" macros="@INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="can_L+H*" stem="can" macros="@th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="can_H*" stem="can" macros="@rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="may" macros="@INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="may_L+H*" stem="may" macros="@th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="may_H*" stem="may" macros="@rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="should" macros="@INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="should_L+H*" stem="should" macros="@th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="should_H*" stem="should" macros="@rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="would" macros="@INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="would_L+H*" stem="would" macros="@th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="would_H*" stem="would" macros="@rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="'d" stem="would" macros="@INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="will" macros="@INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="will_L+H*" stem="will" macros="@th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="will_H*" stem="will" macros="@rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="'ll" stem="will" macros="@INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="not" macros="@base @base6 @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="not_L+H*" stem="not" macros="@base @base6 @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="not_H*" stem="not" macros="@base @base6 @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="n't" stem="not" macros="@base @base6 @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="not" macros="@adj @adj6 @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="not_L+H*" stem="not" macros="@adj @adj6 @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="not_H*" stem="not" macros="@adj @adj6 @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="n't" stem="not" macros="@adj @adj6 @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="do" macros="@pres @sg-agr @non-3rd-agr @INFO-E @nokon-E @OWNER-E" excluded="Do-Support"/>
  <entry pos="V" word="do_L+H*" stem="do" macros="@pres @sg-agr @non-3rd-agr @th-E @kon-E @OWNER-E" excluded="Do-Support"/>
  <entry pos="V" word="do_H*" stem="do" macros="@pres @sg-agr @non-3rd-agr @rh-E @kon-E @OWNER-E" excluded="Do-Support"/>
  <entry pos="V" word="does" stem="do" macros="@pres @sg-or-mass-agr @3rd-agr @INFO-E @nokon-E @OWNER-E" excluded="Do-Support"/>
  <entry pos="V" word="does_L+H*" stem="do" macros="@pres @sg-or-mass-agr @3rd-agr @th-E @kon-E @OWNER-E" excluded="Do-Support"/>
  <entry pos="V" word="does_H*" stem="do" macros="@pres @sg-or-mass-agr @3rd-agr @rh-E @kon-E @OWNER-E" excluded="Do-Support"/>
  <entry pos="V" word="do" macros="@pres @pl-agr @INFO-E @nokon-E @OWNER-E" excluded="Do-Support"/>
  <entry pos="V" word="do_L+H*" stem="do" macros="@pres @pl-agr @th-E @kon-E @OWNER-E" excluded="Do-Support"/>
  <entry pos="V" word="do_H*" stem="do" macros="@pres @pl-agr @rh-E @kon-E @OWNER-E" excluded="Do-Support"/>
  <entry pos="V" word="did" stem="do" macros="@past @INFO-E @nokon-E @OWNER-E" excluded="Do-Support"/>
  <entry pos="V" word="did_L+H*" stem="do" macros="@past @th-E @kon-E @OWNER-E" excluded="Do-Support"/>
  <entry pos="V" word="did_H*" stem="do" macros="@past @rh-E @kon-E @OWNER-E" excluded="Do-Support"/>
  <entry pos="V" word="do" macros="@pres @sg-agr @non-3rd-agr" excluded="Modal"/>
  <entry pos="V" word="does" stem="do" macros="@pres @sg-or-mass-agr @3rd-agr" excluded="Modal"/>
  <entry pos="V" word="do" macros="@pres @pl-agr" excluded="Modal"/>
  <entry pos="V" word="did" stem="do" macros="@past" excluded="Modal"/>
  <entry pos="V" word="be" macros="@base @INFO-E @nokon-E @OWNER-E" excluded="Inverted"/>
  <entry pos="V" word="be_L+H*" stem="be" macros="@base @th-E @kon-E @OWNER-E" excluded="Inverted"/>
  <entry pos="V" word="be_H*" stem="be" macros="@base @rh-E @kon-E @OWNER-E" excluded="Inverted"/>
  <entry pos="V" word="am" stem="be" macros="@pres @sg-agr @1st-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="am_L+H*" stem="be" macros="@pres @sg-agr @1st-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="am_H*" stem="be" macros="@pres @sg-agr @1st-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="'m" stem="be" macros="@pres @sg-agr @1st-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="are" stem="be" macros="@pres @sg-agr @2nd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="are_L+H*" stem="be" macros="@pres @sg-agr @2nd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="are_H*" stem="be" macros="@pres @sg-agr @2nd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="'re" stem="be" macros="@pres @sg-agr @2nd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="is" stem="be" macros="@pres @sg-or-mass-agr @3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="is_L+H*" stem="be" macros="@pres @sg-or-mass-agr @3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="is_H*" stem="be" macros="@pres @sg-or-mass-agr @3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="'s" stem="be" macros="@pres @sg-or-mass-agr @3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="are" stem="be" macros="@pres @pl-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="are_L+H*" stem="be" macros="@pres @pl-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="are_H*" stem="be" macros="@pres @pl-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="'re" stem="be" macros="@pres @pl-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="was" stem="be" macros="@past @sg-agr @1st-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="was_L+H*" stem="be" macros="@past @sg-agr @1st-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="was_H*" stem="be" macros="@past @sg-agr @1st-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="were" stem="be" macros="@past @sg-agr @2nd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="were_L+H*" stem="be" macros="@past @sg-agr @2nd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="were_H*" stem="be" macros="@past @sg-agr @2nd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="was" stem="be" macros="@past @sg-or-mass-agr @3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="was_L+H*" stem="be" macros="@past @sg-or-mass-agr @3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="was_H*" stem="be" macros="@past @sg-or-mass-agr @3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="were" stem="be" macros="@past @pl-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="were_L+H*" stem="be" macros="@past @pl-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="were_H*" stem="be" macros="@past @pl-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="have" macros="@base @INFO-E @nokon-E @OWNER-E" excluded="Inverted"/>
  <entry pos="V" word="have_L+H*" stem="have" macros="@base @th-E @kon-E @OWNER-E" excluded="Inverted"/>
  <entry pos="V" word="have_H*" stem="have" macros="@base @rh-E @kon-E @OWNER-E" excluded="Inverted"/>
  <entry pos="V" word="have" macros="@pres @sg-agr @non-3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="have_L+H*" stem="have" macros="@pres @sg-agr @non-3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="have_H*" stem="have" macros="@pres @sg-agr @non-3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="has" stem="have" macros="@pres @sg-or-mass-agr @3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="has_L+H*" stem="have" macros="@pres @sg-or-mass-agr @3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="has_H*" stem="have" macros="@pres @sg-or-mass-agr @3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="have" macros="@pres @pl-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="have_L+H*" stem="have" macros="@pres @pl-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="have_H*" stem="have" macros="@pres @pl-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="had" stem="have" macros="@past @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="had_L+H*" stem="have" macros="@past @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="had_H*" stem="have" macros="@past @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="like" macros="@base @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="like_L+H*" stem="like" macros="@base @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="like_H*" stem="like" macros="@base @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="liking" stem="like" macros="@ng @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="liking_L+H*" stem="like" macros="@ng @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="liking_H*" stem="like" macros="@ng @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="like" macros="@pres @sg-agr @non-3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="like_L+H*" stem="like" macros="@pres @sg-agr @non-3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="like_H*" stem="like" macros="@pres @sg-agr @non-3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="likes" stem="like" macros="@pres @sg-or-mass-agr @3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="likes_L+H*" stem="like" macros="@pres @sg-or-mass-agr @3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="likes_H*" stem="like" macros="@pres @sg-or-mass-agr @3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="like" macros="@pres @pl-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="like_L+H*" stem="like" macros="@pres @pl-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="like_H*" stem="like" macros="@pres @pl-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="liked" stem="like" macros="@past @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="liked_L+H*" stem="like" macros="@past @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="liked_H*" stem="like" macros="@past @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="make" macros="@base @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="make_L+H*" stem="make" macros="@base @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="make_H*" stem="make" macros="@base @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="making" stem="make" macros="@ng @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="making_L+H*" stem="make" macros="@ng @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="making_H*" stem="make" macros="@ng @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="make" macros="@pres @sg-agr @non-3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="make_L+H*" stem="make" macros="@pres @sg-agr @non-3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="make_H*" stem="make" macros="@pres @sg-agr @non-3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="makes" stem="make" macros="@pres @sg-or-mass-agr @3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="makes_L+H*" stem="make" macros="@pres @sg-or-mass-agr @3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="makes_H*" stem="make" macros="@pres @sg-or-mass-agr @3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="make" macros="@pres @pl-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="make_L+H*" stem="make" macros="@pres @pl-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="make_H*" stem="make" macros="@pres @pl-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="made" stem="make" macros="@past @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="made_L+H*" stem="make" macros="@past @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="made_H*" stem="make" macros="@past @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="mention" macros="@pres @sg-agr @non-3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="mention_L+H*" stem="mention" macros="@pres @sg-agr @non-3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="mention_H*" stem="mention" macros="@pres @sg-agr @non-3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="mentions" stem="mention" macros="@pres @sg-or-mass-agr @3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="mentions_L+H*" stem="mention" macros="@pres @sg-or-mass-agr @3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="mentions_H*" stem="mention" macros="@pres @sg-or-mass-agr @3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="mention" macros="@pres @pl-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="mention_L+H*" stem="mention" macros="@pres @pl-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="mention_H*" stem="mention" macros="@pres @pl-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="mentioned" stem="mention" macros="@past @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="mentioned_L+H*" stem="mention" macros="@past @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="mentioned_H*" stem="mention" macros="@past @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="say" macros="@pres @sg-agr @non-3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="say_L+H*" stem="say" macros="@pres @sg-agr @non-3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="say_H*" stem="say" macros="@pres @sg-agr @non-3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="says" stem="say" macros="@pres @sg-or-mass-agr @3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="says_L+H*" stem="say" macros="@pres @sg-or-mass-agr @3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="says_H*" stem="say" macros="@pres @sg-or-mass-agr @3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="say" macros="@pres @pl-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="say_L+H*" stem="say" macros="@pres @pl-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="say_H*" stem="say" macros="@pres @pl-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="said" stem="say" macros="@past @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="said_L+H*" stem="say" macros="@past @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="said_H*" stem="say" macros="@past @rh-E @kon-E @OWNER-E"/>
  <entry pos="Num" word="one" class="num" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Num" word="one_L+H*" stem="one" class="num" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="Num" word="one_H*" stem="one" class="num" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Num" word="1" class="num" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Num" word="1_L+H*" stem="1" class="num" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="Num" word="1_H*" stem="1" class="num" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Num" word="several" class="num" macros="@pl-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Num" word="several_L+H*" stem="several" class="num" macros="@pl-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="Num" word="several_H*" stem="several" class="num" macros="@pl-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Num" word="two" class="num" macros="@pl-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Num" word="two_L+H*" stem="two" class="num" macros="@pl-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="Num" word="two_H*" stem="two" class="num" macros="@pl-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Num" word="three" class="num" macros="@pl-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Num" word="three_L+H*" stem="three" class="num" macros="@pl-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="Num" word="three_H*" stem="three" class="num" macros="@pl-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Num" word="four" class="num" macros="@pl-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Num" word="four_L+H*" stem="four" class="num" macros="@pl-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="Num" word="four_H*" stem="four" class="num" macros="@pl-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Num" word="five" class="num" macros="@pl-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Num" word="five_L+H*" stem="five" class="num" macros="@pl-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="Num" word="five_H*" stem="five" class="num" macros="@pl-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Num" word="six" class="num" macros="@pl-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Num" word="six_L+H*" stem="six" class="num" macros="@pl-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="Num" word="six_H*" stem="six" class="num" macros="@pl-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Num" word="seven" class="num" macros="@pl-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Num" word="seven_L+H*" stem="seven" class="num" macros="@pl-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="Num" word="seven_H*" stem="seven" class="num" macros="@pl-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Num" word="eight" class="num" macros="@pl-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Num" word="eight_L+H*" stem="eight" class="num" macros="@pl-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="Num" word="eight_H*" stem="eight" class="num" macros="@pl-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Num" word="nine" class="num" macros="@pl-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Num" word="nine_L+H*" stem="nine" class="num" macros="@pl-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="Num" word="nine_H*" stem="nine" class="num" macros="@pl-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Num" word="ten" class="num" macros="@pl-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="Num" word="ten_L+H*" stem="ten" class="num" macros="@pl-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="Num" word="ten_H*" stem="ten" class="num" macros="@pl-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="BT" word="LL%"/>
  <entry pos="and" word="and"/>
  <entry pos="Prep" word="about" macros="@INFO-3 @OWNER-3"/>
  <entry pos="TempAdv" word="after" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="TempAdv" word="after_L+H*" stem="after" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="TempAdv" word="after_H*" stem="after" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Prep" word="at" macros="@INFO-3 @OWNER-3"/>
  <entry pos="TempAdv" word="before" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="TempAdv" word="before_L+H*" stem="before" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="TempAdv" word="before_H*" stem="before" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="TempAdv" word="between" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="TempAdv" word="between_L+H*" stem="between" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="TempAdv" word="between_H*" stem="between" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="TempAdv" word="by" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="TempAdv" word="by_L+H*" stem="by" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="TempAdv" word="by_H*" stem="by" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="TempAdv" word="earlier" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="TempAdv" word="earlier_L+H*" stem="earlier" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="TempAdv" word="earlier_H*" stem="earlier" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Prep" word="for" macros="@INFO-3 @OWNER-3"/>
  <entry pos="Prep" word="from" macros="@INFO-3 @OWNER-3"/>
  <entry pos="Prep" word="in" macros="@INFO-3 @OWNER-3"/>
  <entry pos="TempAdv" word="later" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="TempAdv" word="later_L+H*" stem="later" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="TempAdv" word="later_H*" stem="later" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Prep" word="of" macros="@INFO-3 @OWNER-3"/>
  <entry pos="Prep" word="on" macros="@INFO-3 @OWNER-3"/>
  <entry pos="Adj" word="on" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="on_L+H*" stem="on" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="on_H*" stem="on" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Prep" word="to" macros="@INFO-3 @OWNER-3"/>
  <entry pos="TempAdv" word="until" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="TempAdv" word="until_L+H*" stem="until" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="TempAdv" word="until_H*" stem="until" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Prep" word="with" macros="@INFO-3 @OWNER-3"/>
  <entry pos="Adv" word="alternatively" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adv" word="alternatively_L+H*" stem="alternatively" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adv" word="alternatively_H*" stem="alternatively" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adv" word="however" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adv" word="however_L+H*" stem="however" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adv" word="however_H*" stem="however" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adv" word="only" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adv" word="only_L+H*" stem="only" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adv" word="only_H*" stem="only" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adv" word="on_time" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adv" word="on_time_L+H*" stem="on_time" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adv" word="on_time_H*" stem="on_time" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adv" word="today" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adv" word="today_L+H*" stem="today" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adv" word="today_H*" stem="today" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adv" word="yesterday" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adv" word="yesterday_L+H*" stem="yesterday" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adv" word="yesterday_H*" stem="yesterday" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="V" word="arrive" macros="@base @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="arrive_L+H*" stem="arrive" macros="@base @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="arrive_H*" stem="arrive" macros="@base @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="arriving" stem="arrive" macros="@ng @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="arriving_L+H*" stem="arrive" macros="@ng @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="arriving_H*" stem="arrive" macros="@ng @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="arrive" macros="@pres @sg-agr @non-3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="arrive_L+H*" stem="arrive" macros="@pres @sg-agr @non-3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="arrive_H*" stem="arrive" macros="@pres @sg-agr @non-3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="arrives" stem="arrive" macros="@pres @sg-or-mass-agr @3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="arrives_L+H*" stem="arrive" macros="@pres @sg-or-mass-agr @3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="arrives_H*" stem="arrive" macros="@pres @sg-or-mass-agr @3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="arrive" macros="@pres @pl-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="arrive_L+H*" stem="arrive" macros="@pres @pl-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="arrive_H*" stem="arrive" macros="@pres @pl-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="arrived" stem="arrive" macros="@past @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="arrived_L+H*" stem="arrive" macros="@past @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="arrived_H*" stem="arrive" macros="@past @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="book" macros="@base @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="book_L+H*" stem="book" macros="@base @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="book_H*" stem="book" macros="@base @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="booking" stem="book" macros="@ng @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="booking_L+H*" stem="book" macros="@ng @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="booking_H*" stem="book" macros="@ng @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="book" macros="@pres @sg-agr @non-3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="book_L+H*" stem="book" macros="@pres @sg-agr @non-3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="book_H*" stem="book" macros="@pres @sg-agr @non-3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="books" stem="book" macros="@pres @sg-or-mass-agr @3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="books_L+H*" stem="book" macros="@pres @sg-or-mass-agr @3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="books_H*" stem="book" macros="@pres @sg-or-mass-agr @3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="book" macros="@pres @pl-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="book_L+H*" stem="book" macros="@pres @pl-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="book_H*" stem="book" macros="@pres @pl-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="booked" stem="book" macros="@past @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="booked_L+H*" stem="book" macros="@past @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="booked_H*" stem="book" macros="@past @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="choose" macros="@base @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="choose_L+H*" stem="choose" macros="@base @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="choose_H*" stem="choose" macros="@base @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="choosing" stem="choose" macros="@ng @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="choosing_L+H*" stem="choose" macros="@ng @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="choosing_H*" stem="choose" macros="@ng @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="choose" macros="@pres @sg-agr @non-3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="choose_L+H*" stem="choose" macros="@pres @sg-agr @non-3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="choose_H*" stem="choose" macros="@pres @sg-agr @non-3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="chooses" stem="choose" macros="@pres @sg-or-mass-agr @3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="chooses_L+H*" stem="choose" macros="@pres @sg-or-mass-agr @3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="chooses_H*" stem="choose" macros="@pres @sg-or-mass-agr @3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="choose" macros="@pres @pl-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="choose_L+H*" stem="choose" macros="@pres @pl-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="choose_H*" stem="choose" macros="@pres @pl-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="chose" stem="choose" macros="@past @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="chose_L+H*" stem="choose" macros="@past @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="chose_H*" stem="choose" macros="@past @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="connect" macros="@base @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="connect_L+H*" stem="connect" macros="@base @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="connect_H*" stem="connect" macros="@base @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="connecting" stem="connect" macros="@ng @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="connecting_L+H*" stem="connect" macros="@ng @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="connecting_H*" stem="connect" macros="@ng @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="connect" macros="@pres @sg-agr @non-3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="connect_L+H*" stem="connect" macros="@pres @sg-agr @non-3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="connect_H*" stem="connect" macros="@pres @sg-agr @non-3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="connects" stem="connect" macros="@pres @sg-or-mass-agr @3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="connects_L+H*" stem="connect" macros="@pres @sg-or-mass-agr @3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="connects_H*" stem="connect" macros="@pres @sg-or-mass-agr @3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="connect" macros="@pres @pl-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="connect_L+H*" stem="connect" macros="@pres @pl-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="connect_H*" stem="connect" macros="@pres @pl-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="connected" stem="connect" macros="@past @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="connected_L+H*" stem="connect" macros="@past @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="connected_H*" stem="connect" macros="@past @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="cost" macros="@base @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="cost_L+H*" stem="cost" macros="@base @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="cost_H*" stem="cost" macros="@base @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="costing" stem="cost" macros="@ng @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="costing_L+H*" stem="cost" macros="@ng @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="costing_H*" stem="cost" macros="@ng @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="cost" macros="@pres @sg-agr @non-3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="cost_L+H*" stem="cost" macros="@pres @sg-agr @non-3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="cost_H*" stem="cost" macros="@pres @sg-agr @non-3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="costs" stem="cost" macros="@pres @sg-or-mass-agr @3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="costs_L+H*" stem="cost" macros="@pres @sg-or-mass-agr @3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="costs_H*" stem="cost" macros="@pres @sg-or-mass-agr @3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="cost" macros="@pres @pl-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="cost_L+H*" stem="cost" macros="@pres @pl-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="cost_H*" stem="cost" macros="@pres @pl-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="cost" macros="@past @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="cost_L+H*" stem="cost" macros="@past @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="cost_H*" stem="cost" macros="@past @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="depart" macros="@base @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="depart_L+H*" stem="depart" macros="@base @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="depart_H*" stem="depart" macros="@base @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="departing" stem="depart" macros="@ng @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="departing_L+H*" stem="depart" macros="@ng @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="departing_H*" stem="depart" macros="@ng @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="depart" macros="@pres @sg-agr @non-3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="depart_L+H*" stem="depart" macros="@pres @sg-agr @non-3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="depart_H*" stem="depart" macros="@pres @sg-agr @non-3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="departs" stem="depart" macros="@pres @sg-or-mass-agr @3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="departs_L+H*" stem="depart" macros="@pres @sg-or-mass-agr @3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="departs_H*" stem="depart" macros="@pres @sg-or-mass-agr @3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="depart" macros="@pres @pl-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="depart_L+H*" stem="depart" macros="@pres @pl-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="depart_H*" stem="depart" macros="@pres @pl-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="departed" stem="depart" macros="@past @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="departed_L+H*" stem="depart" macros="@past @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="departed_H*" stem="depart" macros="@past @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="find" macros="@base @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="find_L+H*" stem="find" macros="@base @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="find_H*" stem="find" macros="@base @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="finding" stem="find" macros="@ng @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="finding_L+H*" stem="find" macros="@ng @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="finding_H*" stem="find" macros="@ng @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="find" macros="@pres @sg-agr @non-3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="find_L+H*" stem="find" macros="@pres @sg-agr @non-3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="find_H*" stem="find" macros="@pres @sg-agr @non-3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="finds" stem="find" macros="@pres @sg-or-mass-agr @3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="finds_L+H*" stem="find" macros="@pres @sg-or-mass-agr @3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="finds_H*" stem="find" macros="@pres @sg-or-mass-agr @3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="find" macros="@pres @pl-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="find_L+H*" stem="find" macros="@pres @pl-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="find_H*" stem="find" macros="@pres @pl-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="found" stem="find" macros="@past @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="found_L+H*" stem="find" macros="@past @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="found_H*" stem="find" macros="@past @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="fly" macros="@base @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="fly_L+H*" stem="fly" macros="@base @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="fly_H*" stem="fly" macros="@base @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="flying" stem="fly" macros="@ng @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="flying_L+H*" stem="fly" macros="@ng @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="flying_H*" stem="fly" macros="@ng @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="fly" macros="@pres @sg-agr @non-3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="fly_L+H*" stem="fly" macros="@pres @sg-agr @non-3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="fly_H*" stem="fly" macros="@pres @sg-agr @non-3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="flies" stem="fly" macros="@pres @sg-or-mass-agr @3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="flies_L+H*" stem="fly" macros="@pres @sg-or-mass-agr @3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="flies_H*" stem="fly" macros="@pres @sg-or-mass-agr @3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="fly" macros="@pres @pl-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="fly_L+H*" stem="fly" macros="@pres @pl-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="fly_H*" stem="fly" macros="@pres @pl-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="flew" stem="fly" macros="@past @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="flew_L+H*" stem="fly" macros="@past @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="flew_H*" stem="fly" macros="@past @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="get" macros="@base @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="get_L+H*" stem="get" macros="@base @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="get_H*" stem="get" macros="@base @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="getting" stem="get" macros="@ng @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="getting_L+H*" stem="get" macros="@ng @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="getting_H*" stem="get" macros="@ng @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="get" macros="@pres @sg-agr @non-3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="get_L+H*" stem="get" macros="@pres @sg-agr @non-3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="get_H*" stem="get" macros="@pres @sg-agr @non-3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="gets" stem="get" macros="@pres @sg-or-mass-agr @3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="gets_L+H*" stem="get" macros="@pres @sg-or-mass-agr @3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="gets_H*" stem="get" macros="@pres @sg-or-mass-agr @3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="get" macros="@pres @pl-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="get_L+H*" stem="get" macros="@pres @pl-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="get_H*" stem="get" macros="@pres @pl-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="got" stem="get" macros="@past @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="got_L+H*" stem="get" macros="@past @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="got_H*" stem="get" macros="@past @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="go" macros="@base @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="go_L+H*" stem="go" macros="@base @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="go_H*" stem="go" macros="@base @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="going" stem="go" macros="@ng @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="going_L+H*" stem="go" macros="@ng @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="going_H*" stem="go" macros="@ng @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="go" macros="@pres @sg-agr @non-3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="go_L+H*" stem="go" macros="@pres @sg-agr @non-3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="go_H*" stem="go" macros="@pres @sg-agr @non-3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="goes" stem="go" macros="@pres @sg-or-mass-agr @3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="goes_L+H*" stem="go" macros="@pres @sg-or-mass-agr @3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="goes_H*" stem="go" macros="@pres @sg-or-mass-agr @3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="go" macros="@pres @pl-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="go_L+H*" stem="go" macros="@pres @pl-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="go_H*" stem="go" macros="@pres @pl-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="went" stem="go" macros="@past @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="went_L+H*" stem="go" macros="@past @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="went_H*" stem="go" macros="@past @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="hear" macros="@base @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="hear_L+H*" stem="hear" macros="@base @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="hear_H*" stem="hear" macros="@base @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="hearing" stem="hear" macros="@ng @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="hearing_L+H*" stem="hear" macros="@ng @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="hearing_H*" stem="hear" macros="@ng @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="hear" macros="@pres @sg-agr @non-3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="hear_L+H*" stem="hear" macros="@pres @sg-agr @non-3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="hear_H*" stem="hear" macros="@pres @sg-agr @non-3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="hears" stem="hear" macros="@pres @sg-or-mass-agr @3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="hears_L+H*" stem="hear" macros="@pres @sg-or-mass-agr @3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="hears_H*" stem="hear" macros="@pres @sg-or-mass-agr @3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="hear" macros="@pres @pl-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="hear_L+H*" stem="hear" macros="@pres @pl-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="hear_H*" stem="hear" macros="@pres @pl-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="heard" stem="hear" macros="@past @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="heard_L+H*" stem="hear" macros="@past @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="heard_H*" stem="hear" macros="@past @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="leave" macros="@base @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="leave_L+H*" stem="leave" macros="@base @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="leave_H*" stem="leave" macros="@base @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="leaving" stem="leave" macros="@ng @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="leaving_L+H*" stem="leave" macros="@ng @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="leaving_H*" stem="leave" macros="@ng @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="leave" macros="@pres @sg-agr @non-3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="leave_L+H*" stem="leave" macros="@pres @sg-agr @non-3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="leave_H*" stem="leave" macros="@pres @sg-agr @non-3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="leaves" stem="leave" macros="@pres @sg-or-mass-agr @3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="leaves_L+H*" stem="leave" macros="@pres @sg-or-mass-agr @3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="leaves_H*" stem="leave" macros="@pres @sg-or-mass-agr @3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="leave" macros="@pres @pl-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="leave_L+H*" stem="leave" macros="@pres @pl-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="leave_H*" stem="leave" macros="@pres @pl-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="left" stem="leave" macros="@past @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="left_L+H*" stem="leave" macros="@past @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="left_H*" stem="leave" macros="@past @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="match" macros="@base @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="match_L+H*" stem="match" macros="@base @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="match_H*" stem="match" macros="@base @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="matching" stem="match" macros="@ng @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="matching_L+H*" stem="match" macros="@ng @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="matching_H*" stem="match" macros="@ng @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="match" macros="@pres @sg-agr @non-3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="match_L+H*" stem="match" macros="@pres @sg-agr @non-3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="match_H*" stem="match" macros="@pres @sg-agr @non-3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="matches" stem="match" macros="@pres @sg-or-mass-agr @3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="matches_L+H*" stem="match" macros="@pres @sg-or-mass-agr @3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="matches_H*" stem="match" macros="@pres @sg-or-mass-agr @3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="match" macros="@pres @pl-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="match_L+H*" stem="match" macros="@pres @pl-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="match_H*" stem="match" macros="@pres @pl-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="matched" stem="match" macros="@past @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="matched_L+H*" stem="match" macros="@past @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="matched_H*" stem="match" macros="@past @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="need" macros="@base @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="need_L+H*" stem="need" macros="@base @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="need_H*" stem="need" macros="@base @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="needing" stem="need" macros="@ng @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="needing_L+H*" stem="need" macros="@ng @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="needing_H*" stem="need" macros="@ng @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="need" macros="@pres @sg-agr @non-3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="need_L+H*" stem="need" macros="@pres @sg-agr @non-3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="need_H*" stem="need" macros="@pres @sg-agr @non-3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="needs" stem="need" macros="@pres @sg-or-mass-agr @3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="needs_L+H*" stem="need" macros="@pres @sg-or-mass-agr @3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="needs_H*" stem="need" macros="@pres @sg-or-mass-agr @3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="need" macros="@pres @pl-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="need_L+H*" stem="need" macros="@pres @pl-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="need_H*" stem="need" macros="@pres @pl-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="needed" stem="need" macros="@past @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="needed_L+H*" stem="need" macros="@past @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="needed_H*" stem="need" macros="@past @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="offer" macros="@base @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="offer_L+H*" stem="offer" macros="@base @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="offer_H*" stem="offer" macros="@base @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="offering" stem="offer" macros="@ng @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="offering_L+H*" stem="offer" macros="@ng @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="offering_H*" stem="offer" macros="@ng @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="offer" macros="@pres @sg-agr @non-3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="offer_L+H*" stem="offer" macros="@pres @sg-agr @non-3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="offer_H*" stem="offer" macros="@pres @sg-agr @non-3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="offers" stem="offer" macros="@pres @sg-or-mass-agr @3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="offers_L+H*" stem="offer" macros="@pres @sg-or-mass-agr @3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="offers_H*" stem="offer" macros="@pres @sg-or-mass-agr @3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="offer" macros="@pres @pl-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="offer_L+H*" stem="offer" macros="@pres @pl-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="offer_H*" stem="offer" macros="@pres @pl-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="offered" stem="offer" macros="@past @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="offered_L+H*" stem="offer" macros="@past @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="offered_H*" stem="offer" macros="@past @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="prefer" macros="@base @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="prefer_L+H*" stem="prefer" macros="@base @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="prefer_H*" stem="prefer" macros="@base @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="preferring" stem="prefer" macros="@ng @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="preferring_L+H*" stem="prefer" macros="@ng @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="preferring_H*" stem="prefer" macros="@ng @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="prefer" macros="@pres @sg-agr @non-3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="prefer_L+H*" stem="prefer" macros="@pres @sg-agr @non-3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="prefer_H*" stem="prefer" macros="@pres @sg-agr @non-3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="prefers" stem="prefer" macros="@pres @sg-or-mass-agr @3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="prefers_L+H*" stem="prefer" macros="@pres @sg-or-mass-agr @3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="prefers_H*" stem="prefer" macros="@pres @sg-or-mass-agr @3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="prefer" macros="@pres @pl-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="prefer_L+H*" stem="prefer" macros="@pres @pl-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="prefer_H*" stem="prefer" macros="@pres @pl-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="preferred" stem="prefer" macros="@past @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="preferred_L+H*" stem="prefer" macros="@past @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="preferred_H*" stem="prefer" macros="@past @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="require" macros="@base @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="require_L+H*" stem="require" macros="@base @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="require_H*" stem="require" macros="@base @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="requiring" stem="require" macros="@ng @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="requiring_L+H*" stem="require" macros="@ng @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="requiring_H*" stem="require" macros="@ng @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="require" macros="@pres @sg-agr @non-3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="require_L+H*" stem="require" macros="@pres @sg-agr @non-3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="require_H*" stem="require" macros="@pres @sg-agr @non-3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="requires" stem="require" macros="@pres @sg-or-mass-agr @3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="requires_L+H*" stem="require" macros="@pres @sg-or-mass-agr @3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="requires_H*" stem="require" macros="@pres @sg-or-mass-agr @3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="require" macros="@pres @pl-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="require_L+H*" stem="require" macros="@pres @pl-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="require_H*" stem="require" macros="@pres @pl-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="required" stem="require" macros="@past @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="required_L+H*" stem="require" macros="@past @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="required_H*" stem="require" macros="@past @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="return" macros="@base @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="return_L+H*" stem="return" macros="@base @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="return_H*" stem="return" macros="@base @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="returning" stem="return" macros="@ng @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="returning_L+H*" stem="return" macros="@ng @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="returning_H*" stem="return" macros="@ng @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="return" macros="@pres @sg-agr @non-3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="return_L+H*" stem="return" macros="@pres @sg-agr @non-3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="return_H*" stem="return" macros="@pres @sg-agr @non-3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="returns" stem="return" macros="@pres @sg-or-mass-agr @3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="returns_L+H*" stem="return" macros="@pres @sg-or-mass-agr @3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="returns_H*" stem="return" macros="@pres @sg-or-mass-agr @3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="return" macros="@pres @pl-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="return_L+H*" stem="return" macros="@pres @pl-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="return_H*" stem="return" macros="@pres @pl-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="returned" stem="return" macros="@past @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="returned_L+H*" stem="return" macros="@past @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="returned_H*" stem="return" macros="@past @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="take" macros="@base @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="take_L+H*" stem="take" macros="@base @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="take_H*" stem="take" macros="@base @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="taking" stem="take" macros="@ng @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="taking_L+H*" stem="take" macros="@ng @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="taking_H*" stem="take" macros="@ng @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="take" macros="@pres @sg-agr @non-3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="take_L+H*" stem="take" macros="@pres @sg-agr @non-3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="take_H*" stem="take" macros="@pres @sg-agr @non-3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="takes" stem="take" macros="@pres @sg-or-mass-agr @3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="takes_L+H*" stem="take" macros="@pres @sg-or-mass-agr @3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="takes_H*" stem="take" macros="@pres @sg-or-mass-agr @3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="take" macros="@pres @pl-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="take_L+H*" stem="take" macros="@pres @pl-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="take_H*" stem="take" macros="@pres @pl-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="took" stem="take" macros="@past @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="took_L+H*" stem="take" macros="@past @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="took_H*" stem="take" macros="@past @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="travel" macros="@base @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="travel_L+H*" stem="travel" macros="@base @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="travel_H*" stem="travel" macros="@base @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="traveling" stem="travel" macros="@ng @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="traveling_L+H*" stem="travel" macros="@ng @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="traveling_H*" stem="travel" macros="@ng @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="travel" macros="@pres @sg-agr @non-3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="travel_L+H*" stem="travel" macros="@pres @sg-agr @non-3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="travel_H*" stem="travel" macros="@pres @sg-agr @non-3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="travels" stem="travel" macros="@pres @sg-or-mass-agr @3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="travels_L+H*" stem="travel" macros="@pres @sg-or-mass-agr @3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="travels_H*" stem="travel" macros="@pres @sg-or-mass-agr @3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="travel" macros="@pres @pl-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="travel_L+H*" stem="travel" macros="@pres @pl-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="travel_H*" stem="travel" macros="@pres @pl-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="traveled" stem="travel" macros="@past @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="traveled_L+H*" stem="travel" macros="@past @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="traveled_H*" stem="travel" macros="@past @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="want" macros="@base @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="want_L+H*" stem="want" macros="@base @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="want_H*" stem="want" macros="@base @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="wanting" stem="want" macros="@ng @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="wanting_L+H*" stem="want" macros="@ng @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="wanting_H*" stem="want" macros="@ng @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="want" macros="@pres @sg-agr @non-3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="want_L+H*" stem="want" macros="@pres @sg-agr @non-3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="want_H*" stem="want" macros="@pres @sg-agr @non-3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="wants" stem="want" macros="@pres @sg-or-mass-agr @3rd-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="wants_L+H*" stem="want" macros="@pres @sg-or-mass-agr @3rd-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="wants_H*" stem="want" macros="@pres @sg-or-mass-agr @3rd-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="want" macros="@pres @pl-agr @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="want_L+H*" stem="want" macros="@pres @pl-agr @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="want_H*" stem="want" macros="@pres @pl-agr @rh-E @kon-E @OWNER-E"/>
  <entry pos="V" word="wanted" stem="want" macros="@past @INFO-E @nokon-E @OWNER-E"/>
  <entry pos="V" word="wanted_L+H*" stem="want" macros="@past @th-E @kon-E @OWNER-E"/>
  <entry pos="V" word="wanted_H*" stem="want" macros="@past @rh-E @kon-E @OWNER-E"/>
  <entry pos="Adj" word="afternoon" class="timeframe" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="afternoon_L+H*" stem="afternoon" class="timeframe" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="afternoon_H*" stem="afternoon" class="timeframe" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="available" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="available_L+H*" stem="available" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="available_H*" stem="available" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="better" class="scalar" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="better_L+H*" stem="better" class="scalar" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="better_H*" stem="better" class="scalar" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="best" class="scalar" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="best_L+H*" stem="best" class="scalar" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="best_H*" stem="best" class="scalar" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="cheap" class="scalar" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="cheap_L+H*" stem="cheap" class="scalar" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="cheap_H*" stem="cheap" class="scalar" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="cheaper" class="scalar" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="cheaper_L+H*" stem="cheaper" class="scalar" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="cheaper_H*" stem="cheaper" class="scalar" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="cheapest" class="scalar" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="cheapest_L+H*" stem="cheapest" class="scalar" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="cheapest_H*" stem="cheapest" class="scalar" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="connecting" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="connecting_L+H*" stem="connecting" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="connecting_H*" stem="connecting" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="departure" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="departure_L+H*" stem="departure" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="departure_H*" stem="departure" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="destination" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="destination_L+H*" stem="destination" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="destination_H*" stem="destination" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="direct" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="direct_L+H*" stem="direct" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="direct_H*" stem="direct" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="early" class="scalar" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="early_L+H*" stem="early" class="scalar" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="early_H*" stem="early" class="scalar" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="earlier" class="scalar" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="earlier_L+H*" stem="earlier" class="scalar" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="earlier_H*" stem="earlier" class="scalar" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="earliest" class="scalar" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="earliest_L+H*" stem="earliest" class="scalar" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="earliest_H*" stem="earliest" class="scalar" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="even" macros="@INFO-P @nokon-P @OWNER-P" excluded="Predicative"/>
  <entry pos="Adj" word="even_L+H*" stem="even" macros="@th-P @kon-P @OWNER-P" excluded="Predicative"/>
  <entry pos="Adj" word="even_H*" stem="even" macros="@rh-P @kon-P @OWNER-P" excluded="Predicative"/>
  <entry pos="Adj" word="evening" class="timeframe" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="evening_L+H*" stem="evening" class="timeframe" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="evening_H*" stem="evening" class="timeframe" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="first" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="first_L+H*" stem="first" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="first_H*" stem="first" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="full" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="full_L+H*" stem="full" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="full_H*" stem="full" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="good" class="scalar" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="good_L+H*" stem="good" class="scalar" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="good_H*" stem="good" class="scalar" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="great" class="scalar" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="great_L+H*" stem="great" class="scalar" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="great_H*" stem="great" class="scalar" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="just" macros="@INFO-P @nokon-P @OWNER-P" excluded="Predicative"/>
  <entry pos="Adj" word="just_L+H*" stem="just" macros="@th-P @kon-P @OWNER-P" excluded="Predicative"/>
  <entry pos="Adj" word="just_H*" stem="just" macros="@rh-P @kon-P @OWNER-P" excluded="Predicative"/>
  <entry pos="Adj" word="last" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="last_L+H*" stem="last" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="last_H*" stem="last" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="late" class="scalar" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="late_L+H*" stem="late" class="scalar" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="late_H*" stem="late" class="scalar" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="later" class="scalar" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="later_L+H*" stem="later" class="scalar" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="later_H*" stem="later" class="scalar" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="latest" class="scalar" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="latest_L+H*" stem="latest" class="scalar" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="latest_H*" stem="latest" class="scalar" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="morning" class="timeframe" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="morning_L+H*" stem="morning" class="timeframe" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="morning_H*" stem="morning" class="timeframe" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="next" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="next_L+H*" stem="next" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="next_H*" stem="next" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="nonstop" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="nonstop_L+H*" stem="nonstop" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="nonstop_H*" stem="nonstop" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="only" macros="@INFO-P @nokon-P @OWNER-P" excluded="Predicative"/>
  <entry pos="Adj" word="only_L+H*" stem="only" macros="@th-P @kon-P @OWNER-P" excluded="Predicative"/>
  <entry pos="Adj" word="only_H*" stem="only" macros="@rh-P @kon-P @OWNER-P" excluded="Predicative"/>
  <entry pos="Adj" word="other" macros="@INFO-P @nokon-P @OWNER-P" excluded="Predicative"/>
  <entry pos="Adj" word="other_L+H*" stem="other" macros="@th-P @kon-P @OWNER-P" excluded="Predicative"/>
  <entry pos="Adj" word="other_H*" stem="other" macros="@rh-P @kon-P @OWNER-P" excluded="Predicative"/>
  <entry pos="Adj" word="total" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="total_L+H*" stem="total" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="total_H*" stem="total" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="willing" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="willing_L+H*" stem="willing" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="willing_H*" stem="willing" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="N" word="afternoon" class="timeframe" macros="@sg @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="afternoon_L+H*" stem="afternoon" class="timeframe" macros="@sg @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="afternoon_H*" stem="afternoon" class="timeframe" macros="@sg @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="afternoons" stem="afternoon" class="timeframe" macros="@pl @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="afternoons_L+H*" stem="afternoon" class="timeframe" macros="@pl @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="afternoons_H*" stem="afternoon" class="timeframe" macros="@pl @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="airline" class="airline" macros="@sg @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="airline_L+H*" stem="airline" class="airline" macros="@sg @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="airline_H*" stem="airline" class="airline" macros="@sg @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="airlines" stem="airline" class="airline" macros="@pl @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="airlines_L+H*" stem="airline" class="airline" macros="@pl @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="airlines_H*" stem="airline" class="airline" macros="@pl @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="availability" class="abstraction" macros="@mass @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="availability_L+H*" stem="availability" class="abstraction" macros="@mass @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="availability_H*" stem="availability" class="abstraction" macros="@mass @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="cheapest" class="scalar" macros="@INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="cheapest_L+H*" stem="cheapest" class="scalar" macros="@th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="cheapest_H*" stem="cheapest" class="scalar" macros="@rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="city" class="city" macros="@sg @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="city_L+H*" stem="city" class="city" macros="@sg @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="city_H*" stem="city" class="city" macros="@sg @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="cities" stem="city" class="city" macros="@pl @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="cities_L+H*" stem="city" class="city" macros="@pl @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="cities_H*" stem="city" class="city" macros="@pl @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="connection" class="action" macros="@sg @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="connection_L+H*" stem="connection" class="action" macros="@sg @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="connection_H*" stem="connection" class="action" macros="@sg @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="connections" stem="connection" class="action" macros="@pl @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="connections_L+H*" stem="connection" class="action" macros="@pl @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="connections_H*" stem="connection" class="action" macros="@pl @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="day" class="date" macros="@sg @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="day_L+H*" stem="day" class="date" macros="@sg @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="day_H*" stem="day" class="date" macros="@sg @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="days" stem="day" class="date" macros="@pl @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="days_L+H*" stem="day" class="date" macros="@pl @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="days_H*" stem="day" class="date" macros="@pl @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="date" class="date" macros="@sg @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="date_L+H*" stem="date" class="date" macros="@sg @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="date_H*" stem="date" class="date" macros="@sg @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="dates" stem="date" class="date" macros="@pl @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="dates_L+H*" stem="date" class="date" macros="@pl @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="dates_H*" stem="date" class="date" macros="@pl @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="destination" class="location" macros="@sg @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="destination_L+H*" stem="destination" class="location" macros="@sg @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="destination_H*" stem="destination" class="location" macros="@sg @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="destinations" stem="destination" class="location" macros="@pl @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="destinations_L+H*" stem="destination" class="location" macros="@pl @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="destinations_H*" stem="destination" class="location" macros="@pl @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="earliest" class="scalar" macros="@INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="earliest_L+H*" stem="earliest" class="scalar" macros="@th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="earliest_H*" stem="earliest" class="scalar" macros="@rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="evening" class="timeframe" macros="@sg @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="evening_L+H*" stem="evening" class="timeframe" macros="@sg @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="evening_H*" stem="evening" class="timeframe" macros="@sg @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="evenings" stem="evening" class="timeframe" macros="@pl @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="evenings_L+H*" stem="evening" class="timeframe" macros="@pl @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="evenings_H*" stem="evening" class="timeframe" macros="@pl @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="flight" class="phys-obj" macros="@sg @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="flight_L+H*" stem="flight" class="phys-obj" macros="@sg @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="flight_H*" stem="flight" class="phys-obj" macros="@sg @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="flights" stem="flight" class="phys-obj" macros="@pl @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="flights_L+H*" stem="flight" class="phys-obj" macros="@pl @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="flights_H*" stem="flight" class="phys-obj" macros="@pl @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="latest" class="scalar" macros="@INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="latest_L+H*" stem="latest" class="scalar" macros="@th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="latest_H*" stem="latest" class="scalar" macros="@rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="month" class="date" macros="@sg @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="month_L+H*" stem="month" class="date" macros="@sg @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="month_H*" stem="month" class="date" macros="@sg @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="months" stem="month" class="date" macros="@pl @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="months_L+H*" stem="month" class="date" macros="@pl @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="months_H*" stem="month" class="date" macros="@pl @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="morning" class="timeframe" macros="@sg @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="morning_L+H*" stem="morning" class="timeframe" macros="@sg @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="morning_H*" stem="morning" class="timeframe" macros="@sg @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="mornings" stem="morning" class="timeframe" macros="@pl @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="mornings_L+H*" stem="morning" class="timeframe" macros="@pl @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="mornings_H*" stem="morning" class="timeframe" macros="@pl @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="nonstop" class="abstraction" macros="@INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="nonstop_L+H*" stem="nonstop" class="abstraction" macros="@th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="nonstop_H*" stem="nonstop" class="abstraction" macros="@rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="pound" class="abstraction" macros="@sg @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="pound_L+H*" stem="pound" class="abstraction" macros="@sg @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="pound_H*" stem="pound" class="abstraction" macros="@sg @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="pounds" stem="pound" class="abstraction" macros="@pl @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="pounds_L+H*" stem="pound" class="abstraction" macros="@pl @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="pounds_H*" stem="pound" class="abstraction" macros="@pl @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="option" class="abstraction" macros="@sg @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="option_L+H*" stem="option" class="abstraction" macros="@sg @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="option_H*" stem="option" class="abstraction" macros="@sg @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="options" stem="option" class="abstraction" macros="@pl @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="options_L+H*" stem="option" class="abstraction" macros="@pl @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="options_H*" stem="option" class="abstraction" macros="@pl @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="price" class="abstraction" macros="@sg @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="price_L+H*" stem="price" class="abstraction" macros="@sg @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="price_H*" stem="price" class="abstraction" macros="@sg @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="prices" stem="price" class="abstraction" macros="@pl @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="prices_L+H*" stem="price" class="abstraction" macros="@pl @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="prices_H*" stem="price" class="abstraction" macros="@pl @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="requirement" class="mental-obj" macros="@sg @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="requirement_L+H*" stem="requirement" class="mental-obj" macros="@sg @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="requirement_H*" stem="requirement" class="mental-obj" macros="@sg @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="requirements" stem="requirement" class="mental-obj" macros="@pl @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="requirements_L+H*" stem="requirement" class="mental-obj" macros="@pl @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="requirements_H*" stem="requirement" class="mental-obj" macros="@pl @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="seat" class="phys-obj" macros="@sg @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="seat_L+H*" stem="seat" class="phys-obj" macros="@sg @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="seat_H*" stem="seat" class="phys-obj" macros="@sg @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="seats" stem="seat" class="phys-obj" macros="@pl @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="seats_L+H*" stem="seat" class="phys-obj" macros="@pl @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="seats_H*" stem="seat" class="phys-obj" macros="@pl @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="stopover" class="action" macros="@sg @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="stopover_L+H*" stem="stopover" class="action" macros="@sg @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="stopover_H*" stem="stopover" class="action" macros="@sg @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="stopovers" stem="stopover" class="action" macros="@pl @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="stopovers_L+H*" stem="stopover" class="action" macros="@pl @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="stopovers_H*" stem="stopover" class="action" macros="@pl @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="ticket" class="mental-obj" macros="@sg @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="ticket_L+H*" stem="ticket" class="mental-obj" macros="@sg @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="ticket_H*" stem="ticket" class="mental-obj" macros="@sg @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="tickets" stem="ticket" class="mental-obj" macros="@pl @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="tickets_L+H*" stem="ticket" class="mental-obj" macros="@pl @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="tickets_H*" stem="ticket" class="mental-obj" macros="@pl @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="time" class="time" macros="@sg @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="time_L+H*" stem="time" class="time" macros="@sg @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="time_H*" stem="time" class="time" macros="@sg @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="times" stem="time" class="time" macros="@pl @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="times_L+H*" stem="time" class="time" macros="@pl @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="times_H*" stem="time" class="time" macros="@pl @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="travel_time" class="abstraction" macros="@sg @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="travel_time_L+H*" stem="travel_time" class="abstraction" macros="@sg @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="travel_time_H*" stem="travel_time" class="abstraction" macros="@sg @rh-X @kon-X @OWNER-X"/>
  <entry pos="N" word="travel_times" stem="travel_time" class="abstraction" macros="@pl @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="N" word="travel_times_L+H*" stem="travel_time" class="abstraction" macros="@pl @th-X @kon-X @OWNER-X"/>
  <entry pos="N" word="travel_times_H*" stem="travel_time" class="abstraction" macros="@pl @rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="noon" class="time" macros="@INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="noon_L+H*" stem="noon" class="time" macros="@th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="noon_H*" stem="noon" class="time" macros="@rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="midnight" class="time" macros="@INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="midnight_L+H*" stem="midnight" class="time" macros="@th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="midnight_H*" stem="midnight" class="time" macros="@rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Bob" class="person" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Bob_L+H*" stem="Bob" class="person" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Bob_H*" stem="Bob" class="person" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Gil" class="person" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Gil_L+H*" stem="Gil" class="person" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Gil_H*" stem="Gil" class="person" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Ted" class="person" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Ted_L+H*" stem="Ted" class="person" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Ted_H*" stem="Ted" class="person" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="business" class="fareclass" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="business_L+H*" stem="business" class="fareclass" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="business_H*" stem="business" class="fareclass" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="business_class" class="fareclass" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="business_class_L+H*" stem="business_class" class="fareclass" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="business_class_H*" stem="business_class" class="fareclass" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="coach" class="fareclass" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="coach_L+H*" stem="coach" class="fareclass" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="coach_H*" stem="coach" class="fareclass" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="economy" class="fareclass" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="economy_L+H*" stem="economy" class="fareclass" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="economy_H*" stem="economy" class="fareclass" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="first" class="fareclass" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="first_L+H*" stem="first" class="fareclass" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="first_H*" stem="first" class="fareclass" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="first_class" class="fareclass" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="first_class_L+H*" stem="first_class" class="fareclass" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="first_class_H*" stem="first_class" class="fareclass" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Air_France" class="airline" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Air_France_L+H*" stem="Air_France" class="airline" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Air_France_H*" stem="Air_France" class="airline" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="Air_France" class="airline" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="Air_France_L+H*" stem="Air_France" class="airline" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="Air_France_H*" stem="Air_France" class="airline" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="NNP" word="American" class="airline" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="American_L+H*" stem="American" class="airline" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="American_H*" stem="American" class="airline" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="American" class="airline" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="American_L+H*" stem="American" class="airline" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="American_H*" stem="American" class="airline" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="NNP" word="BMI" class="airline" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="BMI_L+H*" stem="BMI" class="airline" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="BMI_H*" stem="BMI" class="airline" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="BMI" class="airline" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="BMI_L+H*" stem="BMI" class="airline" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="BMI_H*" stem="BMI" class="airline" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="NNP" word="British_Airways" class="airline" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="British_Airways_L+H*" stem="British_Airways" class="airline" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="British_Airways_H*" stem="British_Airways" class="airline" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="British_Airways" class="airline" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="British_Airways_L+H*" stem="British_Airways" class="airline" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="British_Airways_H*" stem="British_Airways" class="airline" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="NNP" word="Delta" class="airline" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Delta_L+H*" stem="Delta" class="airline" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Delta_H*" stem="Delta" class="airline" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="Delta" class="airline" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="Delta_L+H*" stem="Delta" class="airline" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="Delta_H*" stem="Delta" class="airline" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="NNP" word="Easyjet" class="airline" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Easyjet_L+H*" stem="Easyjet" class="airline" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Easyjet_H*" stem="Easyjet" class="airline" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="Easyjet" class="airline" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="Easyjet_L+H*" stem="Easyjet" class="airline" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="Easyjet_H*" stem="Easyjet" class="airline" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="NNP" word="Flybe" class="airline" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Flybe_L+H*" stem="Flybe" class="airline" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Flybe_H*" stem="Flybe" class="airline" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="Flybe" class="airline" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="Flybe_L+H*" stem="Flybe" class="airline" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="Flybe_H*" stem="Flybe" class="airline" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="NNP" word="KLM" class="airline" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="KLM_L+H*" stem="KLM" class="airline" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="KLM_H*" stem="KLM" class="airline" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="KLM" class="airline" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="KLM_L+H*" stem="KLM" class="airline" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="KLM_H*" stem="KLM" class="airline" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="NNP" word="Lufthansa" class="airline" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Lufthansa_L+H*" stem="Lufthansa" class="airline" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Lufthansa_H*" stem="Lufthansa" class="airline" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="Lufthansa" class="airline" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="Lufthansa_L+H*" stem="Lufthansa" class="airline" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="Lufthansa_H*" stem="Lufthansa" class="airline" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="NNP" word="SN_Brussels_Airlines" class="airline" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="SN_Brussels_Airlines_L+H*" stem="SN_Brussels_Airlines" class="airline" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="SN_Brussels_Airlines_H*" stem="SN_Brussels_Airlines" class="airline" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="SN_Brussels_Airlines" class="airline" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="SN_Brussels_Airlines_L+H*" stem="SN_Brussels_Airlines" class="airline" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="SN_Brussels_Airlines_H*" stem="SN_Brussels_Airlines" class="airline" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="NNP" word="Ryanair" class="airline" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Ryanair_L+H*" stem="Ryanair" class="airline" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Ryanair_H*" stem="Ryanair" class="airline" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="Ryanair" class="airline" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="Ryanair_L+H*" stem="Ryanair" class="airline" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="Ryanair_H*" stem="Ryanair" class="airline" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="NNP" word="Scot_Airways" class="airline" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Scot_Airways_L+H*" stem="Scot_Airways" class="airline" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Scot_Airways_H*" stem="Scot_Airways" class="airline" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="Scot_Airways" class="airline" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="Scot_Airways_L+H*" stem="Scot_Airways" class="airline" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="Scot_Airways_H*" stem="Scot_Airways" class="airline" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="NNP" word="United" class="airline" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="United_L+H*" stem="United" class="airline" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="United_H*" stem="United" class="airline" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="United" class="airline" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="United_L+H*" stem="United" class="airline" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="United_H*" stem="United" class="airline" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="NNP" word="VLM" class="airline" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="VLM_L+H*" stem="VLM" class="airline" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="VLM_H*" stem="VLM" class="airline" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="Adj" word="VLM" class="airline" macros="@INFO-P @nokon-P @OWNER-P"/>
  <entry pos="Adj" word="VLM_L+H*" stem="VLM" class="airline" macros="@th-P @kon-P @OWNER-P"/>
  <entry pos="Adj" word="VLM_H*" stem="VLM" class="airline" macros="@rh-P @kon-P @OWNER-P"/>
  <entry pos="NNP" word="Amsterdam_Schiphol" class="airport" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Amsterdam_Schiphol_L+H*" stem="Amsterdam_Schiphol" class="airport" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Amsterdam_Schiphol_H*" stem="Amsterdam_Schiphol" class="airport" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Boston_Logan" class="airport" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Boston_Logan_L+H*" stem="Boston_Logan" class="airport" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Boston_Logan_H*" stem="Boston_Logan" class="airport" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Helsinki_airport" class="airport" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Helsinki_airport_L+H*" stem="Helsinki_airport" class="airport" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Helsinki_airport_H*" stem="Helsinki_airport" class="airport" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="London_City_Airport" class="airport" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="London_City_Airport_L+H*" stem="London_City_Airport" class="airport" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="London_City_Airport_H*" stem="London_City_Airport" class="airport" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="London_Gatwick" class="airport" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="London_Gatwick_L+H*" stem="London_Gatwick" class="airport" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="London_Gatwick_H*" stem="London_Gatwick" class="airport" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="London_Heathrow" class="airport" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="London_Heathrow_L+H*" stem="London_Heathrow" class="airport" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="London_Heathrow_H*" stem="London_Heathrow" class="airport" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Heathrow" class="airport" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Heathrow_L+H*" stem="Heathrow" class="airport" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Heathrow_H*" stem="Heathrow" class="airport" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="San_Francisco_International" class="airport" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="San_Francisco_International_L+H*" stem="San_Francisco_International" class="airport" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="San_Francisco_International_H*" stem="San_Francisco_International" class="airport" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Aalborg" class="city" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Aalborg_L+H*" stem="Aalborg" class="city" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Aalborg_H*" stem="Aalborg" class="city" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Amsterdam" class="city" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Amsterdam_L+H*" stem="Amsterdam" class="city" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Amsterdam_H*" stem="Amsterdam" class="city" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Barcelona" class="city" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Barcelona_L+H*" stem="Barcelona" class="city" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Barcelona_H*" stem="Barcelona" class="city" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Berlin" class="city" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Berlin_L+H*" stem="Berlin" class="city" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Berlin_H*" stem="Berlin" class="city" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Birmingham" class="city" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Birmingham_L+H*" stem="Birmingham" class="city" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Birmingham_H*" stem="Birmingham" class="city" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Boston" class="city" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Boston_L+H*" stem="Boston" class="city" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Boston_H*" stem="Boston" class="city" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Bristol" class="city" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Bristol_L+H*" stem="Bristol" class="city" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Bristol_H*" stem="Bristol" class="city" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Brussels" class="city" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Brussels_L+H*" stem="Brussels" class="city" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Brussels_H*" stem="Brussels" class="city" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Dublin" class="city" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Dublin_L+H*" stem="Dublin" class="city" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Dublin_H*" stem="Dublin" class="city" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Edinburgh" class="city" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Edinburgh_L+H*" stem="Edinburgh" class="city" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Edinburgh_H*" stem="Edinburgh" class="city" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Frankfurt" class="city" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Frankfurt_L+H*" stem="Frankfurt" class="city" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Frankfurt_H*" stem="Frankfurt" class="city" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Helsinki" class="city" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Helsinki_L+H*" stem="Helsinki" class="city" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Helsinki_H*" stem="Helsinki" class="city" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="London" class="city" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="London_L+H*" stem="London" class="city" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="London_H*" stem="London" class="city" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Manchester" class="city" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Manchester_L+H*" stem="Manchester" class="city" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Manchester_H*" stem="Manchester" class="city" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Madrid" class="city" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Madrid_L+H*" stem="Madrid" class="city" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Madrid_H*" stem="Madrid" class="city" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Milan" class="city" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Milan_L+H*" stem="Milan" class="city" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Milan_H*" stem="Milan" class="city" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Paris" class="city" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="Paris_L+H*" stem="Paris" class="city" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="Paris_H*" stem="Paris" class="city" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="San_Francisco" class="city" macros="@sg-2 @INFO-X @nokon-X @OWNER-X"/>
  <entry pos="NNP" word="San_Francisco_L+H*" stem="San_Francisco" class="city" macros="@sg-2 @th-X @kon-X @OWNER-X"/>
  <entry pos="NNP" word="San_Francisco_H*" stem="San_Francisco" class="city" macros="@sg-2 @rh-X @kon-X @OWNER-X"/>
  <macro name="@mass">
    <fs val="mass" attr="num" id="2"/>
  </macro>
  <macro name="@sg">
    <fs val="sg" attr="num" id="2"/>
    <lf>
      <satop nomvar="X">
        <diamond mode="num">
          <prop name="sg"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@sg-agr">
    <fs val="sg" attr="num" id="1"/>
    <fs val="sg" attr="num" id="2"/>
  </macro>
  <macro name="@sg-or-mass-agr">
    <fs id="1">
      <feat attr="num">
        <featvar name="NUM:sg-or-mass"/>
      </feat>
    </fs>
    <fs id="2">
      <feat attr="num">
        <featvar name="NUM:sg-or-mass"/>
      </feat>
    </fs>
  </macro>
  <macro name="@sg-2">
    <fs val="sg" attr="num" id="2"/>
  </macro>
  <macro name="@sg-or-mass-2">
    <fs val="sg-or-mass" attr="num" id="2"/>
  </macro>
  <macro name="@sg-P">
    <lf>
      <satop nomvar="P">
        <diamond mode="num">
          <prop name="sg"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@pl">
    <fs val="pl" attr="num" id="2"/>
    <lf>
      <satop nomvar="X">
        <diamond mode="num">
          <prop name="pl"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@pl-agr">
    <fs val="pl" attr="num" id="1"/>
    <fs val="pl" attr="num" id="2"/>
  </macro>
  <macro name="@pl-2">
    <fs val="pl" attr="num" id="2"/>
  </macro>
  <macro name="@pl-or-mass-2">
    <fs val="pl-or-mass" attr="num" id="2"/>
  </macro>
  <macro name="@pl-P">
    <lf>
      <satop nomvar="P">
        <diamond mode="num">
          <prop name="pl"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@1st">
    <fs val="1st" attr="pers" id="2"/>
  </macro>
  <macro name="@1st-agr">
    <fs val="1st" attr="pers" id="1"/>
    <fs val="1st" attr="pers" id="2"/>
  </macro>
  <macro name="@2nd">
    <fs val="2nd" attr="pers" id="2"/>
  </macro>
  <macro name="@2nd-agr">
    <fs val="2nd" attr="pers" id="1"/>
    <fs val="2nd" attr="pers" id="2"/>
  </macro>
  <macro name="@non-3rd-agr">
    <fs id="1">
      <feat attr="pers">
        <featvar name="PERS:non-3rd"/>
      </feat>
    </fs>
    <fs id="2">
      <feat attr="pers">
        <featvar name="PERS:non-3rd"/>
      </feat>
    </fs>
  </macro>
  <macro name="@3rd">
    <fs val="3rd" attr="pers" id="2"/>
  </macro>
  <macro name="@3rd-agr">
    <fs val="3rd" attr="pers" id="1"/>
    <fs val="3rd" attr="pers" id="2"/>
  </macro>
  <macro name="@nom">
    <fs val="nom" attr="case" id="2"/>
  </macro>
  <macro name="@acc">
    <fs val="acc" attr="case" id="2"/>
  </macro>
  <macro name="@pp-from">
    <fs val="from" attr="lex" id="3"/>
  </macro>
  <macro name="@pp-to">
    <fs val="to" attr="lex" id="3"/>
  </macro>
  <macro name="@prt-up">
    <fs val="up" attr="lex" id="4"/>
  </macro>
  <macro name="@prt-with">
    <fs val="with" attr="lex" id="4"/>
  </macro>
  <macro name="@ng">
    <fs val="ng" attr="form" id="1"/>
  </macro>
  <macro name="@base">
    <fs val="base" attr="form" id="1"/>
  </macro>
  <macro name="@base6">
    <fs val="base" attr="form" id="6"/>
  </macro>
  <macro name="@dcl">
    <fs id="1">
      <feat val="dcl" attr="form"/>
    </fs>
  </macro>
  <macro name="@adj">
    <fs val="adj" attr="form" id="1"/>
  </macro>
  <macro name="@adj6">
    <fs val="adj" attr="form" id="6"/>
  </macro>
  <macro name="@X-location">
    <fs id="2">
      <feat attr="index">
        <lf>
          <nomvar name="X:location"/>
        </lf>
      </feat>
    </fs>
  </macro>
  <macro name="@X-person">
    <fs id="2">
      <feat attr="index">
        <lf>
          <nomvar name="X:person"/>
        </lf>
      </feat>
    </fs>
  </macro>
  <macro name="@past">
    <lf>
      <satop nomvar="E">
        <diamond mode="tense">
          <prop name="past"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@pres">
    <lf>
      <satop nomvar="E">
        <diamond mode="tense">
          <prop name="pres"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@th-X">
    <fs id="2">
      <feat attr="info">
        <lf>
          <prop name="th"/>
        </lf>
      </feat>
    </fs>
    <lf>
      <satop nomvar="X">
        <diamond mode="info">
          <prop name="th"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@rh-X">
    <fs id="2">
      <feat attr="info">
        <lf>
          <prop name="rh"/>
        </lf>
      </feat>
    </fs>
    <lf>
      <satop nomvar="X">
        <diamond mode="info">
          <prop name="rh"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@INFO-X">
    <fs id="2">
      <feat attr="info">
        <lf>
          <var name="INFO"/>
        </lf>
      </feat>
    </fs>
    <lf>
      <satop nomvar="X">
        <diamond mode="info">
          <var name="INFO"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@th-S">
    <fs id="1">
      <feat attr="info">
        <lf>
          <prop name="th"/>
        </lf>
      </feat>
    </fs>
    <lf>
      <satop nomvar="S">
        <diamond mode="info">
          <prop name="th"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@rh-S">
    <fs id="1">
      <feat attr="info">
        <lf>
          <prop name="rh"/>
        </lf>
      </feat>
    </fs>
    <lf>
      <satop nomvar="S">
        <diamond mode="info">
          <prop name="rh"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@INFO-S">
    <fs id="1">
      <feat attr="info">
        <lf>
          <var name="INFO"/>
        </lf>
      </feat>
    </fs>
    <lf>
      <satop nomvar="S">
        <diamond mode="info">
          <var name="INFO"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@th-Q">
    <fs id="2">
      <feat attr="info">
        <lf>
          <prop name="th"/>
        </lf>
      </feat>
    </fs>
    <lf>
      <satop nomvar="Q">
        <diamond mode="info">
          <prop name="th"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@rh-Q">
    <fs id="2">
      <feat attr="info">
        <lf>
          <prop name="rh"/>
        </lf>
      </feat>
    </fs>
    <lf>
      <satop nomvar="Q">
        <diamond mode="info">
          <prop name="rh"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@INFO-Q">
    <fs id="2">
      <feat attr="info">
        <lf>
          <var name="INFO"/>
        </lf>
      </feat>
    </fs>
    <lf>
      <satop nomvar="Q">
        <diamond mode="info">
          <var name="INFO"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@th-P">
    <fs id="1">
      <feat attr="info">
        <lf>
          <prop name="th"/>
        </lf>
      </feat>
    </fs>
    <fs id="2">
      <feat attr="info">
        <lf>
          <prop name="th"/>
        </lf>
      </feat>
    </fs>
    <lf>
      <satop nomvar="P">
        <diamond mode="info">
          <prop name="th"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@rh-P">
    <fs id="1">
      <feat attr="info">
        <lf>
          <prop name="rh"/>
        </lf>
      </feat>
    </fs>
    <fs id="2">
      <feat attr="info">
        <lf>
          <prop name="rh"/>
        </lf>
      </feat>
    </fs>
    <lf>
      <satop nomvar="P">
        <diamond mode="info">
          <prop name="rh"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@INFO-P">
    <fs id="1">
      <feat attr="info">
        <lf>
          <var name="INFO"/>
        </lf>
      </feat>
    </fs>
    <fs id="2">
      <feat attr="info">
        <lf>
          <var name="INFO"/>
        </lf>
      </feat>
    </fs>
    <lf>
      <satop nomvar="P">
        <diamond mode="info">
          <var name="INFO"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@th-E">
    <fs id="1">
      <feat attr="info">
        <lf>
          <prop name="th"/>
        </lf>
      </feat>
    </fs>
    <lf>
      <satop nomvar="E">
        <diamond mode="info">
          <prop name="th"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@rh-E">
    <fs id="1">
      <feat attr="info">
        <lf>
          <prop name="rh"/>
        </lf>
      </feat>
    </fs>
    <lf>
      <satop nomvar="E">
        <diamond mode="info">
          <prop name="rh"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@INFO-E">
    <fs id="1">
      <feat attr="info">
        <lf>
          <var name="INFO"/>
        </lf>
      </feat>
    </fs>
    <lf>
      <satop nomvar="E">
        <diamond mode="info">
          <var name="INFO"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@INFO-3">
    <fs id="3">
      <feat attr="info">
        <lf>
          <var name="INFO"/>
        </lf>
      </feat>
    </fs>
  </macro>
  <macro name="@OWNER-X">
    <fs id="2">
      <feat attr="owner">
        <lf>
          <var name="OWNER"/>
        </lf>
      </feat>
    </fs>
    <lf>
      <satop nomvar="X">
        <diamond mode="owner">
          <var name="OWNER"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@OWNER-S">
    <fs id="1">
      <feat attr="owner">
        <lf>
          <var name="OWNER"/>
        </lf>
      </feat>
    </fs>
    <lf>
      <satop nomvar="S">
        <diamond mode="owner">
          <var name="OWNER"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@OWNER-Q">
    <fs id="2">
      <feat attr="owner">
        <lf>
          <var name="OWNER"/>
        </lf>
      </feat>
    </fs>
    <lf>
      <satop nomvar="Q">
        <diamond mode="owner">
          <var name="OWNER"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@OWNER-P">
    <fs id="1">
      <feat attr="owner">
        <lf>
          <var name="OWNER"/>
        </lf>
      </feat>
    </fs>
    <fs id="2">
      <feat attr="owner">
        <lf>
          <var name="OWNER"/>
        </lf>
      </feat>
    </fs>
    <lf>
      <satop nomvar="P">
        <diamond mode="owner">
          <var name="OWNER"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@OWNER-E">
    <fs id="1">
      <feat attr="owner">
        <lf>
          <var name="OWNER"/>
        </lf>
      </feat>
    </fs>
    <lf>
      <satop nomvar="E">
        <diamond mode="owner">
          <var name="OWNER"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@OWNER-3">
    <fs id="3">
      <feat attr="owner">
        <lf>
          <var name="OWNER"/>
        </lf>
      </feat>
    </fs>
  </macro>
  <macro name="@kon-X">
    <lf>
      <satop nomvar="X">
        <diamond mode="kon">
          <prop name="+"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@nokon-X">
    <lf>
      <satop nomvar="X">
        <diamond mode="kon">
          <prop name="-"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@kon-S">
    <lf>
      <satop nomvar="S">
        <diamond mode="kon">
          <prop name="+"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@nokon-S">
    <lf>
      <satop nomvar="S">
        <diamond mode="kon">
          <prop name="-"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@kon-Q">
    <lf>
      <satop nomvar="Q">
        <diamond mode="kon">
          <prop name="+"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@nokon-Q">
    <lf>
      <satop nomvar="Q">
        <diamond mode="kon">
          <prop name="-"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@kon-P">
    <lf>
      <satop nomvar="P">
        <diamond mode="kon">
          <prop name="+"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@nokon-P">
    <lf>
      <satop nomvar="P">
        <diamond mode="kon">
          <prop name="-"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@kon-E">
    <lf>
      <satop nomvar="E">
        <diamond mode="kon">
          <prop name="+"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@nokon-E">
    <lf>
      <satop nomvar="E">
        <diamond mode="kon">
          <prop name="-"/>
        </diamond>
      </satop>
    </lf>
  </macro>
</morph>


================================================
FILE: grammars/flights/nina107.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<regression>  
  <comment> skipping to nina107_033 </comment>
  <item numOfParses="1" string="flying from Amsterdam_Schiphol_L+H* LH% .">
    <lf>
      <node id="f1:motion" pred="fly" info="th" mood="dcl">
        <rel name="Traveler">
          <node idref="x1:phys-obj"/>
        </rel>
        <rel name="Source">
          <node id="a1:airport" pred="Amsterdam_Schiphol" kon="+"/>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="flying to Amsterdam_Schiphol_L+H* LH% .">
    <lf>
      <node id="f1:motion" pred="fly" info="th" mood="dcl">
        <rel name="Traveler">
          <node idref="x1:phys-obj"/>
        </rel>
        <rel name="Goal">
          <node id="a1:airport" pred="Amsterdam_Schiphol" kon="+"/>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="2" string="flying on *.01.01_L+H* LL% .">
    <lf>
      <node id="f1:motion" pred="fly" info="th" mood="dcl" owner="s">
        <rel name="Traveler">
          <node idref="x1:phys-obj"/>
        </rel>
        <rel name="Date">
          <node id="n1:date" pred="*.01.01" kon="+"/>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="2" string="returning on *.01.01_L+H* LH% at 13:31_L+H* LL% .">
    <lf>
      <node id="r1:motion" pred="return" info="th" mood="dcl">
        <rel name="Traveler">
          <node idref="x1:phys-obj"/>
        </rel>
        <rel name="Date">
          <node id="n1:date" pred="*.01.01" kon="+"/>
        </rel>
        <rel name="Time">
          <node id="n2:time" pred="13:31" kon="+" owner="s"/>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="departing from Helsinki_airport_L+H* LH% at 13:41_L+H* LL% .">
    <lf>
      <node id="d1:motion" pred="depart" info="th" mood="dcl">
        <rel name="Theme">
          <node idref="x1:phys-obj"/>
        </rel>
        <rel name="Source">
          <node id="h1:airport" pred="Helsinki_airport" kon="+"/>
        </rel>
        <rel name="Time">
          <node id="n1:time" pred="13:41" kon="+" owner="s"/>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="arriving in Aalborg_L+H* at 1:51_L+H* LL% .">
    <lf>
      <node id="a1:motion" pred="arrive" info="th" mood="dcl" owner="s">
        <rel name="Theme">
          <node idref="x1:phys-obj"/>
        </rel>
        <rel name="Goal">
          <node id="a2:city" pred="Aalborg" kon="+"/>
        </rel>
        <rel name="Time">
          <node id="n1:time" pred="1:51" kon="+"/>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="where would you like to fly from LL% ?">
    <lf>
      <node id="w1:quantification" pred="where" mood="int" owner="s">
        <rel name="Restr">
          <node idref="x1:location"/>
        </rel>
        <rel name="Body">
          <node id="w2:state" pred="would">
            <rel name="Body">
              <node id="l1:experience" pred="like">
                <rel name="Experiencer">
                  <node id="p1:animate-being" pred="pro2"/>
                </rel>
                <rel name="Content">
                  <node id="f1:motion" pred="fly">
                    <rel name="Traveler">
                      <node idref="p1:animate-being"/>
                    </rel>
                    <rel name="Source">
                      <node idref="x1:location"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <comment> TBD:
    nina107_040.wav	 From where?
    nina107_041.wav	 And from where?
  </comment>
  <item numOfParses="1" string="and flying from which city LH% ?">
    <lf>
      <node id="a1:situation" pred="and" mood="int">
        <rel name="Arg2">
          <node id="w1:quantification" pred="which">
            <rel name="Restr">
              <node id="c1:city" pred="city" num="sg"/>
            </rel>
            <rel name="Body">
              <node id="f1:motion" pred="fly">
                <rel name="Traveler">
                  <node idref="x1:phys-obj"/>
                </rel>
                <rel name="Source">
                  <node idref="c1:city"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="2" string="what city do you want to fly from LL% ?">
    <lf>
      <node id="w1:quantification" pred="what" mood="int" owner="s">
        <rel name="Restr">
          <node id="c1:city" pred="city" num="sg"/>
        </rel>
        <rel name="Body">
          <node id="w2:experience" pred="want" tense="pres">
            <rel name="Experiencer">
              <node id="p1:animate-being" pred="pro2"/>
            </rel>
            <rel name="Situation">
              <node id="f1:motion" pred="fly">
                <rel name="Traveler">
                  <node idref="p1:animate-being"/>
                </rel>
                <rel name="Source">
                  <node idref="c1:city"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="2" string="what is your departure city LL% ?">
    <lf>
      <node id="w1:quantification" pred="what" mood="int" owner="s">
        <rel name="Restr">
          <node idref="x1:sem-obj"/>
        </rel>
        <rel name="Body">
          <node id="b1:state" pred="be" tense="pres">
            <rel name="Arg">
              <node idref="x1:sem-obj"/>
            </rel>
            <rel name="Pred">
              <node id="c1:city" pred="city" num="sg">
                <rel name="HasProp">
                  <node id="d1:proposition" pred="departure"/>
                </rel>
                <rel name="GenOwner">
                  <node id="p1:animate-being" pred="pro2"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="and going where LH% ?">
    <lf>
      <node id="a1:situation" pred="and" mood="int">
        <rel name="Arg2">
          <node id="w1:quantification" pred="where">
            <rel name="Restr">
              <node idref="x1:location"/>
            </rel>
            <rel name="Body">
              <node id="g1:motion" pred="go">
                <rel name="Traveler">
                  <node idref="x2:phys-obj"/>
                </rel>
                <rel name="Goal">
                  <node idref="x1:location"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="going where LH% ?">
    <lf>
      <node id="w1:quantification" pred="where" mood="int">
        <rel name="Restr">
          <node idref="x1:location"/>
        </rel>
        <rel name="Body">
          <node id="g1:motion" pred="go">
            <rel name="Traveler">
              <node idref="x2:phys-obj"/>
            </rel>
            <rel name="Goal">
              <node idref="x1:location"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="and where will you be flying to LL% ?">
    <lf>
      <node id="a1:situation" pred="and" mood="int" owner="s">
        <rel name="Arg2">
          <node id="w1:quantification" pred="where">
            <rel name="Restr">
              <node idref="x1:location"/>
            </rel>
            <rel name="Body">
              <node id="w2:state" pred="will">
                <rel name="Body">
                  <node id="p1:state" pred="prog">
                    <rel name="Body">
                      <node id="f1:motion" pred="fly">
                        <rel name="Traveler">
                          <node id="p2:animate-being" pred="pro2"/>
                        </rel>
                        <rel name="Goal">
                          <node idref="x1:location"/>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="where are you going to from Barcelona_H* LL% ?">
    <lf>
      <node id="w1:quantification" pred="where" info="rh" mood="int" owner="s">
        <rel name="Restr">
          <node idref="x1:location"/>
        </rel>
        <rel name="Body">
          <node id="p1:state" pred="prog" tense="pres">
            <rel name="Body">
              <node id="g1:motion" pred="go">
                <rel name="Traveler">
                  <node id="p2:animate-being" pred="pro2"/>
                </rel>
                <rel name="Source">
                  <node id="b1:city" pred="Barcelona" kon="+"/>
                </rel>
                <rel name="Goal">
                  <node idref="x1:location"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="flying to what city LL% ?">
    <lf>
      <node id="w1:quantification" pred="what" mood="int" owner="s">
        <rel name="Restr">
          <node id="c1:city" pred="city" num="sg"/>
        </rel>
        <rel name="Body">
          <node id="f1:motion" pred="fly">
            <rel name="Traveler">
              <node idref="x1:phys-obj"/>
            </rel>
            <rel name="Goal">
              <node idref="c1:city"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="what city are you flying to LL% ?">
    <lf>
      <node id="w1:quantification" pred="what" mood="int" owner="s">
        <rel name="Restr">
          <node id="c1:city" pred="city" num="sg"/>
        </rel>
        <rel name="Body">
          <node id="p1:state" pred="prog" tense="pres">
            <rel name="Body">
              <node id="f1:motion" pred="fly">
                <rel name="Traveler">
                  <node id="p2:animate-being" pred="pro2"/>
                </rel>
                <rel name="Goal">
                  <node idref="c1:city"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="2" string="what is your destination city LL% ?">
    <lf>
      <node id="w1:quantification" pred="what" mood="int" owner="s">
        <rel name="Restr">
          <node idref="x1:sem-obj"/>
        </rel>
        <rel name="Body">
          <node id="b1:state" pred="be" tense="pres">
            <rel name="Arg">
              <node idref="x1:sem-obj"/>
            </rel>
            <rel name="Pred">
              <node id="c1:city" pred="city" num="sg">
                <rel name="HasProp">
                  <node id="d1:proposition" pred="destination"/>
                </rel>
                <rel name="GenOwner">
                  <node id="p1:animate-being" pred="pro2"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="2" string="what is your destination LL% ?">
    <lf>
      <node id="w1:quantification" pred="what" mood="int" owner="s">
        <rel name="Restr">
          <node idref="x1:sem-obj"/>
        </rel>
        <rel name="Body">
          <node id="b1:state" pred="be" tense="pres">
            <rel name="Arg">
              <node idref="x1:sem-obj"/>
            </rel>
            <rel name="Pred">
              <node id="d1:location" pred="destination" num="sg">
                <rel name="GenOwner">
                  <node id="p1:animate-being" pred="pro2"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="leaving on what date LL% ?">
    <lf>
      <node id="w1:quantification" pred="what" mood="int" owner="s">
        <rel name="Restr">
          <node id="d1:date" pred="date" num="sg"/>
        </rel>
        <rel name="Body">
          <node id="l1:motion" pred="leave">
            <rel name="Theme">
              <node idref="x1:phys-obj"/>
            </rel>
            <rel name="Date">
              <node idref="d1:date"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="departing on what date LL% ?">
    <lf>
      <node id="w1:quantification" pred="what" mood="int" owner="s">
        <rel name="Restr">
          <node id="d1:date" pred="date" num="sg"/>
        </rel>
        <rel name="Body">
          <node id="d2:motion" pred="depart">
            <rel name="Theme">
              <node idref="x1:phys-obj"/>
            </rel>
            <rel name="Date">
              <node idref="d1:date"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
</regression>


================================================
FILE: grammars/flights/rules-base.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!-- 
Copyright (C) 2003 University of Edinburgh (Michael White) 
$Revision: 1.2 $, $Date: 2004/10/05 11:01:48 $ 
-->
<rules
  name="flights"
  xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
  xsi:noNamespaceSchemaLocation="../rules.xsd"
>
  <application dir="forward"/>
  <application dir="backward"/>
  <composition dir="forward" harmonic="true"/>
  <!--
  <composition dir="forward" harmonic="false"/>
  -->
  <composition dir="backward" harmonic="true"/>
  <composition dir="backward" harmonic="false"/>
  <typeraising dir="forward" useDollar="false"/>
  <typeraising dir="forward" useDollar="false">
    <arg><atomcat type="pp"/></arg>
  </typeraising>
  <typeraising dir="backward" useDollar="true"/>
  <typeraising dir="backward" useDollar="true">
    <arg><atomcat type="pp"/></arg>
  </typeraising>
  <!--
  <substitution dir="forward" harmonic="true"/>
  <substitution dir="forward" harmonic="false"/>
  <substitution dir="backward" harmonic="true"/>
  <substitution dir="backward" harmonic="false"/>
  -->
</rules>


================================================
FILE: grammars/flights/rules.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!-- 
Copyright (C) 2003 University of Edinburgh (Michael White) 
$Revision: 1.108 $, $Date: 2008/12/12 05:09:29 $ 
-->
<rules xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" name="flights" xsi:noNamespaceSchemaLocation="../rules.xsd">
  <application dir="forward"/>
  <application dir="backward"/>
  <composition dir="forward" harmonic="true"/>
  <!--
  <composition dir="forward" harmonic="false"/>
  -->
  <composition dir="backward" harmonic="true"/>
  <composition dir="backward" harmonic="false"/>
  <typeraising dir="forward" useDollar="false"/>
  <typeraising dir="forward" useDollar="false">
    <arg>
      <atomcat type="pp"/>
    </arg>
  </typeraising>
  <typeraising dir="backward" useDollar="true"/>
  <typeraising dir="backward" useDollar="true">
    <arg>
      <atomcat type="pp"/>
    </arg>
  </typeraising>
  <!--
  <substitution dir="forward" harmonic="true"/>
  <substitution dir="forward" harmonic="false"/>
  <substitution dir="backward" harmonic="true"/>
  <substitution dir="backward" harmonic="false"/>
  -->
  <typechanging name="rrel">
    <arg>
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/"/>
        <atomcat type="np">
          <fs id="2">
            <feat val="3rd" attr="pers"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </arg>
    <result>
      <complexcat>
        <atomcat type="n">
          <fs inheritsFrom="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
            <feat attr="case">
              <featvar name="CASE"/>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="n">
          <fs inheritsFrom="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
            <feat attr="case">
              <featvar name="CASE"/>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="GenRel">
              <nomvar name="E:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </result>
  </typechanging>
  <typechanging name="tpc">
    <arg>
      <atomcat type="np">
        <fs id="2">
          <feat attr="index">
            <lf>
              <nomvar name="X"/>
            </lf>
          </feat>
          <feat attr="info">
            <lf>
              <prop name="th"/>
            </lf>
          </feat>
          <feat attr="owner">
            <lf>
              <prop name="h"/>
            </lf>
          </feat>
        </fs>
      </atomcat>
    </arg>
    <result>
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="fronted" attr="form"/>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat val="dcl" attr="form"/>
            </fs>
          </atomcat>
          <slash dir="/"/>
          <atomcat type="np">
            <fs id="2"/>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="tpc">
              <prop name="+"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </result>
  </typechanging>
  <typechanging name="bnp">
    <arg>
      <complexcat>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
            <feat val="pl-or-mass" attr="num"/>
          </fs>
        </atomcat>
        <slash/>
        <dollar name="1"/>
      </complexcat>
    </arg>
    <result>
      <complexcat>
        <atomcat type="np">
          <fs id="2">
            <feat val="3rd" attr="pers"/>
          </fs>
          <lf>
            <satop nomvar="X:sem-obj">
              <diamond mode="det">
                <prop name="nil"/>
              </diamond>
            </satop>
          </lf>
        </atomcat>
        <slash/>
        <dollar name="1"/>
      </complexcat>
    </result>
  </typechanging>
  <typechanging name="s-list">
    <arg>
      <complexcat>
        <atomcat type="s_conj">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="L1"/>
              </lf>
            </feat>
            <feat attr="op-index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash/>
        <dollar name="1"/>
      </complexcat>
    </arg>
    <result>
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash/>
        <dollar name="1"/>
        <lf>
          <satop nomvar="S:situation">
            <diamond mode="First">
              <nomvar name="L1:struct"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </result>
  </typechanging>
  <typechanging name="pred-adj-list-to-adj">
    <arg>
      <complexcat>
        <atomcat type="s_conj">
          <fs id="1">
            <feat val="adj" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="L1"/>
              </lf>
            </feat>
            <feat attr="op-index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </arg>
    <result>
      <complexcat>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="GenRel">
              <nomvar name="S:proposition"/>
              <diamond mode="First">
                <nomvar name="L1:struct"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </result>
  </typechanging>
  <typechanging name="np-list-c">
    <arg>
      <atomcat type="np_conj">
        <fs id="1">
          <feat val="pl" attr="num"/>
          <feat attr="case">
            <featvar name="CASE"/>
          </feat>
          <feat val="coll" attr="type"/>
          <feat attr="index">
            <lf>
              <nomvar name="L1"/>
            </lf>
          </feat>
          <feat attr="op-index">
            <lf>
              <nomvar name="S"/>
            </lf>
          </feat>
        </fs>
      </atomcat>
    </arg>
    <result>
      <atomcat type="np">
        <fs inheritsFrom="1">
          <feat attr="index">
            <lf>
              <nomvar name="S"/>
            </lf>
          </feat>
        </fs>
        <lf>
          <satop nomvar="S:sem-obj">
            <diamond mode="First">
              <nomvar name="L1:struct"/>
            </diamond>
          </satop>
        </lf>
      </atomcat>
    </result>
  </typechanging>
  <typechanging name="np-list-d-&gt;T">
    <arg>
      <atomcat type="np_conj">
        <fs>
          <feat attr="num">
            <featvar name="NUM:num-vals"/>
          </feat>
          <feat attr="case">
            <featvar name="CASE"/>
          </feat>
          <feat val="distr" attr="type"/>
          <feat attr="index">
            <lf>
              <nomvar name="L1"/>
            </lf>
          </feat>
          <feat attr="op-index">
            <lf>
              <nomvar name="S"/>
            </lf>
          </feat>
          <feat attr="info">
            <lf>
              <var name="INFO"/>
            </lf>
          </feat>
          <feat attr="owner">
            <lf>
              <var name="OWNER"/>
            </lf>
          </feat>
        </fs>
      </atomcat>
    </arg>
    <result>
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash ability="active" varmodality="M" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash ability="active" varmodality="M" dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="num">
                <featvar name="NUM:num-vals"/>
              </feat>
              <feat val="3rd" attr="pers"/>
              <feat attr="case">
                <featvar name="CASE"/>
              </feat>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="S:situation">
            <diamond mode="First">
              <nomvar name="L1:struct"/>
            </diamond>
            <diamond mode="BoundVar">
              <nomvar name="X:sem-obj"/>
            </diamond>
            <diamond mode="Pred">
              <nomvar name="E:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </result>
  </typechanging>
  <typechanging name="np-list-d-&lt;T">
    <arg>
      <atomcat type="np_conj">
        <fs>
          <feat attr="num">
            <featvar name="NUM:num-vals"/>
          </feat>
          <feat attr="case">
            <featvar name="CASE"/>
          </feat>
          <feat val="distr" attr="type"/>
          <feat attr="index">
            <lf>
              <nomvar name="L1"/>
            </lf>
          </feat>
          <feat attr="op-index">
            <lf>
              <nomvar name="S"/>
            </lf>
          </feat>
          <feat attr="info">
            <lf>
              <var name="INFO"/>
            </lf>
          </feat>
          <feat attr="owner">
            <lf>
              <var name="OWNER"/>
            </lf>
          </feat>
        </fs>
      </atomcat>
    </arg>
    <result>
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash/>
        <dollar name="1"/>
        <slash ability="active" varmodality="M" dir="\"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
          <slash ability="active" varmodality="M" dir="/"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="num">
                <featvar name="NUM:num-vals"/>
              </feat>
              <feat val="3rd" attr="pers"/>
              <feat attr="case">
                <featvar name="CASE"/>
              </feat>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="S:situation">
            <diamond mode="First">
              <nomvar name="L1:struct"/>
            </diamond>
            <diamond mode="BoundVar">
              <nomvar name="X:sem-obj"/>
            </diamond>
            <diamond mode="Pred">
              <nomvar name="E:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </result>
  </typechanging>
  <typechanging name="card">
    <arg>
      <atomcat type="num">
        <fs>
          <feat attr="index">
            <lf>
              <nomvar name="Y"/>
            </lf>
          </feat>
          <feat attr="num">
            <featvar name="NUM"/>
          </feat>
        </fs>
      </atomcat>
    </arg>
    <result>
      <complexcat>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
            <feat attr="info">
              <lf>
                <var name="INFO"/>
              </lf>
            </feat>
            <feat attr="owner">
              <lf>
                <var name="OWNER"/>
              </lf>
            </feat>
            <feat attr="num">
              <featvar name="NUM"/>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
            <feat attr="info">
              <lf>
                <var name="INFO"/>
              </lf>
            </feat>
            <feat attr="owner">
              <lf>
                <var name="OWNER"/>
              </lf>
            </feat>
            <feat attr="num">
              <featvar name="NUM"/>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="Card">
              <nomvar name="Y:num"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </result>
  </typechanging>
  <typechanging name="card-h">
    <arg>
      <atomcat type="num">
        <fs>
          <feat attr="index">
            <lf>
              <nomvar name="Y"/>
            </lf>
          </feat>
          <feat val="pl" attr="num"/>
        </fs>
      </atomcat>
    </arg>
    <result>
      <atomcat type="n">
        <fs id="2">
          <feat attr="index">
            <lf>
              <nomvar name="X"/>
            </lf>
          </feat>
          <feat attr="info">
            <lf>
              <var name="INFO"/>
            </lf>
          </feat>
          <feat attr="owner">
            <lf>
              <var name="OWNER"/>
            </lf>
          </feat>
          <feat val="pl" attr="num"/>
        </fs>
        <lf>
          <satop nomvar="X:sem-obj">
            <prop name="pro-n"/>
            <diamond mode="info">
              <var name="INFO"/>
            </diamond>
            <diamond mode="owner">
              <var name="OWNER"/>
            </diamond>
            <diamond mode="kon">
              <prop name="-"/>
            </diamond>
            <diamond mode="Card">
              <nomvar name="Y:num"/>
            </diamond>
          </satop>
        </lf>
      </atomcat>
    </result>
  </typechanging>
  <typechanging name="purp-i">
    <arg>
      <complexcat>
        <atomcat type="s">
          <fs>
            <feat val="inf" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E2"/>
              </lf>
            </feat>
            <feat attr="info">
              <lf>
                <var name="INFO"/>
              </lf>
            </feat>
            <feat attr="owner">
              <lf>
                <var name="OWNER"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </arg>
    <result>
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="fronted" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <atomcat type="s">
          <fs id="1">
            <feat val="dcl" attr="form"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
            <feat attr="info">
              <lf>
                <var name="INFO"/>
              </lf>
            </feat>
            <feat attr="owner">
              <lf>
                <var name="OWNER"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="S:proposition">
            <prop name="purpose-rel"/>
            <diamond mode="info">
              <var name="INFO"/>
            </diamond>
            <diamond mode="owner">
              <var name="OWNER"/>
            </diamond>
            <diamond mode="kon">
              <prop name="-"/>
            </diamond>
            <diamond mode="Core">
              <nomvar name="E:situation"/>
            </diamond>
            <diamond mode="Trib">
              <nomvar name="E2:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </result>
  </typechanging>
</rules>


================================================
FILE: grammars/flights/testbed.xml
================================================
<?xml version="1.0"?>
<!-- 
Copyright (C) 2003-4 University of Edinburgh (Michael White) 
$Revision: 1.31 $, $Date: 2004/11/20 16:34:44 $ 
-->
<regression>

  <!-- case agreement -->
  <item numOfParses="1" string="I booked you the flight LL% ."/>
  <item numOfParses="0" string="me booked you the flight LL% ."/>
  <item numOfParses="0" string="I booked we the flight LL% ."/>

  <!-- num agreement -->
  <item numOfParses="1" string="the flights are_H* available LL% ."/>
  <item numOfParses="0" string="the flights is_H* available LL% ."/>

  <!-- subj-v theme, obj rheme: boundary tones required -->
  <item numOfParses="1" string="Bob_L+H* booked LH% the flight_H* LL% ."/>
  <item numOfParses="0" string="Bob_L+H* booked the flight_H* LL% ."/>
  <item numOfParses="0" string="Bob_L+H* booked LH% the flight_H* ."/>
  
  <!-- rheme subject, copula, pred adj -->
  <item numOfParses="1" string="the nonstop_H* flight L is available_L+H* LH% ."/>
  
  <!-- discontinuous theme -->
  <!-- context: I know that Gil booked Ted a hotel, but who did Bob book a flight? -->
  <item numOfParses="1" string="Bob_L+H* booked LH% me_H* LL% the flight_L+H* LH% ."/>
  
  <!-- topicalization: theme, h owner required -->
  <item numOfParses="1" string="the flight_L+H* LH% Bob_H* booked LL% ."/>
  <item numOfParses="1" string="the nonstop_L+H* flight LH% Bob_H* booked LL% ."/>
  <item numOfParses="0" string="the flight L Bob_H* booked LL% ."/>
  <item numOfParses="0" string="the flight_H* LH% Bob_H* booked LL% ."/>
  
  <!-- y/n questions: 'do' pred, for polarity, required with pitch accent, otherwise optional -->
  <!-- nb: 'do .. be' is a known overgeneration -->
  <item numOfParses="2" string="did Bob book the nonstop_H* flight HH% ?"/>
  <item numOfParses="1" string="did_H* Bob book the nonstop_H* flight HH% ?"/>
  <item numOfParses="1" string="is the flight_H* available HH% ?"/>  
  <item numOfParses="0" string="does the flight_H* be available HH% ?" known="true"/>  

  <!-- subj-v agreement with 'do' in questions (requires propagation through s) -->
  <item numOfParses="2" string="does Bob book flights_H* HH% ?"/>
  <item numOfParses="0" string="do Bob book flights_H* HH% ?"/>
  <item numOfParses="0" string="does they book flights_H* HH% ?"/>
  <item numOfParses="2" string="do they book flights_H* HH% ?"/>
  
  <!-- wh questions -->
  <item numOfParses="2" string="which_L+H* flight LH% did Bob book LL% ?"/>
  <item numOfParses="1" string="which_L+H* airline LH% booked the flight LL% ?"/>
  <item numOfParses="1" string="who_L+H* LH% booked the flight LL% ?"/>
  <item numOfParses="2" string="which_L+H* flight LH% did Bob_H* book LL% ?"/>
  <item numOfParses="0" string="which_L+H* flight LH% are available LL% ?"/>
  
  <!-- quantifiers (every gets correct scope!) -->
  <item numOfParses="1" string="Bob booked everyone_H* the flight LL% ."/>
  <item numOfParses="1" string="Bob booked every available_H* flight LL% ."/>
  <item numOfParses="1" string="all_H* flights are available LL% ."/>
  <item numOfParses="0" string="every_H* flights are available LL% ."/>
  <item numOfParses="1" string="both_L+H* LH% require a connection in Birmingham_H* LL% ."/>
  
  <!-- there existentials -->
  <item numOfParses="1" string="there is a nonstop_H* flight available LL% ."/>
  <item numOfParses="1" string="is there a nonstop_H* flight available HH% ?"/>
  <item numOfParses="0" string="is there two_H* flights_H* available HH% ?"/>
  <item numOfParses="0" string="there are one_H* flight_H* available LL% ."/>
  
  <!-- relative clauses (with number but not case agreement) -->
  <!-- nb: appositive rel clauses don't enforce agreement at present -->
  <item numOfParses="2" string="there are two_H* flights_H* that match your requirements LL% ."/>
  <item numOfParses="2" string="there is one_H* flight_H* that matches your requirements LL% ."/>
  <item numOfParses="0" string="there is one_H* flight_H* that match your requirements LL% ." known="true"/>
  <item numOfParses="0" string="there are two_H* flights_H* that matches your requirements LL% ." known="true"/>
  <item numOfParses="2" string="there are two_H* flights_H* that Bob books LL% ."/>

  <!-- modals -->  
  <item numOfParses="2" string="the cheapest_L+H* flight LH% may_H* get you to Boston today LH% ."/>
  <item numOfParses="2" string="the United_L+H* flight LH% will_H* get you to Boston on_time LL% ."/>
  
  <!-- np coordination: 'and' has collective/distributive readings; 'or' just distributive 
       (also case and some number agreement, but not person agreement) -->
  <item numOfParses="2" string="Bob_H* LH% , Ted_H* LH% and I_H* L booked the flight_L+H* LH% ."/>
  <item numOfParses="1" string="Bob_H* LH% , Ted_H* LH% or I_H* L booked it LH% ."/>
  <item numOfParses="0" string="Bob_H* LH% and me_H* L booked it LH% ."/>
  <item numOfParses="2" string="Bob_H* LH% and I_H* L book flights LH% ."/>
  <item numOfParses="0" string="Bob_H* LH% and I_H* L books flights LH% ."/>
  <item numOfParses="1" string="Bob_L+H* booked LH% the United_H* flight LH% or the Delta_H* flight LL% ."/>
  
  <!-- sentential coordination -->
  <item numOfParses="1" string="the flight LH% leaves London_H* LH% , arrives Boston_H* at 15:00_H* LH% and is_H* available LL% ."/>
  <item numOfParses="1" string="the flights_L+H* LH% leave London_H* LH% or are not cheap_H* LL% ."/>
  
  <!-- 'but' -->
  <item numOfParses="1" string="the United_L+H* flight LH% is_H* available LH% but is not_H* cheap LL% ."/>
  <item numOfParses="1" string="the United_L+H* flight LH% is available_H* LH% , but it is not cheap_H* LL% ."/>
  <item numOfParses="1" string="but_H* it requires a connection_H* in Amsterdam_H* LL% ."/>
  
  <!-- initial 'and' -->
  <item numOfParses="11" string="and_H* there is a Flybe_H* flight that arrives at 17:00_H* LL% ."/>
  
  <!-- unmarked theme, 'arrives at' -->
  <item numOfParses="1" string="the KLM flight arrives in Brussels LH% at 11:00_H* LL% ."/>
  
  <!-- accent on destination, split theme -->
  <item numOfParses="1" string="the KLM_L+H* flight arrives in LH% Brussels_H* L at 11:00 LH% ."/>
  
  <!-- 'no availability' -->
  <item numOfParses="1" string="it has no_H* availability in first_class_H* LH% and requires a connection_H* at London_Heathrow_H* LL% ."/>
  
  <!-- accent on 'has' -->
  <item numOfParses="1" string="it L has_H* availability in business_class_H* LL% but requires a connection_H* in Amsterdam LL% ."/>
  <item numOfParses="1" string="the VLM_L+H* flight LH% leaves at 14:00_H* LH% and has_H* availability_H* in economy_H* LL% ."/>
  
  <!-- tbd: more test cases for copula, coord with relative clauses, various lex items ... -->
  
</regression>


================================================
FILE: grammars/flights/types-extras.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!--
Copyright (C) 2003-4 University of Edinburgh (Michael White)
$Revision: 1.2 $, $Date: 2004/11/20 16:34:44 $ 
-->
<types name="flights" 
  xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" 
  xsi:noNamespaceSchemaLocation="../types.xsd"
>

  <!-- additional sorts for flights (builds on ../core-en/types.xml) -->
  <type name="airline" parents="organization"/>
  <type name="airport" parents="location phys-obj"/>
  <type name="fareclass" parents="abstraction"/>
  <type name="scalar" parents="proposition"/>
  <type name="timeframe" parents="abstraction"/>
  <type name="travel" parents="action motion"/>
  
</types>


================================================
FILE: grammars/flights/types.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!--
Copyright (C) 2003-4 University of Edinburgh (Michael White)
$Revision: 1.17 $, $Date: 2008/12/12 05:09:29 $ 
-->
<types xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" name="flights" xsi:noNamespaceSchemaLocation="../types.xsd">
  <!-- form vals -->
  <type name="form-vals"/>
  <type name="dcl-base" parents="form-vals"/>
  <type name="dcl" parents="dcl-base"/>
  <type name="fronted" parents="dcl-base"/>
  <type name="q-base" parents="form-vals"/>
  <type name="q" parents="q-base"/>
  <type name="wh" parents="q-base"/>
  <type name="base" parents="form-vals"/>
  <type name="emb" parents="form-vals"/>
  <type name="inf" parents="form-vals"/>
  <type name="adj" parents="form-vals"/>
  <type name="ng" parents="form-vals"/>
  <!-- person vals (nb: could merge this with number vals) -->
  <type name="pers-vals"/>
  <type name="3rd" parents="pers-vals"/>
  <type name="non-3rd" parents="pers-vals"/>
  <type name="1st" parents="non-3rd"/>
  <type name="2nd" parents="non-3rd"/>
  <!-- number vals -->
  <type name="num-vals"/>
  <type name="sg-or-mass" parents="num-vals"/>
  <type name="sg" parents="sg-or-mass"/>
  <type name="pl-or-mass" parents="num-vals"/>
  <type name="pl" parents="pl-or-mass"/>
  <type name="mass" parents="sg-or-mass pl-or-mass"/>
  <!-- ontological sorts (adapted in part from WordNet 2.0) -->
  <type name="sem-obj"/>
  <type name="abstraction" parents="sem-obj"/>
  <type name="date" parents="abstraction"/>
  <type name="measure" parents="abstraction"/>
  <type name="amt" parents="measure"/>
  <type name="dur" parents="measure"/>
  <type name="num" parents="abstraction"/>
  <type name="time" parents="abstraction"/>
  <type name="location" parents="sem-obj"/>
  <type name="city" parents="location"/>
  <type name="entity" parents="sem-obj"/>
  <type name="causal-agent" parents="entity"/>
  <type name="organization" parents="causal-agent"/>
  <type name="mental-obj" parents="entity"/>
  <type name="phys-obj" parents="entity"/>
  <type name="animate-being" parents="phys-obj"/>
  <type name="person" parents="animate-being causal-agent"/>
  <type name="grouping" parents="sem-obj"/>
  <type name="situation" parents="sem-obj"/>
  <type name="change" parents="situation"/>
  <type name="action" parents="change"/>
  <type name="statement" parents="action"/>
  <type name="motion" parents="change"/>
  <type name="quantification" parents="situation"/>
  <type name="state" parents="situation"/>
  <type name="proposition" parents="state"/>
  <type name="experience" parents="state"/>
  <!-- a structural element in the semantics -->
  <type name="struct"/>
  <!-- additional sorts for flights (builds on ../core-en/types.xml) -->
  <type name="airline" parents="organization"/>
  <type name="airport" parents="location phys-obj"/>
  <type name="fareclass" parents="abstraction"/>
  <type name="scalar" parents="proposition"/>
  <type name="timeframe" parents="abstraction"/>
  <type name="travel" parents="action motion"/>
</types>


================================================
FILE: grammars/flights/vera.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<regression>

  <!-- nb: "with availability in business class" should perhaps be a theme phrase; 
           however, that would require changing the syntax or boundary tones -->
  <item numOfParses="1" string="I found 4_H* flights with availability in business_class_H* LL% .">
    <lf>
      <node id="f1:proposition" pred="find" info="rh" mood="dcl" tense="past">
        <rel name="Perceiver">
          <node id="p1:animate-being" pred="pro1" num="sg"/>
        </rel>
        <rel name="Sought">
          <node id="f2:phys-obj" pred="flight" det="nil" num="pl">
            <rel name="Card">
              <node id="n1:num" pred="4" kon="+"/>
            </rel>
            <rel name="Poss">
              <node id="a1:abstraction" pred="availability" det="nil">
                <rel name="Category">
                  <node id="b1:fareclass" pred="business_class" kon="+"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="2" string="I found 4_H* flights with availability in business_class_H* LL% , but none_H* are on KLM_H* LL% .">
    <lf>
      <node id="b1:situation" pred="but" info="rh" mood="dcl">
        <rel name="Arg1">
          <node id="f1:proposition" pred="find" tense="past">
            <rel name="Perceiver">
              <node id="p1:animate-being" pred="pro1" num="sg"/>
            </rel>
            <rel name="Sought">
              <node id="f2:phys-obj" pred="flight" det="nil" num="pl">
                <rel name="Card">
                  <node id="n1:num" pred="4" kon="+"/>
                </rel>
                <rel name="Poss">
                  <node id="a1:abstraction" pred="availability" det="nil">
                    <rel name="Category">
                      <node id="b2:fareclass" pred="business_class" kon="+"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="Arg2">
          <node id="n2:quantification" pred="none" kon="+">
            <rel name="Restr">
              <node idref="x1:sem-obj"/>
            </rel>
            <rel name="Body">
              <node id="b3:state" pred="be" tense="pres">
                <rel name="Arg">
                  <node idref="x1:sem-obj"/>
                </rel>
                <rel name="Prop">
                  <node id="h1:proposition" pred="has-rel">
                    <rel name="Of">
                      <node idref="x1:sem-obj"/>
                    </rel>
                    <rel name="Airline">
                      <node id="k1:airline" pred="KLM" kon="+"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>

  <!-- tbd: "which is later than you requested" -->
  <item numOfParses="1" string="the only direct_L+H* flight LH% arrives at 20:30_H* LL% .">
    <lf>
      <node id="a1:motion" pred="arrive" info="rh" mood="dcl" tense="pres">
        <rel name="Theme">
          <node id="f1:phys-obj" pred="flight" det="the" info="th" num="sg">
            <rel name="HasProp">
              <node id="o1:proposition" pred="only"/>
            </rel>
            <rel name="HasProp">
              <node id="d1:proposition" pred="direct" kon="+"/>
            </rel>
          </node>
        </rel>
        <rel name="Time">
          <node id="n1:time" pred="20:30" kon="+"/>
        </rel>
      </node>
    </lf>
  </item>
  
  <!-- tbd: "have to" instead of "need to" -->
  <item numOfParses="1" string="to arrive earlier_L+H* LH% you would need to make a connection_H* LL% .">
    <lf>
      <node id="p1:proposition" pred="purpose-rel" info="th" mood="dcl">
        <rel name="Core">
          <node id="w1:state" pred="would" info="rh" owner="s">
            <rel name="Body">
              <node id="n1:action" pred="need-to">
                <rel name="Agent">
                  <node id="p2:person" pred="pro2"/>
                </rel>
                <rel name="Duty">
                  <node id="m1:situation" pred="make">
                    <rel name="Agent">
                      <node idref="p2:person"/>
                    </rel>
                    <rel name="Effect">
                      <node id="c1:action" pred="connection" det="a" kon="+" num="sg"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="Trib">
          <node id="a1:motion" pred="arrive">
            <rel name="Theme">
              <node idref="x1:phys-obj"/>
            </rel>
            <rel name="TimeRel">
              <node id="e1:proposition" pred="earlier" kon="+"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  
  <!-- nb: Simplified sentence, by leaving "or a KLM flight" for a separate one. -->
  <item numOfParses="4" string="if you 're willing to travel economy_L+H* LH% , there is a direct_L+H* flight LH% on BMI_H* LL% , arriving at 16:10_H* LL% .">
    <lf>
      <node id="i1:situation" pred="if" info="th" mood="dcl">
        <rel name="Arg1">
          <node id="b1:state" pred="be" tense="pres">
            <rel name="Arg">
              <node id="p1:animate-being" pred="pro2"/>
            </rel>
            <rel name="Prop">
              <node id="w1:proposition" pred="willing">
                <rel name="Experiencer">
                  <node idref="p1:animate-being"/>
                </rel>
                <rel name="Situation">
                  <node id="t1:motion" pred="travel">
                    <rel name="Traveler">
                      <node idref="p1:animate-being"/>
                    </rel>
                    <rel name="Category">
                      <node id="e1:fareclass" pred="economy" kon="+"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="Arg2">
          <node id="e2:proposition" pred="elab-rel" info="rh" owner="s">
            <rel name="Core">
              <node id="t2:state" pred="there-be" info="th" owner="h" tense="pres">
                <rel name="Arg">
                  <node id="f1:phys-obj" pred="flight" det="a" num="sg">
                    <rel name="HasProp">
                      <node id="d1:proposition" pred="direct" kon="+"/>
                    </rel>
                  </node>
                </rel>
                <rel name="Prop">
                  <node id="h1:proposition" pred="has-rel" info="rh" owner="s">
                    <rel name="Of">
                      <node idref="f1:phys-obj"/>
                    </rel>
                    <rel name="Airline">
                      <node id="b2:airline" pred="BMI" kon="+"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
            <rel name="Trib">
              <node id="a1:motion" pred="arrive">
                <rel name="Theme">
                  <node idref="x1:phys-obj"/>
                </rel>
                <rel name="Time">
                  <node id="n1:time" pred="16:10" kon="+"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="there is also_H* a KLM_H* flight LL%  arriving at 16:50_H* LL% , but it requires a connection_H* in Amsterdam_H* LL% .">
    <lf>
      <node id="b1:situation" pred="but" info="rh" mood="dcl">
        <rel name="Arg1">
          <node id="t1:state" pred="there-be" tense="pres">
            <rel name="Arg">
              <node id="f1:phys-obj" pred="flight" det="a" num="sg">
                <rel name="Airline">
                  <node id="k1:airline" pred="KLM" kon="+"/>
                </rel>
              </node>
            </rel>
            <rel name="Prop">
              <node id="a1:motion" pred="arrive">
                <rel name="Theme">
                  <node idref="f1:phys-obj"/>
                </rel>
                <rel name="Time">
                  <node id="n1:time" pred="16:50" kon="+"/>
                </rel>
              </node>
            </rel>
            <rel name="HasProp">
              <node id="a2:proposition" pred="also" kon="+"/>
            </rel>
          </node>
        </rel>
        <rel name="Arg2">
          <node id="r1:action" pred="require" tense="pres">
            <rel name="Agent">
              <node id="p1:causal-agent" pred="pro3n" num="sg"/>
            </rel>
            <rel name="Duty">
              <node id="c1:action" pred="connection" det="a" kon="+" num="sg">
                <rel name="Path">
                  <node id="a3:city" pred="Amsterdam" kon="+"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  
  <!-- the following should work as before:
         There's a KLM flight arriving Brussels at four fifty pm, 
           but business class is not available and you'd need to connect in Amsterdam. 
         If you want to fly direct, there's a BMI flight that arrives at four ten pm, 
           but it has no availability in business class either. -->
  <item numOfParses="1" string="I also found_L+H* LH% 4_H* flights LL% that do_H* have availability in business_class_H* LL% .">
    <lf>
      <node id="e1:proposition" pred="elab-rel" info="rh" mood="dcl">
        <rel name="Core">
          <node id="f1:proposition" pred="find" info="th" kon="+" tense="past">
            <rel name="Perceiver">
              <node id="p1:animate-being" pred="pro1" num="sg"/>
            </rel>
            <rel name="Sought">
              <node id="f2:phys-obj" pred="flight" det="nil" info="rh" num="pl" owner="s">
                <rel name="Card">
                  <node id="n1:num" pred="4" kon="+"/>
                </rel>
              </node>
            </rel>
            <rel name="HasProp">
              <node id="a1:proposition" pred="also"/>
            </rel>
          </node>
        </rel>
        <rel name="Trib">
          <node id="d1:state" pred="do" kon="+" tense="pres">
            <rel name="Body">
              <node id="h1:situation" pred="have">
                <rel name="Owner">
                  <node idref="x1:sem-obj"/>
                </rel>
                <rel name="Poss">
                  <node id="a2:abstraction" pred="availability" det="nil">
                    <rel name="Category">
                      <node id="b1:fareclass" pred="business_class" kon="+"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="would you like to hear about these_H* LH% ?">
    <lf>
      <node id="w1:state" pred="would" info="rh" mood="int">
        <rel name="Body">
          <node id="l1:experience" pred="like">
            <rel name="Experiencer">
              <node id="p1:animate-being" pred="pro2"/>
            </rel>
            <rel name="Content">
              <node id="h1:experience" pred="hear">
                <rel name="Perceiver">
                  <node idref="p1:animate-being"/>
                </rel>
                <rel name="Phenomenon">
                  <node id="t1:sem-obj" pred="this" kon="+" num="pl"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  
  <!-- nb: changed "the following" to "several", which should be more appropriate for spoken output -->
  <item numOfParses="1" string="I found several_H* flights with availability in business_class_H* LL% .">
    <lf>
      <node id="f1:proposition" pred="find" info="rh" mood="dcl" tense="past">
        <rel name="Perceiver">
          <node id="p1:animate-being" pred="pro1" num="sg"/>
        </rel>
        <rel name="Sought">
          <node id="f2:phys-obj" pred="flight" det="nil" num="pl">
            <rel name="Card">
              <node id="s1:num" pred="several" kon="+"/>
            </rel>
            <rel name="Poss">
              <node id="a1:abstraction" pred="availability" det="nil">
                <rel name="Category">
                  <node id="b1:fareclass" pred="business_class" kon="+"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <!-- this should work: There is a direct flight on BMI, but it arrives at 20:30. -->
  <item numOfParses="2" string="if you want to arrive earlier_L+H* LH% , there is a British_Airways_H* flight LL% arriving at 16:20_H* LL% .">
    <lf>
      <node id="i1:situation" pred="if" info="th" mood="dcl">
        <rel name="Arg1">
          <node id="w1:experience" pred="want" tense="pres">
            <rel name="Experiencer">
              <node id="p1:animate-being" pred="pro2"/>
            </rel>
            <rel name="Situation">
              <node id="a1:motion" pred="arrive">
                <rel name="Theme">
                  <node idref="p1:animate-being"/>
                </rel>
                <rel name="TimeRel">
                  <node id="e1:proposition" pred="earlier" kon="+"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="Arg2">
          <node id="t1:state" pred="there-be" info="rh" owner="s" tense="pres">
            <rel name="Arg">
              <node id="f1:phys-obj" pred="flight" det="a" num="sg">
                <rel name="Airline">
                  <node id="b1:airline" pred="British_Airways" kon="+"/>
                </rel>
              </node>
            </rel>
            <rel name="Prop">
              <node id="a2:motion" pred="arrive">
                <rel name="Theme">
                  <node idref="f1:phys-obj"/>
                </rel>
                <rel name="Time">
                  <node id="n1:time" pred="16:20" kon="+"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="2" string="there 's a cheaper_L+H* flight LH% on Lufthansa_H* LL% .">
    <lf>
      <node id="t1:state" pred="there-be" info="th" mood="dcl" tense="pres">
        <rel name="Arg">
          <node id="f1:phys-obj" pred="flight" det="a" num="sg">
            <rel name="HasProp">
              <node id="c1:proposition" pred="cheaper" kon="+"/>
            </rel>
          </node>
        </rel>
        <rel name="Prop">
          <node id="h1:proposition" pred="has-rel" info="rh" owner="s">
            <rel name="Of">
              <node idref="f1:phys-obj"/>
            </rel>
            <rel name="Airline">
              <node id="l1:airline" pred="Lufthansa" kon="+"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <!-- this should work: It costs 114 GBP and arrives at 16:40, but you'd need to connect in London/Heathrow.  -->
  
  <item numOfParses="1" string="the Lufthansa_L+H* flight LH% arrives at 18:10 LH% and costs only 114GBP LL% .">
    <lf>
      <node id="a1:situation" pred="and" mood="dcl">
        <rel name="List">
          <node id="a2:motion" pred="arrive" tense="pres">
            <rel name="Theme">
              <node idref="f1:phys-obj"/>
            </rel>
            <rel name="Time">
              <node id="n1:time" pred="18:10"/>
            </rel>
          </node>
          <node id="c1:proposition" pred="cost" tense="pres">
            <rel name="Goods">
              <node idref="f1:phys-obj"/>
            </rel>
            <rel name="Asset">
              <node id="n2:amt" pred="114GBP">
                <rel name="HasProp">
                  <node id="j1:proposition" pred="only"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <node id="f1:phys-obj" pred="flight" det="the" info="th" num="sg">
          <rel name="Airline">
            <node id="l1:airline" pred="Lufthansa" kon="+"/>
          </rel>
        </node>
      </node>
    </lf>
  </item>
  <!-- this should work with 'need to': You would have to connect in Frankfurt. -->
  <!-- nb: simplified considerably! (removed 'or'; perhaps better for spoken output) -->
  <item numOfParses="2" string="alternatively_L+H* LH% , there are two_H* flights LL% on British_Airways_H* LL% .">
    <lf>
      <node id="t1:state" pred="there-be" info="rh" mood="dcl" tense="pres">
        <rel name="Arg">
          <node id="f1:phys-obj" pred="flight" det="nil" num="pl">
            <rel name="Card">
              <node id="t2:num" pred="two" kon="+"/>
            </rel>
          </node>
        </rel>
        <rel name="Prop">
          <node id="h1:proposition" pred="has-rel">
            <rel name="Of">
              <node idref="f1:phys-obj"/>
            </rel>
            <rel name="Airline">
              <node id="b1:airline" pred="British_Airways" kon="+"/>
            </rel>
          </node>
        </rel>
        <rel name="HasProp">
          <node id="a1:proposition" pred="alternatively" info="th" kon="+"/>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="2" string="both cost 220GBP_H* LL% .">
    <lf>
      <node id="b1:quantification" pred="both" info="rh" mood="dcl">
        <rel name="Restr">
          <node idref="x1:phys-obj"/>
        </rel>
        <rel name="Body">
          <node id="c1:proposition" pred="cost" tense="pres">
            <rel name="Goods">
              <node idref="x1:phys-obj"/>
            </rel>
            <rel name="Asset">
              <node id="n1:amt" pred="220GBP" kon="+"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="one_L+H* flight LH% arrives at 16:20_H* LH% and connects in Manchester_H* LL% .">
    <lf>
      <node id="a1:situation" pred="and" info="rh" mood="dcl">
        <rel name="List">
          <node id="a2:motion" pred="arrive" tense="pres">
            <rel name="Theme">
              <node idref="f1:phys-obj"/>
            </rel>
            <rel name="Time">
              <node id="n1:time" pred="16:20" kon="+"/>
            </rel>
          </node>
          <node id="c1:motion" pred="connect" tense="pres">
            <rel name="Traveler">
              <node idref="f1:phys-obj"/>
            </rel>
            <rel name="Path">
              <node id="m1:city" pred="Manchester" kon="+"/>
            </rel>
          </node>
        </rel>
        <node id="f1:phys-obj" pred="flight" det="nil" info="th" num="sg">
          <rel name="Card">
            <node id="o1:num" pred="one" kon="+"/>
          </rel>
        </node>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="the other_L+H* one LH% arrives at 18:30_H* LH% and requires a connection_H* in Bristol_H* LL% .">
    <lf>
      <node id="a1:situation" pred="and" info="rh" mood="dcl">
        <rel name="List">
          <node id="a2:motion" pred="arrive" tense="pres">
            <rel name="Theme">
              <node idref="p1:person"/>
            </rel>
            <rel name="Time">
              <node id="n1:time" pred="18:30" kon="+"/>
            </rel>
          </node>
          <node id="r1:action" pred="require" tense="pres">
            <rel name="Agent">
              <node idref="p1:person"/>
            </rel>
            <rel name="Duty">
              <node id="c1:action" pred="connection" det="a" kon="+" num="sg">
                <rel name="Path">
                  <node id="b1:city" pred="Bristol" kon="+"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <node id="p1:person" pred="pro_one" det="the" info="th" num="sg">
          <rel name="HasProp">
            <node id="o1:proposition" pred="other" kon="+"/>
          </rel>
        </node>
      </node>
    </lf>
  </item>
  
  <item numOfParses="1" string="the best_L+H* Lufthansa_L+H* flight I found LH% does_H* have availability_H* in business_class_H* LH% and costs just 114GBP_H* LL% .">
    <lf>
      <node id="a1:situation" pred="and" info="rh" mood="dcl">
        <rel name="List">
          <node id="d1:state" pred="do" kon="+" tense="pres">
            <rel name="Body">
              <node id="h1:situation" pred="have">
                <rel name="Owner">
                  <node idref="f1:phys-obj"/>
                </rel>
                <rel name="Poss">
                  <node id="a2:abstraction" pred="availability" det="nil" kon="+">
                    <rel name="Category">
                      <node id="b2:fareclass" pred="business_class" kon="+"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
          <node id="c1:proposition" pred="cost" tense="pres">
            <rel name="Goods">
              <node idref="f1:phys-obj"/>
            </rel>
            <rel name="Asset">
              <node id="n1:amt" pred="114GBP" kon="+">
                <rel name="HasProp">
                  <node id="j1:proposition" pred="just"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <node id="f1:phys-obj" pred="flight" det="the" info="th" num="sg">
          <rel name="Airline">
            <node id="l1:airline" pred="Lufthansa" kon="+"/>
          </rel>
          <rel name="HasProp">
            <node id="b1:scalar" pred="best" kon="+"/>
          </rel>
          <rel name="GenRel">
            <node id="f2:proposition" pred="find" tense="past">
              <rel name="Perceiver">
                <node id="p1:animate-being" pred="pro1" num="sg"/>
              </rel>
              <rel name="Sought">
                <node idref="f1:phys-obj"/>
              </rel>
            </node>
          </rel>
        </node>
      </node>
    </lf>
  </item>
  <item numOfParses="4" string="but it only_H* arrives at 12:45_H* LH% and you 'd need to connect_H* in Manchester_H* LL% .">
    <lf>
      <node id="b1:situation" pred="but" info="rh" mood="dcl">
        <rel name="Arg2">
          <node id="a1:situation" pred="and">
            <rel name="List">
              <node id="a2:motion" pred="arrive" tense="pres">
                <rel name="Theme">
                  <node id="p1:phys-obj" pred="pro3n" num="sg"/>
                </rel>
                <rel name="Time">
                  <node id="n1:time" pred="12:45" kon="+"/>
                </rel>
                <rel name="HasProp">
                  <node id="o1:proposition" pred="only" kon="+"/>
                </rel>
              </node>
              <node id="w1:state" pred="would">
                <rel name="Body">
                  <node id="n2:action" pred="need-to">
                    <rel name="Agent">
                      <node id="p2:person" pred="pro2"/>
                    </rel>
                    <rel name="Duty">
                      <node id="c1:motion" pred="connect" kon="+">
                        <rel name="Traveler">
                          <node idref="p2:person"/>
                        </rel>
                        <rel name="Path">
                          <node id="m1:city" pred="Manchester" kon="+"/>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <!-- tbd: 'for 111GBP' option -->
  <item numOfParses="2" string="if you want to fly direct_L+H* LH% , there is a BMI_L+H* flight LH% that arrives at 11:05_H* LH% and costs 111GBP_H* LL% .">
    <lf>
      <node id="i1:situation" pred="if" info="th" mood="dcl">
        <rel name="Arg1">
          <node id="w1:experience" pred="want" tense="pres">
            <rel name="Experiencer">
              <node id="p1:animate-being" pred="pro2"/>
            </rel>
            <rel name="Situation">
              <node id="f1:motion" pred="fly">
                <rel name="Traveler">
                  <node idref="p1:animate-being"/>
                </rel>
                <rel name="Prop">
                  <node id="d1:proposition" pred="direct" kon="+">
                    <rel name="Of">
                      <node idref="x1:sem-obj"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="Arg2">
          <node id="e1:proposition" pred="elab-rel" info="rh" owner="s">
            <rel name="Core">
              <node id="t1:state" pred="there-be" info="th" owner="h" tense="pres">
                <rel name="Arg">
                  <node id="f2:phys-obj" pred="flight" det="a" num="sg">
                    <rel name="Airline">
                      <node id="b1:airline" pred="BMI" kon="+"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
            <rel name="Trib">
              <node id="a1:situation" pred="and">
                <rel name="List">
                  <node id="a2:motion" pred="arrive" tense="pres">
                    <rel name="Theme">
                      <node idref="x2:phys-obj"/>
                    </rel>
                    <rel name="Time">
                      <node id="n1:time" pred="11:05" kon="+"/>
                    </rel>
                  </node>
                  <node id="c1:proposition" pred="cost" tense="pres">
                    <rel name="Goods">
                      <node idref="x2:phys-obj"/>
                    </rel>
                    <rel name="Asset">
                      <node id="n2:amt" pred="111GBP" kon="+"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  
  <!-- nb: would be nicer if 'do' pred not required with 'not' -->
  <item numOfParses="3" string="there 's a Lufthansa_H* flight with availability in business_class_H* LL% , but it does n't arrive until 16:10_H* LL% .">
    <lf>
      <node id="b1:situation" pred="but" info="rh" mood="dcl">
        <rel name="Arg1">
          <node id="t1:state" pred="there-be" tense="pres">
            <rel name="Arg">
              <node id="f1:phys-obj" pred="flight" det="a" num="sg">
                <rel name="Poss">
                  <node id="a1:abstraction" pred="availability" det="nil">
                    <rel name="Category">
                      <node id="b2:fareclass" pred="business_class" kon="+"/>
                    </rel>
                  </node>
                </rel>
                <rel name="Airline">
                  <node id="l1:airline" pred="Lufthansa" kon="+"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="Arg2">
          <node id="d1:state" pred="do" tense="pres">
            <rel name="Body">
              <node id="n1:state" pred="not">
                <rel name="Body">
                  <node id="a2:motion" pred="arrive">
                    <rel name="Theme">
                      <node id="p1:phys-obj" pred="pro3n" num="sg"/>
                    </rel>
                  </node>
                </rel>
                <rel name="TimeRel">
                  <node id="u1:proposition" pred="until">
                    <rel name="Time">
                      <node id="n2:time" pred="16:10" kon="+"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <!-- this should work (w/o comma before arriving): If you want to arrive earlier, there is a Lufthansa flight, arriving 13:05, but there is no availability in business class. -->
  <item numOfParses="3" string="if you want to arrive between 12:00_L+H* and 14:00_L+H* LH% and fly business_class_L+H* LH% , you would need to choose another_H* airline LL% .">
    <lf>
      <node id="i1:situation" pred="if" info="th" mood="dcl">
        <rel name="Arg1">
          <node id="w1:experience" pred="want" tense="pres">
            <rel name="Experiencer">
              <node id="p1:animate-being" pred="pro2"/>
            </rel>
            <rel name="Situation">
              <node id="a1:situation" pred="and">
                <rel name="List">
                  <node id="a2:motion" pred="arrive">
                    <rel name="Theme">
                      <node idref="p1:animate-being"/>
                    </rel>
                    <rel name="TimeRel">
                      <node id="b1:proposition" pred="between">
                        <rel name="Time1">
                          <node id="n1:time" pred="12:00" kon="+"/>
                        </rel>
                        <rel name="Time2">
                          <node id="n2:time" pred="14:00" kon="+"/>
                        </rel>
                      </node>
                    </rel>
                  </node>
                  <node id="f1:motion" pred="fly">
                    <rel name="Traveler">
                      <node idref="p1:animate-being"/>
                    </rel>
                    <rel name="Category">
                      <node id="b2:fareclass" pred="business_class" kon="+"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="Arg2">
          <node id="w2:state" pred="would" info="rh" owner="s">
            <rel name="Body">
              <node id="n3:action" pred="need-to">
                <rel name="Agent">
                  <node id="p2:person" pred="pro2"/>
                </rel>
                <rel name="Duty">
                  <node id="c1:action" pred="choose">
                    <rel name="Chosen">
                      <node id="a3:airline" pred="airline" num="sg">
                        <rel name="Det">
                          <node id="a4:proposition" pred="another" kon="+"/>
                        </rel>
                      </node>
                    </rel>
                    <rel name="Cognizer">
                      <node idref="p2:person"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  
  <!-- nb: rather than
             There is a direct flight on BMI that arrives at 13:35 and costs 221 pounds, 
             and a RyanAir flight arriving at 12:05. 
           I suggest starting a second sentence with "there 's also_H* a Ryanair_H* flight LL% ...", 
           to avoid this somewhat problematic coordination -->
           
  <!-- nb: "on Lufthansa" is a theme phrase here, supposing it to be preferred; 
           otherwise, it could also be part of the rheme -->
  <item numOfParses="2" string="there are 2_H* flights LL% on Lufthansa_L+H* LH% .">
    <lf>
      <node id="t1:state" pred="there-be" info="rh" mood="dcl" tense="pres">
        <rel name="Arg">
          <node id="f1:phys-obj" pred="flight" det="nil" num="pl">
            <rel name="Card">
              <node id="n1:num" pred="2" kon="+"/>
            </rel>
          </node>
        </rel>
        <rel name="Prop">
          <node id="h1:proposition" pred="has-rel" info="th">
            <rel name="Of">
              <node idref="f1:phys-obj"/>
            </rel>
            <rel name="Airline">
              <node id="l1:airline" pred="Lufthansa" kon="+"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <!-- nb: For technical reasons, I suggest changing
             A direct flight arriving at 15:00, and another arriving at 13:55 that requires a connection.
           to the following two sentences, as the proposed example would require substantial 
           changes to the grammar. -->
  <item numOfParses="1" string="there is a direct_H* flight LL% arriving at 15:00_H* LL% .">
    <lf>
      <node id="t1:state" pred="there-be" info="rh" mood="dcl" tense="pres">
        <rel name="Arg">
          <node id="f1:phys-obj" pred="flight" det="a" num="sg">
            <rel name="HasProp">
              <node id="d1:proposition" pred="direct" kon="+"/>
            </rel>
          </node>
        </rel>
        <rel name="Prop">
          <node id="a1:motion" pred="arrive">
            <rel name="Theme">
              <node idref="f1:phys-obj"/>
            </rel>
            <rel name="Time">
              <node id="n1:time" pred="15:00" kon="+"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="2" string="and L there is another_H* one LL% arriving at 13:55_H* LL% that requires a connection_H* LL% .">
    <lf>
      <node id="a1:situation" pred="and" mood="dcl">
        <rel name="Arg2">
          <node id="e1:proposition" pred="elab-rel" info="rh">
            <rel name="Core">
              <node id="t1:state" pred="there-be" tense="pres">
                <rel name="Arg">
                  <node id="p1:phys-obj" pred="pro_one" num="sg">
                    <rel name="Det">
                      <node id="a2:proposition" pred="another" kon="+"/>
                    </rel>
                  </node>
                </rel>
                <rel name="Prop">
                  <node id="a3:motion" pred="arrive">
                    <rel name="Theme">
                      <node idref="p1:phys-obj"/>
                    </rel>
                    <rel name="Time">
                      <node id="n1:time" pred="13:55" kon="+"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
            <rel name="Trib">
              <node id="r1:action" pred="require" tense="pres">
                <rel name="Agent">
                  <node idref="x1:causal-agent"/>
                </rel>
                <rel name="Duty">
                  <node id="c1:action" pred="connection" det="a" kon="+" num="sg"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="neither_L+H* LH% has availability in business_class_H* LL% .">
    <lf>
      <node id="n1:quantification" pred="neither" info="th" kon="+" mood="dcl">
        <rel name="Restr">
          <node idref="x1:sem-obj"/>
        </rel>
        <rel name="Body">
          <node id="h1:situation" pred="have" info="rh" owner="s" tense="pres">
            <rel name="Owner">
              <node idref="x1:sem-obj"/>
            </rel>
            <rel name="Poss">
              <node id="a1:abstraction" pred="availability" det="nil">
                <rel name="Category">
                  <node id="b1:fareclass" pred="business_class" kon="+"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <!-- nb: should be possible to add "and arrive between 12:00 and 14:00" at the end -->
  <item numOfParses="4" string="however_L+H* LH% , there are several_H* flights LL% on other_H* airlines LL% that do_H* have availability in business_class LL% .">
    <lf>
      <node id="e1:proposition" pred="elab-rel" info="rh" mood="dcl">
        <rel name="Core">
          <node id="t1:state" pred="there-be" tense="pres">
            <rel name="Arg">
              <node id="f1:phys-obj" pred="flight" det="nil" num="pl">
                <rel name="Card">
                  <node id="s1:num" pred="several" kon="+"/>
                </rel>
              </node>
            </rel>
            <rel name="Prop">
              <node id="h1:proposition" pred="has-rel">
                <rel name="Of">
                  <node idref="f1:phys-obj"/>
                </rel>
                <rel name="Airline">
                  <node id="a1:airline" pred="airline" det="nil" num="pl">
                    <rel name="HasProp">
                      <node id="o1:proposition" pred="other" kon="+"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="Trib">
          <node id="d1:state" pred="do" kon="+" tense="pres">
            <rel name="Body">
              <node id="h2:situation" pred="have">
                <rel name="Owner">
                  <node idref="x1:sem-obj"/>
                </rel>
                <rel name="Poss">
                  <node id="a2:abstraction" pred="availability" det="nil">
                    <rel name="Category">
                      <node id="b1:fareclass" pred="business_class"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="HasProp">
          <node id="h3:proposition" pred="however" info="th" kon="+"/>
        </rel>
      </node>
    </lf>
  </item>
  
  <item numOfParses="1" string="Ryanair_H* L offers the cheapest_L+H* flights to Brussels LH% .">
    <lf>
      <node id="o1:action" pred="offer" info="th" mood="dcl" tense="pres">
        <rel name="Agent">
          <node id="r1:airline" pred="Ryanair" info="rh" kon="+" owner="s"/>
        </rel>
        <rel name="Goods">
          <node id="f1:phys-obj" pred="flight" det="the" num="pl">
            <rel name="Goal">
              <node id="b1:city" pred="Brussels"/>
            </rel>
            <rel name="HasProp">
              <node id="c1:proposition" pred="cheapest" kon="+"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="2" string="they cost just 49GBP_H* LL% , but you would need to connect in Dublin_H* LL% .">
    <lf>
      <node id="b1:situation" pred="but" info="rh" mood="dcl">
        <rel name="Arg1">
          <node id="c1:proposition" pred="cost" tense="pres">
            <rel name="Goods">
              <node id="p1:phys-obj" pred="pro3n" num="pl"/>
            </rel>
            <rel name="Asset">
              <node id="n1:amt" pred="49GBP" kon="+">
                <rel name="HasProp">
                  <node id="j1:proposition" pred="just"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="Arg2">
          <node id="w1:state" pred="would">
            <rel name="Body">
              <node id="n2:action" pred="need-to">
                <rel name="Agent">
                  <node id="p2:person" pred="pro2"/>
                </rel>
                <rel name="Duty">
                  <node id="c2:motion" pred="connect">
                    <rel name="Traveler">
                      <node idref="p2:person"/>
                    </rel>
                    <rel name="Path">
                      <node id="d1:city" pred="Dublin" kon="+"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <!-- tbd: simpler version with 'to choose from' -->
  <item numOfParses="1" string="there are 2_H* flights LL% that you can choose_H* from LL% .">
    <lf>
      <node id="e1:proposition" pred="elab-rel" info="rh" mood="dcl">
        <rel name="Core">
          <node id="t1:state" pred="there-be" tense="pres">
            <rel name="Arg">
              <node id="f1:phys-obj" pred="flight" det="nil" num="pl">
                <rel name="Card">
                  <node id="n1:num" pred="2" kon="+"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="Trib">
          <node id="c1:state" pred="can">
            <rel name="Body">
              <node id="c2:action" pred="choose" kon="+">
                <rel name="Cognizer">
                  <node id="p1:person" pred="pro2"/>
                </rel>
                <rel name="Possib">
                  <node idref="x1:sem-obj"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="2" string="if you prefer to arrive at 17:30_L+H* LH% , your total travel_time_L+H* LH% would be PT6H30M_H* LL% .">
    <lf>
      <node id="i1:situation" pred="if" info="th" mood="dcl">
        <rel name="Arg1">
          <node id="p1:experience" pred="prefer" tense="pres">
            <rel name="Experiencer">
              <node id="p2:animate-being" pred="pro2"/>
            </rel>
            <rel name="Content">
              <node id="a1:motion" pred="arrive">
                <rel name="Theme">
                  <node idref="p2:animate-being"/>
                </rel>
                <rel name="Time">
                  <node id="n1:time" pred="17:30" kon="+"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="Arg2">
          <node id="w1:state" pred="would" info="rh" owner="s">
            <rel name="Body">
              <node id="b1:state" pred="be">
                <rel name="Arg">
                  <node id="t1:abstraction" pred="travel_time" info="th" owner="h" kon="+" num="sg">
                    <rel name="HasProp">
                      <node id="t2:proposition" pred="total"/>
                    </rel>
                    <rel name="GenOwner">
                      <node id="p3:animate-being" pred="pro2"/>
                    </rel>
                  </node>
                </rel>
                <rel name="Pred">
                  <node id="p4:dur" pred="PT6H30M" kon="+"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="there 's an earlier_L+H* flight LH% arriving at 12:45_H* LL% that has a travel_time of only PT4H30M_H* LL% .">
    <lf>
      <node id="e1:proposition" pred="elab-rel" info="rh" mood="dcl">
        <rel name="Core">
          <node id="t1:state" pred="there-be" info="th" tense="pres">
            <rel name="Arg">
              <node id="f1:phys-obj" pred="flight" det="a" num="sg">
                <rel name="HasProp">
                  <node id="e2:proposition" pred="earlier" kon="+"/>
                </rel>
              </node>
            </rel>
            <rel name="Prop">
              <node id="a1:motion" pred="arrive" info="rh" owner="s">
                <rel name="Theme">
                  <node idref="f1:phys-obj"/>
                </rel>
                <rel name="Time">
                  <node id="n1:time" pred="12:45" kon="+"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="Trib">
          <node id="h1:situation" pred="have" tense="pres">
            <rel name="Owner">
              <node idref="x1:sem-obj"/>
            </rel>
            <rel name="Poss">
              <node id="t2:abstraction" pred="travel_time" det="a" num="sg">
                <rel name="Duration">
                  <node id="p1:dur" pred="PT4H30M" kon="+">
                    <rel name="HasProp">
                      <node id="o1:proposition" pred="only"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="BMI_L+H* LH% has a direct_L+H* flight LH% that takes just PT2H35M_H* LL% .">
    <lf>
      <node id="e1:proposition" pred="elab-rel" info="rh" mood="dcl">
        <rel name="Core">
          <node id="h1:situation" pred="have" info="th" tense="pres">
            <rel name="Owner">
              <node id="b1:airline" pred="BMI" kon="+"/>
            </rel>
            <rel name="Poss">
              <node id="f1:phys-obj" pred="flight" det="a" num="sg">
                <rel name="HasProp">
                  <node id="d1:proposition" pred="direct" kon="+"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="Trib">
          <node id="t1:situation" pred="take" tense="pres">
            <rel name="Activity">
              <node idref="x1:situation"/>
            </rel>
            <rel name="Duration">
              <node id="p1:dur" pred="PT2H35M" kon="+">
                <rel name="HasProp">
                  <node id="j1:proposition" pred="just"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <!-- this should work: "It arrives at 13:35 and costs 112 pounds." -->
</regression>


================================================
FILE: grammars/grammar.xsd
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!-- 
Copyright (C) 2003-4 University of Edinburgh (Michael White) 
$Revision: 1.11 $, $Date: 2010/11/11 21:23:49 $ 
-->
<xsd:schema xmlns:xsd="http://www.w3.org/2001/XMLSchema">

  <xsd:annotation>
  <xsd:documentation>
    Schema for grammar file.
    
    A grammar file lists the lexicon, morphology and rules files, 
    and optionally lists the types file and sequences of 
    XSLT transformations to use in loading/saving LFs from/to XML.
    It may also specify a custom list of features to use with 
    supertag names, a custom tokenizer, and/or list semantic classes to 
    replace words with for language models.
  </xsd:documentation>
  </xsd:annotation>

  <xsd:include schemaLocation="tokens.xsd"/>

  <xsd:element name="grammar">
    <xsd:annotation>
    <xsd:documentation>
      The root element.
    </xsd:documentation>
    </xsd:annotation>
    <xsd:complexType>
      <xsd:sequence>
        <xsd:element name="lexicon" type="lexiconType"/>
        <xsd:element name="morphology" type="fileType"/>
        <xsd:element name="rules" type="rulesType"/>
        <xsd:element name="types" type="fileType" minOccurs="0"/>
        <xsd:element name="supertags" type="supertagsType" minOccurs="0"/>
        <xsd:element name="tokenizer" type="tokenizerType" minOccurs="0"/>
        <xsd:element name="LF-from-XML" type="transformList" minOccurs="0"/>
        <xsd:element name="LF-to-XML" type="transformList" minOccurs="0"/>
      </xsd:sequence>
      <xsd:attribute name="name" type="xsd:string"/>
    </xsd:complexType>
  </xsd:element>
  
  <xsd:complexType name="fileType">
    <xsd:annotation>
    <xsd:documentation>
      An element with a file attribute specifying a filename.
    </xsd:documentation>
    </xsd:annotation>
    <xsd:attribute name="file" type="xsd:string" use="required"/>
  </xsd:complexType>

  <xsd:complexType name="lexiconType">
    <xsd:annotation>
    <xsd:documentation>
      An element with a file attribute specifying a filename for the
      lexicon file, plus an optional openlex attribute indicating
      whether lexical category assignments are complete (for openlex
      false) or incomplete (for openlex true).
    </xsd:documentation>
    </xsd:annotation>
    <xsd:complexContent>
      <xsd:extension base="fileType">
        <xsd:attribute name="openlex" type="xsd:boolean"/>
      </xsd:extension>
    </xsd:complexContent>
  </xsd:complexType>

  <xsd:complexType name="rulesType">
    <xsd:annotation>
    <xsd:documentation>
      An element with a file attribute specifying a filename 
      for the rules file. An optional combosfile attribute 
      gives the filename for the list of observed supercat-rule 
      combos.  The format of the combos file is one combo per line, 
      where each combo is either a supertag and a rule name, or a 
      pair of supertags and a rule name, separated by single spaces.
      The optional dynamic-combos flag indicates whether the 
      observed combos should be determined dynamically (using the ones 
      in the combos file as a starting point, if present).  By default, 
      dynamic-combos is true if a combos file is given, and false if not.
    </xsd:documentation>
    </xsd:annotation>
    <xsd:complexContent>
      <xsd:extension base="fileType">
        <xsd:attribute name="combosfile" type="xsd:string"/>
        <xsd:attribute name="dynamic-combos" type="xsd:boolean"/>
      </xsd:extension>
    </xsd:complexContent>
  </xsd:complexType>

  <xsd:complexType name="supertagsType">
    <xsd:annotation>
    <xsd:documentation>
      An element which gives the features to use in constructing 
      supertag names.  The feature names are given as a space-delimited list 
      in the feats attribute.
    </xsd:documentation>
    </xsd:annotation>
    <xsd:attribute name="feats" type="listOfTokens" use="required"/>
  </xsd:complexType>
  
  <xsd:complexType name="tokenizerType">
    <xsd:annotation>
    <xsd:documentation>
      An element which gives the fully qualified class name for 
      a custom tokenizer, and/or lists semantic classes to replace words 
      with for language models.
    </xsd:documentation>
    </xsd:annotation>
    <xsd:attribute name="classname" type="xsd:string"/>
    <xsd:attribute name="replacement-sem-classes" type="xsd:string"/>
  </xsd:complexType>
  
  <xsd:complexType name="transformList">
    <xsd:annotation>
    <xsd:documentation>
      Specifies a sequence of XSLT transformations.
    </xsd:documentation>
    </xsd:annotation>
      <xsd:sequence>
        <xsd:element name="transform" type="fileType" maxOccurs="unbounded"/>
      </xsd:sequence>
  </xsd:complexType>
  
</xsd:schema>


================================================
FILE: grammars/hlds.xsd
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!-- 
Copyright (C) 2003 University of Edinburgh (Michael White) 
$Revision: 1.11 $, $Date: 2006/08/15 18:24:18 $ 
-->
<xsd:schema xmlns:xsd="http://www.w3.org/2001/XMLSchema">

  <xsd:annotation>
  <xsd:documentation>
    Elements and types for hybrid logic dependency semantics (HLDS) constructs.
    
    The subset of hybrid logic terms used in HLDS is defined here.
    (The Java classes currently support a slightly larger subset.)
    To support flattening of these terms into elementary predications, the 
    contents of the satisfaction operators and diamond relations (modal ops) 
    are restricted, as described in detail below.
    
    Note that where a list of terms is allowed, these are implicitly conjoined; 
    a conjunction operator is inserted upon loading, when necessary.
    LFs with disjunctive or optionality operators may also be specified.
    
    Nominals and variables may be given a type (or sort) listed in the 
    types file, by appending the type to the name after a colon. 
    Propositions whose names appear in the types file are also treated as typed.
  </xsd:documentation>
  </xsd:annotation>

  <xsd:include schemaLocation="tokens.xsd"/>

  <xsd:complexType name="hldsPreds">
    <xsd:annotation>
    <xsd:documentation>
      Typically one or more satisfaction operators, encoding the semantics 
      associated with a category.
      Exclusive disjunctions (xor) are also allowed.
    </xsd:documentation>
    </xsd:annotation>
    <xsd:choice maxOccurs="unbounded">
      <xsd:element ref="satop"/>
      <xsd:element ref="op"/>
    </xsd:choice>
  </xsd:complexType>
  
  <xsd:complexType name="hldsFeatVals">
    <xsd:annotation>
    <xsd:documentation>
      The possible values of an LF feature, i.e., 
      a nominal (atom or variable), proposition, or variable (over HLDS terms).
    </xsd:documentation>
    </xsd:annotation>
    <xsd:choice>
      <xsd:element ref="nominal"/>
      <xsd:element ref="prop"/>
      <xsd:element ref="var"/>
    </xsd:choice>
  </xsd:complexType>
  
  <xsd:element name="satop">
    <xsd:annotation>
    <xsd:documentation>
      A satisfaction operator, with a nominal and an arg.
      The nominal can either be a nominal atom, named by the "nom" attribute, 
      or a nominal variable, named by the "nomvar" attribute.
      The nominal may be optionally marked as "shared" (see nominal def below).
      The arg optionally begins with a proposition, followed by any number 
      of diamond relations or disjunctive/optionality operators, 
      but must be non-empty.
    </xsd:documentation>
    </xsd:annotation>
    <xsd:complexType>
      <xsd:choice>
        <xsd:sequence>
          <xsd:element ref="prop"/>
          <xsd:choice minOccurs="0" maxOccurs="unbounded">
            <xsd:element ref="diamond"/>
            <xsd:element ref="op"/>
          </xsd:choice>
        </xsd:sequence>
        <xsd:choice maxOccurs="unbounded">
          <xsd:element ref="diamond"/>
          <xsd:element ref="op"/>
        </xsd:choice>
      </xsd:choice>
      <xsd:attribute name="nom" type="typedFeature"/>
      <xsd:attribute name="nomvar" type="typedFeature"/>
      <xsd:attribute name="shared" type="xsd:boolean"/>
    </xsd:complexType>
  </xsd:element>
  
  <xsd:element name="prop">
    <xsd:annotation>
    <xsd:documentation>
      A named proposition.
    </xsd:documentation>
    </xsd:annotation>
    <xsd:complexType>
      <xsd:attribute name="name" type="token" use="required"/>
    </xsd:complexType>
  </xsd:element>
  
  <xsd:element name="diamond">
    <xsd:annotation>
    <xsd:documentation>
      A diamond relation (modal operator), with a mode and an arg.
      The "mode" attribute names the relation.
      The arg is either just a proposition or a variable, 
      or a nominal followed optionally by a proposition and 
      any number of nested diamond relations or disjunctive/optionality operators.
      In the former case, the relation encodes a semantic feature; in the latter case, it encodes 
      a relation to another semantic head.
      The arg may also be a disjunctive operator containing satops.
    </xsd:documentation>
    </xsd:annotation>
    <xsd:complexType>
      <xsd:choice>
        <xsd:element ref="prop"/>
        <xsd:element ref="var"/>
        <xsd:sequence>
          <xsd:element ref="nominal"/>
          <xsd:element ref="prop" minOccurs="0"/>
          <xsd:choice minOccurs="0" maxOccurs="unbounded">
            <xsd:element ref="diamond"/>
            <xsd:element ref="op"/>
          </xsd:choice>
        </xsd:sequence>
        <xsd:element ref="op"/>
      </xsd:choice>
      <xsd:attribute name="mode" type="xsd:NMTOKEN" use="required"/>
    </xsd:complexType>
  </xsd:element>

  <xsd:element name="op">
    <xsd:annotation>
    <xsd:documentation>
      A conjunction (conj), exclusive disjunction (xor) 
      or optionality (opt) operator.
      Note that conjunctions are usually left implicit.
    </xsd:documentation>
    </xsd:annotation>
    <xsd:complexType>
      <xsd:choice maxOccurs="unbounded">
        <xsd:element ref="satop"/>
        <xsd:element ref="diamond"/>
        <xsd:element ref="nominal"/>
        <xsd:element ref="op"/>
      </xsd:choice>
      <xsd:attribute name="name" use="required">
        <xsd:simpleType>
          <xsd:restriction base = "xsd:string">
            <xsd:enumeration value = "conj"/>
            <xsd:enumeration value = "xor"/>
            <xsd:enumeration value = "opt"/>
          </xsd:restriction>
        </xsd:simpleType>
      </xsd:attribute>
    </xsd:complexType>
  </xsd:element>

  <xsd:element name="nominal" type="shareableNamedTerm" abstract="true">
    <xsd:annotation>
    <xsd:documentation>
      A nominal term, either an atom or a variable.
      The "shared" attribute indicates that the nominal term 
      provides a reference to a node that is a shared part of
      multiple alternatives, rather than being a subordinated 
      or coordinated reference.
    </xsd:documentation>
    </xsd:annotation>
  </xsd:element>
  
  <xsd:element name="nom" type="shareableNamedTerm" substitutionGroup="nominal">
    <xsd:annotation>
    <xsd:documentation>
      A nominal atom.
    </xsd:documentation>
    </xsd:annotation>
  </xsd:element>
  
  <xsd:element name="nomvar" type="shareableNamedTerm" substitutionGroup="nominal">
    <xsd:annotation>
    <xsd:documentation>
      A nominal variable.
    </xsd:documentation>
    </xsd:annotation>
  </xsd:element>
  
  <xsd:element name="var" type="namedTerm">
    <xsd:annotation>
    <xsd:documentation>
      A variable over HLDS terms. 
    </xsd:documentation>
    </xsd:annotation>
  </xsd:element>
  
  <xsd:complexType name="namedTerm">
    <xsd:annotation>
    <xsd:documentation>
      A term with a name.
    </xsd:documentation>
    </xsd:annotation>
    <xsd:attribute name="name" type="typedFeature" use="required"/>
  </xsd:complexType>
  
  <xsd:complexType name="shareableNamedTerm">
    <xsd:annotation>
    <xsd:documentation>
      A named term with an optional "shared" attribute.
    </xsd:documentation>
    </xsd:annotation>
    <xsd:complexContent>
      <xsd:extension base="namedTerm">
        <xsd:attribute name="shared" type="xsd:boolean"/>
      </xsd:extension>
    </xsd:complexContent>
  </xsd:complexType>
  
</xsd:schema>


================================================
FILE: grammars/lexicon.xsd
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!-- 
Copyright (C) 2003-4 University of Edinburgh (Michael White) 
$Revision: 1.11 $, $Date: 2007/03/19 21:57:43 $ 
-->
<xsd:schema xmlns:xsd="http://www.w3.org/2001/XMLSchema">

  <xsd:annotation>
  <xsd:documentation>
    Schema for lexicon file.
    
    The lexicon file contains the definitions of the lexical categories, 
    whose entries are grouped into families (inspired by XTAG tree families).
    
    Families may be open or closed.  With open families, all words listed 
    in the morph file with the same part of speech are mapped to all entries 
    in the family.  With closed families, the members of the family must 
    be explicitly listed.
    
    The lexicon may specify that certain features should 
    be treated specially, either for licensing and instantiating 
		semantically null or "marked" categories in the realizer, 
		or for implementing "distributive" behavior.
    See below for further details.
  </xsd:documentation>
  </xsd:annotation>

  <xsd:include schemaLocation="categories.xsd"/>
  
  
  <xsd:element name="ccg-lexicon">
    <xsd:annotation>
    <xsd:documentation>
      The root element, which includes the list of category families and 
      the declarations of the licensing and distributive attributes.
    </xsd:documentation>
    </xsd:annotation>
    <xsd:complexType>
      <xsd:sequence>
        <xsd:element ref="distributive-features" minOccurs="0"/>
        <xsd:element ref="licensing-features" minOccurs="0"/>
        <xsd:element ref="relation-sorting" minOccurs="0"/>
        <xsd:element ref="family" maxOccurs="unbounded"/>
      </xsd:sequence>
      <xsd:attribute name="name" type="xsd:string"/>
    </xsd:complexType>
    <xsd:unique name="familyNameUniqueness">
      <xsd:selector xpath="family"/>
      <xsd:field    xpath="@name"/>
      <xsd:field    xpath="@pos"/>
    </xsd:unique>
  </xsd:element>

  
  <xsd:element name="distributive-features">
    <xsd:annotation>
    <xsd:documentation>
			Lists the names of the attributes with "distributive" behavior, i.e. 
			ones where the feature value is supposed to show up on 
			every atomic category.  Attributes that are distributive in 
			this sense can be used to prevent phrasal combinations across 
			theme/rheme boundaries, following Steedman's '00 LI paper.
			
			Distributive attributes receive two kinds of special processing. 
			First, after instantiating a lexical category for a word, 
			if a distributive attribute has a unique value, it is automatically 
			spread to all of the atomic categories, thereby alleviating the 
			need to ensure this happens in the definition of the lexical 
			categories and macros.
			Second, as a stopgap measure, following rule combinations, the 
			value of any distributive attribute appearing on the result 
			category is propagated to all argument categories, overwriting 
			any values that may already be there.  This processing allows 
			categories such as s[eme=phr]$\s[eme=th]$ to be used for boundary 
			tones, where the value of the distributive 'eme' feature is changed 
			on the target 's' category (in the lexicon), but the value of this 
			attribute on the $-matched categories remain unchanged until the 
			special processing kicks in.  This stopgap measure would not be necessary 
			if the 'inheritsFrom' and $ capabilities could be combined, which would 
			require a more dynamic treatment of 'inheritsFrom' (i.e. exceptive feature 
			propagation, or default unification).
    </xsd:documentation>
		</xsd:annotation>
    <xsd:complexType>
      <xsd:attribute name="attrs" type="xsd:NMTOKENS" use="required">
        <xsd:annotation>
        <xsd:documentation>
				  A space-separated list of attribute names. 
        </xsd:documentation>
        </xsd:annotation>
      </xsd:attribute>
		</xsd:complexType>
	</xsd:element>

	
  <xsd:element name="licensing-features">
    <xsd:annotation>
    <xsd:documentation>
    	Lists the features to use to license and/or instantiate  
			semantically null or "marked" categories in the realizer, 
      in priority order.
			Examples of semantically empty categories may include 
			case-marking prepositions or particles, infinitival 'to', 
			or complementizers such as 'that'.
			Examples of categories which may be considered "marked" 
			include inverting categories for auxiliaries which are 
			used in questions, but not ordinary declaratives.
			
			Note that by default, the 'lex' feature is included as 
			one used to license and instantiate semantically empty 
			categories, for all values, in all locations.
			Thus, if (say) a semantically null, case marking preposition 
			category has a 'lex' attribute which is instantiated with the stem 
			(via the '[*DEFAULT*]' mechanism), then this category will be activated 
			in the realizer iff any of the categories instantiated for the input 
			logical form have the same value for the 'lex' feature, thereby 
			indicating its relevance.
			If an alternative specification for the 'lex' feature 
			is listed, the default specification is not included.
    </xsd:documentation>
		</xsd:annotation>
    <xsd:complexType>
      <xsd:sequence>
        <xsd:element name="feat" minOccurs="1" maxOccurs="unbounded">
          <xsd:complexType>
            <xsd:attribute name="attr" type="xsd:NMTOKEN" use="required">
							<xsd:annotation>
							<xsd:documentation>
								The name of the licensing feature, i.e. the attribute.
							</xsd:documentation>
							</xsd:annotation>
						</xsd:attribute>
            <xsd:attribute name="val" type="token">
							<xsd:annotation>
							<xsd:documentation>
							  The value of the feature.  If not specified, all attribute values 
								are treated the same for licensing and instantiation purposes.
							</xsd:documentation>
							</xsd:annotation>
						</xsd:attribute>
            <xsd:attribute name="also-licensed-by" type="listOfTokens">
							<xsd:annotation>
							<xsd:documentation>
							  A list of other values of this feature whose presence may also license 
                categories with this feature value.
							</xsd:documentation>
							</xsd:annotation>
						</xsd:attribute>
						<xsd:attribute name="license-empty-cats" type="xsd:boolean">
							<xsd:annotation>
							<xsd:documentation>
								A flag indicating whether semantically null categories with the 
								licensing feature need to be licensed.
								Defaults to true.
							</xsd:documentation>
							</xsd:annotation>
						</xsd:attribute>
						<xsd:attribute name="license-marked-cats" type="xsd:boolean">
							<xsd:annotation>
							<xsd:documentation>
							  A flag indicating whether initial categories with the 
							  licensing feature are marked and need to be licensed.
								Defaults to false.
								If set to true, the defaults for the license-empty-cats and instantiate flags  
								change to false, and the default for the location changes to 
								target-only.
							</xsd:documentation>
							</xsd:annotation>
						</xsd:attribute>
						<xsd:attribute name="instantiate" type="xsd:boolean">
							<xsd:annotation>
							<xsd:documentation>
							  A flag indicating whether semantically empty categories with the 
							  licensing feature should be instantiated.
                Defaults to true.
							</xsd:documentation>
							</xsd:annotation>
						</xsd:attribute>
						<xsd:attribute name="location">
							<xsd:annotation>
							<xsd:documentation>
								The location of the licensing feature on the category to be licensed.
								If target-only, then the value must appear only on the target category. 
								If args-only, then the value must appear only on the argument categories.
								Defaults to both.
							</xsd:documentation>
							</xsd:annotation>
							<xsd:simpleType>
								<xsd:restriction base="xsd:string">
									<xsd:enumeration value="target-only"/>
									<xsd:enumeration value="args-only"/>
									<xsd:enumeration value="both"/>
								</xsd:restriction>
							</xsd:simpleType>
						</xsd:attribute>
          </xsd:complexType>
				</xsd:element>
      </xsd:sequence>
		</xsd:complexType>
	</xsd:element>

	
  <xsd:element name="relation-sorting">
    <xsd:annotation>
    <xsd:documentation>
    	Optionally specifies the order in which to sort relations in 
      the logical forms.
      
      The default sort order is as follows, where "*" indicates all 
      other relations (sorted alphabetically):
        
        "BoundVar", "PairedWith", 
        "Restr", "Body", "Scope", 
        "*", 
        "GenRel", "Coord", "Append"

      The default order may be overridden using the 'order' attribute, 
      which should contain a space-separated list of relation names, 
      with "*" indicating all other relations.
    </xsd:documentation>
		</xsd:annotation>
    <xsd:complexType>
      <xsd:attribute name="order" type="listOfTokens" use="required">
        <xsd:annotation>
        <xsd:documentation>
				  A space-separated list of relation names. 
        </xsd:documentation>
        </xsd:annotation>
      </xsd:attribute>
		</xsd:complexType>
	</xsd:element>

	
  <xsd:element name="family">
    <xsd:annotation>
    <xsd:documentation>
      A category family, which groups lexical category entries, and optionally 
      includes a list of the family members, if the family is closed.
      
      Family members are listed by their stems.  A 'member' element may also have a
      predicate ('pred') explicitly specified, if it differs from the stem.
      The predicate is used to fill in any propositions in the semantics with 
      the reserved name '[*DEFAULT*]'.
      
      The name of the family must be unique.
      
      The part of speech ('pos') is used in the mapping between morphological 
      items and families, as described earlier.
      
      A family may also declare a relation used for indexing purposes (the 'indexRel') 
      in the realizer, i.e. a relation used to lookup words based on relational 
      or featural elementary predications in the input logical form;
      see Mike and Jason's paper on the realizer for discussion, at 
      http://www.iccs.informatics.ed.ac.uk/~mwhite/White-Baldridge-ENLG-2003-to-appear.pdf.
      Families with semantically null entries are indicated using the reserved value '*NoSem*'.
      Relations may also be declared at the level of entries.
      
      NB: It would be nicer if the system could figure out which entries were semantically null; 
      what makes this non-trivial is that macros can introduce additional semantic 
      semantic predications.  At present, this is only discovered when lexical 
      categories are instantiated for specific words.
      
      As an alternative to the indexRel, a family may declare a relation (semantic feature) 
      to use to signal a coarticulation, via the 'coartRel' attribute.  For example, the 
      coart rel "kon" may be used to signal a contrast feature that triggers the addition 
      of a pitch accent.  Coarticulation are handled as lexical modifiers, and as such 
      should be given modifier categories of the form X|X.
    </xsd:documentation>
    </xsd:annotation>
    <xsd:complexType>
      <xsd:sequence>
        <xsd:element ref="entry" maxOccurs="unbounded"/>
        <xsd:element name="member" minOccurs="0" maxOccurs="unbounded">
          <xsd:complexType>
            <xsd:attribute name="stem" type="token" use="required"/>
            <xsd:attribute name="pred" type="token"/>
          </xsd:complexType>
        </xsd:element>
      </xsd:sequence>
      <xsd:attribute name="name" type="token" use="required"/>
      <xsd:attribute name="pos" type="token" use="required"/>
      <xsd:attribute name="closed" type="xsd:boolean"/>
      <xsd:attribute name="indexRel" type="token"/>
      <xsd:attribute name="coartRel" type="token"/>
    </xsd:complexType>
    <xsd:unique name="entryNameUniqueness">
      <xsd:selector xpath="entry"/>
      <xsd:field    xpath="@name"/>
    </xsd:unique>
  </xsd:element>

  
  <xsd:element name="entry">
    <xsd:annotation>
    <xsd:documentation>
      An entry for a family, which contains the definition of a lexical category, 
      and must have a name which is unique within the family.
      
      If there is only stem that is applicable to this entry, it may be specified 
      on this element.
      
      A relation to use for indexing purposes in realization may be given 
      for this entry (if different from other entries in the family).
      
      It is possible to temporarily disable an entry by setting the 'active' 
      attribute to false (defaults to true).
    </xsd:documentation>
    </xsd:annotation>
    <xsd:complexType>
      <xsd:sequence>
        <xsd:element ref="category"/>
      </xsd:sequence>
      <xsd:attribute name="name" type="token" use="required"/>
      <xsd:attribute name="stem" type="token"/>
      <xsd:attribute name="indexRel" type="token"/>
      <xsd:attribute name="active" type="xsd:boolean"/>
    </xsd:complexType>
  </xsd:element>
</xsd:schema>


================================================
FILE: grammars/mini-basque/build.xml
================================================
<!-- $Id: build.xml,v 1.2 2007/03/26 18:31:08 mwhite14850 Exp $ -->
<!-- Copyright (C) 2003 University of Edinburgh (Michael White) and Cem Bozsahin -->
<project default="grammar" basedir=".">

  <!-- =================================================================== -->
  <!-- Initialization target                                               -->
  <!-- =================================================================== -->
  <target name="init">
    <tstamp/>
    <property name="Name" value="OpenCCG"/>
    <property name="name" value="openccg"/>

    <echo message="----------- ${Name} ------------"/>

    <property name="lib.dir" value="${openccg.home}/lib"/>
    <property name="grammars.dir" value="${openccg.home}/grammars"/>

    <path id="validate.classpath">
      <pathelement location="${lib.dir}/xercesImpl.jar"/>
      <pathelement location="${lib.dir}/${name}.jar"/>
    </path>
  </target>
  

  <!-- =================================================================== -->
  <!-- Help on usage                                                       -->
  <!-- =================================================================== -->
  <target name="usage">
    <echo message=""/>
    <echo message=""/>
    <echo message="OpenCCG grammar build file"/>
    <echo message="-------------------------------------------------------------"/>
    <echo message=""/>
    <echo message=" Available targets are:"/>
    <echo message=""/>
    <echo message="   grammar  --> builds the grammar (default)"/>
    <echo message=""/>
    <echo message="   skeleton  --> builds the skeleton file"/>
    <echo message=""/>
    <echo message=" See the comments inside the build.xml file for more details."/>
    <echo message="-------------------------------------------------------------"/>
    <echo message=""/>
    <echo message=""/>
  </target>
  

  <!-- =================================================================== -->
  <!-- Builds grammar                                                     -->
  <!-- =================================================================== -->
  <target name="grammar" depends="init" description="builds grammar">
    <echo message="Adding family members from dict.xml to lexicon-base.xml, yielding lexicon.xml"/>
    <java classname="org.apache.xalan.xslt.Process"> 
      <arg value="-IN"/> <arg value="lexicon-base.xml"/>
      <arg value="-XSL"/> <arg value="${grammars.dir}/add-family-members.xsl"/>
      <arg value="-PARAM"/> <arg value="dict-file"/> <arg value="${basedir}/dict.xml"/>
      <arg value="-OUT"/> <arg value="lexicon.xml"/>
    </java>
    <echo message="Extracting morph items from dict.xml to morph.xml"/>
    <java classname="org.apache.xalan.xslt.Process"> 
      <arg value="-IN"/> <arg value="${basedir}/dict.xml"/>
      <arg value="-XSL"/> <arg value="${grammars.dir}/extract-morph.xsl"/>
      <arg value="-OUT"/> <arg value="morph.xml"/>
    </java>
    <echo message="Validating grammar.xml, lexicon.xml, morph.xml, rules.xml and types.xml"/>
    <java classname="opennlp.ccg.test.Validator" classpathref="validate.classpath" fork="true"> 
      <arg value="grammar.xml"/>
      <arg value="lexicon.xml"/>
      <arg value="morph.xml"/>
      <arg value="rules.xml"/>
      <arg value="types.xml"/>
    </java>
  </target>

  <target name="skeleton"
          depends="init"
 description="Builds pre-lexicon to start up lexicon development">
    <echo message="Validating parameters.xml"/>
    <java classname="opennlp.ccg.test.Validator" classpathref="validate.classpath" fork="true"> 
      <arg value="parameters.xml"/>
    </java>
    <echo message="Generating preset-families.xml"/>
    <java classname="org.apache.xalan.xslt.Process">
      <arg value="-IN"/> <arg value="${basedir}/parameters.xml"/>
      <arg value="-XSL"/> <arg value="${grammars.dir}/parametric-lexicon.xsl"/>
      <arg value="-OUT"/> <arg value="${basedir}/preset-families.xml"/>
    </java>
    <echo message="Validating preset-families.xml"/>
    <java classname="opennlp.ccg.test.Validator" classpathref="validate.classpath" fork="true"> 
      <arg value="preset-families.xml"/>
    </java>
	<echo message="Generating types.xml"/>
    <java classname="org.apache.xalan.xslt.Process">
      <arg value="-IN"/> <arg value="${basedir}/parameters.xml"/>
      <arg value="-XSL"/> <arg value="${grammars.dir}/parametric-types.xsl"/>
      <arg value="-OUT"/> <arg value="${basedir}/types.xml"/>
    </java>
    <echo message="Validating types.xml"/>
    <java classname="opennlp.ccg.test.Validator" classpathref="validate.classpath" fork="true"> 
      <arg value="types.xml"/>
    </java>
  </target>
</project>

<!-- End of file -->


================================================
FILE: grammars/mini-basque/dict.xml
================================================
<?xml version="1.0"?>

<dictionary name="Basque">
 
  <entry stem="eta" pred="and" pos="Conj">
    <member-of family="Conj"/>
    <word form="eta" />
  </entry>
  <entry stem="kafe" pred="coffee" pos="NP">
    <member-of family="NP-case"/>
    <word form="kafea" macros="@abs @sg @3rd"/>
  </entry>
  <entry stem="aita" pred="father" pos="NP">
    <member-of family="NP-case"/>
    <word form="aita" macros="@abs @sg @3rd"/>
    <word form="aitak" macros="@erg @sg @3rd"/>
  </entry>
  <entry stem="ama" pred="mother" pos="NP">
    <member-of family="NP-case"/>
    <word form="ama" macros="@abs @sg @3rd"/>
    <word form="amari" macros="@dat @sg @3rd"/>
    <word form="amak" macros="@erg @sg @3rd"/>
  </entry>
  <entry stem="emakume" pred="woman" pos="NP">
    <member-of family="NP-case"/>
    <word form="emakumea" macros="@abs @sg @3rd"/>
    <word form="emakumeari" macros="@dat @sg @3rd"/>
  </entry>
  <entry stem="sagarra" pred="apples" pos="NP">
    <member-of family="NP-case"/>
    <word form="sagarrak" macros="@abs @plu @3rd"/>
  </entry>
  <entry stem="liburu" pred="book" pos="NP">
    <member-of family="NP-case"/>
    <word form="liburua" macros="@abs @sg @3rd"/>
  </entry>
  <entry stem="gizon" pred="man" pos="NP">
    <member-of family="NP-case"/>
    <word form="gizonak" macros="@erg @sg @3rd"/>
    <word form="gizona" macros="@abs @sg @3rd"/>
  </entry>
  <entry stem="ni" pred="i" pos="NNP">
    <member-of family="pronoun"/>
    <word form="ni" macros="@abs @sg @1st"/>
    <word form="nik" macros="@erg @sg @1st"/>
  </entry>
  <entry stem="joan" pred="go" pos="V">
    <member-of family="unergative"/>
    <word form="joan" macros="@non-fin"/>
  </entry>
  <entry stem="usteltzen" pred="rot" pos="V">
    <member-of family="unergative"/>
    <word form="usteltzen" macros="@non-fin"/>
  </entry>
  <entry stem="egin" pred="do" pos="V">
    <member-of family="TV"/>
    <word form="egin" macros="@non-fin"/>
  </entry>
  <entry stem="utzi" pred="leave" pos="V">
    <member-of family="TV"/>
    <word form="utzi" macros="@non-fin"/>
  </entry>
  <entry stem="egosten" pred="cook" pos="V">
    <member-of family="TV"/>
    <word form="egosten" macros="@non-fin"/>
  </entry>
  <entry stem="jaten" pred="eat" pos="V">
    <member-of family="TV"/>
    <word form="jaten" macros="@non-fin"/>
  </entry>
  <entry stem="ikusi" pred="see" pos="V">
    <member-of family="TV"/>
    <word form="ikusi" macros="@non-fin"/>
  </entry>
  <entry stem="nahi" pred="want" pos="V">
    <member-of family="TV"/>
    <member-of family="IV-control1"/>
    <word form="nahi" macros="@non-fin"/>
  </entry>
  <entry stem="eman" pred="give" pos="V">
    <member-of family="DV"/>
    <word form="eman" macros="@non-fin"/>
  </entry>
  <entry stem="dio" pred="have" pos="V">
    <member-of family="AUX-ditransitive"/>
<word form="dio"  macros="@sg1 @3rd1 @erg1 @sg2 @3rd2 @abs2 @sg3 @3rd3 @dat3"/>
  </entry>
  <entry stem="dut1" pred="have" pos="V">
    <member-of family="AUX-intransitive"/>
    <word form="dut" macros="@1st1" />
    <word form="du" macros="@3rd1"/>
    <word form="duzu" macros="@2nd1"/>
    <word form="da" />  <!-- this is in fact unaccusative -->
  </entry>
  <entry stem="dut2" pred="have" pos="V">
    <member-of family="AUX-transitive"/>
    <word form="dut" macros="@sg1 @1st1 @erg1 @sg2 @3rd2 @abs2"/>
    <word form="dud" macros="@sg1 @1st1 @erg1 @sg2 @3rd2 @abs2"/>
    <word form="duzu" macros="@sg1 @2nd1 @erg1  @sg2 @3rd2 @abs2"/>
    <word form="du" macros="@sg1 @3rd1 @erg1 @sg2 @3rd2 @abs2"/>
  </entry>
  <entry stem="nau" pred="have" pos="V">
    <member-of family="AUX-transitive"/>
    <word form="nau" macros="@sg1 @3rd1  @erg1 @sg2 @1st2 @abs2"/>
    <word form="nauzu" macros="@sg1 @2nd1 @erg1 @sg2 @1st2 @abs2"/>
  </entry>
  <entry stem="zuen1" pred="have" pos="V">
    <member-of family="AUX-transitive"/>
    <word form="zuen" macros="@sg1 @3rd1 @sg2 @3rd2"/>
  </entry>
  <entry stem="ditu1" pred="have" pos="V">
    <member-of family="AUX-transitive"/>
    <word form="ditu" macros="@sg1 @3rd1 @plu2 @3rd2"/>
  </entry>
  <entry stem="zen1" pred="have" pos="V">
    <member-of family="AUX-intransitive"/>
    <word form="zen" macros="@sg1 @3rd1 "/>
  </entry>
  <entry stem="dira1" pred="have" pos="V">
    <member-of family="AUX-intransitive"/>
    <word form="dira" macros="@plu1 @3rd1 "/>
  </entry>
  <entry stem="a" pos="Affix">
    <member-of family="case"/>
    <word form="a" macros="@abs"/>
  </entry>
  <entry stem="ak" pos="Affix">
    <member-of family="case"/>
    <word form="ak" macros="@erg"/>
    <word form="k" macros="@erg"/>
  </entry>
  <entry stem="ri" pos="Affix">
    <member-of family="case"/>
    <word form="ri" macros="@dat"/>
    <word form="ari" macros="@dat"/>
  </entry>
  <entry stem="n" pos="Affix">
    <member-of family="rel"/>
    <word form="n" />
    <word form="an" />
  </entry>

  <entry stem="n" pred="at" pos="Affix">
    <member-of family="adjunct-case"/>
    <word form="n" />
  </entry>
  <entry stem="ra" pred="to" pos="Affix">
    <member-of family="adjunct-case"/>
    <word form="ra" />
  </entry>

  <entry stem="gizon" pred="man" pos="N">
    <member-of family="noun"/>
  </entry>
  <entry stem="eskola" pred="school" pos="N">
    <member-of family="noun"/>
  </entry>
  <entry stem="seme" pred="son" pos="N">
    <member-of family="noun"/>
  </entry>
  <entry stem="klase" pred="class" pos="N">
    <member-of family="noun"/>
  </entry>
  <entry stem="emakume" pred="woman" pos="N" macros="@sg">
    <member-of family="noun"/>
  </entry>
  <entry stem="liburu" pred="book" pos="N" macros="@sg">
    <member-of family="noun"/>
  </entry>
  <entry stem="aita" pred="father" pos="N" macros="@sg">
    <member-of family="noun"/>
  </entry>
  <entry stem="ama" pred="mother" pos="N" macros="@sg">
    <member-of family="noun"/>
  </entry>
  <entry stem="kafe" pred="coffee" pos="N" macros="@sg">
    <member-of family="noun"/>
  </entry>

<macro name="@abs">
  <fs id="0" attr="case" val="s-case"/>
</macro>
<macro name="@abs1">
  <fs id="1" attr="case" val="s-case"/>
</macro>
<macro name="@abs2">
  <fs id="2" attr="case" val="p-case"/>
</macro>
<macro name="@erg">
  <fs id="0" attr="case" val="a-case"/>
</macro>
<macro name="@erg1">
  <fs id="1" attr="case" val="a-case"/>
</macro>
<macro name="@erg2">
  <fs id="2" attr="case" val="a-case"/>
</macro>
<macro name="@dat">
  <fs id="0" attr="case" val="dat"/>
</macro>
<macro name="@dat3">
  <fs id="3" attr="case" val="dat"/>
</macro>
<macro name="@sg">
  <fs id="0" attr="num" val="sing"/>
</macro>
<macro name="@plu">
  <fs id="0" attr="num" val="plu"/>
</macro>
<macro name="@plu1">
  <fs id="1" attr="num" val="plu"/>
</macro>
<macro name="@plu2">
  <fs id="2" attr="num" val="plu"/>
</macro>
<macro name="@sg1">
  <fs id="1" attr="num" val="sing"/>
</macro>
<macro name="@sg2">
  <fs id="2" attr="num" val="sing"/>
</macro>
<macro name="@sg3">
  <fs id="3" attr="num" val="sing"/>
</macro>
<macro name="@3rd">
  <fs id="0" attr="person" val="3"/>
</macro>
<macro name="@3rd1">
  <fs id="1" attr="person" val="3"/>
</macro>
<macro name="@3rd2">
  <fs id="2" attr="person" val="3"/>
</macro>
<macro name="@3rd3">
  <fs id="3" attr="person" val="3"/>
</macro>
<macro name="@1st">
  <fs id="0" attr="person" val="1"/>
</macro>
<macro name="@1st1">
  <fs id="1" attr="person" val="1"/>
</macro>
<macro name="@1st2">
  <fs id="2" attr="person" val="1"/>
</macro>
<macro name="@2nd">
  <fs id="0" attr="person" val="1"/>
</macro>
<macro name="@2nd1">
  <fs id="1" attr="person" val="2"/>
</macro>
<macro name="@2nd2">
  <fs id="2" attr="person" val="1"/>
</macro>
<macro name="@non-fin">
  <fs id="0" attr="vform" val="non-fin"/> 
</macro>

</dictionary>


================================================
FILE: grammars/mini-basque/grammar.xml
================================================
<?xml version="1.0"?>
<!-- 
Copyright (C) 2003 University of Edinburgh (Michael White) and Cem Bozsahin
$Revision: 1.1 $, $Date: 2005/08/03 14:23:27 $ 
-->
<grammar name="Basque"
  xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
  xsi:noNamespaceSchemaLocation="../grammar.xsd"
>

  <lexicon file="lexicon.xml"/>
  <morphology file="morph.xml"/>
  <rules file="rules.xml"/>
  <types file="types.xml"/>

</grammar>


================================================
FILE: grammars/mini-basque/lexicon-base.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!-- 
      - This file is generated by lexicon-skeleton.xsl to set up
          accusativity/ergativity parameter for IV and TV primary families
          and control primary families.
      - Modify it to set up a particular lexicon
          NB: pre-CCG categories of lexicon-skeleton.xml are mapped to
              CCG categories in this file. From now on, it's all CCG
      - After modifying preset families, add your own families as needed.
          Then, you can use the build facility of openCCG to build
          the lexicon.xml, morph.xml and rules.xml files needed by the system.
          If you hand-code the entries, families and members, you do not need 
          to use the build facility.
  -->
  <!-- Additional families by Cem Bozsahin , 6/2003 -->
<!--

      *** Families derived from language parameters ***

   Includes primary entries for IV, TV, TV-control1, TV-control2, IV-control1
   
  -->
<ccg-lexicon xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" 
xsi:noNamespaceSchemaLocation="../lexicon.xsd" name="Basque">
	
  <family closed="true" pos="V" name="unergative">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="case" val="s-case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
			<diamond mode="Arg2">
                <nom name="one"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
	</family>

	  <family closed="true" pos="V" name="unaccusative">
       <entry name="primary">
       <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="case" val="s-case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg2">
              <nomvar name="X1"/>
            </diamond>
			<diamond mode="Arg1">
                <nom name="one"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
  
  <family closed="true" pos="V" name="TV">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <setarg>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="case" val="a-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X1:1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="case" val="p-case"/>
               <feat attr="index">
                <lf>
                  <nomvar name="X2:2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </setarg>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1:1"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="X2:2"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
  <family closed="true" pos="V" name="TV-control2">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <setarg>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="case" val="a-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <complexcat>
                  <!--NB: Word order and directionality of embedded clause's |(S|NP) 
type is an 'educated guess' from the syntactic type of TV. Change them
accordingly 
  -->
            <atomcat type="s">
              <fs id="3">
                <feat val="non-fin" attr="vform"/>
                <feat attr="index">
                  <lf>
                    <nomvar name="E2"/>
                  </lf>
                </feat>
              </fs>
            </atomcat> 
            <slash dir="|"/>
            <atomcat type="np">
              <fs id="4">
                <feat attr="index">
                  <lf>
                    <nomvar name="X2"/>
                              <!--NB: Index is same as Arg2's 
  -->
                  </lf>
                </feat>
              </fs>
            </atomcat>
          </complexcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="case" val="p-case"/>
               <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </setarg>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="X2"/>
            </diamond>
            <diamond mode="Arg3">
              <nomvar name="E2"/>
                     <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
            </diamond>
          </satop>
	  <satop nomvar="E2">  <!-- semantic subj control w/o case -->
            <diamond mode="Arg1">
              <nomvar name="X2"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
  <family closed="true" pos="V" name="TV-control1">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <setarg>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="case" val="a-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <complexcat>
                  <!--NB: Word order and directionality of embedded clause's 
|(S|NP) type is an 'educated guess' from the syntactic type of TV. 
Change them accordingly.
  -->
            <atomcat type="s">
              <fs id="3">
                <feat val="non-fin" attr="vform"/>
                <feat attr="index">
                  <lf>
                    <nomvar name="E2"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
            <slash dir="|"/>
            <atomcat type="np">
              <fs id="4">
                 <feat attr="index">
                  <lf>
                    <nomvar name="X1"/>
                              <!--NB: Index is same as Arg1's 
  -->
                  </lf>
                </feat>
              </fs>
            </atomcat>
          </complexcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="case" val="p-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </setarg>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="X2"/>
            </diamond>
            <diamond mode="Arg3">
              <nomvar name="E2"/>
                     <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
            </diamond>
          </satop>
		  <satop nomvar="E2">  <!-- sem. subj control -->
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
  <family closed="true" pos="V" name="IV-control1">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <setarg>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="case" val="a-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="|"/>
          <complexcat>
                  <!--NB: Word order and directionality of embedded clause's 
|(S|NP) type is an 'educated guess' from the syntactic type of TV. 
Change them accordingly.
  -->
            <atomcat type="s">
              <fs id="3">
                <feat val="non-fin" attr="vform"/>
                <feat attr="index">
                  <lf>
                    <nomvar name="E2"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
            <slash dir="\"/>
            <atomcat type="np">
              <fs id="4">
                <feat attr="index">
                  <lf>
                    <nomvar name="X1"/>
                              <!--NB: Index is same as Arg1's 
  -->
                  </lf>
                </feat>
              </fs>
            </atomcat>
          </complexcat>
        </setarg>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="E2"/>
                     <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
            </diamond>
          </satop>
		  <satop nomvar="E2"> <!-- sem. subj control -->
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
   <!--

    *** End of derived families ***
  -->


<!-- these are the user-defined families for Basque. 
  -->
	
  <family indexRel="Restr" pos="Affix" closed="true" name="rel">
    <entry name="primary">
      <complexcat>
        <atomcat type="n">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="*"/>
        <atomcat type="n">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="*"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="np">
<!-- no structure sharing with fs 0; this aint HPSG-->
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="X">
            <diamond mode="Restr">
              <nomvar name="E"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
	
  <family pos="Affix" closed="true" name="case">
    <entry name="primary">
      <complexcat>
        <atomcat type="np">
          <fs id="0">
            <feat attr="person" val="3"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="*"/>
        <atomcat type="n">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X">
            <diamond mode="Det">
              <nomvar name="D"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
	
  <family pos="N" closed="true" name="noun">
    <entry name="primary">
      <atomcat type="n">
        <fs id="0">
          <feat attr="person" val="3"/>
          <feat attr="num">
            <featvar name="NUM"/>
          </feat>
          <feat attr="index">
            <lf>
              <nomvar name="X"/>
            </lf>
          </feat>
        </fs>
        <lf>
          <satop nomvar="X">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </atomcat>
    </entry>
  </family>
	
  <family pos="NP" closed="true" name="NP-case">
    <entry name="primary">
      <atomcat type="np">
        <fs id="0">
          <feat attr="num">
            <featvar name="NUM"/>
          </feat>
          <feat attr="index">
            <lf>
              <nomvar name="X"/>
            </lf>
          </feat>
        </fs>
        <lf>
          <satop nomvar="X">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </atomcat>
    </entry>
	
  </family>

	
  <family pos="NNP" closed="true" name="pronoun">
    <entry name="primary">
      <atomcat type="np">
        <fs id="0">
          <feat attr="num">
            <featvar name="NUM"/>
          </feat>
          <feat attr="index">
            <lf>
              <nomvar name="X"/>
            </lf>
          </feat>
        </fs>
        <lf>
          <satop nomvar="X">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </atomcat>
    </entry>
  </family>
	
  <family closed="true" pos="V" name="AUX-intransitive">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="0">
            <feat attr="vform" val="fin"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="*"/>
        <complexcat>
          <atomcat type="s">
            <fs id="0">
              <feat attr="vform" val="non-fin"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="P">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Asp">
              <nomvar name="E"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
	
  <family closed="true" pos="V" name="AUX-transitive">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="0">
            <feat attr="vform" val="fin"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <setarg>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </setarg>
		<slash dir="\" mode="*"/>
		<complexcat>
          <atomcat type="s">
            <fs id="0">
              <feat attr="vform" val="non-fin"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>  <!-- NB. 'semantic' behaviour of AUX -->
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
		</complexcat>
        <lf>
          <satop nomvar="P">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Asp">
              <nomvar name="E"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
  <family closed="true" pos="V" name="AUX-ditransitive">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="0">
            <feat attr="vform" val="fin"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <setarg>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="3">
              <feat attr="index">
                <lf>
                  <nomvar name="X3"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </setarg>
        <slash dir="\" mode="*"/>
		<complexcat>
            <atomcat type="s">
            <fs id="0">
              <feat attr="vform" val="non-fin"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>  <!-- NB 'semantic behaviour of AUX -->
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="3">
              <feat attr="index">
                <lf>
                  <nomvar name="X3"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
		</complexcat>
        <lf>
          <satop nomvar="P">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Asp">
              <nomvar name="E"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
	
  <family closed="true" pos="V" name="DV">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <setarg>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="case" val="a-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X1:1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="case" val="p-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2:2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="3">
              <feat attr="case" val="dat"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X3:3"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </setarg>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1:1"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="X2:2"/>
            </diamond>
            <diamond mode="Arg3">
              <nomvar name="X3:3"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
	
  <family closed="true" pos="Conj" name="Conj">
    <entry name="sentential">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S0"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="*"/>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="*"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="S2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="S0">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="List">
              <nomvar name="S1"/>
              <diamond mode="Coord">
                <nomvar name="S2"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
	<entry name="1-VP">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S0"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
		<slash dir="\"/>
		<atomcat type="np">
		 <fs> <feat attr="case"><featvar name="Case1"/></feat> 
		     <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat> </fs>
		 </atomcat>
        <slash dir="\" mode="*"/>
		<complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
		<slash dir="\"/>
		<atomcat type="np">
		 <fs> <feat attr="case"><featvar  name="Case1"/></feat> 
		     <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat> </fs>
		 </atomcat>
		 </complexcat>
        <slash dir="/" mode="*"/>
		<complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="S2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
		<slash dir="\"/>
		<atomcat type="np">
		 <fs> <feat attr="case"><featvar name="Case2"/></feat>
		     <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat> </fs>
		 </atomcat>
		 </complexcat>
        <lf>
          <satop nomvar="S0">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="List">
              <nomvar name="S1"/>
              <diamond mode="Coord">
                <nomvar name="S2"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
	
  <family closed="true" pos="Affix" name="adjunct-case">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash/>
        <dollar name="1"/>
        <slash dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="0">
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
        </complexcat>
        <slash dir="\" mode="*"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="P">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Pred">
              <nomvar name="E"/>
              <diamond mode="Mod">
                <nomvar name="Y"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>

</ccg-lexicon>


================================================
FILE: grammars/mini-basque/lexicon.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!-- 
      - This file is generated by lexicon-skeleton.xsl to set up
          accusativity/ergativity parameter for IV and TV primary families
          and control primary families.
      - Modify it to set up a particular lexicon
          NB: pre-CCG categories of lexicon-skeleton.xml are mapped to
              CCG categories in this file. From now on, it's all CCG
      - After modifying preset families, add your own families as needed.
          Then, you can use the build facility of openCCG to build
          the lexicon.xml, morph.xml and rules.xml files needed by the system.
          If you hand-code the entries, families and members, you do not need 
          to use the build facility.
  -->
<!-- Additional families by Cem Bozsahin , 6/2003 -->
<!--

      *** Families derived from language parameters ***

   Includes primary entries for IV, TV, TV-control1, TV-control2, IV-control1
   
  -->
<ccg-lexicon xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:noNamespaceSchemaLocation="../lexicon.xsd" name="Basque">
  <family closed="true" pos="V" name="unergative">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="case" val="s-case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
            <diamond mode="Arg2">
              <nom name="one"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="joan" pred="go"/>
    <member stem="usteltzen" pred="rot"/>
  </family>
  <family closed="true" pos="V" name="unaccusative">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="case" val="s-case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg2">
              <nomvar name="X1"/>
            </diamond>
            <diamond mode="Arg1">
              <nom name="one"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
  <family closed="true" pos="V" name="TV">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <setarg>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="case" val="a-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X1:1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="case" val="p-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2:2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </setarg>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1:1"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="X2:2"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="egin" pred="do"/>
    <member stem="utzi" pred="leave"/>
    <member stem="egosten" pred="cook"/>
    <member stem="jaten" pred="eat"/>
    <member stem="ikusi" pred="see"/>
    <member stem="nahi" pred="want"/>
  </family>
  <family closed="true" pos="V" name="TV-control2">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <setarg>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="case" val="a-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <complexcat>
            <!--NB: Word order and directionality of embedded clause's |(S|NP) 
type is an 'educated guess' from the syntactic type of TV. Change them
accordingly 
  -->
            <atomcat type="s">
              <fs id="3">
                <feat val="non-fin" attr="vform"/>
                <feat attr="index">
                  <lf>
                    <nomvar name="E2"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
            <slash dir="|"/>
            <atomcat type="np">
              <fs id="4">
                <feat attr="index">
                  <lf>
                    <nomvar name="X2"/>
                    <!--NB: Index is same as Arg2's 
  -->
                  </lf>
                </feat>
              </fs>
            </atomcat>
          </complexcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="case" val="p-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </setarg>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="X2"/>
            </diamond>
            <diamond mode="Arg3">
              <nomvar name="E2"/>
              <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
            </diamond>
          </satop>
          <satop nomvar="E2">
            <!-- semantic subj control w/o case -->
            <diamond mode="Arg1">
              <nomvar name="X2"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
  <family closed="true" pos="V" name="TV-control1">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <setarg>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="case" val="a-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <complexcat>
            <!--NB: Word order and directionality of embedded clause's 
|(S|NP) type is an 'educated guess' from the syntactic type of TV. 
Change them accordingly.
  -->
            <atomcat type="s">
              <fs id="3">
                <feat val="non-fin" attr="vform"/>
                <feat attr="index">
                  <lf>
                    <nomvar name="E2"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
            <slash dir="|"/>
            <atomcat type="np">
              <fs id="4">
                <feat attr="index">
                  <lf>
                    <nomvar name="X1"/>
                    <!--NB: Index is same as Arg1's 
  -->
                  </lf>
                </feat>
              </fs>
            </atomcat>
          </complexcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="case" val="p-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </setarg>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="X2"/>
            </diamond>
            <diamond mode="Arg3">
              <nomvar name="E2"/>
              <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
            </diamond>
          </satop>
          <satop nomvar="E2">
            <!-- sem. subj control -->
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
  <family closed="true" pos="V" name="IV-control1">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <setarg>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="case" val="a-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="|"/>
          <complexcat>
            <!--NB: Word order and directionality of embedded clause's 
|(S|NP) type is an 'educated guess' from the syntactic type of TV. 
Change them accordingly.
  -->
            <atomcat type="s">
              <fs id="3">
                <feat val="non-fin" attr="vform"/>
                <feat attr="index">
                  <lf>
                    <nomvar name="E2"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
            <slash dir="\"/>
            <atomcat type="np">
              <fs id="4">
                <feat attr="index">
                  <lf>
                    <nomvar name="X1"/>
                    <!--NB: Index is same as Arg1's 
  -->
                  </lf>
                </feat>
              </fs>
            </atomcat>
          </complexcat>
        </setarg>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="E2"/>
              <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
            </diamond>
          </satop>
          <satop nomvar="E2">
            <!-- sem. subj control -->
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="nahi" pred="want"/>
  </family>
  <!--

    *** End of derived families ***
  -->
  <!-- these are the user-defined families for Basque. 
  -->
  <family indexRel="Restr" pos="Affix" closed="true" name="rel">
    <entry name="primary">
      <complexcat>
        <atomcat type="n">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="*"/>
        <atomcat type="n">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="*"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="np">
            <!-- no structure sharing with fs 0; this aint HPSG-->
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="X">
            <diamond mode="Restr">
              <nomvar name="E"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="n"/>
  </family>
  <family pos="Affix" closed="true" name="case">
    <entry name="primary">
      <complexcat>
        <atomcat type="np">
          <fs id="0">
            <feat attr="person" val="3"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="*"/>
        <atomcat type="n">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X">
            <diamond mode="Det">
              <nomvar name="D"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="a"/>
    <member stem="ak"/>
    <member stem="ri"/>
  </family>
  <family pos="N" closed="true" name="noun">
    <entry name="primary">
      <atomcat type="n">
        <fs id="0">
          <feat attr="person" val="3"/>
          <feat attr="num">
            <featvar name="NUM"/>
          </feat>
          <feat attr="index">
            <lf>
              <nomvar name="X"/>
            </lf>
          </feat>
        </fs>
        <lf>
          <satop nomvar="X">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </atomcat>
    </entry>
    <member stem="gizon" pred="man"/>
    <member stem="eskola" pred="school"/>
    <member stem="seme" pred="son"/>
    <member stem="klase" pred="class"/>
    <member stem="emakume" pred="woman"/>
    <member stem="liburu" pred="book"/>
    <member stem="aita" pred="father"/>
    <member stem="ama" pred="mother"/>
    <member stem="kafe" pred="coffee"/>
  </family>
  <family pos="NP" closed="true" name="NP-case">
    <entry name="primary">
      <atomcat type="np">
        <fs id="0">
          <feat attr="num">
            <featvar name="NUM"/>
          </feat>
          <feat attr="index">
            <lf>
              <nomvar name="X"/>
            </lf>
          </feat>
        </fs>
        <lf>
          <satop nomvar="X">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </atomcat>
    </entry>
    <member stem="kafe" pred="coffee"/>
    <member stem="aita" pred="father"/>
    <member stem="ama" pred="mother"/>
    <member stem="emakume" pred="woman"/>
    <member stem="sagarra" pred="apples"/>
    <member stem="liburu" pred="book"/>
    <member stem="gizon" pred="man"/>
  </family>
  <family pos="NNP" closed="true" name="pronoun">
    <entry name="primary">
      <atomcat type="np">
        <fs id="0">
          <feat attr="num">
            <featvar name="NUM"/>
          </feat>
          <feat attr="index">
            <lf>
              <nomvar name="X"/>
            </lf>
          </feat>
        </fs>
        <lf>
          <satop nomvar="X">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </atomcat>
    </entry>
    <member stem="ni" pred="i"/>
  </family>
  <family closed="true" pos="V" name="AUX-intransitive">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="0">
            <feat attr="vform" val="fin"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="*"/>
        <complexcat>
          <atomcat type="s">
            <fs id="0">
              <feat attr="vform" val="non-fin"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="P">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Asp">
              <nomvar name="E"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="dut1" pred="have"/>
    <member stem="zen1" pred="have"/>
    <member stem="dira1" pred="have"/>
  </family>
  <family closed="true" pos="V" name="AUX-transitive">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="0">
            <feat attr="vform" val="fin"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <setarg>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </setarg>
        <slash dir="\" mode="*"/>
        <complexcat>
          <atomcat type="s">
            <fs id="0">
              <feat attr="vform" val="non-fin"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                  <!-- NB. 'semantic' behaviour of AUX -->
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="P">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Asp">
              <nomvar name="E"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="dut2" pred="have"/>
    <member stem="nau" pred="have"/>
    <member stem="zuen1" pred="have"/>
    <member stem="ditu1" pred="have"/>
  </family>
  <family closed="true" pos="V" name="AUX-ditransitive">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="0">
            <feat attr="vform" val="fin"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <setarg>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="3">
              <feat attr="index">
                <lf>
                  <nomvar name="X3"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </setarg>
        <slash dir="\" mode="*"/>
        <complexcat>
          <atomcat type="s">
            <fs id="0">
              <feat attr="vform" val="non-fin"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                  <!-- NB 'semantic behaviour of AUX -->
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="3">
              <feat attr="index">
                <lf>
                  <nomvar name="X3"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="P">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Asp">
              <nomvar name="E"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="dio" pred="have"/>
  </family>
  <family closed="true" pos="V" name="DV">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <setarg>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="case" val="a-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X1:1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="case" val="p-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2:2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="3">
              <feat attr="case" val="dat"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X3:3"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </setarg>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1:1"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="X2:2"/>
            </diamond>
            <diamond mode="Arg3">
              <nomvar name="X3:3"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="eman" pred="give"/>
  </family>
  <family closed="true" pos="Conj" name="Conj">
    <entry name="sentential">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S0"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="*"/>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="*"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="S2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="S0">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="List">
              <nomvar name="S1"/>
              <diamond mode="Coord">
                <nomvar name="S2"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="1-VP">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S0"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="np">
          <fs>
            <feat attr="case">
              <featvar name="Case1"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="*"/>
        <complexcat>
          <atomcat type="s">
            <fs inheritsFrom="1">
              <feat attr="index">
                <lf>
                  <nomvar name="S1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs>
              <feat attr="case">
                <featvar name="Case1"/>
              </feat>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash dir="/" mode="*"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="S2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs>
              <feat attr="case">
                <featvar name="Case2"/>
              </feat>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="S0">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="List">
              <nomvar name="S1"/>
              <diamond mode="Coord">
                <nomvar name="S2"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="eta" pred="and"/>
  </family>
  <family closed="true" pos="Affix" name="adjunct-case">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash/>
        <dollar name="1"/>
        <slash dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="0">
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
        </complexcat>
        <slash dir="\" mode="*"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="P">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Pred">
              <nomvar name="E"/>
              <diamond mode="Mod">
                <nomvar name="Y"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="n" pred="at"/>
    <member stem="ra" pred="to"/>
  </family>
</ccg-lexicon>


================================================
FILE: grammars/mini-basque/morph.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<morph xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:noNamespaceSchemaLocation="../morph.xsd" name="Basque">
  <entry pos="Conj" word="eta"/>
  <entry pos="NP" word="kafea" stem="kafe" macros="@abs @sg @3rd"/>
  <entry pos="NP" word="aita" macros="@abs @sg @3rd"/>
  <entry pos="NP" word="aitak" stem="aita" macros="@erg @sg @3rd"/>
  <entry pos="NP" word="ama" macros="@abs @sg @3rd"/>
  <entry pos="NP" word="amari" stem="ama" macros="@dat @sg @3rd"/>
  <entry pos="NP" word="amak" stem="ama" macros="@erg @sg @3rd"/>
  <entry pos="NP" word="emakumea" stem="emakume" macros="@abs @sg @3rd"/>
  <entry pos="NP" word="emakumeari" stem="emakume" macros="@dat @sg @3rd"/>
  <entry pos="NP" word="sagarrak" stem="sagarra" macros="@abs @plu @3rd"/>
  <entry pos="NP" word="liburua" stem="liburu" macros="@abs @sg @3rd"/>
  <entry pos="NP" word="gizonak" stem="gizon" macros="@erg @sg @3rd"/>
  <entry pos="NP" word="gizona" stem="gizon" macros="@abs @sg @3rd"/>
  <entry pos="NNP" word="ni" macros="@abs @sg @1st"/>
  <entry pos="NNP" word="nik" stem="ni" macros="@erg @sg @1st"/>
  <entry pos="V" word="joan" macros="@non-fin"/>
  <entry pos="V" word="usteltzen" macros="@non-fin"/>
  <entry pos="V" word="egin" macros="@non-fin"/>
  <entry pos="V" word="utzi" macros="@non-fin"/>
  <entry pos="V" word="egosten" macros="@non-fin"/>
  <entry pos="V" word="jaten" macros="@non-fin"/>
  <entry pos="V" word="ikusi" macros="@non-fin"/>
  <entry pos="V" word="nahi" macros="@non-fin"/>
  <entry pos="V" word="eman" macros="@non-fin"/>
  <entry pos="V" word="dio" macros="@sg1 @3rd1 @erg1 @sg2 @3rd2 @abs2 @sg3 @3rd3 @dat3"/>
  <entry pos="V" word="dut" stem="dut1" macros="@1st1"/>
  <entry pos="V" word="du" stem="dut1" macros="@3rd1"/>
  <entry pos="V" word="duzu" stem="dut1" macros="@2nd1"/>
  <entry pos="V" word="da" stem="dut1"/>
  <!-- this is in fact unaccusative -->
  <entry pos="V" word="dut" stem="dut2" macros="@sg1 @1st1 @erg1 @sg2 @3rd2 @abs2"/>
  <entry pos="V" word="dud" stem="dut2" macros="@sg1 @1st1 @erg1 @sg2 @3rd2 @abs2"/>
  <entry pos="V" word="duzu" stem="dut2" macros="@sg1 @2nd1 @erg1 @sg2 @3rd2 @abs2"/>
  <entry pos="V" word="du" stem="dut2" macros="@sg1 @3rd1 @erg1 @sg2 @3rd2 @abs2"/>
  <entry pos="V" word="nau" macros="@sg1 @3rd1 @erg1 @sg2 @1st2 @abs2"/>
  <entry pos="V" word="nauzu" stem="nau" macros="@sg1 @2nd1 @erg1 @sg2 @1st2 @abs2"/>
  <entry pos="V" word="zuen" stem="zuen1" macros="@sg1 @3rd1 @sg2 @3rd2"/>
  <entry pos="V" word="ditu" stem="ditu1" macros="@sg1 @3rd1 @plu2 @3rd2"/>
  <entry pos="V" word="zen" stem="zen1" macros="@sg1 @3rd1"/>
  <entry pos="V" word="dira" stem="dira1" macros="@plu1 @3rd1"/>
  <entry pos="Affix" word="a" macros="@abs"/>
  <entry pos="Affix" word="ak" macros="@erg"/>
  <entry pos="Affix" word="k" stem="ak" macros="@erg"/>
  <entry pos="Affix" word="ri" macros="@dat"/>
  <entry pos="Affix" word="ari" stem="ri" macros="@dat"/>
  <entry pos="Affix" word="n"/>
  <entry pos="Affix" word="an" stem="n"/>
  <entry pos="Affix" word="n"/>
  <entry pos="Affix" word="ra"/>
  <entry word="gizon" pos="N"/>
  <entry word="eskola" pos="N"/>
  <entry word="seme" pos="N"/>
  <entry word="klase" pos="N"/>
  <entry word="emakume" pos="N" macros="@sg"/>
  <entry word="liburu" pos="N" macros="@sg"/>
  <entry word="aita" pos="N" macros="@sg"/>
  <entry word="ama" pos="N" macros="@sg"/>
  <entry word="kafe" pos="N" macros="@sg"/>
  <macro name="@abs">
    <fs id="0" attr="case" val="s-case"/>
  </macro>
  <macro name="@abs1">
    <fs id="1" attr="case" val="s-case"/>
  </macro>
  <macro name="@abs2">
    <fs id="2" attr="case" val="p-case"/>
  </macro>
  <macro name="@erg">
    <fs id="0" attr="case" val="a-case"/>
  </macro>
  <macro name="@erg1">
    <fs id="1" attr="case" val="a-case"/>
  </macro>
  <macro name="@erg2">
    <fs id="2" attr="case" val="a-case"/>
  </macro>
  <macro name="@dat">
    <fs id="0" attr="case" val="dat"/>
  </macro>
  <macro name="@dat3">
    <fs id="3" attr="case" val="dat"/>
  </macro>
  <macro name="@sg">
    <fs id="0" attr="num" val="sing"/>
  </macro>
  <macro name="@plu">
    <fs id="0" attr="num" val="plu"/>
  </macro>
  <macro name="@plu1">
    <fs id="1" attr="num" val="plu"/>
  </macro>
  <macro name="@plu2">
    <fs id="2" attr="num" val="plu"/>
  </macro>
  <macro name="@sg1">
    <fs id="1" attr="num" val="sing"/>
  </macro>
  <macro name="@sg2">
    <fs id="2" attr="num" val="sing"/>
  </macro>
  <macro name="@sg3">
    <fs id="3" attr="num" val="sing"/>
  </macro>
  <macro name="@3rd">
    <fs id="0" attr="person" val="3"/>
  </macro>
  <macro name="@3rd1">
    <fs id="1" attr="person" val="3"/>
  </macro>
  <macro name="@3rd2">
    <fs id="2" attr="person" val="3"/>
  </macro>
  <macro name="@3rd3">
    <fs id="3" attr="person" val="3"/>
  </macro>
  <macro name="@1st">
    <fs id="0" attr="person" val="1"/>
  </macro>
  <macro name="@1st1">
    <fs id="1" attr="person" val="1"/>
  </macro>
  <macro name="@1st2">
    <fs id="2" attr="person" val="1"/>
  </macro>
  <macro name="@2nd">
    <fs id="0" attr="person" val="1"/>
  </macro>
  <macro name="@2nd1">
    <fs id="1" attr="person" val="2"/>
  </macro>
  <macro name="@2nd2">
    <fs id="2" attr="person" val="1"/>
  </macro>
  <macro name="@non-fin">
    <fs id="0" attr="vform" val="non-fin"/>
  </macro>
</morph>


================================================
FILE: grammars/mini-basque/parameters.xml
================================================
<?xml version="1.0"?>

<!-- Basque's parameter specifications - June 2004 Cem Bozsahin -->

<language name="Basque" type="erg" 
	
	xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" 
	xsi:noNamespaceSchemaLocation="../parameters.xsd"> 
	
  <parameters>

   <!-- NB1: predicate, setarg, arg, x-argument are pre-CCG categories.
             This notation is mapped to CCG notation by lexical rules.
             setarg and arg are serialized as in CCG.
  
        NB2: TV skeleton should NOT carry case information; it is set up 
             from language type and single argument of the IV

        NB3: IV's only argument MUST have its case specified 
        
    -->
		
    <infinitive subject-type="semantic"/>
       
    <iv>
      <predicate syn-type="s"/>
      <arg>
        <s-argument dir="\" syn-type="np" case="abs"/>
      </arg>
    </iv>

   <!-- For example, Basque's
        tv category simply says the order is V-A-P and V-P-A because
        the specs give Pred{\A-Arg, \P-Arg}.
        Pred, A-Arg, P-Arg are syntactically: s, np, np. 
     -->
		
    <tv>
      <predicate syn-type="s"/>
      <setarg>
        <a-argument dir="\" syn-type="np"/>
        <p-argument dir="\" syn-type="np"/>
      </setarg>
    </tv>
	
  </parameters>

</language>


================================================
FILE: grammars/mini-basque/preset-families.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!-- 
      - This file is generated by parametric-lexicon.xsl to set up
          accusativity/ergativity parameter for IV and TV primary families
          and control primary families.

          NB: pre-CCG categories of parameters.xml are mapped to
              CCG categories in this file. From now on, it's all CCG

    Suggestions to start-up lexicon development:

      1) Copy this file to lexicon-base.xml to avoid losing your changes
         to it (remember, this file is auto-generated at the start)
      2) Edit lexicon-base.xml to modify the preset families and to add your 
          own families as needed (merging the entries of same family is
          left to you)
      3) Use the ccg-build facility of openCCG, which uses lexicon-base to build
          the lexicon.xml, morph.xml and rules.xml files needed by the system.
  -->
<!--

      *** Families derived from language parameters ***

   Includes primary entries for IV (unerg and unacc), basic TV, TV-control1, 
   TV-control2, IV-control1
   
  -->
<!--
  subject-case, s-case, p-case and a-case are value types that set up ergative-
  accusative mapping and surface cases of these argumnents (cf. types.xml file).
  Actual case values for them (e.g. nom for a-case in accusative languages,
  erg for a-case in ergative languages) are defined in types.xml file.
  You can of course refer to actual values since they are types,  but if a
  construction is related to GR mapping (ERG or ACC), it's better to use
  `subject-case' (which covers a-case and s-case in ACC; p-case and s-case in ERG).
  Types.xml sets these up from parameter specification.
  
  -->
<ccg-lexicon xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:noNamespaceSchemaLocation="../lexicon.xsd" name="Basque">
   <family closed="true" pos="V" name="unergative">
      <entry name="primary">
         <complexcat>
            <atomcat type="s">
               <fs id="100">
                  <feat attr="index">
                     <lf>
                        <nomvar name="E"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <slash dir="\"/>
            <atomcat type="np">
               <fs id="1">
                  <feat attr="case" val="s-case"/>
                  <feat attr="index">
                     <lf>
                        <nomvar name="X1"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <lf>
               <satop nomvar="E">
                  <prop name="[*DEFAULT*]"/>
                  <diamond mode="Arg1">
                     <nomvar name="X1"/>
                  </diamond>
                  <diamond mode="Arg2">
                     <nom name="one"/>
                  </diamond>
               </satop>
            </lf>
         </complexcat>
      </entry>
   </family>
   <family closed="true" pos="V" name="unaccusative">
      <entry name="primary">
         <complexcat>
            <atomcat type="s">
               <fs id="100">
                  <feat attr="index">
                     <lf>
                        <nomvar name="E"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <slash dir="\"/>
            <atomcat type="np">
               <fs id="1">
                  <feat attr="case" val="s-case"/>
                  <feat attr="index">
                     <lf>
                        <nomvar name="X1"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <lf>
               <satop nomvar="E">
                  <prop name="[*DEFAULT*]"/>
                  <diamond mode="Arg2">
                     <nomvar name="X1"/>
                  </diamond>
                  <diamond mode="Arg1">
                     <nom name="one"/>
                  </diamond>
               </satop>
            </lf>
         </complexcat>
      </entry>
   </family>
   <family closed="true" pos="V" name="TV">
      <entry name="primary">
         <complexcat>
            <atomcat type="s">
               <fs id="100">
                  <feat attr="index">
                     <lf>
                        <nomvar name="E"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <setarg>
               <slash dir="\"/>
               <atomcat type="np">
                  <fs id="1">
                     <feat attr="case" val="a-case"/>
                     <feat attr="index">
                        <lf>
                           <nomvar name="X1"/>
                        </lf>
                     </feat>
                  </fs>
               </atomcat>
               <slash dir="\"/>
               <atomcat type="np">
                  <fs id="2">
                     <feat attr="case" val="p-case"/>
                     <feat attr="index">
                        <lf>
                           <nomvar name="X2"/>
                        </lf>
                     </feat>
                  </fs>
               </atomcat>
            </setarg>
            <lf>
               <satop nomvar="E">
                  <prop name="[*DEFAULT*]"/>
                  <diamond mode="Arg1">
                     <nomvar name="X1"/>
                  </diamond>
                  <diamond mode="Arg2">
                     <nomvar name="X2"/>
                  </diamond>
               </satop>
            </lf>
         </complexcat>
      </entry>
   </family>
   <family closed="true" pos="V" name="TV-control2">
      <entry name="primary">
         <complexcat>
            <atomcat type="s">
               <fs id="100">
                  <feat attr="index">
                     <lf>
                        <nomvar name="E"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <setarg>
               <slash dir="\"/>
               <atomcat type="np">
                  <fs id="1">
                     <feat attr="case" val="a-case"/>
                     <feat attr="index">
                        <lf>
                           <nomvar name="X1"/>
                        </lf>
                     </feat>
                  </fs>
               </atomcat>
               <slash dir="\"/>
               <complexcat>
                  <!--NB: Word order and directionality of embedded clause's |(S|NP) 
type is an 'educated guess' from the syntactic type of TV. Change them
accordingly 
  -->
                  <atomcat type="s">
                     <fs id="3">
                        <feat val="non-fin" attr="vform"/>
                        <feat attr="index">
                           <lf>
                              <nomvar name="E2"/>
                           </lf>
                        </feat>
                     </fs>
                  </atomcat>
                  <slash dir="|"/>
                  <atomcat type="np">
                     <fs id="4">
                        <!-- NB: If infinitive type is syntactic subject (which is the 
		  default), there is a built-in type in types.xml file called
		  "subject-case". Include in this type all the subjects that
		  can be controlled e.g. nominative subjects only (as in German), 
		  dative and nominative subjects (as in Malayalam) etc. In this
		  case, the controllee is not semantically restricted.
		  
		  If infinitive type is semantic subject, you need a larger
		  fragment of Hybrid Logic than HLDS uses to implement identity
		  of two event variables e.g.
		  
		  @_e(Arg1 a) ^ @_e(Arg1 b) - -> @_a(b)
		  
		  where a is the event variable for controller verb, and
		  b is the event variable for the controlled verb, and Arg1 is the
		  modality for primary arguments (1s).
		  
		  This constraint is formulable in HL but HLDS does not cover that
		  fragment (yet). When it does, the lf tag should just stick in that
		  constraint.
		  
		  Currently, OpenCCG can generate an LF with TWO non-identical Arg1 modalities
		  in the same event structure, therefore some illicit examples would
		  go through.
		-->
                        <feat attr="index">
                           <lf>
                              <nomvar name="X2"/>
                           </lf>
                           <!--NB: Index is same as Arg2's -->
                        </feat>
                     </fs>
                  </atomcat>
               </complexcat>
               <slash dir="\"/>
               <atomcat type="np">
                  <fs id="2">
                     <feat attr="case" val="p-case"/>
                     <feat attr="index">
                        <lf>
                           <nomvar name="X2"/>
                        </lf>
                     </feat>
                  </fs>
               </atomcat>
            </setarg>
            <lf>
               <satop nomvar="E">
                  <prop name="[*DEFAULT*]"/>
                  <diamond mode="Arg1">
                     <nomvar name="X1"/>
                  </diamond>
                  <diamond mode="Arg2">
                     <nomvar name="X2"/>
                  </diamond>
                  <diamond mode="Arg3">
                     <nomvar name="E2"/>
                     <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
                  </diamond>
               </satop>
            </lf>
         </complexcat>
      </entry>
   </family>
   <family closed="true" pos="V" name="TV-control1">
      <entry name="primary">
         <complexcat>
            <atomcat type="s">
               <fs id="100">
                  <feat attr="index">
                     <lf>
                        <nomvar name="E"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <setarg>
               <slash dir="\"/>
               <atomcat type="np">
                  <fs id="1">
                     <feat attr="case" val="a-case"/>
                     <feat attr="index">
                        <lf>
                           <nomvar name="X1"/>
                        </lf>
                     </feat>
                  </fs>
               </atomcat>
               <slash dir="\"/>
               <complexcat>
                  <!--NB: Word order and directionality of embedded clause's 
|(S|NP) type is an 'educated guess' from the syntactic type of TV. 
Change them accordingly.
  -->
                  <atomcat type="s">
                     <fs id="3">
                        <feat val="non-fin" attr="vform"/>
                        <feat attr="index">
                           <lf>
                              <nomvar name="E2"/>
                           </lf>
                        </feat>
                     </fs>
                  </atomcat>
                  <slash dir="|"/>
                  <atomcat type="np">
                     <fs id="4">
                        <!-- NB: If infinitive type is syntactic subject (which is the 
		  default), there is a built-in type in types.xml file called
		  "subject-case". Include in this type all the subjects that
		  can be controlled e.g. nominative subjects only (as in German), 
		  dative and nominative subjects (as in Malayalam) etc. In this
		  case, the controllee is not semantically restricted.
		  
		  If infinitive type is semantic subject, you need a larger
		  fragment of Hybrid Logic than HLDS uses to implement identity
		  of two event variables e.g.
		  
		  @_e(Arg1 a) ^ @_e(Arg1 b) - -> @_a(b)
		  
		  where a is the event variable for controller verb, and
		  b is the event variable for the controlled verb, and Arg1 is the
		  modality for primary arguments (1s).
		  
		  This constraint is formulable in HL but HLDS does not cover that
		  fragment (yet). When it does, the lf tag should just stick in that
		  constraint.
		  
		  Currently, OpenCCG can generate an LF with TWO non-identical Arg1 modalities
		  in the same event structure, therefore some illicit examples would
		  go through.
		-->
                        <feat attr="index">
                           <lf>
                              <nomvar name="X1"/>
                           </lf>
                           <!--NB: Index is same as Arg1's -->
                        </feat>
                     </fs>
                  </atomcat>
               </complexcat>
               <slash dir="\"/>
               <atomcat type="np">
                  <fs id="2">
                     <feat attr="case" val="p-case"/>
                     <feat attr="index">
                        <lf>
                           <nomvar name="X2"/>
                        </lf>
                     </feat>
                  </fs>
               </atomcat>
            </setarg>
            <lf>
               <satop nomvar="E">
                  <prop name="[*DEFAULT*]"/>
                  <diamond mode="Arg1">
                     <nomvar name="X1"/>
                  </diamond>
                  <diamond mode="Arg2">
                     <nomvar name="X2"/>
                  </diamond>
                  <diamond mode="Arg3">
                     <nomvar name="E2"/>
                     <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
                  </diamond>
               </satop>
            </lf>
         </complexcat>
      </entry>
   </family>
   <family closed="true" pos="V" name="IV-control1">
      <entry name="primary">
         <complexcat>
            <atomcat type="s">
               <fs id="100">
                  <feat attr="index">
                     <lf>
                        <nomvar name="E"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <setarg>
               <slash dir="\"/>
               <atomcat type="np">
                  <fs id="1">
                     <feat attr="case" val="a-case"/>
                     <feat attr="index">
                        <lf>
                           <nomvar name="X1"/>
                        </lf>
                     </feat>
                  </fs>
               </atomcat>
               <slash dir="\"/>
               <complexcat>
                  <!--NB: Word order and directionality of embedded clause's 
|(S|NP) type is an 'educated guess' from the syntactic type of TV. 
Change them accordingly.
  -->
                  <atomcat type="s">
                     <fs id="3">
                        <feat val="non-fin" attr="vform"/>
                        <feat attr="index">
                           <lf>
                              <nomvar name="E2"/>
                           </lf>
                        </feat>
                     </fs>
                  </atomcat>
                  <slash dir="|"/>
                  <atomcat type="np">
                     <fs id="4">
                        <!-- NB: If infinitive type is syntactic subject (which is the 
		  default), there is a built-in type in types.xml file called
		  "subject-case". Include in this type all the subjects that
		  can be controlled e.g. nominative subjects only (as in German), 
		  dative and nominative subjects (as in Malayalam) etc. In this
		  case, the controllee is not semantically restricted.
		  
		  If infinitive type is semantic subject, you need a larger
		  fragment of Hybrid Logic than HLDS uses to implement identity
		  of two event variables e.g.
		  
		  @_e(Arg1 a) ^ @_e(Arg1 b) - -> @_a(b)
		  
		  where a is the event variable for controller verb, and
		  b is the event variable for the controlled verb, and Arg1 is the
		  modality for primary arguments (1s).
		  
		  This constraint is formulable in HL but HLDS does not cover that
		  fragment (yet). When it does, the lf tag should just stick in that
		  constraint.
		  
		  Currently, OpenCCG can generate an LF with TWO non-identical Arg1 modalities
		  in the same event structure, therefore some illicit examples would
		  go through.
		-->
                        <feat attr="index">
                           <lf>
                              <nomvar name="X1"/>
                           </lf>
                           <!--NB: Index is same as Arg1's -->
                        </feat>
                     </fs>
                  </atomcat>
               </complexcat>
            </setarg>
            <lf>
               <satop nomvar="E">
                  <prop name="[*DEFAULT*]"/>
                  <diamond mode="Arg1">
                     <nomvar name="X1"/>
                  </diamond>
                  <diamond mode="Arg2">
                     <nomvar name="E2"/>
                     <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
                  </diamond>
               </satop>
            </lf>
         </complexcat>
      </entry>
   </family>
   <!--

    *** End of derived families ***
 
        Add new families here, and merge the new entries for preset
         families as needed (e.g., you may add an entry to TV family
         for pro-dropping the subject etc.)
  -->
</ccg-lexicon>


================================================
FILE: grammars/mini-basque/rules.xml
================================================
<?xml version='1.0' encoding='UTF-8'?>
<rules
xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
    xsi:noNamespaceSchemaLocation="../rules.xsd"
>
  <application dir="forward"/>
  <application dir="backward"/>
  <composition dir="forward" harmonic="true"/>
  <composition dir="forward" harmonic="false"/>
  <composition dir="backward" harmonic="true"/>
  <composition dir="backward" harmonic="false"/>
  <typeraising dir="forward" useDollar="true"/>
  <typeraising dir="backward" useDollar="true"/>
  <substitution dir="forward" harmonic="true"/>
  <substitution dir="forward" harmonic="false"/>
  <substitution dir="backward" harmonic="true"/>
  <substitution dir="backward" harmonic="false"/>

<!--
  <typechanging name="pd">
    <arg>
      <complexcat>
        <atomcat type="s">
            <fs id="1">
            <feat attr="index">
             <lf>
              <nomvar name="E"/>
             </lf>
            </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
               <lf>
                <nomvar name="X"/>
               </lf>
              </feat>
            </fs>
          </atomcat>
      </complexcat>
    </arg>
    <result>
      <atomcat type="s">
        <fs >
          <feat attr="index">
            <lf>
             <nomvar name="E"/>
            </lf>
          </feat>
        </fs>
      </atomcat>
    </result>
  </typechanging>
-->
</rules>


================================================
FILE: grammars/mini-basque/testbed.out
================================================
Loading grammar from URL: file:/home/bozsahin/openccg/grammars/mini-basque/grammar.xml

Parse	Realize	String
-----	-------	------
ok	-	joan
ok	-	ikusi
ok	-	zuen
ok	-	zen
ok	-	klase ra
ok	-	eskola n
ok	-	ama aitak ikusi zuen
ok	-	ama joan
ok	-	*ama k joan
ok	-	*ama k joan du
(2)	-	ama k seme a ikusi du
(2)	-	seme a ama k ikusi du
(2)	-	nik liburu a emakume ari eman nahi dut
FAILED	-	*nik liburu a aita k eman nahi dut
FAILED	-	*nik aita k liburu a eman nahi dut
ok	-	ama k seme a emakume ari eman dio
ok	-	seme a ama k emakume ari eman dio
ok	-	emakume ari seme a ama k eman dio
ok	-	nik joan nahi dut
(2)	-	nik kafe a egin nahi dut
ok	-	*nik kafe a egin nahi du
ok	-	nik kafe a egin nahi
FAILED	-	*nik aita k ikusi nahi dut
ok	-	nik ikusi nahi dud an gizon a joan da
ok	-	gizon a ikusi nahi dud an seme a joan da
ok	-	emakume ari liburu a eman dio n gizon a joan du
FAILED	-	emakume ari liburu a eman dio n gizon a nik ikusi dut
ok	-	*emakume ari liburu a eman dio n gizon ak ni ikusi dut
ok	-	emakume ari liburu a eman dio n gizon ak ni ikusi
(2)	-	gizon ak emakume ari eman dio n liburu a aita k ikusi du
(3)	-	gizon ak liburu a eman dio n emakume a
ok	-	gizon ak liburu a eman dio n emakume a joan du
(3)	-	aita k seme a eskola n utzi zuen eta klase ra joan zen
(3)	-	seme a eskola n utzi zuen eta klase ra joan zen
(3)	-	seme a eskola n utzi eta klase ra joan zen
ok	-	*seme a eskola n utzi eta klase ra joan zuen
ok	-	ama joan zen eta aita k ikusi zuen
ok	-	aita k ikusi zuen eta klase ra joan zen
ok	-	*ama k joan eta aita ikusi zuen
ok	-	aitak ama ikusi zuen eta joan zen
ok	-	ama aitak ikusi zuen eta joan zen
ok	-	joan zen eta ama ikusi zuen
ok	-	joan zen eta aitak ikusi zuen
FAILED	-	sagarrak emakume ak egosten ditu eta gizonak jaten ditu
ok	-	sagarrak emakume ak egosten ditu eta usteltzen dira
ok	-	sagarrak usteltzen dira eta emakume ak egosten ditu


================================================
FILE: grammars/mini-basque/testbed.xml
================================================
<?xml version="1.0"?>
<!-- Copyright (C) 2003 Jason Baldridge and Michael White -->
<regression>
  <item numOfParses="1" string="joan"/>
  <item numOfParses="1" string="ikusi"/>
  <item numOfParses="1" string="zuen"/>
  <item numOfParses="1" string="zen"/>
  <item numOfParses="1" string="klase ra"/>
  <item numOfParses="1" string="eskola n"/>
  <item numOfParses="1" string="ama aitak ikusi zuen"/>
  <item numOfParses="1" string="ama joan"/>
  <item numOfParses="0" string="ama k joan"/>
  <item numOfParses="0" string="ama k joan du"/>
  <item numOfParses="1" string="ama k seme a ikusi du"/>
  <item numOfParses="1" string="seme a ama k ikusi du"/>
  <item numOfParses="1" string="nik liburu a emakume ari eman nahi dut"/>
  <item numOfParses="0" string="nik liburu a aita k eman nahi dut"/>
  <item numOfParses="0" string="nik aita k liburu a eman nahi dut"/>
  <item numOfParses="1" string="ama k seme a emakume ari eman dio"/>
  <item numOfParses="1" string="seme a ama k emakume ari eman dio"/>
  <item numOfParses="1" string="emakume ari seme a ama k eman dio"/>
  <item numOfParses="1" string="nik joan nahi dut"/>
  <item numOfParses="1" string="nik kafe a egin nahi dut"/>
  <item numOfParses="0" string="nik kafe a egin nahi du"/>
  <item numOfParses="1" string="nik kafe a egin nahi"/>
  <item numOfParses="0" string="nik aita k ikusi nahi dut"/>
  <item numOfParses="1" string="nik ikusi nahi dud an gizon a joan da"/>
  <item numOfParses="1" string="gizon a ikusi nahi dud an seme a joan da"/>
  <item numOfParses="1" 
string="emakume ari liburu a eman dio n gizon a joan du"/>
  <item numOfParses="1" 
string="emakume ari liburu a eman dio n gizon a nik ikusi dut"/>
  <item numOfParses="0" 
string="emakume ari liburu a eman dio n gizon ak ni ikusi dut"/>
  <item numOfParses="1" 
string="emakume ari liburu a eman dio n gizon ak ni ikusi"/>
  <item numOfParses="1" 
string="gizon ak emakume ari eman dio n liburu a aita k ikusi du"/>
<item numOfParses="1" 
string="gizon ak liburu a eman dio n emakume a"/>
<item numOfParses="1" 
string="gizon ak liburu a eman dio n emakume a joan du"/>
  <item numOfParses="1" 
string="aita k seme a eskola n utzi zuen eta klase ra joan zen"/>
  <item numOfParses="1" 
string="seme a eskola n utzi zuen eta klase ra joan zen"/>
  <item numOfParses="1" string="seme a eskola n utzi eta klase ra joan zen"/>
  <item numOfParses="0" string="seme a eskola n utzi eta klase ra joan zuen"/>
  <item numOfParses="1" string="ama joan zen eta aita k ikusi zuen"/>
  <item numOfParses="1" string="aita k ikusi zuen eta klase ra joan zen"/>
  <item numOfParses="0" string="ama k joan eta aita ikusi zuen"/>
  <item numOfParses="1" 
string="aitak ama ikusi zuen eta joan zen"/>
  <item numOfParses="1" 
string="ama aitak ikusi zuen eta joan zen"/>
  <item numOfParses="1" 
string="joan zen eta ama ikusi zuen"/>
  <item numOfParses="1" 
string="joan zen eta aitak ikusi zuen"/>
<item numOfParses="1" 
string="sagarrak emakume ak egosten ditu eta gizonak jaten ditu"/>
<item numOfParses="1" 
string="sagarrak emakume ak egosten ditu eta usteltzen dira"/>
<item numOfParses="1" 
string="sagarrak usteltzen dira eta emakume ak egosten ditu"/>
</regression>


================================================
FILE: grammars/mini-basque/types.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!-- 
      - This file is generated by parametric-types.xsl from parameter specs
	    (parameters.xml) to set up  types.xml file for development.
         
      - If the language in question has eg. quirky subjects etc., add their 
	    values under appropriate types.
	 
	 -->
<!--
	   subject-case, s-case, p-case and a-case are pre-defined types that are
	   used in the automatically generated initial lexicon (preset-families
	   .xml). We recommend that you dont change them. They handle
	   accusative/ergative mapping among other things (cf. types.xml initial
	   hierarchy).
	  
	 -->
<types xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:noNamespaceSchemaLocation="../types.xsd" name="Basque">
  <type name="s-case" parents="subject-case"/>
  <type name="subject-case"/>
  <type parents="a-case" name="erg"/>
  <type name="a-case"/>
  <type parents="s-case p-case" name="abs"/>
  <type name="p-case" parents="subject-case"/>
</types>


================================================
FILE: grammars/mini-dyirbal/build.xml
================================================
<!-- $Id: build.xml,v 1.2 2007/03/26 18:31:11 mwhite14850 Exp $ -->
<!-- Copyright (C) 2003 University of Edinburgh (Michael White) and Cem Bozsahin -->
<project default="grammar" basedir=".">

  <!-- =================================================================== -->
  <!-- Initialization target                                               -->
  <!-- =================================================================== -->
  <target name="init">
    <tstamp/>
    <property name="Name" value="OpenCCG"/>
    <property name="name" value="openccg"/>

    <echo message="----------- ${Name} ------------"/>

    <property name="lib.dir" value="${openccg.home}/lib"/>
    <property name="grammars.dir" value="${openccg.home}/grammars"/>

    <path id="validate.classpath">
      <pathelement location="${lib.dir}/xercesImpl.jar"/>
      <pathelement location="${lib.dir}/${name}.jar"/>
    </path>
  </target>
  

  <!-- =================================================================== -->
  <!-- Help on usage                                                       -->
  <!-- =================================================================== -->
  <target name="usage">
    <echo message=""/>
    <echo message=""/>
    <echo message="OpenCCG grammar build file"/>
    <echo message="-------------------------------------------------------------"/>
    <echo message=""/>
    <echo message=" Available targets are:"/>
    <echo message=""/>
    <echo message="   grammar  --> builds the grammar (default)"/>
    <echo message=""/>
    <echo message="   skeleton  --> builds the skeleton file"/>
    <echo message=""/>
    <echo message=" See the comments inside the build.xml file for more details."/>
    <echo message="-------------------------------------------------------------"/>
    <echo message=""/>
    <echo message=""/>
  </target>
  

  <!-- =================================================================== -->
  <!-- Builds grammar                                                     -->
  <!-- =================================================================== -->
  <target name="grammar" depends="init" description="builds grammar">
    <echo message="Adding family members from dict.xml to lexicon-base.xml, yielding lexicon.xml"/>
    <java classname="org.apache.xalan.xslt.Process"> 
      <arg value="-IN"/> <arg value="lexicon-base.xml"/>
      <arg value="-XSL"/> <arg value="${grammars.dir}/add-family-members.xsl"/>
      <arg value="-PARAM"/> <arg value="dict-file"/> <arg value="${basedir}/dict.xml"/>
      <arg value="-OUT"/> <arg value="lexicon.xml"/>
    </java>
    <echo message="Extracting morph items from dict.xml to morph.xml"/>
    <java classname="org.apache.xalan.xslt.Process"> 
      <arg value="-IN"/> <arg value="${basedir}/dict.xml"/>
      <arg value="-XSL"/> <arg value="${grammars.dir}/extract-morph.xsl"/>
      <arg value="-OUT"/> <arg value="morph.xml"/>
    </java>
    <echo message="Validating grammar.xml, lexicon.xml, morph.xml, rules.xml and types.xml"/>
    <java classname="opennlp.ccg.test.Validator" classpathref="validate.classpath" fork="true"> 
      <arg value="grammar.xml"/>
      <arg value="lexicon.xml"/>
      <arg value="morph.xml"/>
      <arg value="rules.xml"/>
      <arg value="types.xml"/>
    </java>
  </target>

  <target name="skeleton"
          depends="init"
 description="Builds pre-lexicon to start up lexicon development">
    <echo message="Validating parameters.xml"/>
    <java classname="opennlp.ccg.test.Validator" classpathref="validate.classpath" fork="true"> 
      <arg value="parameters.xml"/>
    </java>
    <echo message="Generating preset-families.xml"/>
    <java classname="org.apache.xalan.xslt.Process">
      <arg value="-IN"/> <arg value="${basedir}/parameters.xml"/>
      <arg value="-XSL"/> <arg value="${grammars.dir}/parametric-lexicon.xsl"/>
      <arg value="-OUT"/> <arg value="${basedir}/preset-families.xml"/>
    </java>
    <echo message="Validating preset-families.xml"/>
    <java classname="opennlp.ccg.test.Validator" classpathref="validate.classpath" fork="true"> 
      <arg value="preset-families.xml"/>
    </java>
	<echo message="Generating types.xml"/>
    <java classname="org.apache.xalan.xslt.Process">
      <arg value="-IN"/> <arg value="${basedir}/parameters.xml"/>
      <arg value="-XSL"/> <arg value="${grammars.dir}/parametric-types.xsl"/>
      <arg value="-OUT"/> <arg value="${basedir}/types.xml"/>
    </java>
    <echo message="Validating types.xml"/>
    <java classname="opennlp.ccg.test.Validator" classpathref="validate.classpath" fork="true"> 
      <arg value="types.xml"/>
    </java>
  </target>
</project>

<!-- End of file -->


================================================
FILE: grammars/mini-dyirbal/dict.xml
================================================
<?xml version="1.0"?>

<dictionary name="Dyirbal">
 
  <entry stem="," pred="and" pos="Conj">
    <member-of family="Conj"/>
    <word form=","/>
  </entry>
  <entry stem="naba" pred="bathe" pos="V">
    <member-of family="IV"/>
    <word form="nabaygu"/>
  </entry>
  <entry stem="miyanda" pred="laugh" pos="V">
    <member-of family="IV"/>
    <word form="miyanda"/>
  </entry>
  <entry stem="ya" pred="go" pos="V">
    <member-of family="IV"/>
    <word form="yanu" macros="@nfut"/>
  </entry>
  <entry stem="baji" pred="fall-down" pos="V">
    <member-of family="IV"/>
    <word form="bajigu" macros="@purp"/>
  </entry>
  <entry stem="banaga" pred="return" pos="V">
    <member-of family="IV"/>
    <word form="banaganyu" macros="@nfut"/>
    <word form="banagaygu" macros="@purp"/>
  </entry>
  <entry stem="bural" pred="see" pos="V">
    <member-of family="TV"/>
    <word form="bural" macros="@purp"/>
    <word form="buran" macros="@nfut"/>
    <word form="burali" macros="@purp"/>
  </entry>
  <entry stem="jilwal" pred="kick" pos="V">
    <member-of family="TV"/>
    <word form="jilwal"/>
  </entry>
  <entry stem="bara" pred="punch" pos="V">
    <member-of family="TV"/>
    <word form="baran" macros="@purp"/>
  </entry>
  <entry stem="mawa" pred="examine" pos="V">
    <member-of family="TV"/>
    <word form="mawali" macros="@purp"/>
  </entry>
  <entry stem="walngarra" pred="want" pos="V">
    <member-of family="TV"/>
    <member-of family="IV-control1"/>
    <word form="walngarra"/>
  </entry>
  <entry stem="giga" pred="tell" pos="V">
    <member-of family="TV"/>
    <member-of family="TV-control2"/>
    <word form="gigan" macros="@nfut" />
  </entry>
  <entry stem="yara" pred="man" pos="NP">
    <member-of family="Noun"/>
    <word form="yara" macros="@abs @n1" />
  </entry>
  <entry stem="burrbula" pos="NP">
    <member-of family="Noun"/>
    <word form="burrbula" macros="@abs @n1" />
  </entry>
  <entry stem="numa" pred="father" pos="NP">
    <member-of family="Noun"/>
    <word form="numa" macros="@abs @n1" />
  </entry>
  <entry stem="gubi" pred="doctor" pos="NP">
    <member-of family="Noun"/>
    <word form="gubi" macros="@abs @n1" />
  </entry>
  <entry stem="yibi" pred="woman" pos="NP">
    <member-of family="Noun"/>
    <word form="yibi" macros="@abs @n2" />
  </entry>
  <entry stem="yabu" pred="mother" pos="NP">
    <member-of family="Noun"/>
    <word form="yabu" macros="@abs @n2" />
  </entry>
  <entry stem="guda" pred="dog" pos="NP">
    <member-of family="Noun"/>
    <word form="guda" macros="@abs @n2" />
  </entry>
  <entry stem="naja" pred="i" pos="NNP">
    <member-of family="pronoun"/>
    <word form="naja" macros="@erg"/>
  </entry>
  <entry stem="nyurra" pred="you" pos="NNP">
    <member-of family="pronoun"/>
    <word form="nyurra" macros="@erg"/>
  </entry>
  <entry stem="nanana" pred="we" pos="NNP">
    <member-of family="pronoun"/>
    <word form="nanana" macros="@abs"/>
  </entry>
  <entry stem="ba" pred="class" pos="NP">
    <member-of family="N-class"/>
    <word form="bayi" macros="@abs @n1" />
    <word form="bangul" macros="@erg @n1" />
    <word form="bagul" macros="@dat @n1" />
    <word form="banul" macros="@gen @n1" />
    <word form="balan" macros="@abs @n2" />
    <word form="bangun" macros="@erg @n2" />
    <word form="bagun" macros="@dat @n2" />
    <word form="banun" macros="@gen @n2" />
    <word form="balam" macros="@abs @n3" />
    <word form="bagun" macros="@erg @n3" />
    <word form="bagum" macros="@dat @n3" />
    <word form="bala" macros="@abs @n4" />
    <word form="baygu" macros="@erg @n4" />
    <word form="bagu" macros="@dat @n4" />
    <word form="banu" macros="@gen @n4" />
  </entry>
  <entry stem="ngu" pos="Affix">
    <member-of family="case"/>
    <word form="ngu" macros="@erg" />
  </entry>
  <entry stem="gu" pos="Affix">
    <member-of family="adjunct-case"/>
    <word form="gu" macros="@dat2" />
  </entry>
  <entry stem="nu" pos="Affix">
    <member-of family="rel"/>
    <word form="nu" />
  </entry>
  <entry stem="ru" pos="Affix">
    <member-of family="rel-case"/>
    <word form="ru" />
  </entry>
  <entry stem="na" pred="anti-p" pos="Affix">
    <member-of family="voice"/>
    <word form="na" />
    <word form="naygu" />
  </entry>

<macro name="@purp">
  <fs id="0" attr="v-form" val="purposive"/>
</macro>
<macro name="@nfut">
  <fs id="0" attr="v-form" val="purposive"/>
</macro>
<macro name="@n1">
  <fs id="0" attr="class" val="1"/>
  <lf>
     <satop nomvar="X">
       <diamond mode="Class">
         <prop name="1"/>
       </diamond>
      </satop>
   </lf>
</macro>
<macro name="@n2">
  <fs id="0" attr="class" val="2"/>
  <lf>
     <satop nomvar="X">
       <diamond mode="Class">
         <prop name="2"/>
       </diamond>
      </satop>
   </lf>
</macro>
<macro name="@n3">
  <fs id="0" attr="class" val="3"/>
  <lf>
     <satop nomvar="X">
       <diamond mode="Class">
         <prop name="3"/>
       </diamond>
      </satop>
   </lf>
</macro>
<macro name="@n4">
  <fs id="0" attr="class" val="4"/>
   <lf>
     <satop nomvar="X">
       <diamond mode="Class">
         <prop name="3"/>
       </diamond>
      </satop>
   </lf>
</macro>
<macro name="@gen">
  <fs id="0" attr="case" val="gen"/>
</macro>
<macro name="@abs">
  <fs id="0" attr="case" val="subject-case"/>
</macro>
<macro name="@abs1">
  <fs id="1" attr="case" val="subject-case"/>
</macro>
<macro name="@abs2">
  <fs id="2" attr="case" val="subject-case"/>
</macro>
<macro name="@erg">
  <fs id="0" attr="case" val="a-case"/>
</macro>
<macro name="@erg1">
  <fs id="1" attr="case" val="a-case"/>
</macro>
<macro name="@erg2">
  <fs id="2" attr="case" val="a-case"/>
</macro>
<macro name="@dat">
  <fs id="0" attr="case" val="dat"/>
</macro>
<macro name="@dat2">
  <fs id="2" attr="case" val="dat"/>
</macro>
<macro name="@sg">
  <fs id="0" attr="num" val="sing"/>
</macro>
<macro name="@sg1">
  <fs id="1" attr="num" val="sing"/>
</macro>
<macro name="@sg2">
  <fs id="2" attr="num" val="sing"/>
</macro>
<macro name="@3rd">
  <fs id="0" attr="person" val="3"/>
</macro>
<macro name="@3rd1">
  <fs id="1" attr="person" val="3"/>
</macro>
<macro name="@3rd2">
  <fs id="2" attr="person" val="3"/>
</macro>
<macro name="@1st">
  <fs id="0" attr="person" val="1"/>
</macro>
<macro name="@1st1">
  <fs id="1" attr="person" val="1"/>
</macro>
<macro name="@1st2">
  <fs id="2" attr="person" val="1"/>
</macro>
<macro name="@2nd">
  <fs id="0" attr="person" val="1"/>
</macro>
<macro name="@2nd1">
  <fs id="1" attr="person" val="1"/>
</macro>
<macro name="@2nd2">
  <fs id="2" attr="person" val="1"/>
</macro>
<macro name="@non-fin">
  <fs id="0" attr="vform" val="non-fin"/> 
</macro>

</dictionary>


================================================
FILE: grammars/mini-dyirbal/grammar.xml
================================================
<?xml version="1.0"?>
<!-- 
Copyright (C) 2003 University of Edinburgh (Michael White) and Cem Bozsahin
$Revision: 1.1 $, $Date: 2005/08/03 14:23:28 $ 
-->
<grammar name="Dyirbal"
  xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
  xsi:noNamespaceSchemaLocation="../grammar.xsd"
>

  <lexicon file="lexicon.xml"/>
  <morphology file="morph.xml"/>
  <rules file="rules.xml"/>
  <types file="types.xml"/>

</grammar>


================================================
FILE: grammars/mini-dyirbal/lexicon-base.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!-- 
      - This file is generated by lexicon-skeleton.xsl to set up
          accusativity/ergativity parameter for IV and TV primary families
          and control primary families.

          NB: pre-CCG categories of lexicon-skeleton.xml are mapped to
              CCG categories in this file. From now on, it's all CCG

    Suggestions to start-up lexicon development:

      1) Copy this file to lexicon-base.xml to avoid losing your changes
         to it (remember, this file is auto-generated at the start)
      2) Edit lexicon-base.xml to modify the preset families and to add your 
          own families as needed (merging the entries of same family is
          left to you)
      3) Use the build facility of openCCG to build
          the lexicon.xml, morph.xml and rules.xml files needed by the system.
  -->
<!-- Additional families by Cem Bozsahin, 6/2003 -->
<!--

      *** Families derived from language parameters ***

   Includes primary entries for IV, TV, TV-control1, TV-control2, IV-control1
   
  -->
<ccg-lexicon name="Dyirbal" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:noNamespaceSchemaLocation="../lexicon.xsd">

  <family closed="true" pos="V" name="IV">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="case" val="s-case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>

  <family closed="true" pos="V" name="TV">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <setarg>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="case" val="a-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="case" val="p-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </setarg>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="X2"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
  <family closed="true" pos="V" name="TV-control2">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <setarg>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="case" val="a-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="|"/>
          <complexcat>
                  <!--NB: Word order and directionality of embedded clause's |(S|NP) 
type is an 'educated guess' from the syntactic type of TV. Change them
accordingly 
  -->
            <atomcat type="s">
              <fs id="3">
                <feat val="non-fin" attr="vform"/>
                <feat attr="index">
                  <lf>
                    <nomvar name="E2"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
            <slash dir="|"/>
            <atomcat type="np">
              <fs id="4">
                 <feat attr="case" val="subject-case"/>
                <feat attr="index">
                  <lf>
                    <nomvar name="X2"/>
                  </lf>
                           <!--NB: Index is same as Arg2's 
  -->
                </feat>
              </fs>
            </atomcat>
          </complexcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="case" val="p-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </setarg>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="X2"/>
            </diamond>
            <diamond mode="Arg3">
              <nomvar name="E2"/>
                     <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
  <family closed="true" pos="V" name="TV-control1">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <setarg>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="case" val="a-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="|"/>
          <complexcat>
                  <!--NB: Word order and directionality of embedded clause's 
|(S|NP) type is an 'educated guess' from the syntactic type of TV. 
Change them accordingly.
  -->
            <atomcat type="s">
              <fs id="3">
                <feat val="non-fin" attr="vform"/>
                <feat attr="index">
                  <lf>
                    <nomvar name="E2"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
            <slash dir="|"/>
            <atomcat type="np">
              <fs id="4">
                <feat attr="case" val="subject-case"/>
                <feat attr="index">
                  <lf>
                    <nomvar name="X1"/>
                  </lf>
                           <!--NB: Index is same as Arg1's 
  -->
                </feat>
              </fs>
            </atomcat>
          </complexcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="case" val="p-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </setarg>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="X2"/>
            </diamond>
            <diamond mode="Arg3">
              <nomvar name="E2"/>
                     <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
  <family closed="true" pos="V" name="IV-control1">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <setarg>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="case" val="s-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="|"/>
          <complexcat>
                  <!--NB: Word order and directionality of embedded clause's 
|(S|NP) type is an 'educated guess' from the syntactic type of TV. 
Change them accordingly.
  -->
            <atomcat type="s">
              <fs id="3">
                <feat val="non-fin" attr="vform"/>
                <feat attr="index">
                  <lf>
                    <nomvar name="E2"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
            <slash dir="|"/>
            <atomcat type="np">
              <fs id="4">
              <feat attr="case" val="subject-case"/>
               <feat attr="index">
                  <lf>
                    <nomvar name="X1"/>
                  </lf>
                           <!--NB: Index is same as Arg1's 
  -->
                </feat>
              </fs>
            </atomcat>
          </complexcat>
        </setarg>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="E2"/>
                     <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
   <!--

    *** End of derived families ***
 
        Add new families here, and merge the new entries for preset
         families as needed (e.g., you may add an entry to TV family
         for pro-dropping the subject etc.)
  -->

<!-- these are the user-defined families for Dyirbal.
  -->

  <family indexRel="*noSem*" pos="Affix" closed="true" name="rel-case">
    <entry name="primary">
      <complexcat>
        <atomcat type="np">
          <fs inheritsFrom="0">
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="np">
          <fs inheritsFrom="1">
            <feat attr="case" val="a-case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="*"/>
        <complexcat>
          <atomcat type="n">
            <fs id="0">
              <feat attr="index">
                <lf>
                  <nomvar name="Y"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="n">
            <fs id="1">
              <feat attr="case" val="subject-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
<!--
      <lf>
        <satop nomvar="Y">
          <prop name="[*DEFAULT*]"/>
          <diamond mode="Spec">
            <nomvar name="X"/>
          </diamond>
        </satop>
      </lf>
-->
      </complexcat>
    </entry>
  </family>

  <family indexRel="Restr" pos="Affix" closed="true" name="rel">
    <entry name="primary">
      <complexcat>
        <atomcat type="n">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="n">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="*"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="np">
<!-- no structure sharing with fs 0; this aint HPSG-->
            <fs id="2">
              <feat attr="case" val="subject-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="X">
            <diamond mode="Restr">
              <nomvar name="E"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>

  <family closed="true" pos="Affix" name="voice">
    <entry name="anti-passive">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="0">
            <feat attr="index">
              <lf>
                <nomvar name="P"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="np">
          <fs inheritsFrom="2">
            <feat attr="case" val="subject-case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="*"/>
        <complexcat>
          <atomcat type="s">
            <fs id="0">
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="case" val="a-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="case" val="subject-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="P">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Pred">
              <nomvar name="E"/>
            </diamond>
            <diamond mode="Arg1">
              <nomvar name="X"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>

  <family pos="Affix" closed="true" name="case">
    <entry name="primary">
      <complexcat>
        <atomcat type="np">
          <fs id="0">
            <feat attr="person" val="3"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="*"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="person" val="3"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X">
            <diamond mode="Spec">
              <nomvar name="D"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>

  <family closed="true" pos="Affix" name="adjunct-case">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash/>
        <dollar name="1"/>
        <slash dir="|"/>
        <complexcat>
          <atomcat type="s">
            <fs id="0">
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
        </complexcat>
        <slash dir="\" mode="*"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="P">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Pred">
              <nomvar name="E"/>
              <diamond mode="Mod">
                <nomvar name="Y"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>

  <family pos="NP" closed="true" name="Noun">
    <entry name="primary">
      <atomcat type="np">
        <fs id="0">
          <feat attr="num">
            <featvar name="NUM"/>
          </feat>
          <feat attr="index">
            <lf>
              <nomvar name="X"/>
            </lf>
          </feat>
        </fs>
        <lf>
          <satop nomvar="X">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </atomcat>
    </entry>
    <entry name="bare">
      <atomcat type="n">
        <fs id="1">
          <feat attr="num">
            <featvar name="NUM"/>
          </feat>
          <feat attr="index">
            <lf>
              <nomvar name="X"/>
            </lf>
          </feat>
        </fs>
        <lf>
          <satop nomvar="X">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </atomcat>
    </entry>
  </family>

  <family pos="NNP" closed="true" name="pronoun">
    <entry name="primary">
      <atomcat type="np">
        <fs id="0">
          <feat attr="num">
            <featvar name="NUM"/>
          </feat>
          <feat attr="index">
            <lf>
              <nomvar name="X"/>
            </lf>
          </feat>
        </fs>
        <lf>
          <satop nomvar="X">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </atomcat>
    </entry>
  </family>

  <family pos="NP" closed="true" name="N-class">
    <entry name="primary">
      <complexcat>
        <atomcat type="np">
          <fs id="0">
            <feat attr="person" val="3"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="*"/>
        <atomcat type="n">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <entry name="NP-like">
      <atomcat type="np">
        <fs id="0">
          <feat attr="person" val="3"/>
          <feat attr="num">
            <featvar name="NUM"/>
          </feat>
          <feat attr="index">
            <lf>
              <nomvar name="X"/>
            </lf>
          </feat>
        </fs>
      </atomcat>
    </entry>
  </family>

  <family closed="true" pos="Conj" name="Conj">
    <entry name="sentential">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S0"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash/>
        <dollar name="1"/>
        <slash dir="/" mode="*"/>
        <complexcat>
          <atomcat type="s">
            <fs inheritsFrom="1">
              <feat attr="index">
                <lf>
                  <nomvar name="S1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
        </complexcat>
        <slash dir="\" mode="*"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="S2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
        </complexcat>
        <lf>
          <satop nomvar="S0">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="List">
              <nomvar name="S1"/>
              <diamond mode="Coord">
                <nomvar name="S2"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>

</ccg-lexicon>


================================================
FILE: grammars/mini-dyirbal/lexicon.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!-- 
      - This file is generated by lexicon-skeleton.xsl to set up
          accusativity/ergativity parameter for IV and TV primary families
          and control primary families.

          NB: pre-CCG categories of lexicon-skeleton.xml are mapped to
              CCG categories in this file. From now on, it's all CCG

    Suggestions to start-up lexicon development:

      1) Copy this file to lexicon-base.xml to avoid losing your changes
         to it (remember, this file is auto-generated at the start)
      2) Edit lexicon-base.xml to modify the preset families and to add your 
          own families as needed (merging the entries of same family is
          left to you)
      3) Use the build facility of openCCG to build
          the lexicon.xml, morph.xml and rules.xml files needed by the system.
  -->
<!-- Additional families by Cem Bozsahin, 6/2003 -->
<!--

      *** Families derived from language parameters ***

   Includes primary entries for IV, TV, TV-control1, TV-control2, IV-control1
   
  -->
<ccg-lexicon xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" name="Dyirbal" xsi:noNamespaceSchemaLocation="../lexicon.xsd">
  <family closed="true" pos="V" name="IV">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="case" val="s-case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="naba" pred="bathe"/>
    <member stem="miyanda" pred="laugh"/>
    <member stem="ya" pred="go"/>
    <member stem="baji" pred="fall-down"/>
    <member stem="banaga" pred="return"/>
  </family>
  <family closed="true" pos="V" name="TV">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <setarg>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="case" val="a-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="case" val="p-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </setarg>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="X2"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="bural" pred="see"/>
    <member stem="jilwal" pred="kick"/>
    <member stem="bara" pred="punch"/>
    <member stem="mawa" pred="examine"/>
    <member stem="walngarra" pred="want"/>
    <member stem="giga" pred="tell"/>
  </family>
  <family closed="true" pos="V" name="TV-control2">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <setarg>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="case" val="a-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="|"/>
          <complexcat>
            <!--NB: Word order and directionality of embedded clause's |(S|NP) 
type is an 'educated guess' from the syntactic type of TV. Change them
accordingly 
  -->
            <atomcat type="s">
              <fs id="3">
                <feat val="non-fin" attr="vform"/>
                <feat attr="index">
                  <lf>
                    <nomvar name="E2"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
            <slash dir="|"/>
            <atomcat type="np">
              <fs id="4">
                <feat attr="case" val="subject-case"/>
                <feat attr="index">
                  <lf>
                    <nomvar name="X2"/>
                  </lf>
                  <!--NB: Index is same as Arg2's 
  -->
                </feat>
              </fs>
            </atomcat>
          </complexcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="case" val="p-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </setarg>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="X2"/>
            </diamond>
            <diamond mode="Arg3">
              <nomvar name="E2"/>
              <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="giga" pred="tell"/>
  </family>
  <family closed="true" pos="V" name="TV-control1">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <setarg>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="case" val="a-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="|"/>
          <complexcat>
            <!--NB: Word order and directionality of embedded clause's 
|(S|NP) type is an 'educated guess' from the syntactic type of TV. 
Change them accordingly.
  -->
            <atomcat type="s">
              <fs id="3">
                <feat val="non-fin" attr="vform"/>
                <feat attr="index">
                  <lf>
                    <nomvar name="E2"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
            <slash dir="|"/>
            <atomcat type="np">
              <fs id="4">
                <feat attr="case" val="subject-case"/>
                <feat attr="index">
                  <lf>
                    <nomvar name="X1"/>
                  </lf>
                  <!--NB: Index is same as Arg1's 
  -->
                </feat>
              </fs>
            </atomcat>
          </complexcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="case" val="p-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </setarg>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="X2"/>
            </diamond>
            <diamond mode="Arg3">
              <nomvar name="E2"/>
              <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
  <family closed="true" pos="V" name="IV-control1">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <setarg>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="case" val="s-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="|"/>
          <complexcat>
            <!--NB: Word order and directionality of embedded clause's 
|(S|NP) type is an 'educated guess' from the syntactic type of TV. 
Change them accordingly.
  -->
            <atomcat type="s">
              <fs id="3">
                <feat val="non-fin" attr="vform"/>
                <feat attr="index">
                  <lf>
                    <nomvar name="E2"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
            <slash dir="|"/>
            <atomcat type="np">
              <fs id="4">
                <feat attr="case" val="subject-case"/>
                <feat attr="index">
                  <lf>
                    <nomvar name="X1"/>
                  </lf>
                  <!--NB: Index is same as Arg1's 
  -->
                </feat>
              </fs>
            </atomcat>
          </complexcat>
        </setarg>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="E2"/>
              <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="walngarra" pred="want"/>
  </family>
  <!--

    *** End of derived families ***
 
        Add new families here, and merge the new entries for preset
         families as needed (e.g., you may add an entry to TV family
         for pro-dropping the subject etc.)
  -->
  <!-- these are the user-defined families for Dyirbal.
  -->
  <family indexRel="*noSem*" pos="Affix" closed="true" name="rel-case">
    <entry name="primary">
      <complexcat>
        <atomcat type="np">
          <fs inheritsFrom="0">
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="np">
          <fs inheritsFrom="1">
            <feat attr="case" val="a-case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="*"/>
        <complexcat>
          <atomcat type="n">
            <fs id="0">
              <feat attr="index">
                <lf>
                  <nomvar name="Y"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="n">
            <fs id="1">
              <feat attr="case" val="subject-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <!--
      <lf>
        <satop nomvar="Y">
          <prop name="[*DEFAULT*]"/>
          <diamond mode="Spec">
            <nomvar name="X"/>
          </diamond>
        </satop>
      </lf>
-->
      </complexcat>
    </entry>
    <member stem="ru"/>
  </family>
  <family indexRel="Restr" pos="Affix" closed="true" name="rel">
    <entry name="primary">
      <complexcat>
        <atomcat type="n">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="n">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="*"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="np">
            <!-- no structure sharing with fs 0; this aint HPSG-->
            <fs id="2">
              <feat attr="case" val="subject-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="X">
            <diamond mode="Restr">
              <nomvar name="E"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="nu"/>
  </family>
  <family closed="true" pos="Affix" name="voice">
    <entry name="anti-passive">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="0">
            <feat attr="index">
              <lf>
                <nomvar name="P"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="np">
          <fs inheritsFrom="2">
            <feat attr="case" val="subject-case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="*"/>
        <complexcat>
          <atomcat type="s">
            <fs id="0">
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="case" val="a-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="case" val="subject-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="P">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Pred">
              <nomvar name="E"/>
            </diamond>
            <diamond mode="Arg1">
              <nomvar name="X"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="na" pred="anti-p"/>
  </family>
  <family pos="Affix" closed="true" name="case">
    <entry name="primary">
      <complexcat>
        <atomcat type="np">
          <fs id="0">
            <feat attr="person" val="3"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="*"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="person" val="3"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X">
            <diamond mode="Spec">
              <nomvar name="D"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="ngu"/>
  </family>
  <family closed="true" pos="Affix" name="adjunct-case">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash/>
        <dollar name="1"/>
        <slash dir="|"/>
        <complexcat>
          <atomcat type="s">
            <fs id="0">
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
        </complexcat>
        <slash dir="\" mode="*"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="P">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Pred">
              <nomvar name="E"/>
              <diamond mode="Mod">
                <nomvar name="Y"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="gu"/>
  </family>
  <family pos="NP" closed="true" name="Noun">
    <entry name="primary">
      <atomcat type="np">
        <fs id="0">
          <feat attr="num">
            <featvar name="NUM"/>
          </feat>
          <feat attr="index">
            <lf>
              <nomvar name="X"/>
            </lf>
          </feat>
        </fs>
        <lf>
          <satop nomvar="X">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </atomcat>
    </entry>
    <entry name="bare">
      <atomcat type="n">
        <fs id="1">
          <feat attr="num">
            <featvar name="NUM"/>
          </feat>
          <feat attr="index">
            <lf>
              <nomvar name="X"/>
            </lf>
          </feat>
        </fs>
        <lf>
          <satop nomvar="X">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </atomcat>
    </entry>
    <member stem="yara" pred="man"/>
    <member stem="burrbula"/>
    <member stem="numa" pred="father"/>
    <member stem="gubi" pred="doctor"/>
    <member stem="yibi" pred="woman"/>
    <member stem="yabu" pred="mother"/>
    <member stem="guda" pred="dog"/>
  </family>
  <family pos="NNP" closed="true" name="pronoun">
    <entry name="primary">
      <atomcat type="np">
        <fs id="0">
          <feat attr="num">
            <featvar name="NUM"/>
          </feat>
          <feat attr="index">
            <lf>
              <nomvar name="X"/>
            </lf>
          </feat>
        </fs>
        <lf>
          <satop nomvar="X">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </atomcat>
    </entry>
    <member stem="naja" pred="i"/>
    <member stem="nyurra" pred="you"/>
    <member stem="nanana" pred="we"/>
  </family>
  <family pos="NP" closed="true" name="N-class">
    <entry name="primary">
      <complexcat>
        <atomcat type="np">
          <fs id="0">
            <feat attr="person" val="3"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="*"/>
        <atomcat type="n">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <entry name="NP-like">
      <atomcat type="np">
        <fs id="0">
          <feat attr="person" val="3"/>
          <feat attr="num">
            <featvar name="NUM"/>
          </feat>
          <feat attr="index">
            <lf>
              <nomvar name="X"/>
            </lf>
          </feat>
        </fs>
      </atomcat>
    </entry>
    <member stem="ba" pred="class"/>
  </family>
  <family closed="true" pos="Conj" name="Conj">
    <entry name="sentential">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S0"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash/>
        <dollar name="1"/>
        <slash dir="/" mode="*"/>
        <complexcat>
          <atomcat type="s">
            <fs inheritsFrom="1">
              <feat attr="index">
                <lf>
                  <nomvar name="S1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
        </complexcat>
        <slash dir="\" mode="*"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="S2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
        </complexcat>
        <lf>
          <satop nomvar="S0">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="List">
              <nomvar name="S1"/>
              <diamond mode="Coord">
                <nomvar name="S2"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="," pred="and"/>
  </family>
</ccg-lexicon>


================================================
FILE: grammars/mini-dyirbal/morph.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<morph xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:noNamespaceSchemaLocation="../morph.xsd" name="Dyirbal">
  <entry pos="Conj" word=","/>
  <entry pos="V" word="nabaygu" stem="naba"/>
  <entry pos="V" word="miyanda"/>
  <entry pos="V" word="yanu" stem="ya" macros="@nfut"/>
  <entry pos="V" word="bajigu" stem="baji" macros="@purp"/>
  <entry pos="V" word="banaganyu" stem="banaga" macros="@nfut"/>
  <entry pos="V" word="banagaygu" stem="banaga" macros="@purp"/>
  <entry pos="V" word="bural" macros="@purp"/>
  <entry pos="V" word="buran" stem="bural" macros="@nfut"/>
  <entry pos="V" word="burali" stem="bural" macros="@purp"/>
  <entry pos="V" word="jilwal"/>
  <entry pos="V" word="baran" stem="bara" macros="@purp"/>
  <entry pos="V" word="mawali" stem="mawa" macros="@purp"/>
  <entry pos="V" word="walngarra"/>
  <entry pos="V" word="gigan" stem="giga" macros="@nfut"/>
  <entry pos="NP" word="yara" macros="@abs @n1"/>
  <entry pos="NP" word="burrbula" macros="@abs @n1"/>
  <entry pos="NP" word="numa" macros="@abs @n1"/>
  <entry pos="NP" word="gubi" macros="@abs @n1"/>
  <entry pos="NP" word="yibi" macros="@abs @n2"/>
  <entry pos="NP" word="yabu" macros="@abs @n2"/>
  <entry pos="NP" word="guda" macros="@abs @n2"/>
  <entry pos="NNP" word="naja" macros="@erg"/>
  <entry pos="NNP" word="nyurra" macros="@erg"/>
  <entry pos="NNP" word="nanana" macros="@abs"/>
  <entry pos="NP" word="bayi" stem="ba" macros="@abs @n1"/>
  <entry pos="NP" word="bangul" stem="ba" macros="@erg @n1"/>
  <entry pos="NP" word="bagul" stem="ba" macros="@dat @n1"/>
  <entry pos="NP" word="banul" stem="ba" macros="@gen @n1"/>
  <entry pos="NP" word="balan" stem="ba" macros="@abs @n2"/>
  <entry pos="NP" word="bangun" stem="ba" macros="@erg @n2"/>
  <entry pos="NP" word="bagun" stem="ba" macros="@dat @n2"/>
  <entry pos="NP" word="banun" stem="ba" macros="@gen @n2"/>
  <entry pos="NP" word="balam" stem="ba" macros="@abs @n3"/>
  <entry pos="NP" word="bagun" stem="ba" macros="@erg @n3"/>
  <entry pos="NP" word="bagum" stem="ba" macros="@dat @n3"/>
  <entry pos="NP" word="bala" stem="ba" macros="@abs @n4"/>
  <entry pos="NP" word="baygu" stem="ba" macros="@erg @n4"/>
  <entry pos="NP" word="bagu" stem="ba" macros="@dat @n4"/>
  <entry pos="NP" word="banu" stem="ba" macros="@gen @n4"/>
  <entry pos="Affix" word="ngu" macros="@erg"/>
  <entry pos="Affix" word="gu" macros="@dat2"/>
  <entry pos="Affix" word="nu"/>
  <entry pos="Affix" word="ru"/>
  <entry pos="Affix" word="na"/>
  <entry pos="Affix" word="naygu" stem="na"/>
  <macro name="@purp">
    <fs id="0" attr="v-form" val="purposive"/>
  </macro>
  <macro name="@nfut">
    <fs id="0" attr="v-form" val="purposive"/>
  </macro>
  <macro name="@n1">
    <fs id="0" attr="class" val="1"/>
    <lf>
      <satop nomvar="X">
        <diamond mode="Class">
          <prop name="1"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@n2">
    <fs id="0" attr="class" val="2"/>
    <lf>
      <satop nomvar="X">
        <diamond mode="Class">
          <prop name="2"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@n3">
    <fs id="0" attr="class" val="3"/>
    <lf>
      <satop nomvar="X">
        <diamond mode="Class">
          <prop name="3"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@n4">
    <fs id="0" attr="class" val="4"/>
    <lf>
      <satop nomvar="X">
        <diamond mode="Class">
          <prop name="3"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@gen">
    <fs id="0" attr="case" val="gen"/>
  </macro>
  <macro name="@abs">
    <fs id="0" attr="case" val="subject-case"/>
  </macro>
  <macro name="@abs1">
    <fs id="1" attr="case" val="subject-case"/>
  </macro>
  <macro name="@abs2">
    <fs id="2" attr="case" val="subject-case"/>
  </macro>
  <macro name="@erg">
    <fs id="0" attr="case" val="a-case"/>
  </macro>
  <macro name="@erg1">
    <fs id="1" attr="case" val="a-case"/>
  </macro>
  <macro name="@erg2">
    <fs id="2" attr="case" val="a-case"/>
  </macro>
  <macro name="@dat">
    <fs id="0" attr="case" val="dat"/>
  </macro>
  <macro name="@dat2">
    <fs id="2" attr="case" val="dat"/>
  </macro>
  <macro name="@sg">
    <fs id="0" attr="num" val="sing"/>
  </macro>
  <macro name="@sg1">
    <fs id="1" attr="num" val="sing"/>
  </macro>
  <macro name="@sg2">
    <fs id="2" attr="num" val="sing"/>
  </macro>
  <macro name="@3rd">
    <fs id="0" attr="person" val="3"/>
  </macro>
  <macro name="@3rd1">
    <fs id="1" attr="person" val="3"/>
  </macro>
  <macro name="@3rd2">
    <fs id="2" attr="person" val="3"/>
  </macro>
  <macro name="@1st">
    <fs id="0" attr="person" val="1"/>
  </macro>
  <macro name="@1st1">
    <fs id="1" attr="person" val="1"/>
  </macro>
  <macro name="@1st2">
    <fs id="2" attr="person" val="1"/>
  </macro>
  <macro name="@2nd">
    <fs id="0" attr="person" val="1"/>
  </macro>
  <macro name="@2nd1">
    <fs id="1" attr="person" val="1"/>
  </macro>
  <macro name="@2nd2">
    <fs id="2" attr="person" val="1"/>
  </macro>
  <macro name="@non-fin">
    <fs id="0" attr="vform" val="non-fin"/>
  </macro>
</morph>


================================================
FILE: grammars/mini-dyirbal/parameters.xml
================================================
<?xml version="1.0"?>

<!-- Basque's parameter specifications - June 2004 Cem Bozsahin -->

<language name="Dyirbal" type="erg" 
	
	xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" 
	xsi:noNamespaceSchemaLocation="../parameters.xsd"> 
	
  <parameters>

   <!-- NB1: predicate, setarg, arg, x-argument are pre-CCG categories.
             This notation is mapped to CCG notation by lexical rules.
             setarg and arg are serialized as in CCG.
  
        NB2: TV skeleton should NOT carry case information; it is set up 
             from language type and single argument of the IV

        NB3: IV's only argument MUST have its case specified 
        
    -->
		
    <infinitive subject-type="syntactic"/>
       
    <iv>
      <predicate syn-type="s"/>
      <arg>
        <s-argument dir="\" syn-type="np" case="abs"/>
      </arg>
    </iv>

   <!-- For example, Basque's
        tv category simply says the order is V-A-P and V-P-A because
        the specs give Pred{\A-Arg, \P-Arg}.
        Pred, A-Arg, P-Arg are syntactically: s, np, np. 
     -->
		
    <tv>
      <predicate syn-type="s"/>
      <setarg>
        <p-argument dir="\" syn-type="np"/>
        <a-argument dir="\" syn-type="np"/>
      </setarg>
    </tv>
	
  </parameters>

</language>


================================================
FILE: grammars/mini-dyirbal/preset-families.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!-- 
      - This file is generated by parametric-lexicon.xsl to set up
          accusativity/ergativity parameter for IV and TV primary families
          and control primary families.

          NB: pre-CCG categories of parameters.xml are mapped to
              CCG categories in this file. From now on, it's all CCG

    Suggestions to start-up lexicon development:

      1) Copy this file to lexicon-base.xml to avoid losing your changes
         to it (remember, this file is auto-generated at the start)
      2) Edit lexicon-base.xml to modify the preset families and to add your 
          own families as needed (merging the entries of same family is
          left to you)
      3) Use the ccg-build facility of openCCG, which uses lexicon-base to build
          the lexicon.xml, morph.xml and rules.xml files needed by the system.
  -->
<!--

      *** Families derived from language parameters ***

   Includes primary entries for IV (unerg and unacc), basic TV, TV-control1, 
   TV-control2, IV-control1
   
  -->
<!--
  subject-case, s-case, p-case and a-case are value types that set up ergative-
  accusative mapping and surface cases of these argumnents (cf. types.xml file).
  Actual case values for them (e.g. nom for a-case in accusative languages,
  erg for a-case in ergative languages) are defined in types.xml file.
  You can of course refer to actual values since they are types,  but if a
  construction is related to GR mapping (ERG or ACC), it's better to use
  `subject-case' (which covers a-case and s-case in ACC; p-case and s-case in ERG).
  Types.xml sets these up from parameter specification.
  
  -->
<ccg-lexicon xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:noNamespaceSchemaLocation="../lexicon.xsd" name="Dyirbal">
   <family closed="true" pos="V" name="unergative">
      <entry name="primary">
         <complexcat>
            <atomcat type="s">
               <fs id="100">
                  <feat attr="index">
                     <lf>
                        <nomvar name="E"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <slash dir="\"/>
            <atomcat type="np">
               <fs id="1">
                  <feat attr="case" val="s-case"/>
                  <feat attr="index">
                     <lf>
                        <nomvar name="X1"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <lf>
               <satop nomvar="E">
                  <prop name="[*DEFAULT*]"/>
                  <diamond mode="Arg1">
                     <nomvar name="X1"/>
                  </diamond>
                  <diamond mode="Arg2">
                     <nom name="one"/>
                  </diamond>
               </satop>
            </lf>
         </complexcat>
      </entry>
   </family>
   <family closed="true" pos="V" name="unaccusative">
      <entry name="primary">
         <complexcat>
            <atomcat type="s">
               <fs id="100">
                  <feat attr="index">
                     <lf>
                        <nomvar name="E"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <slash dir="\"/>
            <atomcat type="np">
               <fs id="1">
                  <feat attr="case" val="s-case"/>
                  <feat attr="index">
                     <lf>
                        <nomvar name="X1"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <lf>
               <satop nomvar="E">
                  <prop name="[*DEFAULT*]"/>
                  <diamond mode="Arg2">
                     <nomvar name="X1"/>
                  </diamond>
                  <diamond mode="Arg1">
                     <nom name="one"/>
                  </diamond>
               </satop>
            </lf>
         </complexcat>
      </entry>
   </family>
   <family closed="true" pos="V" name="TV">
      <entry name="primary">
         <complexcat>
            <atomcat type="s">
               <fs id="100">
                  <feat attr="index">
                     <lf>
                        <nomvar name="E"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <setarg>
               <slash dir="\"/>
               <atomcat type="np">
                  <fs id="2">
                     <feat attr="case" val="p-case"/>
                     <feat attr="index">
                        <lf>
                           <nomvar name="X2"/>
                        </lf>
                     </feat>
                  </fs>
               </atomcat>
               <slash dir="\"/>
               <atomcat type="np">
                  <fs id="1">
                     <feat attr="case" val="a-case"/>
                     <feat attr="index">
                        <lf>
                           <nomvar name="X1"/>
                        </lf>
                     </feat>
                  </fs>
               </atomcat>
            </setarg>
            <lf>
               <satop nomvar="E">
                  <prop name="[*DEFAULT*]"/>
                  <diamond mode="Arg1">
                     <nomvar name="X1"/>
                  </diamond>
                  <diamond mode="Arg2">
                     <nomvar name="X2"/>
                  </diamond>
               </satop>
            </lf>
         </complexcat>
      </entry>
   </family>
   <family closed="true" pos="V" name="TV-control2">
      <entry name="primary">
         <complexcat>
            <atomcat type="s">
               <fs id="100">
                  <feat attr="index">
                     <lf>
                        <nomvar name="E"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <setarg>
               <slash dir="\"/>
               <complexcat>
                  <!--NB: Word order and directionality of embedded clause's |(S|NP) 
type is an 'educated guess' from the syntactic type of TV. Change them
accordingly 
  -->
                  <atomcat type="s">
                     <fs id="3">
                        <feat val="non-fin" attr="vform"/>
                        <feat attr="index">
                           <lf>
                              <nomvar name="E2"/>
                           </lf>
                        </feat>
                     </fs>
                  </atomcat>
                  <slash dir="|"/>
                  <atomcat type="np">
                     <fs id="4">
                        <!-- NB: If infinitive type is syntactic subject (which is the 
		  default), there is a built-in type in types.xml file called
		  "subject-case". Include in this type all the subjects that
		  can be controlled e.g. nominative subjects only (as in German), 
		  dative and nominative subjects (as in Malayalam) etc. In this
		  case, the controllee is not semantically restricted.
		  
		  If infinitive type is semantic subject, you need a larger
		  fragment of Hybrid Logic than HLDS uses to implement identity
		  of two event variables e.g.
		  
		  @_e(Arg1 a) ^ @_e(Arg1 b) - -> @_a(b)
		  
		  where a is the event variable for controller verb, and
		  b is the event variable for the controlled verb, and Arg1 is the
		  modality for primary arguments (1s).
		  
		  This constraint is formulable in HL but HLDS does not cover that
		  fragment (yet). When it does, the lf tag should just stick in that
		  constraint.
		  
		  Currently, OpenCCG can generate an LF with TWO non-identical Arg1 modalities
		  in the same event structure, therefore some illicit examples would
		  go through.
		-->
                        <feat attr="case" val="subject-case"/>
                        <feat attr="index">
                           <lf>
                              <nomvar name="X2"/>
                           </lf>
                           <!--NB: Index is same as Arg2's  -->
                        </feat>
                     </fs>
                  </atomcat>
               </complexcat>
               <slash dir="\"/>
               <atomcat type="np">
                  <fs id="2">
                     <feat attr="case" val="p-case"/>
                     <feat attr="index">
                        <lf>
                           <nomvar name="X2"/>
                        </lf>
                     </feat>
                  </fs>
               </atomcat>
               <slash dir="\"/>
               <atomcat type="np">
                  <fs id="1">
                     <feat attr="case" val="a-case"/>
                     <feat attr="index">
                        <lf>
                           <nomvar name="X1"/>
                        </lf>
                     </feat>
                  </fs>
               </atomcat>
            </setarg>
            <lf>
               <satop nomvar="E">
                  <prop name="[*DEFAULT*]"/>
                  <diamond mode="Arg1">
                     <nomvar name="X1"/>
                  </diamond>
                  <diamond mode="Arg2">
                     <nomvar name="X2"/>
                  </diamond>
                  <diamond mode="Arg3">
                     <nomvar name="E2"/>
                     <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
                  </diamond>
               </satop>
            </lf>
         </complexcat>
      </entry>
   </family>
   <family closed="true" pos="V" name="TV-control1">
      <entry name="primary">
         <complexcat>
            <atomcat type="s">
               <fs id="100">
                  <feat attr="index">
                     <lf>
                        <nomvar name="E"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <setarg>
               <slash dir="\"/>
               <complexcat>
                  <!--NB: Word order and directionality of embedded clause's 
|(S|NP) type is an 'educated guess' from the syntactic type of TV. 
Change them accordingly.
  -->
                  <atomcat type="s">
                     <fs id="3">
                        <feat val="non-fin" attr="vform"/>
                        <feat attr="index">
                           <lf>
                              <nomvar name="E2"/>
                           </lf>
                        </feat>
                     </fs>
                  </atomcat>
                  <slash dir="|"/>
                  <atomcat type="np">
                     <fs id="4">
                        <!-- NB: If infinitive type is syntactic subject (which is the 
		  default), there is a built-in type in types.xml file called
		  "subject-case". Include in this type all the subjects that
		  can be controlled e.g. nominative subjects only (as in German), 
		  dative and nominative subjects (as in Malayalam) etc. In this
		  case, the controllee is not semantically restricted.
		  
		  If infinitive type is semantic subject, you need a larger
		  fragment of Hybrid Logic than HLDS uses to implement identity
		  of two event variables e.g.
		  
		  @_e(Arg1 a) ^ @_e(Arg1 b) - -> @_a(b)
		  
		  where a is the event variable for controller verb, and
		  b is the event variable for the controlled verb, and Arg1 is the
		  modality for primary arguments (1s).
		  
		  This constraint is formulable in HL but HLDS does not cover that
		  fragment (yet). When it does, the lf tag should just stick in that
		  constraint.
		  
		  Currently, OpenCCG can generate an LF with TWO non-identical Arg1 modalities
		  in the same event structure, therefore some illicit examples would
		  go through.
		-->
                        <feat attr="case" val="subject-case"/>
                        <feat attr="index">
                           <lf>
                              <nomvar name="X1"/>
                           </lf>
                           <!--NB: Index is same as Arg1's -->
                        </feat>
                     </fs>
                  </atomcat>
               </complexcat>
               <slash dir="\"/>
               <atomcat type="np">
                  <fs id="2">
                     <feat attr="case" val="p-case"/>
                     <feat attr="index">
                        <lf>
                           <nomvar name="X2"/>
                        </lf>
                     </feat>
                  </fs>
               </atomcat>
               <slash dir="\"/>
               <atomcat type="np">
                  <fs id="1">
                     <feat attr="case" val="a-case"/>
                     <feat attr="index">
                        <lf>
                           <nomvar name="X1"/>
                        </lf>
                     </feat>
                  </fs>
               </atomcat>
            </setarg>
            <lf>
               <satop nomvar="E">
                  <prop name="[*DEFAULT*]"/>
                  <diamond mode="Arg1">
                     <nomvar name="X1"/>
                  </diamond>
                  <diamond mode="Arg2">
                     <nomvar name="X2"/>
                  </diamond>
                  <diamond mode="Arg3">
                     <nomvar name="E2"/>
                     <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
                  </diamond>
               </satop>
            </lf>
         </complexcat>
      </entry>
   </family>
   <family closed="true" pos="V" name="IV-control1">
      <entry name="primary">
         <complexcat>
            <atomcat type="s">
               <fs id="100">
                  <feat attr="index">
                     <lf>
                        <nomvar name="E"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <setarg>
               <slash dir="\"/>
               <complexcat>
                  <!--NB: Word order and directionality of embedded clause's 
|(S|NP) type is an 'educated guess' from the syntactic type of TV. 
Change them accordingly.
  -->
                  <atomcat type="s">
                     <fs id="3">
                        <feat val="non-fin" attr="vform"/>
                        <feat attr="index">
                           <lf>
                              <nomvar name="E2"/>
                           </lf>
                        </feat>
                     </fs>
                  </atomcat>
                  <slash dir="|"/>
                  <atomcat type="np">
                     <fs id="4">
                        <!-- NB: If infinitive type is syntactic subject (which is the 
		  default), there is a built-in type in types.xml file called
		  "subject-case". Include in this type all the subjects that
		  can be controlled e.g. nominative subjects only (as in German), 
		  dative and nominative subjects (as in Malayalam) etc. In this
		  case, the controllee is not semantically restricted.
		  
		  If infinitive type is semantic subject, you need a larger
		  fragment of Hybrid Logic than HLDS uses to implement identity
		  of two event variables e.g.
		  
		  @_e(Arg1 a) ^ @_e(Arg1 b) - -> @_a(b)
		  
		  where a is the event variable for controller verb, and
		  b is the event variable for the controlled verb, and Arg1 is the
		  modality for primary arguments (1s).
		  
		  This constraint is formulable in HL but HLDS does not cover that
		  fragment (yet). When it does, the lf tag should just stick in that
		  constraint.
		  
		  Currently, OpenCCG can generate an LF with TWO non-identical Arg1 modalities
		  in the same event structure, therefore some illicit examples would
		  go through.
		-->
                        <feat attr="case" val="subject-case"/>
                        <feat attr="index">
                           <lf>
                              <nomvar name="X1"/>
                           </lf>
                           <!--NB: Index is same as Arg1's -->
                        </feat>
                     </fs>
                  </atomcat>
               </complexcat>
               <slash dir="\"/>
               <atomcat type="np">
                  <fs id="1">
                     <feat attr="case" val="a-case"/>
                     <feat attr="index">
                        <lf>
                           <nomvar name="X1"/>
                        </lf>
                     </feat>
                  </fs>
               </atomcat>
            </setarg>
            <lf>
               <satop nomvar="E">
                  <prop name="[*DEFAULT*]"/>
                  <diamond mode="Arg1">
                     <nomvar name="X1"/>
                  </diamond>
                  <diamond mode="Arg2">
                     <nomvar name="E2"/>
                     <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
                  </diamond>
               </satop>
            </lf>
         </complexcat>
      </entry>
   </family>
   <!--

    *** End of derived families ***
 
        Add new families here, and merge the new entries for preset
         families as needed (e.g., you may add an entry to TV family
         for pro-dropping the subject etc.)
  -->
</ccg-lexicon>


================================================
FILE: grammars/mini-dyirbal/rules.xml
================================================
<?xml version='1.0' encoding='UTF-8'?>
<rules
xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
    xsi:noNamespaceSchemaLocation="../rules.xsd"
>
  <application dir="forward"/>
  <application dir="backward"/>
  <composition dir="forward" harmonic="true"/>
  <composition dir="forward" harmonic="false"/>
  <composition dir="backward" harmonic="true"/>
  <composition dir="backward" harmonic="false"/>
  <typeraising dir="forward" useDollar="false"/>
  <typeraising dir="backward" useDollar="false"/>
  <substitution dir="forward" harmonic="true"/>
  <substitution dir="forward" harmonic="false"/>
  <substitution dir="backward" harmonic="true"/>
  <substitution dir="backward" harmonic="false"/>
  <typechanging name="pd">
    <arg>
      <complexcat>
        <atomcat type="s">
            <fs id="1">
            <feat attr="index">
             <lf>
              <nomvar name="E"/>
             </lf>
            </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="case" val="subject-case"/>
              <feat attr="index">
                <lf>
                <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
      </complexcat>
    </arg>
    <result>
      <atomcat type="s">
        <fs >
          <feat attr="index">
            <lf>
             <nomvar name="E"/>
            </lf>
          </feat>
        </fs>
      </atomcat>
    </result>
  </typechanging>
</rules>


================================================
FILE: grammars/mini-dyirbal/testbed.out
================================================
Loading grammar from URL: file:/home/bozsahin/openccg/grammars/mini-dyirbal/grammar.xml

Parse	Realize	String
-----	-------	------
ok	-	bayi yara walngarra nabaygu
ok	-	bayi yara walngarra bural naygu bagun yibi gu
ok	-	bayi yara walngarra bangun yibi ngu burali
ok	-	yabu numa ngu gigan banagaygu
ok	-	naja bayi yara gigan gubi ngu mawali
ok	-	*naja bayi yara gigan bayi gubi mawali
ok	-	bayi yara miyanda nu yanu
ok	-	balan yibi bangul yara ngu miyanda nu ru buran
ok	-	bayi yara jilwal na nu bagun guda gu yanu
ok	-	bayi burrbula bangul gubi ngu baran , bajigu
FAILED	-	*bangul gubi ngu bayi burrbula baran , bajigu
ok	-	bayi yara yanu , bangun yibi ngu buran
ok	-	nyurra nanana buran , banaganyu


================================================
FILE: grammars/mini-dyirbal/testbed.xml
================================================
<?xml version="1.0"?>
<regression>
  <item numOfParses="1" string="bayi yara walngarra nabaygu"/>
  <item numOfParses="2" string="bayi yara walngarra bural naygu bagun yibi gu"/>
  <item numOfParses="1" string="bayi yara walngarra bangun yibi ngu burali"/>
  <item numOfParses="1" string="yabu numa ngu gigan banagaygu"/>
  <item numOfParses="1" string="naja bayi yara gigan gubi ngu mawali"/>
  <item numOfParses="0" string="naja bayi yara gigan bayi gubi mawali"/>
  <item numOfParses="1" string="bayi yara miyanda nu yanu"/>
  <item numOfParses="1" string="balan yibi bangul yara ngu miyanda nu ru buran"/>
  <item numOfParses="1" string="bayi yara jilwal na nu bagun guda gu yanu"/>
  <item numOfParses="2" string="bayi burrbula bangul gubi ngu baran , bajigu"/>
  <item numOfParses="0" string="bangul gubi ngu bayi burrbula baran , bajigu"/>
  <item numOfParses="2" string="bayi yara yanu , bangun yibi ngu buran"/>
  <item numOfParses="1" string="nyurra nanana buran , banaganyu"/>
</regression>


================================================
FILE: grammars/mini-dyirbal/types.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!-- 
      - This file is generated by parametric-types.xsl from parameter specs
	    (parameters.xml) to set up  types.xml file for development.
         
      - If the language in question has eg. quirky subjects etc., add their 
	    values under appropriate types.
	 
	 -->
<!--
	   subject-case, s-case, p-case and a-case are pre-defined types that are
	   used in the automatically generated initial lexicon (preset-families
	   .xml). We recommend that you dont change them. They handle
	   accusative/ergative mapping among other things (cf. types.xml initial
	   hierarchy).
	  
	 -->
<types xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:noNamespaceSchemaLocation="../types.xsd" name="Dyirbal">
  <type name="s-case" parents="subject-case"/>
  <type name="subject-case"/>
  <type parents="s-case p-case" name="abs"/>
  <type name="p-case" parents="subject-case"/>
  <type parents="a-case" name="erg"/>
  <type name="a-case"/>
</types>


================================================
FILE: grammars/mini-english/build.xml
================================================
<!-- $Id: build.xml,v 1.2 2007/03/26 18:31:12 mwhite14850 Exp $ -->
<!-- Copyright (C) 2003 University of Edinburgh (Michael White) and Cem Bozsahin -->
<project default="grammar" basedir=".">

  <!-- =================================================================== -->
  <!-- Initialization target                                               -->
  <!-- =================================================================== -->
  <target name="init">
    <tstamp/>
    <property name="Name" value="OpenCCG"/>
    <property name="name" value="openccg"/>

    <echo message="----------- ${Name} ------------"/>

    <property name="lib.dir" value="${openccg.home}/lib"/>
    <property name="grammars.dir" value="${openccg.home}/grammars"/>

    <path id="validate.classpath">
      <pathelement location="${lib.dir}/xercesImpl.jar"/>
      <pathelement location="${lib.dir}/${name}.jar"/>
    </path>
  </target>
  

  <!-- =================================================================== -->
  <!-- Help on usage                                                       -->
  <!-- =================================================================== -->
  <target name="usage">
    <echo message=""/>
    <echo message=""/>
    <echo message="OpenCCG grammar build file"/>
    <echo message="-------------------------------------------------------------"/>
    <echo message=""/>
    <echo message=" Available targets are:"/>
    <echo message=""/>
    <echo message="   grammar  --> builds the grammar (default)"/>
    <echo message=""/>
    <echo message="   skeleton  --> builds the skeleton file"/>
    <echo message=""/>
    <echo message=" See the comments inside the build.xml file for more details."/>
    <echo message="-------------------------------------------------------------"/>
    <echo message=""/>
    <echo message=""/>
  </target>
  

  <!-- =================================================================== -->
  <!-- Builds grammar                                                     -->
  <!-- =================================================================== -->
  <target name="grammar" depends="init" description="builds grammar">
    <echo message="Adding family members from dict.xml to lexicon-base.xml, yielding lexicon.xml"/>
    <java classname="org.apache.xalan.xslt.Process"> 
      <arg value="-IN"/> <arg value="lexicon-base.xml"/>
      <arg value="-XSL"/> <arg value="${grammars.dir}/add-family-members.xsl"/>
      <arg value="-PARAM"/> <arg value="dict-file"/> <arg value="${basedir}/dict.xml"/>
      <arg value="-OUT"/> <arg value="lexicon.xml"/>
    </java>
    <echo message="Extracting morph items from dict.xml to morph.xml"/>
    <java classname="org.apache.xalan.xslt.Process"> 
      <arg value="-IN"/> <arg value="${basedir}/dict.xml"/>
      <arg value="-XSL"/> <arg value="${grammars.dir}/extract-morph.xsl"/>
      <arg value="-OUT"/> <arg value="morph.xml"/>
    </java>
    <echo message="Validating grammar.xml, lexicon.xml, morph.xml, rules.xml and types.xml"/>
    <java classname="opennlp.ccg.test.Validator" classpathref="validate.classpath" fork="true"> 
      <arg value="grammar.xml"/>
      <arg value="lexicon.xml"/>
      <arg value="morph.xml"/>
      <arg value="rules.xml"/>
      <arg value="types.xml"/>
    </java>
  </target>

  <target name="skeleton"
          depends="init"
 description="Builds pre-lexicon to start up lexicon development">
    <echo message="Validating parameters.xml"/>
    <java classname="opennlp.ccg.test.Validator" classpathref="validate.classpath" fork="true"> 
      <arg value="parameters.xml"/>
    </java>
    <echo message="Generating preset-families.xml"/>
    <java classname="org.apache.xalan.xslt.Process">
      <arg value="-IN"/> <arg value="${basedir}/parameters.xml"/>
      <arg value="-XSL"/> <arg value="${grammars.dir}/parametric-lexicon.xsl"/>
      <arg value="-OUT"/> <arg value="${basedir}/preset-families.xml"/>
    </java>
    <echo message="Validating preset-families.xml"/>
    <java classname="opennlp.ccg.test.Validator" classpathref="validate.classpath" fork="true"> 
      <arg value="preset-families.xml"/>
    </java>
	<echo message="Generating types.xml"/>
    <java classname="org.apache.xalan.xslt.Process">
      <arg value="-IN"/> <arg value="${basedir}/parameters.xml"/>
      <arg value="-XSL"/> <arg value="${grammars.dir}/parametric-types.xsl"/>
      <arg value="-OUT"/> <arg value="${basedir}/types.xml"/>
    </java>
    <echo message="Validating types.xml"/>
    <java classname="opennlp.ccg.test.Validator" classpathref="validate.classpath" fork="true"> 
      <arg value="types.xml"/>
    </java>
  </target>
</project>

<!-- End of file -->


================================================
FILE: grammars/mini-english/dict.xml
================================================
<?xml version="1.0"?>
<dictionary name="English">

  <entry stem="and" pos="Conj">
    <member-of family="Conj"/>
  </entry>
  <entry stem="or" pos="Conj">
    <member-of family="Conj"/>
  </entry>
  <entry stem="that" pos="RelPro">
    <member-of family="RelPro"/>
  </entry>

  <entry stem="a" pos="Det">
    <word form="a"/>
    <word form="an"/>
    <member-of family="Det"/>
  </entry>
  <entry stem="the" pos="Det">
    <member-of family="Det"/>
  </entry>
  <entry stem="his" pos="Det">
    <member-of family="Det"/>
  </entry>
  <entry stem="my" pos="Det">
    <member-of family="Det"/>
  </entry>
  <entry stem="its" pos="Det">
    <member-of family="Det"/>
  </entry>
  
  <entry stem="to" pos="Prep">
    <member-of family="To-Infinitive"/>
  </entry>

  <entry word="celebrated" stem="celebrate" pos="V" macros="@past">
    <member-of family="IV"/>
  </entry>
  <entry stem="cheer" pos="V">
    <member-of family="IV"/>
    <word form="cheer" macros="@nonfin"/>
    <word form="cheered" macros="@past"/>
  </entry>
  <entry stem="come" pos="V">
    <member-of family="IV"/>
    <word form="come" macros="@nonfin"/>
    <word form="came" macros="@past"/>
  </entry>
  <entry stem="leave" pos="V">
    <member-of family="IV"/>
    <word form="leave" macros="@nonfin"/>
    <word form="left" macros="@past"/>
  </entry>
  <entry word="misses" stem="miss" pos="V" macros="@pres @+3rd-agr @sg-agr">
    <member-of family="IV"/>
  </entry>
  <entry stem="score" pos="V">
    <member-of family="IV"/>
    <member-of family="TV"/>
    <word form="score" macros="@nonfin"/>
    <word form="scores" macros="@pres @+3rd-agr @sg-agr"/>
    <word form="scored" macros="@past"/>
  </entry>
  <entry stem="shoot" pos="V">
    <member-of family="IV"/>
    <member-of family="TV"/>
    <word form="shoot" macros="@nonfin"/>
    <word form="shoots" macros="@pres @+3rd-agr @sg-agr"/>
  </entry>
  <entry stem="smile" pos="V">
    <member-of family="IV"/>
    <word form="smile" macros="@nonfin"/>
    <word form="smile" macros="@pres @-3rd-agr"/>
    <word form="smiles" macros="@pres @+3rd-agr @sg-agr"/>
    <word form="smile" macros="@pres @+3rd-agr @pl-agr"/>
    <word form="smiled" macros="@past"/>
  </entry>
  <entry word="stayed" stem="stay" pos="V" macros="@past">
    <member-of family="IV"/>
  </entry>
  <entry stem="win" pos="V">
    <member-of family="IV"/>
    <member-of family="TV"/>
    <word form="won" macros="@past"/>
    <word form="win" macros="@nonfin"/>
  </entry>

  <entry word="astonished" stem="astonish" pos="V" macros="@past">
    <member-of family="TV"/>
  </entry>
  <entry stem="beat" pos="V" macros="@past">
    <member-of family="TV"/>
  </entry>
  <entry word="blocked" stem="block" pos="V" macros="@past">
    <member-of family="TV"/>
  </entry>
  <entry stem="defeat" pos="V">
    <member-of family="TV"/>
    <word form="defeat" macros="@nonfin"/>
    <word form="defeated" macros="@past"/>
  </entry>
  <entry word="hosted" stem="host" pos="V" macros="@past">
    <member-of family="TV"/>
  </entry>
  <entry word="kicked" stem="kick" pos="V" macros="@past">
    <member-of family="TV"/>
  </entry>
  <entry stem="meet" pos="V">
    <member-of family="TV"/>
    <word form="meet" macros="@nonfin"/>
    <word form="met" macros="@past"/>
  </entry>
  <entry word="played" stem="play" pos="V" macros="@past">
    <member-of family="TV"/>
  </entry>
  <entry word="read" stem="read" pos="V" macros="@past">
    <member-of family="TV"/>
  </entry>
  <entry word="punched" stem="punch" pos="V" macros="@past">
    <member-of family="TV"/>
  </entry>
  <entry word="studied" stem="study" pos="V" macros="@past">
    <member-of family="IV"/>
  </entry>
  <entry word="fell-down" stem="fall-down" pos="V" macros="@past">
    <member-of family="IV"/>
  </entry>
  <entry word="exercise" stem="exercise" pos="V">
    <member-of family="IV"/>
  </entry>
  <entry word="see" stem="see" pos="V" macros="@past">
    <member-of family="TV"/>
  </entry>
  <entry stem="support" pos="V" macros="@nonfin">
    <member-of family="TV"/>
  </entry>
  <entry word="threw" stem="throw" pos="V" macros="@past">
    <member-of family="TV"/>
  </entry>
  <entry word="watched" stem="watch" pos="V" macros="@past">
    <member-of family="TV"/>
  </entry>

  <entry stem="give" pos="V">
    <member-of family="DTV"/>
    <word form="give" macros="@nonfin"/>
    <word form="gives" macros="@pres @+3rd-agr @sg-agr"/>
    <word form="gave" macros="@past"/>
  </entry>
  <entry word="offered" stem="offer" pos="V" macros="@past">
    <member-of family="DTV"/>
  </entry>

  <entry word="persuaded" stem="persuade" pos="V" macros="@past">
    <member-of family="TV-control2"/>
  </entry>
  <entry word="promised" stem="promise" pos="V" macros="@past">
    <member-of family="TV-control1"/>
  </entry>

  <entry stem="shot" pos="N" macros="@sg"/>
  <entry stem="doctor" pos="N" macros="@sg"/>
  <entry stem="patient" pos="N" macros="@sg"/>
  <entry stem="book" pos="N" macros="@sg"/>
  <entry stem="ball" pos="N" macros="@sg"/>
  <entry stem="cup" pos="N" macros="@sg"/>
  <entry stem="friend" pos="N" macros="@sg"/>
  <entry stem="family" pos="N" macros="@sg"/>
  <entry stem="victory" pos="N" macros="@sg"/>
  <entry stem="ticket" pos="N">
    <word form="ticket" macros="@sg"/>
    <word form="tickets" macros="@pl"/>
  </entry>
  <entry stem="card" pos="N" macros="@sg"/>
  <entry stem="goal" pos="N">
    <word form="goal" macros="@sg"/>
    <word form="goals" macros="@pl"/>
  </entry>
  <entry stem="referee" pos="N" macros="@sg"/>
  <entry stem="team" pos="N">
    <word form="team" macros="@sg"/>
    <word form="teams" macros="@pl"/>
  </entry>
  <entry stem="game" pos="N">
    <word form="game" macros="@sg"/>
    <word form="games" macros="@pl"/>
  </entry>
  <entry stem="fan" pos="N" macros="@sg"/>
  <entry stem="final" pos="N" macros="@sg"/>
  <entry stem="field" pos="N" macros="@sg"/>
  <entry stem="stadium" pos="N" macros="@sg"/>
  <entry stem="country" pos="N" macros="@sg"/>
  <entry stem="detractor" pos="N" macros="@sg"/>
  <entry stem="player" pos="N">
    <word form="player" macros="@sg"/>
    <word form="players" macros="@pl"/>
  </entry>
  
  <entry stem="I" pos="NNP" macros="@-3rd @sg"/>
  <entry stem="me" pos="NNP" macros="@-3rd @sg"/>
  <entry stem="he" pos="NNP" macros="@sg"/>
  <entry stem="her" pos="NNP" macros="@sg"/>
  <entry stem="him" pos="NNP" macros="@sg"/>
  <entry stem="it" pos="NNP" macros="@sg"/>
  <entry stem="you" pos="NNP" macros="@-3rd"/>
  <entry stem="Spain" pos="NNP" macros="@sg"/>
  <entry stem="Germany" pos="NNP" macros="@sg"/>
  <entry stem="Brazil" pos="NNP" macros="@sg"/>
  <entry stem="Turkey" pos="NNP" macros="@sg"/>
  <entry stem="China" pos="NNP" macros="@sg"/>
  <entry stem="Paraguay" pos="NNP" macros="@sg"/>
  <entry stem="John" pos="NNP" macros="@sg"/>
  <entry stem="Mary" pos="NNP" macros="@sg"/>
  <entry stem="Sue" pos="NNP" macros="@sg"/>
  <entry stem="Joao" pos="NNP" macros="@sg"/>
  <entry stem="Maria" pos="NNP" macros="@sg"/>
  <entry stem="Bill" pos="NNP" macros="@sg"/>
  <entry stem="Ronaldo" pos="NNP" macros="@sg"/>
  <entry stem="Ronaldinho" pos="NNP" macros="@sg"/>
  <entry stem="Rivaldo" pos="NNP" macros="@sg"/>
  <entry stem="Marcos" pos="NNP" macros="@sg"/>
  <entry stem="Kahn" pos="NNP" macros="@sg"/>
  <entry stem="Unsal" pos="NNP" macros="@sg"/>

  <macro name="@+3rd-agr">
    <fs id="1" attr="3rd" val="+"/>
    <fs id="2" attr="3rd" val="+"/>
  </macro>

  <macro name="@-3rd">
    <fs id="1" attr="3rd" val="-"/>
    <fs id="2" attr="3rd" val="-"/>
  </macro>

  <macro name="@-3rd-agr">
    <fs id="1" attr="3rd" val="-"/>
    <fs id="2" attr="3rd" val="-"/>
  </macro>

  <macro name="@sg">
    <fs id="2" attr="num" val="sg"/>
    <lf>
      <satop nomvar="X">
        <diamond mode="num"><prop name="sg"/></diamond>
      </satop>
    </lf>
  </macro>

  <macro name="@sg-agr">
    <fs id="1" attr="num" val="sg"/>
    <fs id="2" attr="num" val="sg"/>
  </macro>

  <macro name="@pl">
    <fs id="2" attr="num" val="pl"/>
    <lf>
      <satop nomvar="X">
        <diamond mode="num"><prop name="pl"/></diamond>
      </satop>
    </lf>
  </macro>

  <macro name="@pl-agr">
    <fs id="1" attr="num" val="pl"/>
    <fs id="2" attr="num" val="pl"/>
  </macro>

  <macro name="@pp-from">
    <fs id="3" attr="lex" val="from"/>
  </macro>

  <macro name="@pp-to">
    <fs id="3" attr="lex" val="to"/>
  </macro>

  <macro name="@prt-up">
    <fs id="4" attr="lex" val="up"/>
  </macro>

  <macro name="@prt-with">
    <fs id="4" attr="lex" val="with"/>
  </macro>

  <macro name="@gerund">
    <fs id="1" attr="vform" val="ger"/>
  </macro>

  <macro name="@nonfin">
    <fs id="1" attr="vform" val="non-fin"/>
  </macro>

  <macro name="@finite">
    <fs id="1">
      <feat attr="vform" val="fin"/>
    </fs>
  </macro>

  <macro name="@past">
    <lf>
      <satop nomvar="E">
        <diamond mode="tense"><prop name="past"/></diamond>
      </satop>
    </lf>
  </macro>

  <macro name="@pres">
    <lf>
      <satop nomvar="E">
        <diamond mode="tense"><prop name="pres"/></diamond>
      </satop>
    </lf>
  </macro>

</dictionary>


================================================
FILE: grammars/mini-english/grammar.xml
================================================
<?xml version="1.0"?>
<!-- 
Copyright (C) 2003 University of Edinburgh (Michael White) and Cem Bozsahin
$Revision: 1.1 $, $Date: 2005/08/03 14:23:28 $ 
-->
<grammar name="English"
  xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
  xsi:noNamespaceSchemaLocation="../grammar.xsd"
>

  <lexicon file="lexicon.xml"/>
  <morphology file="morph.xml"/>
  <rules file="rules.xml"/>
  <types file="types.xml"/>

</grammar>


================================================
FILE: grammars/mini-english/lexicon-base.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!-- 
      - This file is generated by lexicon-skeleton.xsl to set up
          accusativity/ergativity parameter for IV and TV primary families
          and control primary families.

          NB: pre-CCG categories of lexicon-skeleton.xml are mapped to
              CCG categories in this file. From now on, it's all CCG

    Suggestions to start-up lexicon development:

      1) Copy this file to lexicon-base.xml to avoid losing your changes
         to it (remember, this file is auto-generated at the start)
      2) Edit lexicon-base.xml to modify the preset families and to add your 
          own families as needed (merging the entries of same family is
          left to you)
      3) Use the build facility of openCCG to build
          the lexicon.xml, morph.xml and rules.xml files needed by the system.
  -->
  <!-- Additional families by Cem Bozsahin, 6/2003 -->
  
<!--

      *** Families derived from language parameters ***

   Includes primary entries for IV, TV, TV-control1, TV-control2, IV-control1
   
  -->
<ccg-lexicon name="English" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:noNamespaceSchemaLocation="../lexicon.xsd">
  <family closed="true" pos="V" name="IV">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="case" val="s-case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
  <family closed="true" pos="V" name="TV">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="case" val="a-case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="case" val="p-case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="X2"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
  <family closed="true" pos="V" name="TV-control2">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="case" val="a-case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/"/>
        <complexcat>
               <!--NB: Word order and directionality of embedded clause's |(S|NP) 
type is an 'educated guess' from the syntactic type of TV. Change them
accordingly 
  -->
          <atomcat type="s">
            <fs id="3">
              <feat val="inf" attr="vform"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="|"/>
          <atomcat type="np">
            <fs id="4">
              <feat attr="case" val="subject-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
                        <!--NB: Index is same as Arg2's 
  -->
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash dir="/"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="case" val="p-case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="X2"/>
            </diamond>
            <diamond mode="Arg3">
              <nomvar name="E2"/>
                     <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
  <family closed="true" pos="V" name="TV-control1">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="case" val="a-case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/"/>
        <complexcat>
               <!--NB: Word order and directionality of embedded clause's 
|(S|NP) type is an 'educated guess' from the syntactic type of TV. 
Change them accordingly.
  -->
          <atomcat type="s">
            <fs id="3">
              <feat val="inf" attr="vform"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="|"/>
          <atomcat type="np">
            <fs id="4">
              <feat attr="case" val="subject-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
                        <!--NB: Index is same as Arg1's 
  -->
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash dir="/"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="case" val="p-case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="X2"/>
            </diamond>
            <diamond mode="Arg3">
              <nomvar name="E2"/>
                     <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
  <family closed="true" pos="V" name="IV-control1">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="case" val="s-case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/"/>
        <complexcat>
               <!--NB: Word order and directionality of embedded clause's 
|(S|NP) type is an 'educated guess' from the syntactic type of TV. 
Change them accordingly.
  -->
          <atomcat type="s">
            <fs id="3">
              <feat val="inf" attr="vform"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="|"/>
          <atomcat type="np">
            <fs id="4">
            <feat attr="case" val="subject-case"/>
             <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
                        <!--NB: Index is same as Arg1's 
  -->
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="E2"/>
                     <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
   <!--

    *** End of derived families ***
 
        Add new families here, and merge the new entries for preset
         families as needed (e.g., you may add an entry to TV family
         for pro-dropping the subject etc.)
  -->

  <!-- Additional families for English, mainly adapted from Baldridge's (2002)
      worldcup grammar, modified by Mike White.
   -->
     <family indexRel="GenRel" closed="true" pos="RelPro" name="RelPro">
    <entry name="Primary">
      <complexcat>
        <atomcat type="n">
          <fs inheritsFrom="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
            <feat attr="case">
              <featvar name="CASE"/>
            </feat>
          </fs>
        </atomcat>
          <slash  dir="\"/>
          <atomcat type="n">
            <fs inheritsFrom="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
              <feat attr="case">
                <featvar name="CASE"/>
              </feat>
            </fs>
          </atomcat>
          <slash  dir="/"/>
          <complexcat>
            <atomcat type="s">
              <fs id="1">
                <feat val="dcl" attr="form"/>
                <feat attr="index">
                  <lf>
                    <nomvar name="E"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
            <slash dir="\"/>
            <atomcat type="np">
              <fs id="2">
                <feat val="3rd" attr="pers"/>
                <feat attr="index">
                  <lf>
                    <nomvar name="X"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
          </complexcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="GenRel">
              <nomvar name="E:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
  
  <family pos="NNP" name="Name">
    <entry name="Primary">
      <atomcat type="np">
        <fs id="2">
          <feat attr="num">
            <featvar name="NUM"/>
          </feat>
          <feat val="+" attr="3rd"/>
          <feat attr="index">
            <lf>
              <nomvar name="X"/>
            </lf>
          </feat>
        </fs>
        <lf>
          <satop nomvar="X">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </atomcat>
    </entry>
  </family>

  <family pos="N" name="Noun">
    <entry name="Primary">
      <atomcat type="n">
        <fs id="2">
          <feat attr="num">
            <featvar name="NUM"/>
          </feat>
          <feat attr="index">
            <lf>
              <nomvar name="X"/>
            </lf>
          </feat>
        </fs>
        <lf>
          <satop nomvar="X">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </atomcat>
    </entry>
  </family>

  <family closed="true" pos="Det" name="Det">
    <entry name="Primary">
      <complexcat>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM"/>
            </feat>
            <feat val="+" attr="3rd"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X">
            <diamond mode="Det">
              <nomvar name="D"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>

  <family indexRel="*NoSem*" closed="true" pos="Prep" name="To-Infinitive">
    <entry name="Basic">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="inf" attr="vform"/>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat val="non-fin" attr="vform"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
      </complexcat>
    </entry>
  </family>

  <family closed="true" pos="Conj" name="Conj">
    <entry name="Sentential">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="E0"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash/>
        <dollar name="1"/>
        <slash mode="*" dir="\"/>
        <complexcat>
          <atomcat type="s">
            <fs inheritsFrom="1">
              <feat attr="index">
                <lf>
                  <nomvar name="E1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
        </complexcat>
        <slash mode="*" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="E2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
        </complexcat>
        <lf>
          <satop nomvar="E0">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="List">
              <nomvar name="E1"/>
              <diamond mode="Coord">
                <nomvar name="E2"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>

  <family closed="true" pos="V" name="DTV">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM"/>
            </feat>
            <feat attr="3rd">
              <featvar name="3RD"/>
            </feat>
            <feat val="fin" attr="vform"/>
            <feat val="none" attr="marking"/>
            <feat val="-" attr="inv"/>
            <feat val="-" attr="quant"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM"/>
            </feat>
            <feat attr="3rd">
              <featvar name="3RD"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="/"/>
        <atomcat type="np">
          <fs id="4">
            <feat attr="index">
              <lf>
                <nomvar name="Z"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X"/>
            </diamond>
          </satop>
          <satop nomvar="E">
            <diamond mode="Arg3">
              <nomvar name="Y"/>
            </diamond>
          </satop>
          <satop nomvar="E">
            <diamond mode="Arg2">
              <nomvar name="Z"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>


</ccg-lexicon>


================================================
FILE: grammars/mini-english/lexicon.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!-- 
      - This file is generated by lexicon-skeleton.xsl to set up
          accusativity/ergativity parameter for IV and TV primary families
          and control primary families.

          NB: pre-CCG categories of lexicon-skeleton.xml are mapped to
              CCG categories in this file. From now on, it's all CCG

    Suggestions to start-up lexicon development:

      1) Copy this file to lexicon-base.xml to avoid losing your changes
         to it (remember, this file is auto-generated at the start)
      2) Edit lexicon-base.xml to modify the preset families and to add your 
          own families as needed (merging the entries of same family is
          left to you)
      3) Use the build facility of openCCG to build
          the lexicon.xml, morph.xml and rules.xml files needed by the system.
  -->
<!-- Additional families by Cem Bozsahin, 6/2003 -->
<!--

      *** Families derived from language parameters ***

   Includes primary entries for IV, TV, TV-control1, TV-control2, IV-control1
   
  -->
<ccg-lexicon xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" name="English" xsi:noNamespaceSchemaLocation="../lexicon.xsd">
  <family closed="true" pos="V" name="IV">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="case" val="s-case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="celebrate"/>
    <member stem="cheer"/>
    <member stem="come"/>
    <member stem="leave"/>
    <member stem="miss"/>
    <member stem="score"/>
    <member stem="shoot"/>
    <member stem="smile"/>
    <member stem="stay"/>
    <member stem="win"/>
    <member stem="study"/>
    <member stem="fall-down"/>
    <member stem="exercise"/>
  </family>
  <family closed="true" pos="V" name="TV">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="case" val="a-case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="case" val="p-case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="X2"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="score"/>
    <member stem="shoot"/>
    <member stem="win"/>
    <member stem="astonish"/>
    <member stem="beat"/>
    <member stem="block"/>
    <member stem="defeat"/>
    <member stem="host"/>
    <member stem="kick"/>
    <member stem="meet"/>
    <member stem="play"/>
    <member stem="read"/>
    <member stem="punch"/>
    <member stem="see"/>
    <member stem="support"/>
    <member stem="throw"/>
    <member stem="watch"/>
  </family>
  <family closed="true" pos="V" name="TV-control2">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="case" val="a-case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/"/>
        <complexcat>
          <!--NB: Word order and directionality of embedded clause's |(S|NP) 
type is an 'educated guess' from the syntactic type of TV. Change them
accordingly 
  -->
          <atomcat type="s">
            <fs id="3">
              <feat val="inf" attr="vform"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="|"/>
          <atomcat type="np">
            <fs id="4">
              <feat attr="case" val="subject-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
                <!--NB: Index is same as Arg2's 
  -->
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash dir="/"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="case" val="p-case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="X2"/>
            </diamond>
            <diamond mode="Arg3">
              <nomvar name="E2"/>
              <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="persuade"/>
  </family>
  <family closed="true" pos="V" name="TV-control1">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="case" val="a-case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/"/>
        <complexcat>
          <!--NB: Word order and directionality of embedded clause's 
|(S|NP) type is an 'educated guess' from the syntactic type of TV. 
Change them accordingly.
  -->
          <atomcat type="s">
            <fs id="3">
              <feat val="inf" attr="vform"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="|"/>
          <atomcat type="np">
            <fs id="4">
              <feat attr="case" val="subject-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
                <!--NB: Index is same as Arg1's 
  -->
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash dir="/"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="case" val="p-case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="X2"/>
            </diamond>
            <diamond mode="Arg3">
              <nomvar name="E2"/>
              <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="promise"/>
  </family>
  <family closed="true" pos="V" name="IV-control1">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="case" val="s-case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/"/>
        <complexcat>
          <!--NB: Word order and directionality of embedded clause's 
|(S|NP) type is an 'educated guess' from the syntactic type of TV. 
Change them accordingly.
  -->
          <atomcat type="s">
            <fs id="3">
              <feat val="inf" attr="vform"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="|"/>
          <atomcat type="np">
            <fs id="4">
              <feat attr="case" val="subject-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
                <!--NB: Index is same as Arg1's 
  -->
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="E2"/>
              <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
  <!--

    *** End of derived families ***
 
        Add new families here, and merge the new entries for preset
         families as needed (e.g., you may add an entry to TV family
         for pro-dropping the subject etc.)
  -->
  <!-- Additional families for English, mainly adapted from Baldridge's (2002)
      worldcup grammar, modified by Mike White.
   -->
  <family indexRel="GenRel" closed="true" pos="RelPro" name="RelPro">
    <entry name="Primary">
      <complexcat>
        <atomcat type="n">
          <fs inheritsFrom="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
            <feat attr="case">
              <featvar name="CASE"/>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="n">
          <fs inheritsFrom="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
            <feat attr="case">
              <featvar name="CASE"/>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat val="dcl" attr="form"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat val="3rd" attr="pers"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="GenRel">
              <nomvar name="E:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="that"/>
  </family>
  <family pos="NNP" name="Name">
    <entry name="Primary">
      <atomcat type="np">
        <fs id="2">
          <feat attr="num">
            <featvar name="NUM"/>
          </feat>
          <feat val="+" attr="3rd"/>
          <feat attr="index">
            <lf>
              <nomvar name="X"/>
            </lf>
          </feat>
        </fs>
        <lf>
          <satop nomvar="X">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </atomcat>
    </entry>
  </family>
  <family pos="N" name="Noun">
    <entry name="Primary">
      <atomcat type="n">
        <fs id="2">
          <feat attr="num">
            <featvar name="NUM"/>
          </feat>
          <feat attr="index">
            <lf>
              <nomvar name="X"/>
            </lf>
          </feat>
        </fs>
        <lf>
          <satop nomvar="X">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </atomcat>
    </entry>
  </family>
  <family closed="true" pos="Det" name="Det">
    <entry name="Primary">
      <complexcat>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM"/>
            </feat>
            <feat val="+" attr="3rd"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X">
            <diamond mode="Det">
              <nomvar name="D"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="a"/>
    <member stem="the"/>
    <member stem="his"/>
    <member stem="my"/>
    <member stem="its"/>
  </family>
  <family indexRel="*NoSem*" closed="true" pos="Prep" name="To-Infinitive">
    <entry name="Basic">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="inf" attr="vform"/>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat val="non-fin" attr="vform"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
      </complexcat>
    </entry>
    <member stem="to"/>
  </family>
  <family closed="true" pos="Conj" name="Conj">
    <entry name="Sentential">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="E0"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash/>
        <dollar name="1"/>
        <slash mode="*" dir="\"/>
        <complexcat>
          <atomcat type="s">
            <fs inheritsFrom="1">
              <feat attr="index">
                <lf>
                  <nomvar name="E1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
        </complexcat>
        <slash mode="*" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="E2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
        </complexcat>
        <lf>
          <satop nomvar="E0">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="List">
              <nomvar name="E1"/>
              <diamond mode="Coord">
                <nomvar name="E2"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="and"/>
    <member stem="or"/>
  </family>
  <family closed="true" pos="V" name="DTV">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM"/>
            </feat>
            <feat attr="3rd">
              <featvar name="3RD"/>
            </feat>
            <feat val="fin" attr="vform"/>
            <feat val="none" attr="marking"/>
            <feat val="-" attr="inv"/>
            <feat val="-" attr="quant"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM"/>
            </feat>
            <feat attr="3rd">
              <featvar name="3RD"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="/"/>
        <atomcat type="np">
          <fs id="4">
            <feat attr="index">
              <lf>
                <nomvar name="Z"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X"/>
            </diamond>
          </satop>
          <satop nomvar="E">
            <diamond mode="Arg3">
              <nomvar name="Y"/>
            </diamond>
          </satop>
          <satop nomvar="E">
            <diamond mode="Arg2">
              <nomvar name="Z"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="give"/>
    <member stem="offer"/>
  </family>
</ccg-lexicon>


================================================
FILE: grammars/mini-english/morph.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<morph xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:noNamespaceSchemaLocation="../morph.xsd" name="English">
  <entry word="and" pos="Conj"/>
  <entry word="or" pos="Conj"/>
  <entry word="that" pos="RelPro"/>
  <entry pos="Det" word="a"/>
  <entry pos="Det" word="an" stem="a"/>
  <entry word="the" pos="Det"/>
  <entry word="his" pos="Det"/>
  <entry word="my" pos="Det"/>
  <entry word="its" pos="Det"/>
  <entry word="to" pos="Prep"/>
  <entry word="celebrated" stem="celebrate" pos="V" macros="@past"/>
  <entry pos="V" word="cheer" macros="@nonfin"/>
  <entry pos="V" word="cheered" stem="cheer" macros="@past"/>
  <entry pos="V" word="come" macros="@nonfin"/>
  <entry pos="V" word="came" stem="come" macros="@past"/>
  <entry pos="V" word="leave" macros="@nonfin"/>
  <entry pos="V" word="left" stem="leave" macros="@past"/>
  <entry word="misses" stem="miss" pos="V" macros="@pres @+3rd-agr @sg-agr"/>
  <entry pos="V" word="score" macros="@nonfin"/>
  <entry pos="V" word="scores" stem="score" macros="@pres @+3rd-agr @sg-agr"/>
  <entry pos="V" word="scored" stem="score" macros="@past"/>
  <entry pos="V" word="shoot" macros="@nonfin"/>
  <entry pos="V" word="shoots" stem="shoot" macros="@pres @+3rd-agr @sg-agr"/>
  <entry pos="V" word="smile" macros="@nonfin"/>
  <entry pos="V" word="smile" macros="@pres @-3rd-agr"/>
  <entry pos="V" word="smiles" stem="smile" macros="@pres @+3rd-agr @sg-agr"/>
  <entry pos="V" word="smile" macros="@pres @+3rd-agr @pl-agr"/>
  <entry pos="V" word="smiled" stem="smile" macros="@past"/>
  <entry word="stayed" stem="stay" pos="V" macros="@past"/>
  <entry pos="V" word="won" stem="win" macros="@past"/>
  <entry pos="V" word="win" macros="@nonfin"/>
  <entry word="astonished" stem="astonish" pos="V" macros="@past"/>
  <entry word="beat" pos="V" macros="@past"/>
  <entry word="blocked" stem="block" pos="V" macros="@past"/>
  <entry pos="V" word="defeat" macros="@nonfin"/>
  <entry pos="V" word="defeated" stem="defeat" macros="@past"/>
  <entry word="hosted" stem="host" pos="V" macros="@past"/>
  <entry word="kicked" stem="kick" pos="V" macros="@past"/>
  <entry pos="V" word="meet" macros="@nonfin"/>
  <entry pos="V" word="met" stem="meet" macros="@past"/>
  <entry word="played" stem="play" pos="V" macros="@past"/>
  <entry word="read" stem="read" pos="V" macros="@past"/>
  <entry word="punched" stem="punch" pos="V" macros="@past"/>
  <entry word="studied" stem="study" pos="V" macros="@past"/>
  <entry word="fell-down" stem="fall-down" pos="V" macros="@past"/>
  <entry word="exercise" stem="exercise" pos="V"/>
  <entry word="see" stem="see" pos="V" macros="@past"/>
  <entry word="support" pos="V" macros="@nonfin"/>
  <entry word="threw" stem="throw" pos="V" macros="@past"/>
  <entry word="watched" stem="watch" pos="V" macros="@past"/>
  <entry pos="V" word="give" macros="@nonfin"/>
  <entry pos="V" word="gives" stem="give" macros="@pres @+3rd-agr @sg-agr"/>
  <entry pos="V" word="gave" stem="give" macros="@past"/>
  <entry word="offered" stem="offer" pos="V" macros="@past"/>
  <entry word="persuaded" stem="persuade" pos="V" macros="@past"/>
  <entry word="promised" stem="promise" pos="V" macros="@past"/>
  <entry word="shot" pos="N" macros="@sg"/>
  <entry word="doctor" pos="N" macros="@sg"/>
  <entry word="patient" pos="N" macros="@sg"/>
  <entry word="book" pos="N" macros="@sg"/>
  <entry word="ball" pos="N" macros="@sg"/>
  <entry word="cup" pos="N" macros="@sg"/>
  <entry word="friend" pos="N" macros="@sg"/>
  <entry word="family" pos="N" macros="@sg"/>
  <entry word="victory" pos="N" macros="@sg"/>
  <entry pos="N" word="ticket" macros="@sg"/>
  <entry pos="N" word="tickets" stem="ticket" macros="@pl"/>
  <entry word="card" pos="N" macros="@sg"/>
  <entry pos="N" word="goal" macros="@sg"/>
  <entry pos="N" word="goals" stem="goal" macros="@pl"/>
  <entry word="referee" pos="N" macros="@sg"/>
  <entry pos="N" word="team" macros="@sg"/>
  <entry pos="N" word="teams" stem="team" macros="@pl"/>
  <entry pos="N" word="game" macros="@sg"/>
  <entry pos="N" word="games" stem="game" macros="@pl"/>
  <entry word="fan" pos="N" macros="@sg"/>
  <entry word="final" pos="N" macros="@sg"/>
  <entry word="field" pos="N" macros="@sg"/>
  <entry word="stadium" pos="N" macros="@sg"/>
  <entry word="country" pos="N" macros="@sg"/>
  <entry word="detractor" pos="N" macros="@sg"/>
  <entry pos="N" word="player" macros="@sg"/>
  <entry pos="N" word="players" stem="player" macros="@pl"/>
  <entry word="I" pos="NNP" macros="@-3rd @sg"/>
  <entry word="me" pos="NNP" macros="@-3rd @sg"/>
  <entry word="he" pos="NNP" macros="@sg"/>
  <entry word="her" pos="NNP" macros="@sg"/>
  <entry word="him" pos="NNP" macros="@sg"/>
  <entry word="it" pos="NNP" macros="@sg"/>
  <entry word="you" pos="NNP" macros="@-3rd"/>
  <entry word="Spain" pos="NNP" macros="@sg"/>
  <entry word="Germany" pos="NNP" macros="@sg"/>
  <entry word="Brazil" pos="NNP" macros="@sg"/>
  <entry word="Turkey" pos="NNP" macros="@sg"/>
  <entry word="China" pos="NNP" macros="@sg"/>
  <entry word="Paraguay" pos="NNP" macros="@sg"/>
  <entry word="John" pos="NNP" macros="@sg"/>
  <entry word="Mary" pos="NNP" macros="@sg"/>
  <entry word="Sue" pos="NNP" macros="@sg"/>
  <entry word="Joao" pos="NNP" macros="@sg"/>
  <entry word="Maria" pos="NNP" macros="@sg"/>
  <entry word="Bill" pos="NNP" macros="@sg"/>
  <entry word="Ronaldo" pos="NNP" macros="@sg"/>
  <entry word="Ronaldinho" pos="NNP" macros="@sg"/>
  <entry word="Rivaldo" pos="NNP" macros="@sg"/>
  <entry word="Marcos" pos="NNP" macros="@sg"/>
  <entry word="Kahn" pos="NNP" macros="@sg"/>
  <entry word="Unsal" pos="NNP" macros="@sg"/>
  <macro name="@+3rd-agr">
    <fs id="1" attr="3rd" val="+"/>
    <fs id="2" attr="3rd" val="+"/>
  </macro>
  <macro name="@-3rd">
    <fs id="1" attr="3rd" val="-"/>
    <fs id="2" attr="3rd" val="-"/>
  </macro>
  <macro name="@-3rd-agr">
    <fs id="1" attr="3rd" val="-"/>
    <fs id="2" attr="3rd" val="-"/>
  </macro>
  <macro name="@sg">
    <fs id="2" attr="num" val="sg"/>
    <lf>
      <satop nomvar="X">
        <diamond mode="num">
          <prop name="sg"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@sg-agr">
    <fs id="1" attr="num" val="sg"/>
    <fs id="2" attr="num" val="sg"/>
  </macro>
  <macro name="@pl">
    <fs id="2" attr="num" val="pl"/>
    <lf>
      <satop nomvar="X">
        <diamond mode="num">
          <prop name="pl"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@pl-agr">
    <fs id="1" attr="num" val="pl"/>
    <fs id="2" attr="num" val="pl"/>
  </macro>
  <macro name="@pp-from">
    <fs id="3" attr="lex" val="from"/>
  </macro>
  <macro name="@pp-to">
    <fs id="3" attr="lex" val="to"/>
  </macro>
  <macro name="@prt-up">
    <fs id="4" attr="lex" val="up"/>
  </macro>
  <macro name="@prt-with">
    <fs id="4" attr="lex" val="with"/>
  </macro>
  <macro name="@gerund">
    <fs id="1" attr="vform" val="ger"/>
  </macro>
  <macro name="@nonfin">
    <fs id="1" attr="vform" val="non-fin"/>
  </macro>
  <macro name="@finite">
    <fs id="1">
      <feat attr="vform" val="fin"/>
    </fs>
  </macro>
  <macro name="@past">
    <lf>
      <satop nomvar="E">
        <diamond mode="tense">
          <prop name="past"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@pres">
    <lf>
      <satop nomvar="E">
        <diamond mode="tense">
          <prop name="pres"/>
        </diamond>
      </satop>
    </lf>
  </macro>
</morph>


================================================
FILE: grammars/mini-english/parameters.xml
================================================
<?xml version="1.0"?>

<!-- Basque's parameter specifications - June 2004 Cem Bozsahin -->

<language name="English" type="acc" 
	
	xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" 
	xsi:noNamespaceSchemaLocation="../parameters.xsd"> 
	
  <parameters>

   <!-- NB1: predicate, setarg, arg, x-argument are pre-CCG categories.
             This notation is mapped to CCG notation by lexical rules.
             setarg and arg are serialized as in CCG.
  
        NB2: TV skeleton should NOT carry case information; it is set up 
             from language type and single argument of the IV

        NB3: IV's only argument MUST have its case specified 
        
    -->
		
    <infinitive subject-type="syntactic"/>
       
    <iv>
      <predicate syn-type="s"/>
      <arg>
        <s-argument dir="\" syn-type="np" case="nom"/>
      </arg>
    </iv>

   <!-- For example, Basque's
        tv category simply says the order is V-A-P and V-P-A because
        the specs give Pred{\A-Arg, \P-Arg}.
        Pred, A-Arg, P-Arg are syntactically: s, np, np. 
     -->
		
    <tv>
      <predicate syn-type="s"/>
      <arg>
        <a-argument dir="\" syn-type="np"/>
        <p-argument dir="\" syn-type="np"/>
      </arg>
    </tv>
	
  </parameters>

</language>


================================================
FILE: grammars/mini-english/preset-families.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!-- 
      - This file is generated by parametric-lexicon.xsl to set up
          accusativity/ergativity parameter for IV and TV primary families
          and control primary families.

          NB: pre-CCG categories of parameters.xml are mapped to
              CCG categories in this file. From now on, it's all CCG

    Suggestions to start-up lexicon development:

      1) Copy this file to lexicon-base.xml to avoid losing your changes
         to it (remember, this file is auto-generated at the start)
      2) Edit lexicon-base.xml to modify the preset families and to add your 
          own families as needed (merging the entries of same family is
          left to you)
      3) Use the ccg-build facility of openCCG, which uses lexicon-base to build
          the lexicon.xml, morph.xml and rules.xml files needed by the system.
  -->
<!--

      *** Families derived from language parameters ***

   Includes primary entries for IV (unerg and unacc), basic TV, TV-control1, 
   TV-control2, IV-control1
   
  -->
<!--
  subject-case, s-case, p-case and a-case are value types that set up ergative-
  accusative mapping and surface cases of these argumnents (cf. types.xml file).
  Actual case values for them (e.g. nom for a-case in accusative languages,
  erg for a-case in ergative languages) are defined in types.xml file.
  You can of course refer to actual values since they are types,  but if a
  construction is related to GR mapping (ERG or ACC), it's better to use
  `subject-case' (which covers a-case and s-case in ACC; p-case and s-case in ERG).
  Types.xml sets these up from parameter specification.
  
  -->
<ccg-lexicon xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:noNamespaceSchemaLocation="../lexicon.xsd" name="English">
   <family closed="true" pos="V" name="unergative">
      <entry name="primary">
         <complexcat>
            <atomcat type="s">
               <fs id="100">
                  <feat attr="index">
                     <lf>
                        <nomvar name="E"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <slash dir="\"/>
            <atomcat type="np">
               <fs id="1">
                  <feat attr="case" val="s-case"/>
                  <feat attr="index">
                     <lf>
                        <nomvar name="X1"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <lf>
               <satop nomvar="E">
                  <prop name="[*DEFAULT*]"/>
                  <diamond mode="Arg1">
                     <nomvar name="X1"/>
                  </diamond>
                  <diamond mode="Arg2">
                     <nom name="one"/>
                  </diamond>
               </satop>
            </lf>
         </complexcat>
      </entry>
   </family>
   <family closed="true" pos="V" name="unaccusative">
      <entry name="primary">
         <complexcat>
            <atomcat type="s">
               <fs id="100">
                  <feat attr="index">
                     <lf>
                        <nomvar name="E"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <slash dir="\"/>
            <atomcat type="np">
               <fs id="1">
                  <feat attr="case" val="s-case"/>
                  <feat attr="index">
                     <lf>
                        <nomvar name="X1"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <lf>
               <satop nomvar="E">
                  <prop name="[*DEFAULT*]"/>
                  <diamond mode="Arg2">
                     <nomvar name="X1"/>
                  </diamond>
                  <diamond mode="Arg1">
                     <nom name="one"/>
                  </diamond>
               </satop>
            </lf>
         </complexcat>
      </entry>
   </family>
   <family closed="true" pos="V" name="TV">
      <entry name="primary">
         <complexcat>
            <atomcat type="s">
               <fs id="100">
                  <feat attr="index">
                     <lf>
                        <nomvar name="E"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <slash dir="\"/>
            <atomcat type="np">
               <fs id="1">
                  <feat attr="case" val="a-case"/>
                  <feat attr="index">
                     <lf>
                        <nomvar name="X1"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <slash dir="\"/>
            <atomcat type="np">
               <fs id="2">
                  <feat attr="case" val="p-case"/>
                  <feat attr="index">
                     <lf>
                        <nomvar name="X2"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <lf>
               <satop nomvar="E">
                  <prop name="[*DEFAULT*]"/>
                  <diamond mode="Arg1">
                     <nomvar name="X1"/>
                  </diamond>
                  <diamond mode="Arg2">
                     <nomvar name="X2"/>
                  </diamond>
               </satop>
            </lf>
         </complexcat>
      </entry>
   </family>
   <family closed="true" pos="V" name="TV-control2">
      <entry name="primary">
         <complexcat>
            <atomcat type="s">
               <fs id="100">
                  <feat attr="index">
                     <lf>
                        <nomvar name="E"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <slash dir="\"/>
            <atomcat type="np">
               <fs id="1">
                  <feat attr="case" val="a-case"/>
                  <feat attr="index">
                     <lf>
                        <nomvar name="X1"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <slash dir="\"/>
            <complexcat>
               <!--NB: Word order and directionality of embedded clause's |(S|NP) 
type is an 'educated guess' from the syntactic type of TV. Change them
accordingly 
  -->
               <atomcat type="s">
                  <fs id="3">
                     <feat val="non-fin" attr="vform"/>
                     <feat attr="index">
                        <lf>
                           <nomvar name="E2"/>
                        </lf>
                     </feat>
                  </fs>
               </atomcat>
               <slash dir="|"/>
               <atomcat type="np">
                  <fs id="4">
                     <!-- NB: If infinitive type is syntactic subject (which is the 
		  default), there is a built-in type in types.xml file called
		  "subject-case". Include in this type all the subjects that
		  can be controlled e.g. nominative subjects only (as in German), 
		  dative and nominative subjects (as in Malayalam) etc. In this
		  case, the controllee is not semantically restricted.
		  
		  If infinitive type is semantic subject, you need a larger
		  fragment of Hybrid Logic than HLDS uses to implement identity
		  of two event variables e.g.
		  
		  @_e(Arg1 a) ^ @_e(Arg1 b) - -> @_a(b)
		  
		  where a is the event variable for controller verb, and
		  b is the event variable for the controlled verb, and Arg1 is the
		  modality for primary arguments (1s).
		  
		  This constraint is formulable in HL but HLDS does not cover that
		  fragment (yet). When it does, the lf tag should just stick in that
		  constraint.
		  
		  Currently, OpenCCG can generate an LF with TWO non-identical Arg1 modalities
		  in the same event structure, therefore some illicit examples would
		  go through.
		-->
                     <feat attr="case" val="subject-case"/>
                     <feat attr="index">
                        <lf>
                           <nomvar name="X2"/>
                        </lf>
                        <!--NB: Index is same as Arg2's  -->
                     </feat>
                  </fs>
               </atomcat>
            </complexcat>
            <slash dir="\"/>
            <atomcat type="np">
               <fs id="2">
                  <feat attr="case" val="p-case"/>
                  <feat attr="index">
                     <lf>
                        <nomvar name="X2"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <lf>
               <satop nomvar="E">
                  <prop name="[*DEFAULT*]"/>
                  <diamond mode="Arg1">
                     <nomvar name="X1"/>
                  </diamond>
                  <diamond mode="Arg2">
                     <nomvar name="X2"/>
                  </diamond>
                  <diamond mode="Arg3">
                     <nomvar name="E2"/>
                     <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
                  </diamond>
               </satop>
            </lf>
         </complexcat>
      </entry>
   </family>
   <family closed="true" pos="V" name="TV-control1">
      <entry name="primary">
         <complexcat>
            <atomcat type="s">
               <fs id="100">
                  <feat attr="index">
                     <lf>
                        <nomvar name="E"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <slash dir="\"/>
            <atomcat type="np">
               <fs id="1">
                  <feat attr="case" val="a-case"/>
                  <feat attr="index">
                     <lf>
                        <nomvar name="X1"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <slash dir="\"/>
            <complexcat>
               <!--NB: Word order and directionality of embedded clause's 
|(S|NP) type is an 'educated guess' from the syntactic type of TV. 
Change them accordingly.
  -->
               <atomcat type="s">
                  <fs id="3">
                     <feat val="non-fin" attr="vform"/>
                     <feat attr="index">
                        <lf>
                           <nomvar name="E2"/>
                        </lf>
                     </feat>
                  </fs>
               </atomcat>
               <slash dir="|"/>
               <atomcat type="np">
                  <fs id="4">
                     <!-- NB: If infinitive type is syntactic subject (which is the 
		  default), there is a built-in type in types.xml file called
		  "subject-case". Include in this type all the subjects that
		  can be controlled e.g. nominative subjects only (as in German), 
		  dative and nominative subjects (as in Malayalam) etc. In this
		  case, the controllee is not semantically restricted.
		  
		  If infinitive type is semantic subject, you need a larger
		  fragment of Hybrid Logic than HLDS uses to implement identity
		  of two event variables e.g.
		  
		  @_e(Arg1 a) ^ @_e(Arg1 b) - -> @_a(b)
		  
		  where a is the event variable for controller verb, and
		  b is the event variable for the controlled verb, and Arg1 is the
		  modality for primary arguments (1s).
		  
		  This constraint is formulable in HL but HLDS does not cover that
		  fragment (yet). When it does, the lf tag should just stick in that
		  constraint.
		  
		  Currently, OpenCCG can generate an LF with TWO non-identical Arg1 modalities
		  in the same event structure, therefore some illicit examples would
		  go through.
		-->
                     <feat attr="case" val="subject-case"/>
                     <feat attr="index">
                        <lf>
                           <nomvar name="X1"/>
                        </lf>
                        <!--NB: Index is same as Arg1's -->
                     </feat>
                  </fs>
               </atomcat>
            </complexcat>
            <slash dir="\"/>
            <atomcat type="np">
               <fs id="2">
                  <feat attr="case" val="p-case"/>
                  <feat attr="index">
                     <lf>
                        <nomvar name="X2"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <lf>
               <satop nomvar="E">
                  <prop name="[*DEFAULT*]"/>
                  <diamond mode="Arg1">
                     <nomvar name="X1"/>
                  </diamond>
                  <diamond mode="Arg2">
                     <nomvar name="X2"/>
                  </diamond>
                  <diamond mode="Arg3">
                     <nomvar name="E2"/>
                     <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
                  </diamond>
               </satop>
            </lf>
         </complexcat>
      </entry>
   </family>
   <family closed="true" pos="V" name="IV-control1">
      <entry name="primary">
         <complexcat>
            <atomcat type="s">
               <fs id="100">
                  <feat attr="index">
                     <lf>
                        <nomvar name="E"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <slash dir="\"/>
            <atomcat type="np">
               <fs id="1">
                  <feat attr="case" val="a-case"/>
                  <feat attr="index">
                     <lf>
                        <nomvar name="X1"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <slash dir="\"/>
            <complexcat>
               <!--NB: Word order and directionality of embedded clause's 
|(S|NP) type is an 'educated guess' from the syntactic type of TV. 
Change them accordingly.
  -->
               <atomcat type="s">
                  <fs id="3">
                     <feat val="non-fin" attr="vform"/>
                     <feat attr="index">
                        <lf>
                           <nomvar name="E2"/>
                        </lf>
                     </feat>
                  </fs>
               </atomcat>
               <slash dir="|"/>
               <atomcat type="np">
                  <fs id="4">
                     <!-- NB: If infinitive type is syntactic subject (which is the 
		  default), there is a built-in type in types.xml file called
		  "subject-case". Include in this type all the subjects that
		  can be controlled e.g. nominative subjects only (as in German), 
		  dative and nominative subjects (as in Malayalam) etc. In this
		  case, the controllee is not semantically restricted.
		  
		  If infinitive type is semantic subject, you need a larger
		  fragment of Hybrid Logic than HLDS uses to implement identity
		  of two event variables e.g.
		  
		  @_e(Arg1 a) ^ @_e(Arg1 b) - -> @_a(b)
		  
		  where a is the event variable for controller verb, and
		  b is the event variable for the controlled verb, and Arg1 is the
		  modality for primary arguments (1s).
		  
		  This constraint is formulable in HL but HLDS does not cover that
		  fragment (yet). When it does, the lf tag should just stick in that
		  constraint.
		  
		  Currently, OpenCCG can generate an LF with TWO non-identical Arg1 modalities
		  in the same event structure, therefore some illicit examples would
		  go through.
		-->
                     <feat attr="case" val="subject-case"/>
                     <feat attr="index">
                        <lf>
                           <nomvar name="X1"/>
                        </lf>
                        <!--NB: Index is same as Arg1's -->
                     </feat>
                  </fs>
               </atomcat>
            </complexcat>
            <lf>
               <satop nomvar="E">
                  <prop name="[*DEFAULT*]"/>
                  <diamond mode="Arg1">
                     <nomvar name="X1"/>
                  </diamond>
                  <diamond mode="Arg2">
                     <nomvar name="E2"/>
                     <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
                  </diamond>
               </satop>
            </lf>
         </complexcat>
      </entry>
   </family>
   <!--

    *** End of derived families ***
 
        Add new families here, and merge the new entries for preset
         families as needed (e.g., you may add an entry to TV family
         for pro-dropping the subject etc.)
  -->
</ccg-lexicon>


================================================
FILE: grammars/mini-english/rules.xml
================================================
<?xml version='1.0' encoding='UTF-8'?>
<rules
xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
    xsi:noNamespaceSchemaLocation="../rules.xsd"
>
  <application dir="forward"/>
  <application dir="backward"/>
  <composition dir="forward" harmonic="true"/>
  <composition dir="forward" harmonic="false"/>
  <composition dir="backward" harmonic="true"/>
  <composition dir="backward" harmonic="false"/>
  <typeraising dir="forward" useDollar="false"/>
  <typeraising dir="backward" useDollar="true"/>
  <substitution dir="forward" harmonic="true"/>
  <substitution dir="forward" harmonic="false"/>
  <substitution dir="backward" harmonic="true"/>
  <substitution dir="backward" harmonic="false"/>
</rules>


================================================
FILE: grammars/mini-english/testbed.out
================================================
Loading grammar from URL: file:/home/bozsahin/openccg/grammars/mini-english/grammar.xml

Parse	Realize	String
-----	-------	------
ok	-	John promised him to exercise
ok	-	John persuaded him to read the book
ok	-	*John promised him Sue see
ok	-	John gave Mary and read a book
ok	-	the doctor punched the patient and fell-down


================================================
FILE: grammars/mini-english/testbed.xml
================================================
<?xml version="1.0"?>
<regression>
  <item numOfParses="1" string="John promised him to exercise"/>
  <item numOfParses="1" string="John persuaded him to read the book"/>
  <item numOfParses="0" string="John promised him Sue see"/>
  <item numOfParses="2" string="John gave Mary and read a book"/>
  <item numOfParses="1" string="the doctor punched the patient and fell-down"/>
</regression>


================================================
FILE: grammars/mini-english/types.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!-- 
      - This file is generated by parametric-types.xsl from parameter specs
	    (parameters.xml) to set up  types.xml file for development.
         
      - If the language in question has eg. quirky subjects etc., add their 
	    values under appropriate types.
	 
	 -->
<!--
	   subject-case, s-case, p-case and a-case are pre-defined types that are
	   used in the automatically generated initial lexicon (preset-families
	   .xml). We recommend that you dont change them. They handle
	   accusative/ergative mapping among other things (cf. types.xml initial
	   hierarchy).
	  
	 -->
<types xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:noNamespaceSchemaLocation="../types.xsd" name="English">
  <type name="s-case" parents="subject-case"/>
  <type name="subject-case"/>
  <type parents="a-case s-case" name="nom"/>
  <type name="a-case" parents="subject-case"/>
  <type parents="p-case" name="acc"/>
  <type name="p-case"/>
</types>


================================================
FILE: grammars/mini-inuit/build.xml
================================================
<!-- $Id: build.xml,v 1.2 2007/03/26 18:31:12 mwhite14850 Exp $ -->
<!-- Copyright (C) 2003 University of Edinburgh (Michael White) and Cem Bozsahin -->
<project default="grammar" basedir=".">

  <!-- =================================================================== -->
  <!-- Initialization target                                               -->
  <!-- =================================================================== -->
  <target name="init">
    <tstamp/>
    <property name="Name" value="OpenCCG"/>
    <property name="name" value="openccg"/>

    <echo message="----------- ${Name} ------------"/>

    <property name="lib.dir" value="${openccg.home}/lib"/>
    <property name="grammars.dir" value="${openccg.home}/grammars"/>

    <path id="validate.classpath">
      <pathelement location="${lib.dir}/xercesImpl.jar"/>
      <pathelement location="${lib.dir}/${name}.jar"/>
    </path>
  </target>
  

  <!-- =================================================================== -->
  <!-- Help on usage                                                       -->
  <!-- =================================================================== -->
  <target name="usage">
    <echo message=""/>
    <echo message=""/>
    <echo message="OpenCCG grammar build file"/>
    <echo message="-------------------------------------------------------------"/>
    <echo message=""/>
    <echo message=" Available targets are:"/>
    <echo message=""/>
    <echo message="   grammar  --> builds the grammar (default)"/>
    <echo message=""/>
    <echo message="   skeleton  --> builds the skeleton file"/>
    <echo message=""/>
    <echo message=" See the comments inside the build.xml file for more details."/>
    <echo message="-------------------------------------------------------------"/>
    <echo message=""/>
    <echo message=""/>
  </target>
  

  <!-- =================================================================== -->
  <!-- Builds grammar                                                     -->
  <!-- =================================================================== -->
  <target name="grammar" depends="init" description="builds grammar">
    <echo message="Adding family members from dict.xml to lexicon-base.xml, yielding lexicon.xml"/>
    <java classname="org.apache.xalan.xslt.Process"> 
      <arg value="-IN"/> <arg value="lexicon-base.xml"/>
      <arg value="-XSL"/> <arg value="${grammars.dir}/add-family-members.xsl"/>
      <arg value="-PARAM"/> <arg value="dict-file"/> <arg value="${basedir}/dict.xml"/>
      <arg value="-OUT"/> <arg value="lexicon.xml"/>
    </java>
    <echo message="Extracting morph items from dict.xml to morph.xml"/>
    <java classname="org.apache.xalan.xslt.Process"> 
      <arg value="-IN"/> <arg value="${basedir}/dict.xml"/>
      <arg value="-XSL"/> <arg value="${grammars.dir}/extract-morph.xsl"/>
      <arg value="-OUT"/> <arg value="morph.xml"/>
    </java>
    <echo message="Validating grammar.xml, lexicon.xml, morph.xml, rules.xml and types.xml"/>
    <java classname="opennlp.ccg.test.Validator" classpathref="validate.classpath" fork="true"> 
      <arg value="grammar.xml"/>
      <arg value="lexicon.xml"/>
      <arg value="morph.xml"/>
      <arg value="rules.xml"/>
      <arg value="types.xml"/>
    </java>
  </target>

  <target name="skeleton"
          depends="init"
 description="Builds pre-lexicon to start up lexicon development">
    <echo message="Validating parameters.xml"/>
    <java classname="opennlp.ccg.test.Validator" classpathref="validate.classpath" fork="true"> 
      <arg value="parameters.xml"/>
    </java>
    <echo message="Generating preset-families.xml"/>
    <java classname="org.apache.xalan.xslt.Process">
      <arg value="-IN"/> <arg value="${basedir}/parameters.xml"/>
      <arg value="-XSL"/> <arg value="${grammars.dir}/parametric-lexicon.xsl"/>
      <arg value="-OUT"/> <arg value="${basedir}/preset-families.xml"/>
    </java>
    <echo message="Validating preset-families.xml"/>
    <java classname="opennlp.ccg.test.Validator" classpathref="validate.classpath" fork="true"> 
      <arg value="preset-families.xml"/>
    </java>
	<echo message="Generating types.xml"/>
    <java classname="org.apache.xalan.xslt.Process">
      <arg value="-IN"/> <arg value="${basedir}/parameters.xml"/>
      <arg value="-XSL"/> <arg value="${grammars.dir}/parametric-types.xsl"/>
      <arg value="-OUT"/> <arg value="${basedir}/types.xml"/>
    </java>
    <echo message="Validating types.xml"/>
    <java classname="opennlp.ccg.test.Validator" classpathref="validate.classpath" fork="true"> 
      <arg value="types.xml"/>
    </java>
  </target>
</project>

<!-- End of file -->


================================================
FILE: grammars/mini-inuit/dict.xml
================================================
<?xml version="1.0"?>

<dictionary name="Inuit">
 
  <entry stem="qiti" pred="dance" pos="V">
    <member-of family="IV"/>
    <word form="qitissallutik"/>
  </entry>
  <entry stem="kamat" pred="angry" pos="V">
    <member-of family="IV"/>
    <word form="kamat"/>
  </entry>
  <entry stem="niriursui" pred="promise" pos="V">
    <member-of family="TV"/>
    <member-of family="IV-control1"/>
    <word form="niriursuipput"/>
  </entry>
  <entry stem="tugu" pred="kill" pos="V">
    <member-of family="TV"/>
    <word form="tugu" />
  </entry>
  <entry stem="ikiu" pred="help" pos="V">
    <member-of family="TV"/>
    <word form="ikiussallugu" />
  </entry>
  <entry stem="miiqqat" pred="children" pos="NP">
    <member-of family="Noun"/>
    <word form="miiqqat"/>
  </entry>
  <entry stem="miiraq" pred="child" pos="NP">
    <member-of family="Noun"/>
    <word form="miiraq" />
  </entry>
  <entry stem="Juuna" pred="Juuna" pos="NP">
    <member-of family="Noun"/>
    <word form="Juuna" />
  </entry>
  <entry stem="Piita" pred="Piita" pos="NP">
    <member-of family="Noun"/>
    <word form="Piita" />
  </entry>
  <entry stem="nanuq" pred="polar-bear" pos="NP">
    <member-of family="Noun"/>
    <word form="nanuq" />
  </entry>
  <entry stem="p" pos="Affix">
    <member-of family="case"/>
    <word form="p" macros="@erg" />
  </entry>
  <entry stem="ta" pos="Affix">
    <member-of family="rel"/>
    <word form="taa" />
    <word form="tuq" />
  </entry>


<macro name="@erg">
  <fs id="0" attr="case" val="a-case"/>
</macro>
</dictionary>


================================================
FILE: grammars/mini-inuit/grammar.xml
================================================
<?xml version="1.0"?>
<!-- 
Copyright (C) 2003 University of Edinburgh (Michael White) and Cem Bozsahin
$Revision: 1.1 $, $Date: 2005/08/03 14:23:28 $ 
-->
<grammar name="Inuit"
  xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
  xsi:noNamespaceSchemaLocation="../grammar.xsd"
>

  <lexicon file="lexicon.xml"/>
  <morphology file="morph.xml"/>
  <rules file="rules.xml"/>
  <types file="types.xml"/>

</grammar>


================================================
FILE: grammars/mini-inuit/lexicon-base.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!-- 
      - This file is generated by lexicon-skeleton.xsl to set up
          accusativity/ergativity parameter for IV and TV primary families
          and control primary families.

          NB: pre-CCG categories of lexicon-skeleton.xml are mapped to
              CCG categories in this file. From now on, it's all CCG

    Suggestions to start-up lexicon development:

      1) Copy this file to lexicon-base.xml to avoid losing your changes
         to it (remember, this file is auto-generated at the start)
      2) Edit lexicon-base.xml to modify the preset families and to add your 
          own families as needed (merging the entries of same family is
          left to you)
      3) Use the build facility of openCCG to build
          the lexicon.xml, morph.xml and rules.xml files needed by the system.
  -->
  <!-- Additional families by Cem Bozsahin, 6/2003 -->
  
<!--

      *** Families derived from language parameters ***

   Includes primary entries for IV, TV, TV-control1, TV-control2, IV-control1
   
  -->
<ccg-lexicon name="Inuit" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:noNamespaceSchemaLocation="../lexicon.xsd">
  <family closed="true" pos="V" name="IV">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="case" val="s-case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>

  <family closed="true" pos="V" name="TV">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <setarg>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="case" val="a-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="case" val="p-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </setarg>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="X2"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
  <family closed="true" pos="V" name="TV-control2">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <setarg>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="case" val="a-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <complexcat>
                  <!--NB: Word order and directionality of embedded clause's |(S|NP) 
type is an 'educated guess' from the syntactic type of TV. Change them
accordingly 
  -->
            <atomcat type="s">
              <fs id="3">
                <feat val="non-fin" attr="vform"/>
                <feat attr="index">
                  <lf>
                    <nomvar name="E2"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
            <slash dir="|"/>
            <atomcat type="np">
              <fs id="4">
                <feat attr="index">
                  <lf>
                    <nomvar name="X2"/>
                  </lf>
                           <!--NB: Index is same as Arg2's 
  -->
                </feat>
              </fs>
            </atomcat>
          </complexcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="case" val="subject-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </setarg>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="X2"/>
            </diamond>
            <diamond mode="Arg3">
              <nomvar name="E2"/>
                     <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
            </diamond>
          </satop>
          <satop nomvar="E2">  <!-- semantic subj control w/o case -->
            <diamond mode="Arg1">
              <nomvar name="X2"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
  <family closed="true" pos="V" name="TV-control1">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <setarg>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="case" val="a-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <complexcat>
                  <!--NB: Word order and directionality of embedded clause's 
|(S|NP) type is an 'educated guess' from the syntactic type of TV. 
Change them accordingly.
  -->
            <atomcat type="s">
              <fs id="3">
                <feat val="non-fin" attr="vform"/>
                <feat attr="index">
                  <lf>
                    <nomvar name="E2"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
            <slash dir="|"/>
            <atomcat type="np">
              <fs id="4">
               <feat attr="index">
                  <lf>
                    <nomvar name="X1"/>
                  </lf>
                           <!--NB: Index is same as Arg1's 
  -->
                </feat>
              </fs>
            </atomcat>
          </complexcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="case" val="subject-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </setarg>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="X2"/>
            </diamond>
            <diamond mode="Arg3">
              <nomvar name="E2"/>
                     <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
            </diamond>
          </satop>
          <satop nomvar="E2">  <!-- sem. subj control -->
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
          </satop>

        </lf>
      </complexcat>
    </entry>
  </family>
  <family closed="true" pos="V" name="IV-control1">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <setarg>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="case" val="s-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <complexcat>
                  <!--NB: Word order and directionality of embedded clause's 
|(S|NP) type is an 'educated guess' from the syntactic type of TV. 
Change them accordingly.
  -->
            <atomcat type="s">
              <fs id="3">
                <feat val="non-fin" attr="vform"/>
                <feat attr="index">
                  <lf>
                    <nomvar name="E2"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
            <slash dir="|"/>
            <atomcat type="np">
              <fs id="4">
                <feat attr="index">
                  <lf>
                    <nomvar name="X1"/>
                  </lf>
                           <!--NB: Index is same as Arg1's 
  -->
                </feat>
              </fs>
            </atomcat>
          </complexcat>
        </setarg>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="E2"/>
                     <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
            </diamond>
          </satop>
          <satop nomvar="E2"> <!-- sem. subj control -->
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
   <!--

    *** End of derived families ***
 
        Add new families here, and merge the new entries for preset
         families as needed (e.g., you may add an entry to TV family
         for pro-dropping the subject etc.)
  -->

<!-- these are the user-defined families for Inuit.
  -->

  <family indexRel="Restr" pos="Affix" closed="true" name="rel">
    <entry name="primary">
      <complexcat>
        <atomcat type="n">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="n">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="*"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="np">
<!-- no structure sharing with fs 0; this aint HPSG-->
            <fs id="2">
              <feat attr="case" val="subject-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="X">
            <diamond mode="Restr">
              <nomvar name="E"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>

  <family closed="true" pos="Affix" name="voice">
    <entry name="anti-passive">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="0">
            <feat attr="index">
              <lf>
                <nomvar name="P"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="np">
          <fs inheritsFrom="2">
            <feat attr="case" val="s-case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="*"/>
        <complexcat>
          <atomcat type="s">
            <fs id="0">
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="case" val="a-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="case" val="p-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="P">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Pred">
              <nomvar name="E"/>
            </diamond>
            <diamond mode="Arg1">
              <nomvar name="X"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>

  <family pos="Affix" closed="true" name="case">
    <entry name="primary">
      <complexcat>
        <atomcat type="np">
          <fs id="0">
            <feat attr="person" val="3"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="*"/>
        <atomcat type="n">
          <fs id="1">
            <feat attr="person" val="3"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X">
            <diamond mode="Spec">
              <nomvar name="D"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>

  <family pos="NP" closed="true" name="Noun">
    <entry name="primary">
      <atomcat type="np">
        <fs id="0">
          <feat attr="num">
            <featvar name="NUM"/>
          </feat>
          <feat attr="case" val="s-case"/>
          <feat attr="index">
            <lf>
              <nomvar name="X"/>
            </lf>
          </feat>
        </fs>
        <lf>
          <satop nomvar="X">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </atomcat>
    </entry>
    <entry name="bare">
      <atomcat type="n">
        <fs id="1">
          <feat attr="num">
            <featvar name="NUM"/>
          </feat>
          <feat attr="index">
            <lf>
              <nomvar name="X"/>
            </lf>
          </feat>
        </fs>
        <lf>
          <satop nomvar="X">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </atomcat>
    </entry>
  </family>

  <family closed="true" pos="Conj" name="Conj">
    <entry name="sentential">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S0"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash/>
        <dollar name="1"/>
        <slash dir="/" mode="*"/>
        <complexcat>
          <atomcat type="s">
            <fs inheritsFrom="1">
              <feat attr="index">
                <lf>
                  <nomvar name="S1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
        </complexcat>
        <slash dir="\" mode="*"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="S2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
        </complexcat>
        <lf>
          <satop nomvar="S0">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="List">
              <nomvar name="S1"/>
              <diamond mode="Coord">
                <nomvar name="S2"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>

</ccg-lexicon>


================================================
FILE: grammars/mini-inuit/lexicon.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!-- 
      - This file is generated by lexicon-skeleton.xsl to set up
          accusativity/ergativity parameter for IV and TV primary families
          and control primary families.

          NB: pre-CCG categories of lexicon-skeleton.xml are mapped to
              CCG categories in this file. From now on, it's all CCG

    Suggestions to start-up lexicon development:

      1) Copy this file to lexicon-base.xml to avoid losing your changes
         to it (remember, this file is auto-generated at the start)
      2) Edit lexicon-base.xml to modify the preset families and to add your 
          own families as needed (merging the entries of same family is
          left to you)
      3) Use the build facility of openCCG to build
          the lexicon.xml, morph.xml and rules.xml files needed by the system.
  -->
<!-- Additional families by Cem Bozsahin, 6/2003 -->
<!--

      *** Families derived from language parameters ***

   Includes primary entries for IV, TV, TV-control1, TV-control2, IV-control1
   
  -->
<ccg-lexicon xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" name="Inuit" xsi:noNamespaceSchemaLocation="../lexicon.xsd">
  <family closed="true" pos="V" name="IV">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="case" val="s-case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="qiti" pred="dance"/>
    <member stem="kamat" pred="angry"/>
  </family>
  <family closed="true" pos="V" name="TV">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <setarg>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="case" val="a-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="case" val="p-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </setarg>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="X2"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="niriursui" pred="promise"/>
    <member stem="tugu" pred="kill"/>
    <member stem="ikiu" pred="help"/>
  </family>
  <family closed="true" pos="V" name="TV-control2">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <setarg>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="case" val="a-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <complexcat>
            <!--NB: Word order and directionality of embedded clause's |(S|NP) 
type is an 'educated guess' from the syntactic type of TV. Change them
accordingly 
  -->
            <atomcat type="s">
              <fs id="3">
                <feat val="non-fin" attr="vform"/>
                <feat attr="index">
                  <lf>
                    <nomvar name="E2"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
            <slash dir="|"/>
            <atomcat type="np">
              <fs id="4">
                <feat attr="index">
                  <lf>
                    <nomvar name="X2"/>
                  </lf>
                  <!--NB: Index is same as Arg2's 
  -->
                </feat>
              </fs>
            </atomcat>
          </complexcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="case" val="subject-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </setarg>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="X2"/>
            </diamond>
            <diamond mode="Arg3">
              <nomvar name="E2"/>
              <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
            </diamond>
          </satop>
          <satop nomvar="E2">
            <!-- semantic subj control w/o case -->
            <diamond mode="Arg1">
              <nomvar name="X2"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
  <family closed="true" pos="V" name="TV-control1">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <setarg>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="case" val="a-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <complexcat>
            <!--NB: Word order and directionality of embedded clause's 
|(S|NP) type is an 'educated guess' from the syntactic type of TV. 
Change them accordingly.
  -->
            <atomcat type="s">
              <fs id="3">
                <feat val="non-fin" attr="vform"/>
                <feat attr="index">
                  <lf>
                    <nomvar name="E2"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
            <slash dir="|"/>
            <atomcat type="np">
              <fs id="4">
                <feat attr="index">
                  <lf>
                    <nomvar name="X1"/>
                  </lf>
                  <!--NB: Index is same as Arg1's 
  -->
                </feat>
              </fs>
            </atomcat>
          </complexcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="case" val="subject-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </setarg>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="X2"/>
            </diamond>
            <diamond mode="Arg3">
              <nomvar name="E2"/>
              <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
            </diamond>
          </satop>
          <satop nomvar="E2">
            <!-- sem. subj control -->
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
  <family closed="true" pos="V" name="IV-control1">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <setarg>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="case" val="s-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <complexcat>
            <!--NB: Word order and directionality of embedded clause's 
|(S|NP) type is an 'educated guess' from the syntactic type of TV. 
Change them accordingly.
  -->
            <atomcat type="s">
              <fs id="3">
                <feat val="non-fin" attr="vform"/>
                <feat attr="index">
                  <lf>
                    <nomvar name="E2"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
            <slash dir="|"/>
            <atomcat type="np">
              <fs id="4">
                <feat attr="index">
                  <lf>
                    <nomvar name="X1"/>
                  </lf>
                  <!--NB: Index is same as Arg1's 
  -->
                </feat>
              </fs>
            </atomcat>
          </complexcat>
        </setarg>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="E2"/>
              <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
            </diamond>
          </satop>
          <satop nomvar="E2">
            <!-- sem. subj control -->
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="niriursui" pred="promise"/>
  </family>
  <!--

    *** End of derived families ***
 
        Add new families here, and merge the new entries for preset
         families as needed (e.g., you may add an entry to TV family
         for pro-dropping the subject etc.)
  -->
  <!-- these are the user-defined families for Inuit.
  -->
  <family indexRel="Restr" pos="Affix" closed="true" name="rel">
    <entry name="primary">
      <complexcat>
        <atomcat type="n">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="n">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="*"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="np">
            <!-- no structure sharing with fs 0; this aint HPSG-->
            <fs id="2">
              <feat attr="case" val="subject-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="X">
            <diamond mode="Restr">
              <nomvar name="E"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="ta"/>
  </family>
  <family closed="true" pos="Affix" name="voice">
    <entry name="anti-passive">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="0">
            <feat attr="index">
              <lf>
                <nomvar name="P"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="np">
          <fs inheritsFrom="2">
            <feat attr="case" val="s-case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="*"/>
        <complexcat>
          <atomcat type="s">
            <fs id="0">
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="case" val="a-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="case" val="p-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="P">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Pred">
              <nomvar name="E"/>
            </diamond>
            <diamond mode="Arg1">
              <nomvar name="X"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
  <family pos="Affix" closed="true" name="case">
    <entry name="primary">
      <complexcat>
        <atomcat type="np">
          <fs id="0">
            <feat attr="person" val="3"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="*"/>
        <atomcat type="n">
          <fs id="1">
            <feat attr="person" val="3"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X">
            <diamond mode="Spec">
              <nomvar name="D"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="p"/>
  </family>
  <family pos="NP" closed="true" name="Noun">
    <entry name="primary">
      <atomcat type="np">
        <fs id="0">
          <feat attr="num">
            <featvar name="NUM"/>
          </feat>
          <feat attr="case" val="s-case"/>
          <feat attr="index">
            <lf>
              <nomvar name="X"/>
            </lf>
          </feat>
        </fs>
        <lf>
          <satop nomvar="X">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </atomcat>
    </entry>
    <entry name="bare">
      <atomcat type="n">
        <fs id="1">
          <feat attr="num">
            <featvar name="NUM"/>
          </feat>
          <feat attr="index">
            <lf>
              <nomvar name="X"/>
            </lf>
          </feat>
        </fs>
        <lf>
          <satop nomvar="X">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </atomcat>
    </entry>
    <member stem="miiqqat" pred="children"/>
    <member stem="miiraq" pred="child"/>
    <member stem="Juuna" pred="Juuna"/>
    <member stem="Piita" pred="Piita"/>
    <member stem="nanuq" pred="polar-bear"/>
  </family>
  <family closed="true" pos="Conj" name="Conj">
    <entry name="sentential">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S0"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash/>
        <dollar name="1"/>
        <slash dir="/" mode="*"/>
        <complexcat>
          <atomcat type="s">
            <fs inheritsFrom="1">
              <feat attr="index">
                <lf>
                  <nomvar name="S1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
        </complexcat>
        <slash dir="\" mode="*"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="S2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
        </complexcat>
        <lf>
          <satop nomvar="S0">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="List">
              <nomvar name="S1"/>
              <diamond mode="Coord">
                <nomvar name="S2"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
</ccg-lexicon>


================================================
FILE: grammars/mini-inuit/morph.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<morph xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:noNamespaceSchemaLocation="../morph.xsd" name="Inuit">
  <entry pos="V" word="qitissallutik" stem="qiti"/>
  <entry pos="V" word="kamat"/>
  <entry pos="V" word="niriursuipput" stem="niriursui"/>
  <entry pos="V" word="tugu"/>
  <entry pos="V" word="ikiussallugu" stem="ikiu"/>
  <entry pos="NP" word="miiqqat"/>
  <entry pos="NP" word="miiraq"/>
  <entry pos="NP" word="Juuna"/>
  <entry pos="NP" word="Piita"/>
  <entry pos="NP" word="nanuq"/>
  <entry pos="Affix" word="p" macros="@erg"/>
  <entry pos="Affix" word="taa" stem="ta"/>
  <entry pos="Affix" word="tuq" stem="ta"/>
  <macro name="@erg">
    <fs id="0" attr="case" val="a-case"/>
  </macro>
</morph>


================================================
FILE: grammars/mini-inuit/parameters.xml
================================================
<?xml version="1.0"?>

<!-- Mini Inuit parameter specifications - June 2004 Cem Bozsahin -->

<language name="Inuit" type="erg" 
	
	xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" 
	xsi:noNamespaceSchemaLocation="../parameters.xsd"> 
	
  <parameters>

   <!-- NB1: predicate, setarg, arg, x-argument are pre-CCG categories.
             This notation is mapped to CCG notation by lexical rules.
             setarg and arg are serialized as in CCG.
  
        NB2: TV skeleton should NOT carry case information; it is set up 
             from language type and single argument of the IV

        NB3: IV's only argument MUST have its case specified 
        
    -->
		
    <infinitive subject-type="semantic"/>
       
    <iv>
      <predicate syn-type="s"/>
      <arg>
        <s-argument dir="\" syn-type="np" case="abs"/>
      </arg>
    </iv>

   <!-- For example, Basque's
        tv category simply says the order is V-A-P and V-P-A because
        the specs give Pred{\A-Arg, \P-Arg}.
        Pred, A-Arg, P-Arg are syntactically: s, np, np. 
     -->
		
    <tv>
      <predicate syn-type="s"/>
      <setarg>
        <a-argument dir="\" syn-type="np"/>
        <p-argument dir="\" syn-type="np"/>
      </setarg>
    </tv>
	
  </parameters>

</language>


================================================
FILE: grammars/mini-inuit/preset-families.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!-- 
      - This file is generated by parametric-lexicon.xsl to set up
          accusativity/ergativity parameter for IV and TV primary families
          and control primary families.

          NB: pre-CCG categories of parameters.xml are mapped to
              CCG categories in this file. From now on, it's all CCG

    Suggestions to start-up lexicon development:

      1) Copy this file to lexicon-base.xml to avoid losing your changes
         to it (remember, this file is auto-generated at the start)
      2) Edit lexicon-base.xml to modify the preset families and to add your 
          own families as needed (merging the entries of same family is
          left to you)
      3) Use the ccg-build facility of openCCG, which uses lexicon-base to build
          the lexicon.xml, morph.xml and rules.xml files needed by the system.
  -->
<!--

      *** Families derived from language parameters ***

   Includes primary entries for IV (unerg and unacc), basic TV, TV-control1, 
   TV-control2, IV-control1
   
  -->
<!--
  subject-case, s-case, p-case and a-case are value types that set up ergative-
  accusative mapping and surface cases of these argumnents (cf. types.xml file).
  Actual case values for them (e.g. nom for a-case in accusative languages,
  erg for a-case in ergative languages) are defined in types.xml file.
  You can of course refer to actual values since they are types,  but if a
  construction is related to GR mapping (ERG or ACC), it's better to use
  subject-cases (which covers a-case and s-case in ACC; p-case and s-case in ERG).
  Types.xml sets these up from parameter specification.
  
  -->
<ccg-lexicon xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:noNamespaceSchemaLocation="../lexicon.xsd" name="Inuit">
   <family closed="true" pos="V" name="unergative">
      <entry name="primary">
         <complexcat>
            <atomcat type="s">
               <fs id="100">
                  <feat attr="index">
                     <lf>
                        <nomvar name="E"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <slash dir="\"/>
            <atomcat type="np">
               <fs id="1">
                  <feat attr="case" val="s-case"/>
                  <feat attr="index">
                     <lf>
                        <nomvar name="X1"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <lf>
               <satop nomvar="E">
                  <prop name="[*DEFAULT*]"/>
                  <diamond mode="Arg1">
                     <nomvar name="X1"/>
                  </diamond>
                  <diamond mode="Arg2">
                     <nom name="one"/>
                  </diamond>
               </satop>
            </lf>
         </complexcat>
      </entry>
   </family>
   <family closed="true" pos="V" name="unaccusative">
      <entry name="primary">
         <complexcat>
            <atomcat type="s">
               <fs id="100">
                  <feat attr="index">
                     <lf>
                        <nomvar name="E"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <slash dir="\"/>
            <atomcat type="np">
               <fs id="1">
                  <feat attr="case" val="s-case"/>
                  <feat attr="index">
                     <lf>
                        <nomvar name="X1"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <lf>
               <satop nomvar="E">
                  <prop name="[*DEFAULT*]"/>
                  <diamond mode="Arg2">
                     <nomvar name="X1"/>
                  </diamond>
                  <diamond mode="Arg1">
                     <nom name="one"/>
                  </diamond>
               </satop>
            </lf>
         </complexcat>
      </entry>
   </family>
   <family closed="true" pos="V" name="TV">
      <entry name="primary">
         <complexcat>
            <atomcat type="s">
               <fs id="100">
                  <feat attr="index">
                     <lf>
                        <nomvar name="E"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <setarg>
               <slash dir="\"/>
               <atomcat type="np">
                  <fs id="1">
                     <feat attr="case" val="a-case"/>
                     <feat attr="index">
                        <lf>
                           <nomvar name="X1"/>
                        </lf>
                     </feat>
                  </fs>
               </atomcat>
               <slash dir="\"/>
               <atomcat type="np">
                  <fs id="2">
                     <feat attr="case" val="p-case"/>
                     <feat attr="index">
                        <lf>
                           <nomvar name="X2"/>
                        </lf>
                     </feat>
                  </fs>
               </atomcat>
            </setarg>
            <lf>
               <satop nomvar="E">
                  <prop name="[*DEFAULT*]"/>
                  <diamond mode="Arg1">
                     <nomvar name="X1"/>
                  </diamond>
                  <diamond mode="Arg2">
                     <nomvar name="X2"/>
                  </diamond>
               </satop>
            </lf>
         </complexcat>
      </entry>
   </family>
   <family closed="true" pos="V" name="TV-control2">
      <entry name="primary">
         <complexcat>
            <atomcat type="s">
               <fs id="100">
                  <feat attr="index">
                     <lf>
                        <nomvar name="E"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <setarg>
               <slash dir="\"/>
               <atomcat type="np">
                  <fs id="1">
                     <feat attr="case" val="a-case"/>
                     <feat attr="index">
                        <lf>
                           <nomvar name="X1"/>
                        </lf>
                     </feat>
                  </fs>
               </atomcat>
               <slash dir="\"/>
               <complexcat>
                  <!--NB: Word order and directionality of embedded clause's |(S|NP) 
type is an 'educated guess' from the syntactic type of TV. Change them
accordingly 
  -->
                  <atomcat type="s">
                     <fs id="3">
                        <feat val="non-fin" attr="vform"/>
                        <feat attr="index">
                           <lf>
                              <nomvar name="E2"/>
                           </lf>
                        </feat>
                     </fs>
                  </atomcat>
                  <slash dir="|"/>
                  <atomcat type="np">
                     <fs id="4">
                        <!-- NB: If infinitive type is syntactic subject (which is the 
		  default), there is a built-in type in types.xml file called
		  "subject-case". Include in this type all the subjects that
		  can be controlled e.g. nominative subjects only (as in German), 
		  dative and nominative subjects (as in Malayalam) etc. In this
		  case, the controllee is not semantically restricted.
		  
		  If infinitive type is semantic subject, you need a larger
		  fragment of Hybrid Logic than HLDS uses to implement identity
		  of two event variables e.g.
		  
		  @_e(Arg1 a) ^ @_e(Arg1 b) - -> @_a(b)
		  
		  where a is the event variable for controller verb, and
		  b is the event variable for the controlled verb, and Arg1 is the
		  modality for primary arguments (1s).
		  
		  This constraint is formulable in HL but HLDS does not cover that
		  fragment (yet). When it does, the lf tag should just stick in that
		  constraint.
		  
		  Currently, OpenCCG can generate an LF with TWO non-identical Arg1 modalities
		  in the same event structure, therefore some illicit examples would
		  go through.
		-->
                        <feat attr="index">
                           <lf>
                              <nomvar name="X2"/>
                           </lf>
                           <!--NB: Index is same as Arg2's -->
                        </feat>
                     </fs>
                  </atomcat>
               </complexcat>
               <slash dir="\"/>
               <atomcat type="np">
                  <fs id="2">
                     <feat attr="case" val="p-case"/>
                     <feat attr="index">
                        <lf>
                           <nomvar name="X2"/>
                        </lf>
                     </feat>
                  </fs>
               </atomcat>
            </setarg>
            <lf>
               <satop nomvar="E">
                  <prop name="[*DEFAULT*]"/>
                  <diamond mode="Arg1">
                     <nomvar name="X1"/>
                  </diamond>
                  <diamond mode="Arg2">
                     <nomvar name="X2"/>
                  </diamond>
                  <diamond mode="Arg3">
                     <nomvar name="E2"/>
                     <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
                  </diamond>
               </satop>
            </lf>
         </complexcat>
      </entry>
   </family>
   <family closed="true" pos="V" name="TV-control1">
      <entry name="primary">
         <complexcat>
            <atomcat type="s">
               <fs id="100">
                  <feat attr="index">
                     <lf>
                        <nomvar name="E"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <setarg>
               <slash dir="\"/>
               <atomcat type="np">
                  <fs id="1">
                     <feat attr="case" val="a-case"/>
                     <feat attr="index">
                        <lf>
                           <nomvar name="X1"/>
                        </lf>
                     </feat>
                  </fs>
               </atomcat>
               <slash dir="\"/>
               <complexcat>
                  <!--NB: Word order and directionality of embedded clause's 
|(S|NP) type is an 'educated guess' from the syntactic type of TV. 
Change them accordingly.
  -->
                  <atomcat type="s">
                     <fs id="3">
                        <feat val="non-fin" attr="vform"/>
                        <feat attr="index">
                           <lf>
                              <nomvar name="E2"/>
                           </lf>
                        </feat>
                     </fs>
                  </atomcat>
                  <slash dir="|"/>
                  <atomcat type="np">
                     <fs id="4">
                        <!-- NB: If infinitive type is syntactic subject (which is the 
		  default), there is a built-in type in types.xml file called
		  "subject-case". Include in this type all the subjects that
		  can be controlled e.g. nominative subjects only (as in German), 
		  dative and nominative subjects (as in Malayalam) etc. In this
		  case, the controllee is not semantically restricted.
		  
		  If infinitive type is semantic subject, you need a larger
		  fragment of Hybrid Logic than HLDS uses to implement identity
		  of two event variables e.g.
		  
		  @_e(Arg1 a) ^ @_e(Arg1 b) - -> @_a(b)
		  
		  where a is the event variable for controller verb, and
		  b is the event variable for the controlled verb, and Arg1 is the
		  modality for primary arguments (1s).
		  
		  This constraint is formulable in HL but HLDS does not cover that
		  fragment (yet). When it does, the lf tag should just stick in that
		  constraint.
		  
		  Currently, OpenCCG can generate an LF with TWO non-identical Arg1 modalities
		  in the same event structure, therefore some illicit examples would
		  go through.
		-->
                        <feat attr="index">
                           <lf>
                              <nomvar name="X1"/>
                           </lf>
                           <!--NB: Index is same as Arg1's -->
                        </feat>
                     </fs>
                  </atomcat>
               </complexcat>
               <slash dir="\"/>
               <atomcat type="np">
                  <fs id="2">
                     <feat attr="case" val="p-case"/>
                     <feat attr="index">
                        <lf>
                           <nomvar name="X2"/>
                        </lf>
                     </feat>
                  </fs>
               </atomcat>
            </setarg>
            <lf>
               <satop nomvar="E">
                  <prop name="[*DEFAULT*]"/>
                  <diamond mode="Arg1">
                     <nomvar name="X1"/>
                  </diamond>
                  <diamond mode="Arg2">
                     <nomvar name="X2"/>
                  </diamond>
                  <diamond mode="Arg3">
                     <nomvar name="E2"/>
                     <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
                  </diamond>
               </satop>
            </lf>
         </complexcat>
      </entry>
   </family>
   <family closed="true" pos="V" name="IV-control1">
      <entry name="primary">
         <complexcat>
            <atomcat type="s">
               <fs id="100">
                  <feat attr="index">
                     <lf>
                        <nomvar name="E"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <setarg>
               <slash dir="\"/>
               <atomcat type="np">
                  <fs id="1">
                     <feat attr="case" val="a-case"/>
                     <feat attr="index">
                        <lf>
                           <nomvar name="X1"/>
                        </lf>
                     </feat>
                  </fs>
               </atomcat>
               <slash dir="\"/>
               <complexcat>
                  <!--NB: Word order and directionality of embedded clause's 
|(S|NP) type is an 'educated guess' from the syntactic type of TV. 
Change them accordingly.
  -->
                  <atomcat type="s">
                     <fs id="3">
                        <feat val="non-fin" attr="vform"/>
                        <feat attr="index">
                           <lf>
                              <nomvar name="E2"/>
                           </lf>
                        </feat>
                     </fs>
                  </atomcat>
                  <slash dir="|"/>
                  <atomcat type="np">
                     <fs id="4">
                        <!-- NB: If infinitive type is syntactic subject (which is the 
		  default), there is a built-in type in types.xml file called
		  "subject-case". Include in this type all the subjects that
		  can be controlled e.g. nominative subjects only (as in German), 
		  dative and nominative subjects (as in Malayalam) etc. In this
		  case, the controllee is not semantically restricted.
		  
		  If infinitive type is semantic subject, you need a larger
		  fragment of Hybrid Logic than HLDS uses to implement identity
		  of two event variables e.g.
		  
		  @_e(Arg1 a) ^ @_e(Arg1 b) - -> @_a(b)
		  
		  where a is the event variable for controller verb, and
		  b is the event variable for the controlled verb, and Arg1 is the
		  modality for primary arguments (1s).
		  
		  This constraint is formulable in HL but HLDS does not cover that
		  fragment (yet). When it does, the lf tag should just stick in that
		  constraint.
		  
		  Currently, OpenCCG can generate an LF with TWO non-identical Arg1 modalities
		  in the same event structure, therefore some illicit examples would
		  go through.
		-->
                        <feat attr="index">
                           <lf>
                              <nomvar name="X1"/>
                           </lf>
                           <!--NB: Index is same as Arg1's -->
                        </feat>
                     </fs>
                  </atomcat>
               </complexcat>
            </setarg>
            <lf>
               <satop nomvar="E">
                  <prop name="[*DEFAULT*]"/>
                  <diamond mode="Arg1">
                     <nomvar name="X1"/>
                  </diamond>
                  <diamond mode="Arg2">
                     <nomvar name="E2"/>
                     <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
                  </diamond>
               </satop>
            </lf>
         </complexcat>
      </entry>
   </family>
   <!--

    *** End of derived families ***
 
        Add new families here, and merge the new entries for preset
         families as needed (e.g., you may add an entry to TV family
         for pro-dropping the subject etc.)
  -->
</ccg-lexicon>


================================================
FILE: grammars/mini-inuit/rules.xml
================================================
<?xml version='1.0' encoding='UTF-8'?>
<rules
xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
    xsi:noNamespaceSchemaLocation="../rules.xsd"
>
  <application dir="forward"/>
  <application dir="backward"/>
  <composition dir="forward" harmonic="true"/>
  <composition dir="forward" harmonic="false"/>
  <composition dir="backward" harmonic="true"/>
  <composition dir="backward" harmonic="false"/>
  <typeraising dir="forward" useDollar="true"/>
  <typeraising dir="backward" useDollar="true"/>
  <substitution dir="forward" harmonic="true"/>
  <substitution dir="forward" harmonic="false"/>
  <substitution dir="backward" harmonic="true"/>
  <substitution dir="backward" harmonic="false"/>

  <typechanging name="pd">
    <arg>
      <complexcat>
        <atomcat type="s">
            <fs id="1">
            <feat attr="index">
             <lf>
              <nomvar name="E"/>
             </lf>
            </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
               <lf>
                <nomvar name="X"/>
               </lf>
              </feat>
            </fs>
          </atomcat>
      </complexcat>
    </arg>
    <result>
      <atomcat type="s">
        <fs >
          <feat attr="index">
            <lf>
             <nomvar name="E"/>
            </lf>
          </feat>
        </fs>
      </atomcat>
    </result>
  </typechanging>
</rules>


================================================
FILE: grammars/mini-inuit/testbed.out
================================================
Loading grammar from URL: file:/home/bozsahin/openccg/grammars/mini-inuit/grammar.xml

Parse	Realize	String
-----	-------	------
ok	-	miiqqat Juuna ikiussallugu niriursuipput
ok	-	miiqqat qitissallutik niriursuipput
ok	-	nanuq Piita p tugu taa
ok	-	miiraq kamat tuq


================================================
FILE: grammars/mini-inuit/testbed.xml
================================================
<?xml version="1.0"?>
<regression>
  <item numOfParses="2" string="miiqqat Juuna ikiussallugu niriursuipput"/>
  <item numOfParses="1" string="miiqqat qitissallutik niriursuipput"/>
  <item numOfParses="1" string="nanuq Piita p tugu taa"/>
  <item numOfParses="1" string="miiraq kamat tuq"/>
</regression>


================================================
FILE: grammars/mini-inuit/types.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!-- 
      - This file is generated by parametric-types.xsl from parameter specs
	    (parameters.xml) to set up  types.xml file for development.
         
      - If the language in question has eg. quirky subjects etc., add their 
	    values under appropriate types.
	 
	 -->
<!--
	   subject-case, s-case, p-case and a-case are pre-defined types that are
	   used in the automatically generated initial lexicon (preset-families
	   .xml). We recommend that you dont change them. They handle
	   accusative/ergative mapping among other things (cf. types.xml initial
	   hierarchy).
	  
	 -->
<types xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:noNamespaceSchemaLocation="../types.xsd" name="Inuit">
  <type name="s-case" parents="subject-case"/>
  <type name="subject-case"/>
  <type parents="a-case" name="erg"/>
  <type name="a-case"/>
  <type parents="s-case p-case" name="abs"/>
  <type name="p-case" parents="subject-case"/>
</types>


================================================
FILE: grammars/mini-nezperce/build.xml
================================================
<!-- $Id: build.xml,v 1.2 2007/03/26 18:31:12 mwhite14850 Exp $ -->
<!-- Copyright (C) 2003 University of Edinburgh (Michael White) and Cem Bozsahin -->
<project default="grammar" basedir=".">

  <!-- =================================================================== -->
  <!-- Initialization target                                               -->
  <!-- =================================================================== -->
  <target name="init">
    <tstamp/>
    <property name="Name" value="OpenCCG"/>
    <property name="name" value="openccg"/>

    <echo message="----------- ${Name} ------------"/>

    <property name="lib.dir" value="${openccg.home}/lib"/>
    <property name="grammars.dir" value="${openccg.home}/grammars"/>

    <path id="validate.classpath">
      <pathelement location="${lib.dir}/xercesImpl.jar"/>
      <pathelement location="${lib.dir}/${name}.jar"/>
    </path>
  </target>
  

  <!-- =================================================================== -->
  <!-- Help on usage                                                       -->
  <!-- =================================================================== -->
  <target name="usage">
    <echo message=""/>
    <echo message=""/>
    <echo message="OpenCCG grammar build file"/>
    <echo message="-------------------------------------------------------------"/>
    <echo message=""/>
    <echo message=" Available targets are:"/>
    <echo message=""/>
    <echo message="   grammar  --> builds the grammar (default)"/>
    <echo message=""/>
    <echo message="   skeleton  --> builds the skeleton file"/>
    <echo message=""/>
    <echo message=" See the comments inside the build.xml file for more details."/>
    <echo message="-------------------------------------------------------------"/>
    <echo message=""/>
    <echo message=""/>
  </target>
  

  <!-- =================================================================== -->
  <!-- Builds grammar                                                     -->
  <!-- =================================================================== -->
  <target name="grammar" depends="init" description="builds grammar">
    <echo message="Adding family members from dict.xml to lexicon-base.xml, yielding lexicon.xml"/>
    <java classname="org.apache.xalan.xslt.Process"> 
      <arg value="-IN"/> <arg value="lexicon-base.xml"/>
      <arg value="-XSL"/> <arg value="${grammars.dir}/add-family-members.xsl"/>
      <arg value="-PARAM"/> <arg value="dict-file"/> <arg value="${basedir}/dict.xml"/>
      <arg value="-OUT"/> <arg value="lexicon.xml"/>
    </java>
    <echo message="Extracting morph items from dict.xml to morph.xml"/>
    <java classname="org.apache.xalan.xslt.Process"> 
      <arg value="-IN"/> <arg value="${basedir}/dict.xml"/>
      <arg value="-XSL"/> <arg value="${grammars.dir}/extract-morph.xsl"/>
      <arg value="-OUT"/> <arg value="morph.xml"/>
    </java>
    <echo message="Validating grammar.xml, lexicon.xml, morph.xml, rules.xml and types.xml"/>
    <java classname="opennlp.ccg.test.Validator" classpathref="validate.classpath" fork="true"> 
      <arg value="grammar.xml"/>
      <arg value="lexicon.xml"/>
      <arg value="morph.xml"/>
      <arg value="rules.xml"/>
      <arg value="types.xml"/>
    </java>
  </target>

  <target name="skeleton"
          depends="init"
 description="Builds pre-lexicon to start up lexicon development">
    <echo message="Validating parameters.xml"/>
    <java classname="opennlp.ccg.test.Validator" classpathref="validate.classpath" fork="true"> 
      <arg value="parameters.xml"/>
    </java>
    <echo message="Generating preset-families.xml"/>
    <java classname="org.apache.xalan.xslt.Process">
      <arg value="-IN"/> <arg value="${basedir}/parameters.xml"/>
      <arg value="-XSL"/> <arg value="${grammars.dir}/parametric-lexicon.xsl"/>
      <arg value="-OUT"/> <arg value="${basedir}/preset-families.xml"/>
    </java>
    <echo message="Validating preset-families.xml"/>
    <java classname="opennlp.ccg.test.Validator" classpathref="validate.classpath" fork="true"> 
      <arg value="preset-families.xml"/>
    </java>
	<echo message="Generating types.xml"/>
    <java classname="org.apache.xalan.xslt.Process">
      <arg value="-IN"/> <arg value="${basedir}/parameters.xml"/>
      <arg value="-XSL"/> <arg value="${grammars.dir}/parametric-types.xsl"/>
      <arg value="-OUT"/> <arg value="${basedir}/types.xml"/>
    </java>
    <echo message="Validating types.xml"/>
    <java classname="opennlp.ccg.test.Validator" classpathref="validate.classpath" fork="true"> 
      <arg value="types.xml"/>
    </java>
  </target>
</project>

<!-- End of file -->


================================================
FILE: grammars/mini-nezperce/parameters.xml
================================================
<?xml version="1.0"?>

<!-- Basque's parameter specifications - June 2004 Cem Bozsahin -->

<language name="Nez Perce" type="unaligned" 
	
	xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" 
	xsi:noNamespaceSchemaLocation="../parameters.xsd"> 
	
  <parameters>

   <!-- NB1: predicate, setarg, arg, x-argument are pre-CCG categories.
             This notation is mapped to CCG notation by lexical rules.
             setarg and arg are serialized as in CCG.
  
        NB2: TV skeleton should NOT carry case information; it is set up 
             from language type and single argument of the IV

        NB3: IV's only argument MUST have its case specified 
        
    -->
		
    <infinitive subject-type="semantic"/>
       
    <iv>
      <predicate syn-type="s"/>
      <arg>
        <s-argument dir="|" syn-type="np" case="nom"/>
      </arg>
    </iv>

   <!-- For example, Basque's
        tv category simply says the order is V-A-P and V-P-A because
        the specs give Pred{\A-Arg, \P-Arg}.
        Pred, A-Arg, P-Arg are syntactically: s, np, np. 
     -->
		
    <tv>
      <predicate syn-type="s"/>
      <setarg>
        <a-argument dir="|" syn-type="np"/>
        <p-argument dir="|" syn-type="np"/>
      </setarg>
    </tv>
	
  </parameters>

</language>


================================================
FILE: grammars/mini-nezperce/preset-families.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!-- 
      - This file is generated by parametric-lexicon.xsl to set up
          accusativity/ergativity parameter for IV and TV primary families
          and control primary families.

          NB: pre-CCG categories of parameters.xml are mapped to
              CCG categories in this file. From now on, it's all CCG

    Suggestions to start-up lexicon development:

      1) Copy this file to lexicon-base.xml to avoid losing your changes
         to it (remember, this file is auto-generated at the start)
      2) Edit lexicon-base.xml to modify the preset families and to add your 
          own families as needed (merging the entries of same family is
          left to you)
      3) Use the ccg-build facility of openCCG, which uses lexicon-base to build
          the lexicon.xml, morph.xml and rules.xml files needed by the system.
  -->
<!--

      *** Families derived from language parameters ***

   Includes primary entries for IV (unerg and unacc), basic TV, TV-control1, 
   TV-control2, IV-control1
   
  -->
<!--
  subject-case, s-case, p-case and a-case are value types that set up ergative-
  accusative mapping and surface cases of these argumnents (cf. types.xml file).
  Actual case values for them (e.g. nom for a-case in accusative languages,
  erg for a-case in ergative languages) are defined in types.xml file.
  You can of course refer to actual values since they are types,  but if a
  construction is related to GR mapping (ERG or ACC), it's better to use
  subject-cases (which covers a-case and s-case in ACC; p-case and s-case in ERG).
  Types.xml sets these up from parameter specification.
  
  -->
<ccg-lexicon xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:noNamespaceSchemaLocation="../lexicon.xsd" name="Nez Perce">
   <family closed="true" pos="V" name="unergative">
      <entry name="primary">
         <complexcat>
            <atomcat type="s">
               <fs id="100">
                  <feat attr="index">
                     <lf>
                        <nomvar name="E"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <slash dir="|"/>
            <atomcat type="np">
               <fs id="1">
                  <feat attr="case" val="s-case"/>
                  <feat attr="index">
                     <lf>
                        <nomvar name="X1"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <lf>
               <satop nomvar="E">
                  <prop name="[*DEFAULT*]"/>
                  <diamond mode="Arg1">
                     <nomvar name="X1"/>
                  </diamond>
                  <diamond mode="Arg2">
                     <nom name="one"/>
                  </diamond>
               </satop>
            </lf>
         </complexcat>
      </entry>
   </family>
   <family closed="true" pos="V" name="unaccusative">
      <entry name="primary">
         <complexcat>
            <atomcat type="s">
               <fs id="100">
                  <feat attr="index">
                     <lf>
                        <nomvar name="E"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <slash dir="|"/>
            <atomcat type="np">
               <fs id="1">
                  <feat attr="case" val="s-case"/>
                  <feat attr="index">
                     <lf>
                        <nomvar name="X1"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <lf>
               <satop nomvar="E">
                  <prop name="[*DEFAULT*]"/>
                  <diamond mode="Arg2">
                     <nomvar name="X1"/>
                  </diamond>
                  <diamond mode="Arg1">
                     <nom name="one"/>
                  </diamond>
               </satop>
            </lf>
         </complexcat>
      </entry>
   </family>
   <family closed="true" pos="V" name="TV">
      <entry name="primary">
         <complexcat>
            <atomcat type="s">
               <fs id="100">
                  <feat attr="index">
                     <lf>
                        <nomvar name="E"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <setarg>
               <slash dir="|"/>
               <atomcat type="np">
                  <fs id="1">
                     <feat attr="case" val="a-case"/>
                     <feat attr="index">
                        <lf>
                           <nomvar name="X1"/>
                        </lf>
                     </feat>
                  </fs>
               </atomcat>
               <slash dir="|"/>
               <atomcat type="np">
                  <fs id="2">
                     <feat attr="case" val="p-case"/>
                     <feat attr="index">
                        <lf>
                           <nomvar name="X2"/>
                        </lf>
                     </feat>
                  </fs>
               </atomcat>
            </setarg>
            <lf>
               <satop nomvar="E">
                  <prop name="[*DEFAULT*]"/>
                  <diamond mode="Arg1">
                     <nomvar name="X1"/>
                  </diamond>
                  <diamond mode="Arg2">
                     <nomvar name="X2"/>
                  </diamond>
               </satop>
            </lf>
         </complexcat>
      </entry>
   </family>
   <family closed="true" pos="V" name="TV-control2">
      <entry name="primary">
         <complexcat>
            <atomcat type="s">
               <fs id="100">
                  <feat attr="index">
                     <lf>
                        <nomvar name="E"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <setarg>
               <slash dir="|"/>
               <atomcat type="np">
                  <fs id="1">
                     <feat attr="case" val="a-case"/>
                     <feat attr="index">
                        <lf>
                           <nomvar name="X1"/>
                        </lf>
                     </feat>
                  </fs>
               </atomcat>
               <slash dir="|"/>
               <complexcat>
                  <!--NB: Word order and directionality of embedded clause's |(S|NP) 
type is an 'educated guess' from the syntactic type of TV. Change them
accordingly 
  -->
                  <atomcat type="s">
                     <fs id="3">
                        <feat val="non-fin" attr="vform"/>
                        <feat attr="index">
                           <lf>
                              <nomvar name="E2"/>
                           </lf>
                        </feat>
                     </fs>
                  </atomcat>
                  <slash dir="|"/>
                  <atomcat type="np">
                     <fs id="4">
                        <!-- NB: If infinitive type is syntactic subject (which is the 
		  default), there is a built-in type in types.xml file called
		  "subject-case". Include in this type all the subjects that
		  can be controlled e.g. nominative subjects only (as in German), 
		  dative and nominative subjects (as in Malayalam) etc. In this
		  case, the controllee is not semantically restricted.
		  
		  If infinitive type is semantic subject, you need a larger
		  fragment of Hybrid Logic than HLDS uses to implement identity
		  of two event variables e.g.
		  
		  @_e(Arg1 a) ^ @_e(Arg1 b) - -> @_a(b)
		  
		  where a is the event variable for controller verb, and
		  b is the event variable for the controlled verb, and Arg1 is the
		  modality for primary arguments (1s).
		  
		  This constraint is formulable in HL but HLDS does not cover that
		  fragment (yet). When it does, the lf tag should just stick in that
		  constraint.
		  
		  Currently, OpenCCG can generate an LF with TWO non-identical Arg1 modalities
		  in the same event structure, therefore some illicit examples would
		  go through.
		-->
                        <feat attr="index">
                           <lf>
                              <nomvar name="X2"/>
                           </lf>
                           <!--NB: Index is same as Arg2's -->
                        </feat>
                     </fs>
                  </atomcat>
               </complexcat>
               <slash dir="|"/>
               <atomcat type="np">
                  <fs id="2">
                     <feat attr="case" val="p-case"/>
                     <feat attr="index">
                        <lf>
                           <nomvar name="X2"/>
                        </lf>
                     </feat>
                  </fs>
               </atomcat>
            </setarg>
            <lf>
               <satop nomvar="E">
                  <prop name="[*DEFAULT*]"/>
                  <diamond mode="Arg1">
                     <nomvar name="X1"/>
                  </diamond>
                  <diamond mode="Arg2">
                     <nomvar name="X2"/>
                  </diamond>
                  <diamond mode="Arg3">
                     <nomvar name="E2"/>
                     <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
                  </diamond>
               </satop>
            </lf>
         </complexcat>
      </entry>
   </family>
   <family closed="true" pos="V" name="TV-control1">
      <entry name="primary">
         <complexcat>
            <atomcat type="s">
               <fs id="100">
                  <feat attr="index">
                     <lf>
                        <nomvar name="E"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <setarg>
               <slash dir="|"/>
               <atomcat type="np">
                  <fs id="1">
                     <feat attr="case" val="a-case"/>
                     <feat attr="index">
                        <lf>
                           <nomvar name="X1"/>
                        </lf>
                     </feat>
                  </fs>
               </atomcat>
               <slash dir="|"/>
               <complexcat>
                  <!--NB: Word order and directionality of embedded clause's 
|(S|NP) type is an 'educated guess' from the syntactic type of TV. 
Change them accordingly.
  -->
                  <atomcat type="s">
                     <fs id="3">
                        <feat val="non-fin" attr="vform"/>
                        <feat attr="index">
                           <lf>
                              <nomvar name="E2"/>
                           </lf>
                        </feat>
                     </fs>
                  </atomcat>
                  <slash dir="|"/>
                  <atomcat type="np">
                     <fs id="4">
                        <!-- NB: If infinitive type is syntactic subject (which is the 
		  default), there is a built-in type in types.xml file called
		  "subject-case". Include in this type all the subjects that
		  can be controlled e.g. nominative subjects only (as in German), 
		  dative and nominative subjects (as in Malayalam) etc. In this
		  case, the controllee is not semantically restricted.
		  
		  If infinitive type is semantic subject, you need a larger
		  fragment of Hybrid Logic than HLDS uses to implement identity
		  of two event variables e.g.
		  
		  @_e(Arg1 a) ^ @_e(Arg1 b) - -> @_a(b)
		  
		  where a is the event variable for controller verb, and
		  b is the event variable for the controlled verb, and Arg1 is the
		  modality for primary arguments (1s).
		  
		  This constraint is formulable in HL but HLDS does not cover that
		  fragment (yet). When it does, the lf tag should just stick in that
		  constraint.
		  
		  Currently, OpenCCG can generate an LF with TWO non-identical Arg1 modalities
		  in the same event structure, therefore some illicit examples would
		  go through.
		-->
                        <feat attr="index">
                           <lf>
                              <nomvar name="X1"/>
                           </lf>
                           <!--NB: Index is same as Arg1's -->
                        </feat>
                     </fs>
                  </atomcat>
               </complexcat>
               <slash dir="|"/>
               <atomcat type="np">
                  <fs id="2">
                     <feat attr="case" val="p-case"/>
                     <feat attr="index">
                        <lf>
                           <nomvar name="X2"/>
                        </lf>
                     </feat>
                  </fs>
               </atomcat>
            </setarg>
            <lf>
               <satop nomvar="E">
                  <prop name="[*DEFAULT*]"/>
                  <diamond mode="Arg1">
                     <nomvar name="X1"/>
                  </diamond>
                  <diamond mode="Arg2">
                     <nomvar name="X2"/>
                  </diamond>
                  <diamond mode="Arg3">
                     <nomvar name="E2"/>
                     <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
                  </diamond>
               </satop>
            </lf>
         </complexcat>
      </entry>
   </family>
   <family closed="true" pos="V" name="IV-control1">
      <entry name="primary">
         <complexcat>
            <atomcat type="s">
               <fs id="100">
                  <feat attr="index">
                     <lf>
                        <nomvar name="E"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <setarg>
               <slash dir="|"/>
               <atomcat type="np">
                  <fs id="1">
                     <feat attr="case" val="a-case"/>
                     <feat attr="index">
                        <lf>
                           <nomvar name="X1"/>
                        </lf>
                     </feat>
                  </fs>
               </atomcat>
               <slash dir="|"/>
               <complexcat>
                  <!--NB: Word order and directionality of embedded clause's 
|(S|NP) type is an 'educated guess' from the syntactic type of TV. 
Change them accordingly.
  -->
                  <atomcat type="s">
                     <fs id="3">
                        <feat val="non-fin" attr="vform"/>
                        <feat attr="index">
                           <lf>
                              <nomvar name="E2"/>
                           </lf>
                        </feat>
                     </fs>
                  </atomcat>
                  <slash dir="|"/>
                  <atomcat type="np">
                     <fs id="4">
                        <!-- NB: If infinitive type is syntactic subject (which is the 
		  default), there is a built-in type in types.xml file called
		  "subject-case". Include in this type all the subjects that
		  can be controlled e.g. nominative subjects only (as in German), 
		  dative and nominative subjects (as in Malayalam) etc. In this
		  case, the controllee is not semantically restricted.
		  
		  If infinitive type is semantic subject, you need a larger
		  fragment of Hybrid Logic than HLDS uses to implement identity
		  of two event variables e.g.
		  
		  @_e(Arg1 a) ^ @_e(Arg1 b) - -> @_a(b)
		  
		  where a is the event variable for controller verb, and
		  b is the event variable for the controlled verb, and Arg1 is the
		  modality for primary arguments (1s).
		  
		  This constraint is formulable in HL but HLDS does not cover that
		  fragment (yet). When it does, the lf tag should just stick in that
		  constraint.
		  
		  Currently, OpenCCG can generate an LF with TWO non-identical Arg1 modalities
		  in the same event structure, therefore some illicit examples would
		  go through.
		-->
                        <feat attr="index">
                           <lf>
                              <nomvar name="X1"/>
                           </lf>
                           <!--NB: Index is same as Arg1's -->
                        </feat>
                     </fs>
                  </atomcat>
               </complexcat>
            </setarg>
            <lf>
               <satop nomvar="E">
                  <prop name="[*DEFAULT*]"/>
                  <diamond mode="Arg1">
                     <nomvar name="X1"/>
                  </diamond>
                  <diamond mode="Arg2">
                     <nomvar name="E2"/>
                     <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
                  </diamond>
               </satop>
            </lf>
         </complexcat>
      </entry>
   </family>
   <!--

    *** End of derived families ***
 
        Add new families here, and merge the new entries for preset
         families as needed (e.g., you may add an entry to TV family
         for pro-dropping the subject etc.)
  -->
</ccg-lexicon>


================================================
FILE: grammars/mini-nezperce/types.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!-- 
      - This file is generated by parametric-types.xsl from parameter specs
	    (parameters.xml) to set up  types.xml file for development.
         
      - If the language in question has eg. quirky subjects etc., add their 
	    values under appropriate types.
	 
	 -->
<!--
	   subject-case, s-case, p-case and a-case are pre-defined types that are
	   used in the automatically generated initial lexicon (preset-families
	   .xml). We recommend that you dont change them. They handle
	   accusative/ergative mapping among other things (cf. types.xml initial
	   hierarchy).
	  
	 -->
<types xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:noNamespaceSchemaLocation="../types.xsd" name="Nez Perce">
  <type name="s-case" parents="subject-case"/>
  <type name="subject-case"/>
  <type parents="s-case" name="nom"/>
  <!--
		 Warning: Please substitute case names as children
		of a-case and p-case since these cannot be predicted parametrically
		for an unaligned language (cf. unknown and unknown2 values)
        -->
  <type parents="a-case" name="unknown"/>
  <type name="a-case"/>
  <type parents="p-case" name="unknown2"/>
  <type name="p-case"/>
</types>


================================================
FILE: grammars/mini-tagalog/build.xml
================================================
<!-- $Id: build.xml,v 1.2 2007/03/26 18:31:13 mwhite14850 Exp $ -->
<!-- Copyright (C) 2003 University of Edinburgh (Michael White) and Cem Bozsahin -->
<project default="grammar" basedir=".">

  <!-- =================================================================== -->
  <!-- Initialization target                                               -->
  <!-- =================================================================== -->
  <target name="init">
    <tstamp/>
    <property name="Name" value="OpenCCG"/>
    <property name="name" value="openccg"/>

    <echo message="----------- ${Name} ------------"/>

    <property name="lib.dir" value="${openccg.home}/lib"/>
    <property name="grammars.dir" value="${openccg.home}/grammars"/>

    <path id="validate.classpath">
      <pathelement location="${lib.dir}/xercesImpl.jar"/>
      <pathelement location="${lib.dir}/${name}.jar"/>
    </path>
  </target>
  

  <!-- =================================================================== -->
  <!-- Help on usage                                                       -->
  <!-- =================================================================== -->
  <target name="usage">
    <echo message=""/>
    <echo message=""/>
    <echo message="OpenCCG grammar build file"/>
    <echo message="-------------------------------------------------------------"/>
    <echo message=""/>
    <echo message=" Available targets are:"/>
    <echo message=""/>
    <echo message="   grammar  --> builds the grammar (default)"/>
    <echo message=""/>
    <echo message="   skeleton  --> builds the skeleton file"/>
    <echo message=""/>
    <echo message=" See the comments inside the build.xml file for more details."/>
    <echo message="-------------------------------------------------------------"/>
    <echo message=""/>
    <echo message=""/>
  </target>
  

  <!-- =================================================================== -->
  <!-- Builds grammar                                                     -->
  <!-- =================================================================== -->
  <target name="grammar" depends="init" description="builds grammar">
    <echo message="Adding family members from dict.xml to lexicon-base.xml, yielding lexicon.xml"/>
    <java classname="org.apache.xalan.xslt.Process"> 
      <arg value="-IN"/> <arg value="lexicon-base.xml"/>
      <arg value="-XSL"/> <arg value="${grammars.dir}/add-family-members.xsl"/>
      <arg value="-PARAM"/> <arg value="dict-file"/> <arg value="${basedir}/dict.xml"/>
      <arg value="-OUT"/> <arg value="lexicon.xml"/>
    </java>
    <echo message="Extracting morph items from dict.xml to morph.xml"/>
    <java classname="org.apache.xalan.xslt.Process"> 
      <arg value="-IN"/> <arg value="${basedir}/dict.xml"/>
      <arg value="-XSL"/> <arg value="${grammars.dir}/extract-morph.xsl"/>
      <arg value="-OUT"/> <arg value="morph.xml"/>
    </java>
    <echo message="Validating grammar.xml, lexicon.xml, morph.xml, rules.xml and types.xml"/>
    <java classname="opennlp.ccg.test.Validator" classpathref="validate.classpath" fork="true"> 
      <arg value="grammar.xml"/>
      <arg value="lexicon.xml"/>
      <arg value="morph.xml"/>
      <arg value="rules.xml"/>
      <arg value="types.xml"/>
    </java>
  </target>

  <target name="skeleton"
          depends="init"
 description="Builds pre-lexicon to start up lexicon development">
    <echo message="Validating parameters.xml"/>
    <java classname="opennlp.ccg.test.Validator" classpathref="validate.classpath" fork="true"> 
      <arg value="parameters.xml"/>
    </java>
    <echo message="Generating preset-families.xml"/>
    <java classname="org.apache.xalan.xslt.Process">
      <arg value="-IN"/> <arg value="${basedir}/parameters.xml"/>
      <arg value="-XSL"/> <arg value="${grammars.dir}/parametric-lexicon.xsl"/>
      <arg value="-OUT"/> <arg value="${basedir}/preset-families.xml"/>
    </java>
    <echo message="Validating preset-families.xml"/>
    <java classname="opennlp.ccg.test.Validator" classpathref="validate.classpath" fork="true"> 
      <arg value="preset-families.xml"/>
    </java>
	<echo message="Generating types.xml"/>
    <java classname="org.apache.xalan.xslt.Process">
      <arg value="-IN"/> <arg value="${basedir}/parameters.xml"/>
      <arg value="-XSL"/> <arg value="${grammars.dir}/parametric-types.xsl"/>
      <arg value="-OUT"/> <arg value="${basedir}/types.xml"/>
    </java>
    <echo message="Validating types.xml"/>
    <java classname="opennlp.ccg.test.Validator" classpathref="validate.classpath" fork="true"> 
      <arg value="types.xml"/>
    </java>
  </target>
</project>

<!-- End of file -->


================================================
FILE: grammars/mini-tagalog/dict.xml
================================================
<?xml version="1.0"?>

<dictionary name="Tagalog">
 
  <entry stem="at" pred="and" pos="Conj">
    <member-of family="Conj"/>
    <word form="at" />
  </entry>
  <entry stem="pagkain" pred="food" pos="N">
    <member-of family="Noun"/>
    <word form="pagkain" />
  </entry>
  <entry stem="pinggan" pred="dish" pos="N">
    <member-of family="Noun"/>
    <word form="mgapinggan" macros="@pl"/>
  </entry>
  <entry stem="bata" pred="child" pos="N">
    <member-of family="Noun"/>
    <word form="mgabata" macros="@pl"/>
  </entry>
  <entry stem="Juan" pos="N">
    <member-of family="Noun"/>
    <word form="Juan" />
  </entry>
  <entry stem="Josie" pos="N">
    <member-of family="Noun"/>
    <word form="Josie" />
  </entry>
  <entry stem="Lorna" pos="N">
    <member-of family="Noun"/>
    <word form="Lorna" />
  </entry>
  <entry stem="Maria" pos="N">
    <member-of family="Noun"/>
    <word form="Maria" />
  </entry>
  <entry stem="tindahan" pred="store" pos="N">
    <member-of family="Noun"/>
    <word form="tindahan" />
  </entry>
  <entry stem="bigas" pred="rice" pos="N">
    <member-of family="Noun"/>
    <word form="bigas" />
  </entry>
  <entry stem="kapatid" pred="sibling" pos="N">
    <member-of family="Noun"/>
    <word form="kapatid" />
  </entry>
  <entry stem="ama" pred="father" pos="N">
    <member-of family="Noun"/>
    <word form="ama" />
  </entry>
  <entry stem="ina" pred="mother" pos="N">
    <member-of family="Noun"/>
    <word form="ina" />
  </entry>
  <entry stem="regalo" pred="present" pos="N">
    <member-of family="Noun"/>
    <word form="regalo" />
  </entry>
  <entry stem="liham" pred="letter" pos="N">
    <member-of family="Noun"/>
    <word form="liham" />
  </entry>
  <entry stem="isda" pred="fish" pos="N">
    <member-of family="Noun"/>
    <word form="isda" />
  </entry>
  <entry stem="pera" pred="money" pos="N">
    <member-of family="Noun"/>
    <word form="pera" />
  </entry>
  <entry stem="babae" pred="woman" pos="N">
    <member-of family="Noun"/>
    <word form="babae" />
  </entry>
  <entry stem="bangko" pred="bank" pos="N">
    <member-of family="Noun"/>
    <word form="bangko" />
  </entry>
  <entry stem="baro" pred="dress" pos="N">
    <member-of family="Noun"/>
    <word form="baro" />
  </entry>
  <entry stem="mo" pred="you" pos="PN">
    <member-of family="Pronoun"/>
    <word form="mo" macros="@2nd @gen0"/>
  </entry>
  <entry stem="ko" pred="i" pos="PN">
    <member-of family="Pronoun"/>
    <word form="ko" macros="@1st @gen0"/>
  </entry>
  <entry stem="siya" pred="she" pos="PN">
    <member-of family="Pronoun"/>
    <word form="siya" macros="@3rd @nom0"/>
  </entry>
  <entry stem="iwas" pred="avoid" pos="V">
    <member-of family="TV"/>
    <member-of family="IV-control1"/>
    <word form="iniwasan" macros="@gen1 @nom2"/>
  </entry>
  <entry stem="atubili" pred="hesitate" pos="V">
    <member-of family="TV"/>
    <member-of family="IV-control1"/>
    <word form="nagatubili" macros="@nom1 @dat2"/>
  </entry>
  <entry stem="awal" pred="forbid" pos="V">
    <member-of family="TV"/>
    <member-of family="TV-control2"/>
    <word form="binawalan" macros="@gen1 @nom2"/>
  </entry>
  <entry stem="ingin" pred="look-at" pos="V">
    <member-of family="TV"/>
    <word form="tumingin" macros="@nom1 @dat2"/>
  </entry>
  <entry stem="ili" pred="buy" pos="V">
    <member-of family="TV"/>
    <word form="bumili" macros="@nom1 @gen2"/>
    <word form="binili" macros="@gen1 @nom2"/>
  </entry>
  <entry stem="awit" pred="sing" pos="V">
    <member-of family="TV"/>
    <word form="awitin" macros="@gen1 @nom2"/>
  </entry>
  <entry stem="iram" pred="borrow" pos="V">
    <member-of family="DV"/>
    <word form="humiram" macros="@nom1 @gen2 @dat3"/>
    <word form="hiramin" macros="@gen1 @nom2 @dat3"/>
    <word form="hiraman" macros="@gen1 @gen2 @nom3"/>
  </entry>
  <entry stem="nagbigay" pred="give" pos="V">
    <member-of family="DV"/>
    <word form="nagbigay" macros="@nom1 @gen2 @dat3"/>
  </entry>
  <entry stem="nagpadala" pred="send" pos="V">
    <member-of family="DV"/>
    <word form="nagpadala" macros="@nom1 @gen2 @dat3"/>
  </entry>
  <entry stem="nasan" pred="dry" pos="V">
    <member-of family="TV"/>
    <word form="pupunasan" macros="@gen1 @nom2"/>
  </entry>
  <entry stem="luto" pred="cook" pos="V">
    <member-of family="TV"/>
    <word form="niluto" macros="@gen1 @nom2"/>
  </entry>
  <entry stem="pumunta" pred="go" pos="V">
    <member-of family="TV"/>
    <word form="pumunta" macros="@nom1 @dat2"/>
  </entry>
  <entry stem="nanghuhuli" pred="catch" pos="V">
    <member-of family="TV"/>
    <word form="nanghuhuli" macros="@nom1 @gen2"/>
  </entry>
  <entry stem="nantitinda" pred="sell" pos="V">
    <member-of family="TV"/>
    <word form="nagtitinda" macros="@nom1 @gen2"/>
  </entry>
  <entry stem="gasan" pred="wash" pos="V">
    <member-of family="TV"/>
    <word form="huhugasan" macros="@gen1 @nom2"/>
    <word form="hinugasan" macros="@gen1 @nom2"/>
  </entry>
  <entry stem="kay" pos="Case">
    <member-of family="Case"/>
    <word form="kay" macros="@dat1"/>
  </entry>
  <entry stem="si" pos="Case">
    <member-of family="Case"/>
    <word form="si" macros="@nom1"/>
  </entry>
  <entry stem="sa" pos="Case">
    <member-of family="Case"/>
    <word form="sa" macros="@dat1"/>
  </entry>
  <entry stem="ang" pos="Case">
    <member-of family="Case"/>
    <word form="ang" macros="@nom1"/>
  </entry>
  <entry stem="ni" pos="Case">
    <member-of family="Case"/>
    <word form="ni" macros="@gen1"/>
  </entry>
  <entry stem="ng" pos="Case">
    <member-of family="Case"/>
    <word form="ng" macros="@gen1"/>
  </entry>
  <entry stem="ng" pos="Comp">
    <member-of family="Comp"/>
    <word form="ng" />
  </entry>
  <entry stem="ng" pos="Rel">
    <member-of family="rel"/>
    <word form="ng"/>
  </entry>

<macro name="@agr1">
  <fs id="1" attr="agr" val="true"/>
</macro>
<macro name="@gen0">
  <fs id="10" attr="case" val="a-case"/>
</macro>
<macro name="@gen1">
  <fs id="1" attr="case" val="a-case"/>
</macro>
<macro name="@gen2">
  <fs id="2" attr="case" val="a-case"/>
</macro>
<macro name="@acc0">
  <fs id="10" attr="case" val="p-case"/>
</macro>
<macro name="@acc1">
  <fs id="1" attr="case" val="p-case"/>
</macro>
<macro name="@acc2">
  <fs id="2" attr="case" val="p-case"/>
</macro>
<macro name="@acc3">
  <fs id="3" attr="case" val="p-case"/>
</macro>
<macro name="@def0">
  <fs id="10" attr="def" val="true"/>
</macro>
<macro name="@nom0">
  <fs id="10" attr="case" val="s-case"/>
</macro>
<macro name="@nom1">
  <fs id="1" attr="case" val="subject-case"/>
</macro>
<macro name="@nom2">
  <fs id="2" attr="case" val="subject-case"/>
</macro>
<macro name="@nom3">
  <fs id="3" attr="case" val="subject-case"/>
</macro>
<macro name="@dat0">
  <fs id="10" attr="case" val="dat"/>
</macro>
<macro name="@dat1">
  <fs id="1" attr="case" val="dat"/>
</macro>
<macro name="@dat2">
  <fs id="2" attr="case" val="dat"/>
</macro>
<macro name="@dat3">
  <fs id="3" attr="case" val="dat"/>
</macro>
<macro name="@pl">
  <fs id="10" attr="num" val="plu"/>
</macro>
<macro name="@sg">
  <fs id="10" attr="num" val="sing"/>
</macro>
<macro name="@sg1">
  <fs id="1" attr="num" val="sing"/>
</macro>
<macro name="@sg2">
  <fs id="2" attr="num" val="sing"/>
</macro>
<macro name="@sg3">
  <fs id="3" attr="num" val="sing"/>
</macro>
<macro name="@3rd">
  <fs id="10" attr="person" val="3"/>
</macro>
<macro name="@3rd1">
  <fs id="1" attr="person" val="3"/>
</macro>
<macro name="@3rd2">
  <fs id="2" attr="person" val="3"/>
</macro>
<macro name="@3rd3">
  <fs id="3" attr="person" val="3"/>
</macro>
<macro name="@1st">
  <fs id="10" attr="person" val="1"/>
</macro>
<macro name="@1st1">
  <fs id="1" attr="person" val="1"/>
</macro>
<macro name="@1st2">
  <fs id="2" attr="person" val="1"/>
</macro>
<macro name="@2nd">
  <fs id="10" attr="person" val="1"/>
</macro>
<macro name="@2nd1">
  <fs id="1" attr="person" val="2"/>
</macro>
<macro name="@2nd2">
  <fs id="2" attr="person" val="1"/>
</macro>
<macro name="@non-fin">
  <fs id="10" attr="vform" val="non-fin"/> 
</macro>

<macro name="@past">
	  <fs id="10" attr="vform" val="finite"/> 
</macro>
</dictionary>


================================================
FILE: grammars/mini-tagalog/grammar.xml
================================================
<?xml version="1.0"?>
<!-- 
Copyright (C) 2003 University of Edinburgh (Michael White) and Cem Bozsahin
$Revision: 1.1 $, $Date: 2005/08/03 14:23:29 $ 
-->
<grammar name="Tagalog"
  xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
  xsi:noNamespaceSchemaLocation="../grammar.xsd"
>

  <lexicon file="lexicon.xml"/>
  <morphology file="morph.xml"/>
  <rules file="rules.xml"/> 
  <types file="types.xml"/>

</grammar>


================================================
FILE: grammars/mini-tagalog/lexicon-base.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!-- Additional families by Cem Bozsahin, 6/2003 -->
<!-- 
      - This file is generated by lexicon-skeleton.xsl to set up
          accusativity/ergativity parameter for IV and TV primary families
          and control primary families.

          NB: pre-CCG categories of lexicon-skeleton.xml are mapped to
              CCG categories in this file. From now on, it's all CCG

    Suggestions to start-up lexicon development:

      1) Copy this file to lexicon-base.xml to avoid losing your changes
         to it (remember, this file is auto-generated at the start)
      2) Edit lexicon-base.xml to modify the preset families and to add your 
          own families as needed (merging the entries of same family is
          left to you)
      3) Use the build facility of openCCG to build
          the lexicon.xml, morph.xml and rules.xml files needed by the system.
  -->
<!--

      *** Families derived from language parameters ***

   Includes primary entries for IV, TV, TV-control1, TV-control2, IV-control1
   
  -->
<ccg-lexicon name="Tagalog" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:noNamespaceSchemaLocation="../lexicon.xsd">
  <family closed="true" pos="V" name="IV">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="10">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="case" val="s-case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
  <family closed="true" pos="V" name="TV">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="10">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <setarg>
          <slash dir="/"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="/"/>
          <atomcat type="np">
            <fs id="2">
           <!-- case depends on voice; macros handle that -->
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </setarg>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="X2"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
  <family closed="true" pos="V" name="TV-control2">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="10">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <setarg>
          <slash dir="/"/>
          <atomcat type="np">
            <fs id="1">
           <!-- case depends on voice; macros handle that -->
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="/" mode="*"/>
          <complexcat>
                  <!--NB: Word order and directionality of embedded clause's |(S|NP) 
type is an 'educated guess' from the syntactic type of TV. Change them
accordingly 
  -->
            <atomcat type="s">
              <fs id="3">
                <feat val="non-fin" attr="vform"/>
                <feat attr="index">
                  <lf>
                    <nomvar name="E2"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
            <slash dir="|"/>
            <atomcat type="np">
              <fs id="4">
                <feat attr="index">
                  <lf>
                    <nomvar name="X2"/>
                  </lf>
                           <!--NB: Index is same as Arg2's 
  -->
                </feat>
              </fs>
            </atomcat>
          </complexcat>
          <slash dir="/"/>
          <atomcat type="np">
            <fs id="2">
           <!-- case depends on voice; macros handle that -->
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </setarg>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="X2"/>
            </diamond>
            <diamond mode="Arg3">
              <nomvar name="E2"/>
                     <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
  <family closed="true" pos="V" name="TV-control1">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="10">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <setarg>
          <slash dir="/"/>
          <atomcat type="np">
            <fs id="1">
           <!-- case depends on voice; macros handle that -->
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="/" mode="*"/>
          <complexcat>
                  <!--NB: Word order and directionality of embedded clause's 
|(S|NP) type is an 'educated guess' from the syntactic type of TV. 
Change them accordingly.
  -->
            <atomcat type="s">
              <fs id="3">
                <feat val="non-fin" attr="vform"/>
                <feat attr="index">
                  <lf>
                    <nomvar name="E2"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
            <slash dir="|"/>
            <atomcat type="np">
              <fs id="4">
                <feat attr="index">
                  <lf>
                    <nomvar name="X1"/>
                  </lf>
                           <!--NB: Index is same as Arg1's 
  -->
                </feat>
              </fs>
            </atomcat>
          </complexcat>
          <slash dir="/"/>
          <atomcat type="np">
            <fs id="2">
           <!-- case depends on voice; macros handle that -->
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </setarg>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="X2"/>
            </diamond>
            <diamond mode="Arg3">
              <nomvar name="E2"/>
                     <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
  <family closed="true" pos="V" name="IV-control1">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="10">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <setarg>
          <slash dir="/"/>
          <atomcat type="np">
            <fs id="1">
           <!-- case depends on voice; macros handle that -->
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="/" mode="*"/>
          <complexcat>
                  <!--NB: Word order and directionality of embedded clause's 
|(S|NP) type is an 'educated guess' from the syntactic type of TV. 
Change them accordingly.
  -->
            <atomcat type="s">
              <fs id="3">
                <feat val="non-fin" attr="vform"/>
                <feat attr="index">
                  <lf>
                    <nomvar name="E2"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
            <slash dir="|"/>
            <atomcat type="np">
              <fs id="4">
                <feat attr="index">
                  <lf>
                    <nomvar name="X1"/>
                  </lf>
                           <!--NB: Index is same as Arg1's 
  -->
                </feat>
              </fs>
            </atomcat>
          </complexcat>
        </setarg>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="E2"/>
                     <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
   <!--

    *** End of derived families ***
 
        Add new families here, and merge the new entries for preset
         families as needed (e.g., you may add an entry to TV family
         for pro-dropping the subject etc.)
  -->

  <family pos="N" closed="true" name="Noun">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="10">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/"/>
        <atomcat type="np">
<!--
      <fs id="1">
        <feat attr="index">
          <lf>
            <nomvar name="X"/>
          </lf>
        </feat>
      </fs>
--></atomcat>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>

  <family pos="PN" closed="true" name="Pronoun">
    <entry name="primary">
      <atomcat type="np">
        <fs id="10">
          <feat attr="index">
            <lf>
              <nomvar name="X"/>
            </lf>
          </feat>
        </fs>
        <lf>
          <satop nomvar="X">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </atomcat>
    </entry>
  </family>

  <family pos="Case" closed="true" name="Case">
    <entry name="primary">
      <complexcat>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="*"/>
        <complexcat>
          <atomcat type="s">
            <fs id="3">
              <feat attr="index">
                <lf>
                  <nomvar name="E2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="/"/>
          <atomcat type="np"></atomcat>
        </complexcat>
        <lf>
          <satop nomvar="E">              <!-- Ns are intransitive preds in T-->
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Spec">
              <nomvar name="E2"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>

  <family pos="Comp" closed="true" name="Comp">
    <entry name="primary">
      <complexcat>
        <atomcat type="np">
          <fs id="10">
            <feat attr="case">
              <featvar name="CASE"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="*"/>
        <atomcat type="np">
          <fs id="10">
            <feat attr="case">
              <featvar name="CASE"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
  </family>

  <family pos="Rel" closed="true" name="rel">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="10">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/"/>
        <atomcat type="np">
          <fs inheritsFrom="1"></fs>
        </atomcat>
        <setarg>
          <slash dir="\"/>
          <complexcat>
            <atomcat type="s">
              <fs id="10">
                <feat attr="index">
                  <lf>
                    <nomvar name="X"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
            <slash dir="/"/>
            <atomcat type="np">
              <fs id="1"></fs>
            </atomcat>
          </complexcat>
          <slash dir="|"/>
          <complexcat>
            <atomcat type="s">
              <fs id="3">
                <feat attr="index">
                  <lf>
                    <nomvar name="E"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
            <slash dir="/"/>
            <atomcat type="np">
              <fs id="1">
                <feat attr="index">
                  <lf>
                    <nomvar name="X"/>
                  </lf>
                </feat>
                <feat attr="case" val="subject-case"/>
              </fs>
            </atomcat>
          </complexcat>
        </setarg>
        <lf>
          <satop nomvar="X">
            <diamond mode="Restr">
              <nomvar name="E"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>

  <family closed="true" pos="V" name="DV">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="10">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <setarg>
          <slash dir="/"/>
          <atomcat type="np">
            <fs id="1">
           <!-- case depends on voice; macros handle that -->
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="/"/>
          <atomcat type="np">
            <fs id="2">
           <!-- case depends on voice; macros handle that -->
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="/"/>
          <atomcat type="np">
            <fs id="3">
           <!-- case depends on voice; macros handle that -->
              <feat attr="index">
                <lf>
                  <nomvar name="X3"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </setarg>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="X2"/>
            </diamond>
            <diamond mode="Arg3">
              <nomvar name="X3"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>

  <family closed="true" pos="Conj" name="Conj">
    <entry name="sentential">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S0"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="*"/>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="*"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="S2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="S0">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="List">
              <nomvar name="S1"/>
              <diamond mode="Coord">
                <nomvar name="S2"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="VP">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S0"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/"/>
        <atomcat type="np">
          <fs inheritsFrom="2">
          </fs>
        </atomcat>
        <slash dir="/" mode="*"/>
        <complexcat>
          <atomcat type="s">
            <fs inheritsFrom="1">
              <feat attr="index">
                <lf>
                  <nomvar name="S1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="/"/>
          <atomcat type="np">
            <fs inheritsFrom="2">
            </fs>
          </atomcat>
        </complexcat>
        <slash dir="\" mode="*"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="S2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="/"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="case"><featvar name="CASE"/></feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="S0">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="List">
              <nomvar name="S1"/>
              <diamond mode="Coord">
                <nomvar name="S2"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>

</ccg-lexicon>


================================================
FILE: grammars/mini-tagalog/lexicon.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!-- Additional families by Cem Bozsahin, 6/2003 -->
<!-- 
      - This file is generated by lexicon-skeleton.xsl to set up
          accusativity/ergativity parameter for IV and TV primary families
          and control primary families.

          NB: pre-CCG categories of lexicon-skeleton.xml are mapped to
              CCG categories in this file. From now on, it's all CCG

    Suggestions to start-up lexicon development:

      1) Copy this file to lexicon-base.xml to avoid losing your changes
         to it (remember, this file is auto-generated at the start)
      2) Edit lexicon-base.xml to modify the preset families and to add your 
          own families as needed (merging the entries of same family is
          left to you)
      3) Use the build facility of openCCG to build
          the lexicon.xml, morph.xml and rules.xml files needed by the system.
  -->
<!--

      *** Families derived from language parameters ***

   Includes primary entries for IV, TV, TV-control1, TV-control2, IV-control1
   
  -->
<ccg-lexicon xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" name="Tagalog" xsi:noNamespaceSchemaLocation="../lexicon.xsd">
  <family closed="true" pos="V" name="IV">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="10">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="case" val="s-case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
  <family closed="true" pos="V" name="TV">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="10">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <setarg>
          <slash dir="/"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="/"/>
          <atomcat type="np">
            <fs id="2">
              <!-- case depends on voice; macros handle that -->
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </setarg>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="X2"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="iwas" pred="avoid"/>
    <member stem="atubili" pred="hesitate"/>
    <member stem="awal" pred="forbid"/>
    <member stem="ingin" pred="look-at"/>
    <member stem="ili" pred="buy"/>
    <member stem="awit" pred="sing"/>
    <member stem="nasan" pred="dry"/>
    <member stem="luto" pred="cook"/>
    <member stem="pumunta" pred="go"/>
    <member stem="nanghuhuli" pred="catch"/>
    <member stem="nantitinda" pred="sell"/>
    <member stem="gasan" pred="wash"/>
  </family>
  <family closed="true" pos="V" name="TV-control2">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="10">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <setarg>
          <slash dir="/"/>
          <atomcat type="np">
            <fs id="1">
              <!-- case depends on voice; macros handle that -->
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="/" mode="*"/>
          <complexcat>
            <!--NB: Word order and directionality of embedded clause's |(S|NP) 
type is an 'educated guess' from the syntactic type of TV. Change them
accordingly 
  -->
            <atomcat type="s">
              <fs id="3">
                <feat val="non-fin" attr="vform"/>
                <feat attr="index">
                  <lf>
                    <nomvar name="E2"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
            <slash dir="|"/>
            <atomcat type="np">
              <fs id="4">
                <feat attr="index">
                  <lf>
                    <nomvar name="X2"/>
                  </lf>
                  <!--NB: Index is same as Arg2's 
  -->
                </feat>
              </fs>
            </atomcat>
          </complexcat>
          <slash dir="/"/>
          <atomcat type="np">
            <fs id="2">
              <!-- case depends on voice; macros handle that -->
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </setarg>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="X2"/>
            </diamond>
            <diamond mode="Arg3">
              <nomvar name="E2"/>
              <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="awal" pred="forbid"/>
  </family>
  <family closed="true" pos="V" name="TV-control1">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="10">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <setarg>
          <slash dir="/"/>
          <atomcat type="np">
            <fs id="1">
              <!-- case depends on voice; macros handle that -->
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="/" mode="*"/>
          <complexcat>
            <!--NB: Word order and directionality of embedded clause's 
|(S|NP) type is an 'educated guess' from the syntactic type of TV. 
Change them accordingly.
  -->
            <atomcat type="s">
              <fs id="3">
                <feat val="non-fin" attr="vform"/>
                <feat attr="index">
                  <lf>
                    <nomvar name="E2"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
            <slash dir="|"/>
            <atomcat type="np">
              <fs id="4">
                <feat attr="index">
                  <lf>
                    <nomvar name="X1"/>
                  </lf>
                  <!--NB: Index is same as Arg1's 
  -->
                </feat>
              </fs>
            </atomcat>
          </complexcat>
          <slash dir="/"/>
          <atomcat type="np">
            <fs id="2">
              <!-- case depends on voice; macros handle that -->
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </setarg>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="X2"/>
            </diamond>
            <diamond mode="Arg3">
              <nomvar name="E2"/>
              <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
  <family closed="true" pos="V" name="IV-control1">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="10">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <setarg>
          <slash dir="/"/>
          <atomcat type="np">
            <fs id="1">
              <!-- case depends on voice; macros handle that -->
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="/" mode="*"/>
          <complexcat>
            <!--NB: Word order and directionality of embedded clause's 
|(S|NP) type is an 'educated guess' from the syntactic type of TV. 
Change them accordingly.
  -->
            <atomcat type="s">
              <fs id="3">
                <feat val="non-fin" attr="vform"/>
                <feat attr="index">
                  <lf>
                    <nomvar name="E2"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
            <slash dir="|"/>
            <atomcat type="np">
              <fs id="4">
                <feat attr="index">
                  <lf>
                    <nomvar name="X1"/>
                  </lf>
                  <!--NB: Index is same as Arg1's 
  -->
                </feat>
              </fs>
            </atomcat>
          </complexcat>
        </setarg>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="E2"/>
              <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="iwas" pred="avoid"/>
    <member stem="atubili" pred="hesitate"/>
  </family>
  <!--

    *** End of derived families ***
 
        Add new families here, and merge the new entries for preset
         families as needed (e.g., you may add an entry to TV family
         for pro-dropping the subject etc.)
  -->
  <family pos="N" closed="true" name="Noun">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="10">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/"/>
        <atomcat type="np">
          <!--
      <fs id="1">
        <feat attr="index">
          <lf>
            <nomvar name="X"/>
          </lf>
        </feat>
      </fs>
-->
        </atomcat>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="pagkain" pred="food"/>
    <member stem="pinggan" pred="dish"/>
    <member stem="bata" pred="child"/>
    <member stem="Juan"/>
    <member stem="Josie"/>
    <member stem="Lorna"/>
    <member stem="Maria"/>
    <member stem="tindahan" pred="store"/>
    <member stem="bigas" pred="rice"/>
    <member stem="kapatid" pred="sibling"/>
    <member stem="ama" pred="father"/>
    <member stem="ina" pred="mother"/>
    <member stem="regalo" pred="present"/>
    <member stem="liham" pred="letter"/>
    <member stem="isda" pred="fish"/>
    <member stem="pera" pred="money"/>
    <member stem="babae" pred="woman"/>
    <member stem="bangko" pred="bank"/>
    <member stem="baro" pred="dress"/>
  </family>
  <family pos="PN" closed="true" name="Pronoun">
    <entry name="primary">
      <atomcat type="np">
        <fs id="10">
          <feat attr="index">
            <lf>
              <nomvar name="X"/>
            </lf>
          </feat>
        </fs>
        <lf>
          <satop nomvar="X">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </atomcat>
    </entry>
    <member stem="mo" pred="you"/>
    <member stem="ko" pred="i"/>
    <member stem="siya" pred="she"/>
  </family>
  <family pos="Case" closed="true" name="Case">
    <entry name="primary">
      <complexcat>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="*"/>
        <complexcat>
          <atomcat type="s">
            <fs id="3">
              <feat attr="index">
                <lf>
                  <nomvar name="E2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="/"/>
          <atomcat type="np"/>
        </complexcat>
        <lf>
          <satop nomvar="E">
            <!-- Ns are intransitive preds in T-->
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Spec">
              <nomvar name="E2"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="kay"/>
    <member stem="si"/>
    <member stem="sa"/>
    <member stem="ang"/>
    <member stem="ni"/>
    <member stem="ng"/>
  </family>
  <family pos="Comp" closed="true" name="Comp">
    <entry name="primary">
      <complexcat>
        <atomcat type="np">
          <fs id="10">
            <feat attr="case">
              <featvar name="CASE"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="*"/>
        <atomcat type="np">
          <fs id="10">
            <feat attr="case">
              <featvar name="CASE"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="ng"/>
  </family>
  <family pos="Rel" closed="true" name="rel">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="10">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/"/>
        <atomcat type="np">
          <fs inheritsFrom="1"/>
        </atomcat>
        <setarg>
          <slash dir="\"/>
          <complexcat>
            <atomcat type="s">
              <fs id="10">
                <feat attr="index">
                  <lf>
                    <nomvar name="X"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
            <slash dir="/"/>
            <atomcat type="np">
              <fs id="1"/>
            </atomcat>
          </complexcat>
          <slash dir="|"/>
          <complexcat>
            <atomcat type="s">
              <fs id="3">
                <feat attr="index">
                  <lf>
                    <nomvar name="E"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
            <slash dir="/"/>
            <atomcat type="np">
              <fs id="1">
                <feat attr="index">
                  <lf>
                    <nomvar name="X"/>
                  </lf>
                </feat>
                <feat attr="case" val="subject-case"/>
              </fs>
            </atomcat>
          </complexcat>
        </setarg>
        <lf>
          <satop nomvar="X">
            <diamond mode="Restr">
              <nomvar name="E"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="ng"/>
  </family>
  <family closed="true" pos="V" name="DV">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="10">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <setarg>
          <slash dir="/"/>
          <atomcat type="np">
            <fs id="1">
              <!-- case depends on voice; macros handle that -->
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="/"/>
          <atomcat type="np">
            <fs id="2">
              <!-- case depends on voice; macros handle that -->
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="/"/>
          <atomcat type="np">
            <fs id="3">
              <!-- case depends on voice; macros handle that -->
              <feat attr="index">
                <lf>
                  <nomvar name="X3"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </setarg>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="X2"/>
            </diamond>
            <diamond mode="Arg3">
              <nomvar name="X3"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="iram" pred="borrow"/>
    <member stem="nagbigay" pred="give"/>
    <member stem="nagpadala" pred="send"/>
  </family>
  <family closed="true" pos="Conj" name="Conj">
    <entry name="sentential">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S0"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="*"/>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="*"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="S2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="S0">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="List">
              <nomvar name="S1"/>
              <diamond mode="Coord">
                <nomvar name="S2"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="VP">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S0"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/"/>
        <atomcat type="np">
          <fs inheritsFrom="2"/>
        </atomcat>
        <slash dir="/" mode="*"/>
        <complexcat>
          <atomcat type="s">
            <fs inheritsFrom="1">
              <feat attr="index">
                <lf>
                  <nomvar name="S1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="/"/>
          <atomcat type="np">
            <fs inheritsFrom="2"/>
          </atomcat>
        </complexcat>
        <slash dir="\" mode="*"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="S2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="/"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="case">
                <featvar name="CASE"/>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="S0">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="List">
              <nomvar name="S1"/>
              <diamond mode="Coord">
                <nomvar name="S2"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="at" pred="and"/>
  </family>
</ccg-lexicon>


================================================
FILE: grammars/mini-tagalog/morph.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<morph xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:noNamespaceSchemaLocation="../morph.xsd" name="Tagalog">
  <entry pos="Conj" word="at"/>
  <entry pos="N" word="pagkain"/>
  <entry pos="N" word="mgapinggan" stem="pinggan" macros="@pl"/>
  <entry pos="N" word="mgabata" stem="bata" macros="@pl"/>
  <entry pos="N" word="Juan"/>
  <entry pos="N" word="Josie"/>
  <entry pos="N" word="Lorna"/>
  <entry pos="N" word="Maria"/>
  <entry pos="N" word="tindahan"/>
  <entry pos="N" word="bigas"/>
  <entry pos="N" word="kapatid"/>
  <entry pos="N" word="ama"/>
  <entry pos="N" word="ina"/>
  <entry pos="N" word="regalo"/>
  <entry pos="N" word="liham"/>
  <entry pos="N" word="isda"/>
  <entry pos="N" word="pera"/>
  <entry pos="N" word="babae"/>
  <entry pos="N" word="bangko"/>
  <entry pos="N" word="baro"/>
  <entry pos="PN" word="mo" macros="@2nd @gen0"/>
  <entry pos="PN" word="ko" macros="@1st @gen0"/>
  <entry pos="PN" word="siya" macros="@3rd @nom0"/>
  <entry pos="V" word="iniwasan" stem="iwas" macros="@gen1 @nom2"/>
  <entry pos="V" word="nagatubili" stem="atubili" macros="@nom1 @dat2"/>
  <entry pos="V" word="binawalan" stem="awal" macros="@gen1 @nom2"/>
  <entry pos="V" word="tumingin" stem="ingin" macros="@nom1 @dat2"/>
  <entry pos="V" word="bumili" stem="ili" macros="@nom1 @gen2"/>
  <entry pos="V" word="binili" stem="ili" macros="@gen1 @nom2"/>
  <entry pos="V" word="awitin" stem="awit" macros="@gen1 @nom2"/>
  <entry pos="V" word="humiram" stem="iram" macros="@nom1 @gen2 @dat3"/>
  <entry pos="V" word="hiramin" stem="iram" macros="@gen1 @nom2 @dat3"/>
  <entry pos="V" word="hiraman" stem="iram" macros="@gen1 @gen2 @nom3"/>
  <entry pos="V" word="nagbigay" macros="@nom1 @gen2 @dat3"/>
  <entry pos="V" word="nagpadala" macros="@nom1 @gen2 @dat3"/>
  <entry pos="V" word="pupunasan" stem="nasan" macros="@gen1 @nom2"/>
  <entry pos="V" word="niluto" stem="luto" macros="@gen1 @nom2"/>
  <entry pos="V" word="pumunta" macros="@nom1 @dat2"/>
  <entry pos="V" word="nanghuhuli" macros="@nom1 @gen2"/>
  <entry pos="V" word="nagtitinda" stem="nantitinda" macros="@nom1 @gen2"/>
  <entry pos="V" word="huhugasan" stem="gasan" macros="@gen1 @nom2"/>
  <entry pos="V" word="hinugasan" stem="gasan" macros="@gen1 @nom2"/>
  <entry pos="Case" word="kay" macros="@dat1"/>
  <entry pos="Case" word="si" macros="@nom1"/>
  <entry pos="Case" word="sa" macros="@dat1"/>
  <entry pos="Case" word="ang" macros="@nom1"/>
  <entry pos="Case" word="ni" macros="@gen1"/>
  <entry pos="Case" word="ng" macros="@gen1"/>
  <entry pos="Comp" word="ng"/>
  <entry pos="Rel" word="ng"/>
  <macro name="@agr1">
    <fs id="1" attr="agr" val="true"/>
  </macro>
  <macro name="@gen0">
    <fs id="10" attr="case" val="a-case"/>
  </macro>
  <macro name="@gen1">
    <fs id="1" attr="case" val="a-case"/>
  </macro>
  <macro name="@gen2">
    <fs id="2" attr="case" val="a-case"/>
  </macro>
  <macro name="@acc0">
    <fs id="10" attr="case" val="p-case"/>
  </macro>
  <macro name="@acc1">
    <fs id="1" attr="case" val="p-case"/>
  </macro>
  <macro name="@acc2">
    <fs id="2" attr="case" val="p-case"/>
  </macro>
  <macro name="@acc3">
    <fs id="3" attr="case" val="p-case"/>
  </macro>
  <macro name="@def0">
    <fs id="10" attr="def" val="true"/>
  </macro>
  <macro name="@nom0">
    <fs id="10" attr="case" val="s-case"/>
  </macro>
  <macro name="@nom1">
    <fs id="1" attr="case" val="subject-case"/>
  </macro>
  <macro name="@nom2">
    <fs id="2" attr="case" val="subject-case"/>
  </macro>
  <macro name="@nom3">
    <fs id="3" attr="case" val="subject-case"/>
  </macro>
  <macro name="@dat0">
    <fs id="10" attr="case" val="dat"/>
  </macro>
  <macro name="@dat1">
    <fs id="1" attr="case" val="dat"/>
  </macro>
  <macro name="@dat2">
    <fs id="2" attr="case" val="dat"/>
  </macro>
  <macro name="@dat3">
    <fs id="3" attr="case" val="dat"/>
  </macro>
  <macro name="@pl">
    <fs id="10" attr="num" val="plu"/>
  </macro>
  <macro name="@sg">
    <fs id="10" attr="num" val="sing"/>
  </macro>
  <macro name="@sg1">
    <fs id="1" attr="num" val="sing"/>
  </macro>
  <macro name="@sg2">
    <fs id="2" attr="num" val="sing"/>
  </macro>
  <macro name="@sg3">
    <fs id="3" attr="num" val="sing"/>
  </macro>
  <macro name="@3rd">
    <fs id="10" attr="person" val="3"/>
  </macro>
  <macro name="@3rd1">
    <fs id="1" attr="person" val="3"/>
  </macro>
  <macro name="@3rd2">
    <fs id="2" attr="person" val="3"/>
  </macro>
  <macro name="@3rd3">
    <fs id="3" attr="person" val="3"/>
  </macro>
  <macro name="@1st">
    <fs id="10" attr="person" val="1"/>
  </macro>
  <macro name="@1st1">
    <fs id="1" attr="person" val="1"/>
  </macro>
  <macro name="@1st2">
    <fs id="2" attr="person" val="1"/>
  </macro>
  <macro name="@2nd">
    <fs id="10" attr="person" val="1"/>
  </macro>
  <macro name="@2nd1">
    <fs id="1" attr="person" val="2"/>
  </macro>
  <macro name="@2nd2">
    <fs id="2" attr="person" val="1"/>
  </macro>
  <macro name="@non-fin">
    <fs id="10" attr="vform" val="non-fin"/>
  </macro>
  <macro name="@past">
    <fs id="10" attr="vform" val="finite"/>
  </macro>
</morph>


================================================
FILE: grammars/mini-tagalog/parameters.xml
================================================
<?xml version="1.0"?>

<!-- Tagalog's parameter specifications - June 2004 Cem Bozsahin -->

<language name="Tagalog" type="erg" 
	
	xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" 
	xsi:noNamespaceSchemaLocation="../parameters.xsd"> 
	
  <parameters>

   <!-- NB1: predicate, setarg, arg, x-argument are pre-CCG categories.
             This notation is mapped to CCG notation by lexical rules.
             setarg and arg are serialized as in CCG.
  
        NB2: TV skeleton should NOT carry case information; it is set up 
             from language type and single argument of the IV

        NB3: IV's only argument MUST have its case specified 
        
    -->
		
    <infinitive subject-type="semantic"/>
       
    <iv>
      <predicate syn-type="s"/>
      <arg>
        <s-argument dir="/" syn-type="np" case="abs"/>
      </arg>
    </iv>

   <!-- For example, Basque's
        tv category simply says the order is V-A-P and V-P-A because
        the specs give Pred{\A-Arg, \P-Arg}.
        Pred, A-Arg, P-Arg are syntactically: s, np, np. 
     -->
		
    <tv>
      <predicate syn-type="s"/>
      <setarg>
        <a-argument dir="/" syn-type="np"/>
        <p-argument dir="/" syn-type="np"/>
      </setarg>
    </tv>
	
  </parameters>

</language>


================================================
FILE: grammars/mini-tagalog/preset-families.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!-- 
      - This file is generated by parametric-lexicon.xsl to set up
          accusativity/ergativity parameter for IV and TV primary families
          and control primary families.

          NB: pre-CCG categories of parameters.xml are mapped to
              CCG categories in this file. From now on, it's all CCG

    Suggestions to start-up lexicon development:

      1) Copy this file to lexicon-base.xml to avoid losing your changes
         to it (remember, this file is auto-generated at the start)
      2) Edit lexicon-base.xml to modify the preset families and to add your 
          own families as needed (merging the entries of same family is
          left to you)
      3) Use the ccg-build facility of openCCG, which uses lexicon-base to build
          the lexicon.xml, morph.xml and rules.xml files needed by the system.
  -->
<!--

      *** Families derived from language parameters ***

   Includes primary entries for IV (unerg and unacc), basic TV, TV-control1, 
   TV-control2, IV-control1
   
  -->
<!--
  subject-case, s-case, p-case and a-case are value types that set up ergative-
  accusative mapping and surface cases of these argumnents (cf. types.xml file).
  Actual case values for them (e.g. nom for a-case in accusative languages,
  erg for a-case in ergative languages) are defined in types.xml file.
  You can of course refer to actual values since they are types,  but if a
  construction is related to GR mapping (ERG or ACC), it's better to use
  subject-cases (which covers a-case and s-case in ACC; p-case and s-case in ERG).
  Types.xml sets these up from parameter specification.
  
  -->
<ccg-lexicon xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:noNamespaceSchemaLocation="../lexicon.xsd" name="Tagalog">
   <family closed="true" pos="V" name="unergative">
      <entry name="primary">
         <complexcat>
            <atomcat type="s">
               <fs id="100">
                  <feat attr="index">
                     <lf>
                        <nomvar name="E"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <slash dir="/"/>
            <atomcat type="np">
               <fs id="1">
                  <feat attr="case" val="s-case"/>
                  <feat attr="index">
                     <lf>
                        <nomvar name="X1"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <lf>
               <satop nomvar="E">
                  <prop name="[*DEFAULT*]"/>
                  <diamond mode="Arg1">
                     <nomvar name="X1"/>
                  </diamond>
                  <diamond mode="Arg2">
                     <nom name="one"/>
                  </diamond>
               </satop>
            </lf>
         </complexcat>
      </entry>
   </family>
   <family closed="true" pos="V" name="unaccusative">
      <entry name="primary">
         <complexcat>
            <atomcat type="s">
               <fs id="100">
                  <feat attr="index">
                     <lf>
                        <nomvar name="E"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <slash dir="/"/>
            <atomcat type="np">
               <fs id="1">
                  <feat attr="case" val="s-case"/>
                  <feat attr="index">
                     <lf>
                        <nomvar name="X1"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <lf>
               <satop nomvar="E">
                  <prop name="[*DEFAULT*]"/>
                  <diamond mode="Arg2">
                     <nomvar name="X1"/>
                  </diamond>
                  <diamond mode="Arg1">
                     <nom name="one"/>
                  </diamond>
               </satop>
            </lf>
         </complexcat>
      </entry>
   </family>
   <family closed="true" pos="V" name="TV">
      <entry name="primary">
         <complexcat>
            <atomcat type="s">
               <fs id="100">
                  <feat attr="index">
                     <lf>
                        <nomvar name="E"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <setarg>
               <slash dir="/"/>
               <atomcat type="np">
                  <fs id="1">
                     <feat attr="case" val="a-case"/>
                     <feat attr="index">
                        <lf>
                           <nomvar name="X1"/>
                        </lf>
                     </feat>
                  </fs>
               </atomcat>
               <slash dir="/"/>
               <atomcat type="np">
                  <fs id="2">
                     <feat attr="case" val="p-case"/>
                     <feat attr="index">
                        <lf>
                           <nomvar name="X2"/>
                        </lf>
                     </feat>
                  </fs>
               </atomcat>
            </setarg>
            <lf>
               <satop nomvar="E">
                  <prop name="[*DEFAULT*]"/>
                  <diamond mode="Arg1">
                     <nomvar name="X1"/>
                  </diamond>
                  <diamond mode="Arg2">
                     <nomvar name="X2"/>
                  </diamond>
               </satop>
            </lf>
         </complexcat>
      </entry>
   </family>
   <family closed="true" pos="V" name="TV-control2">
      <entry name="primary">
         <complexcat>
            <atomcat type="s">
               <fs id="100">
                  <feat attr="index">
                     <lf>
                        <nomvar name="E"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <setarg>
               <slash dir="/"/>
               <atomcat type="np">
                  <fs id="1">
                     <feat attr="case" val="a-case"/>
                     <feat attr="index">
                        <lf>
                           <nomvar name="X1"/>
                        </lf>
                     </feat>
                  </fs>
               </atomcat>
               <slash dir="/"/>
               <complexcat>
                  <!--NB: Word order and directionality of embedded clause's |(S|NP) 
type is an 'educated guess' from the syntactic type of TV. Change them
accordingly 
  -->
                  <atomcat type="s">
                     <fs id="3">
                        <feat val="non-fin" attr="vform"/>
                        <feat attr="index">
                           <lf>
                              <nomvar name="E2"/>
                           </lf>
                        </feat>
                     </fs>
                  </atomcat>
                  <slash dir="|"/>
                  <atomcat type="np">
                     <fs id="4">
                        <!-- NB: If infinitive type is syntactic subject (which is the 
		  default), there is a built-in type in types.xml file called
		  "subject-case". Include in this type all the subjects that
		  can be controlled e.g. nominative subjects only (as in German), 
		  dative and nominative subjects (as in Malayalam) etc. In this
		  case, the controllee is not semantically restricted.
		  
		  If infinitive type is semantic subject, you need a larger
		  fragment of Hybrid Logic than HLDS uses to implement identity
		  of two event variables e.g.
		  
		  @_e(Arg1 a) ^ @_e(Arg1 b) - -> @_a(b)
		  
		  where a is the event variable for controller verb, and
		  b is the event variable for the controlled verb, and Arg1 is the
		  modality for primary arguments (1s).
		  
		  This constraint is formulable in HL but HLDS does not cover that
		  fragment (yet). When it does, the lf tag should just stick in that
		  constraint.
		  
		  Currently, OpenCCG can generate an LF with TWO non-identical Arg1 modalities
		  in the same event structure, therefore some illicit examples would
		  go through.
		-->
                        <feat attr="index">
                           <lf>
                              <nomvar name="X2"/>
                           </lf>
                           <!--NB: Index is same as Arg2's -->
                        </feat>
                     </fs>
                  </atomcat>
               </complexcat>
               <slash dir="/"/>
               <atomcat type="np">
                  <fs id="2">
                     <feat attr="case" val="p-case"/>
                     <feat attr="index">
                        <lf>
                           <nomvar name="X2"/>
                        </lf>
                     </feat>
                  </fs>
               </atomcat>
            </setarg>
            <lf>
               <satop nomvar="E">
                  <prop name="[*DEFAULT*]"/>
                  <diamond mode="Arg1">
                     <nomvar name="X1"/>
                  </diamond>
                  <diamond mode="Arg2">
                     <nomvar name="X2"/>
                  </diamond>
                  <diamond mode="Arg3">
                     <nomvar name="E2"/>
                     <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
                  </diamond>
               </satop>
            </lf>
         </complexcat>
      </entry>
   </family>
   <family closed="true" pos="V" name="TV-control1">
      <entry name="primary">
         <complexcat>
            <atomcat type="s">
               <fs id="100">
                  <feat attr="index">
                     <lf>
                        <nomvar name="E"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <setarg>
               <slash dir="/"/>
               <atomcat type="np">
                  <fs id="1">
                     <feat attr="case" val="a-case"/>
                     <feat attr="index">
                        <lf>
                           <nomvar name="X1"/>
                        </lf>
                     </feat>
                  </fs>
               </atomcat>
               <slash dir="/"/>
               <complexcat>
                  <!--NB: Word order and directionality of embedded clause's 
|(S|NP) type is an 'educated guess' from the syntactic type of TV. 
Change them accordingly.
  -->
                  <atomcat type="s">
                     <fs id="3">
                        <feat val="non-fin" attr="vform"/>
                        <feat attr="index">
                           <lf>
                              <nomvar name="E2"/>
                           </lf>
                        </feat>
                     </fs>
                  </atomcat>
                  <slash dir="|"/>
                  <atomcat type="np">
                     <fs id="4">
                        <!-- NB: If infinitive type is syntactic subject (which is the 
		  default), there is a built-in type in types.xml file called
		  "subject-case". Include in this type all the subjects that
		  can be controlled e.g. nominative subjects only (as in German), 
		  dative and nominative subjects (as in Malayalam) etc. In this
		  case, the controllee is not semantically restricted.
		  
		  If infinitive type is semantic subject, you need a larger
		  fragment of Hybrid Logic than HLDS uses to implement identity
		  of two event variables e.g.
		  
		  @_e(Arg1 a) ^ @_e(Arg1 b) - -> @_a(b)
		  
		  where a is the event variable for controller verb, and
		  b is the event variable for the controlled verb, and Arg1 is the
		  modality for primary arguments (1s).
		  
		  This constraint is formulable in HL but HLDS does not cover that
		  fragment (yet). When it does, the lf tag should just stick in that
		  constraint.
		  
		  Currently, OpenCCG can generate an LF with TWO non-identical Arg1 modalities
		  in the same event structure, therefore some illicit examples would
		  go through.
		-->
                        <feat attr="index">
                           <lf>
                              <nomvar name="X1"/>
                           </lf>
                           <!--NB: Index is same as Arg1's -->
                        </feat>
                     </fs>
                  </atomcat>
               </complexcat>
               <slash dir="/"/>
               <atomcat type="np">
                  <fs id="2">
                     <feat attr="case" val="p-case"/>
                     <feat attr="index">
                        <lf>
                           <nomvar name="X2"/>
                        </lf>
                     </feat>
                  </fs>
               </atomcat>
            </setarg>
            <lf>
               <satop nomvar="E">
                  <prop name="[*DEFAULT*]"/>
                  <diamond mode="Arg1">
                     <nomvar name="X1"/>
                  </diamond>
                  <diamond mode="Arg2">
                     <nomvar name="X2"/>
                  </diamond>
                  <diamond mode="Arg3">
                     <nomvar name="E2"/>
                     <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
                  </diamond>
               </satop>
            </lf>
         </complexcat>
      </entry>
   </family>
   <family closed="true" pos="V" name="IV-control1">
      <entry name="primary">
         <complexcat>
            <atomcat type="s">
               <fs id="100">
                  <feat attr="index">
                     <lf>
                        <nomvar name="E"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <setarg>
               <slash dir="/"/>
               <atomcat type="np">
                  <fs id="1">
                     <feat attr="case" val="a-case"/>
                     <feat attr="index">
                        <lf>
                           <nomvar name="X1"/>
                        </lf>
                     </feat>
                  </fs>
               </atomcat>
               <slash dir="/"/>
               <complexcat>
                  <!--NB: Word order and directionality of embedded clause's 
|(S|NP) type is an 'educated guess' from the syntactic type of TV. 
Change them accordingly.
  -->
                  <atomcat type="s">
                     <fs id="3">
                        <feat val="non-fin" attr="vform"/>
                        <feat attr="index">
                           <lf>
                              <nomvar name="E2"/>
                           </lf>
                        </feat>
                     </fs>
                  </atomcat>
                  <slash dir="|"/>
                  <atomcat type="np">
                     <fs id="4">
                        <!-- NB: If infinitive type is syntactic subject (which is the 
		  default), there is a built-in type in types.xml file called
		  "subject-case". Include in this type all the subjects that
		  can be controlled e.g. nominative subjects only (as in German), 
		  dative and nominative subjects (as in Malayalam) etc. In this
		  case, the controllee is not semantically restricted.
		  
		  If infinitive type is semantic subject, you need a larger
		  fragment of Hybrid Logic than HLDS uses to implement identity
		  of two event variables e.g.
		  
		  @_e(Arg1 a) ^ @_e(Arg1 b) - -> @_a(b)
		  
		  where a is the event variable for controller verb, and
		  b is the event variable for the controlled verb, and Arg1 is the
		  modality for primary arguments (1s).
		  
		  This constraint is formulable in HL but HLDS does not cover that
		  fragment (yet). When it does, the lf tag should just stick in that
		  constraint.
		  
		  Currently, OpenCCG can generate an LF with TWO non-identical Arg1 modalities
		  in the same event structure, therefore some illicit examples would
		  go through.
		-->
                        <feat attr="index">
                           <lf>
                              <nomvar name="X1"/>
                           </lf>
                           <!--NB: Index is same as Arg1's -->
                        </feat>
                     </fs>
                  </atomcat>
               </complexcat>
            </setarg>
            <lf>
               <satop nomvar="E">
                  <prop name="[*DEFAULT*]"/>
                  <diamond mode="Arg1">
                     <nomvar name="X1"/>
                  </diamond>
                  <diamond mode="Arg2">
                     <nomvar name="E2"/>
                     <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
                  </diamond>
               </satop>
            </lf>
         </complexcat>
      </entry>
   </family>
   <!--

    *** End of derived families ***
 
        Add new families here, and merge the new entries for preset
         families as needed (e.g., you may add an entry to TV family
         for pro-dropping the subject etc.)
  -->
</ccg-lexicon>


================================================
FILE: grammars/mini-tagalog/rules.xml
================================================
<?xml version='1.0' encoding='UTF-8'?>
<rules
xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
    xsi:noNamespaceSchemaLocation="../rules.xsd"
>
  <application dir="forward"/>
  <application dir="backward"/>
  <composition dir="forward" harmonic="true"/>
  <composition dir="forward" harmonic="false"/>
  <composition dir="backward" harmonic="true"/>
  <composition dir="backward" harmonic="false"/>
  <typeraising dir="forward" useDollar="false"/>
  <typeraising dir="backward" useDollar="false"/>
  <substitution dir="forward" harmonic="true"/>
  <substitution dir="forward" harmonic="false"/>
  <substitution dir="backward" harmonic="true"/>
  <substitution dir="backward" harmonic="false"/>

  <typechanging name="pd">
    <arg>
      <complexcat>
        <atomcat type="s">
            <fs id="1">
            <feat attr="index">
             <lf>
              <nomvar name="E"/>
             </lf>
            </feat>
            </fs>
          </atomcat>
          <slash dir="/"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="case" val="subject-case"/>
              <feat attr="index">
                <lf>
                <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
      </complexcat>
    </arg>
    <result>
      <atomcat type="s">
        <fs >
          <feat attr="index">
            <lf>
             <nomvar name="E"/>
            </lf>
          </feat>
        </fs>
      </atomcat>
    </result>
  </typechanging>

</rules>


================================================
FILE: grammars/mini-tagalog/testbed.out
================================================
Loading grammar from URL: file:/home/bozsahin/openccg/grammars/mini-tagalog/grammar.xml

Parse	Realize	String
-----	-------	------
(3)	-	iniwasan ko ng tumingin kay Lorna
ok	-	nagatubili siya ng humiram ng pera sa bangko
ok	-	nagatubili siya ng hiramin ang pera sa bangko
(2)	-	nagatubili siya ng hiraman ng pera ang bangko
ok	-	binawalan ko si Maria ng awitin ang pera
(3)	-	ang babae ng bumili ng baro
(3)	-	ang baro ng binili ng babae
(2)	-	huhugasan ko at pupunasan mo ang mgapinggan
(2)	-	niluto ang pagkain at hinugasan ang mgapinggan ni Josie
(4)	-	nanghuhuli ang ama at nagtitinda ang ina ng isda
(2)	-	nagbigay ng regalo si Maria at nagpadala ng liham ang mgabat
		a kay Juan
(5)	-	pumunta sa tindahan at bumili ang kapatid ng bigas


================================================
FILE: grammars/mini-tagalog/testbed.xml
================================================
<?xml version="1.0"?>
<regression>
  <item numOfParses="1" string="iniwasan ko ng tumingin kay Lorna"/>
  <item numOfParses="1" string="nagatubili siya ng humiram ng pera sa bangko"/>
  <item numOfParses="1" string="nagatubili siya ng hiramin ang pera sa bangko"/>
  <item numOfParses="1" string="nagatubili siya ng hiraman ng pera ang bangko"/>
  <item numOfParses="1" string="binawalan ko si Maria ng awitin ang pera"/>
  <item numOfParses="1" string="ang babae ng bumili ng baro"/>
  <item numOfParses="1" string="ang baro ng binili ng babae"/>
  <item numOfParses="1" string="huhugasan ko at pupunasan mo ang mgapinggan"/>
  <item numOfParses="1" string="niluto ang pagkain at hinugasan ang mgapinggan ni Josie"/>
  <item numOfParses="1" string="nanghuhuli ang ama at nagtitinda ang ina ng isda"/>
  <item numOfParses="1" string="nagbigay ng regalo si Maria at nagpadala ng liham ang mgabata kay Juan"/>
  <item numOfParses="1" string="pumunta sa tindahan at bumili ang kapatid ng bigas"/>
</regression>


================================================
FILE: grammars/mini-tagalog/types.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!-- 
      - This file is generated by parametric-types.xsl from parameter specs
	    (parameters.xml) to set up  types.xml file for development.
         
      - If the language in question has eg. quirky subjects etc., add their 
	    values under appropriate types.
	 
	 -->
<!--
	   subject-case, s-case, p-case and a-case are pre-defined types that are
	   used in the automatically generated initial lexicon (preset-families
	   .xml). We recommend that you dont change them. They handle
	   accusative/ergative mapping among other things (cf. types.xml initial
	   hierarchy).
	  
	 -->
<types xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:noNamespaceSchemaLocation="../types.xsd" name="Tagalog">
  <type name="s-case" parents="subject-case"/>
  <type name="subject-case"/>
  <type parents="a-case" name="erg"/>
  <type name="a-case"/>
  <type parents="s-case p-case" name="abs"/>
  <type name="p-case" parents="subject-case"/>
</types>


================================================
FILE: grammars/mini-turkish/build.xml
================================================
<!-- $Id: build.xml,v 1.2 2007/03/26 18:31:13 mwhite14850 Exp $ -->
<!-- Copyright (C) 2003 University of Edinburgh (Michael White) and Cem Bozsahin -->
<project default="grammar" basedir=".">

  <!-- =================================================================== -->
  <!-- Initialization target                                               -->
  <!-- =================================================================== -->
  <target name="init">
    <tstamp/>
    <property name="Name" value="OpenCCG"/>
    <property name="name" value="openccg"/>

    <echo message="----------- ${Name} ------------"/>

    <property name="lib.dir" value="${openccg.home}/lib"/>
    <property name="grammars.dir" value="${openccg.home}/grammars"/>

    <path id="validate.classpath">
      <pathelement location="${lib.dir}/xercesImpl.jar"/>
      <pathelement location="${lib.dir}/${name}.jar"/>
    </path>
  </target>
  

  <!-- =================================================================== -->
  <!-- Help on usage                                                       -->
  <!-- =================================================================== -->
  <target name="usage">
    <echo message=""/>
    <echo message=""/>
    <echo message="OpenCCG grammar build file"/>
    <echo message="-------------------------------------------------------------"/>
    <echo message=""/>
    <echo message=" Available targets are:"/>
    <echo message=""/>
    <echo message="   grammar  --> builds the grammar (default)"/>
    <echo message=""/>
    <echo message="   skeleton  --> builds the skeleton file"/>
    <echo message=""/>
    <echo message=" See the comments inside the build.xml file for more details."/>
    <echo message="-------------------------------------------------------------"/>
    <echo message=""/>
    <echo message=""/>
  </target>
  

  <!-- =================================================================== -->
  <!-- Builds grammar                                                     -->
  <!-- =================================================================== -->
  <target name="grammar" depends="init" description="builds grammar">
    <echo message="Adding family members from dict.xml to lexicon-base.xml, yielding lexicon.xml"/>
    <java classname="org.apache.xalan.xslt.Process"> 
      <arg value="-IN"/> <arg value="lexicon-base.xml"/>
      <arg value="-XSL"/> <arg value="${grammars.dir}/add-family-members.xsl"/>
      <arg value="-PARAM"/> <arg value="dict-file"/> <arg value="${basedir}/dict.xml"/>
      <arg value="-OUT"/> <arg value="lexicon.xml"/>
    </java>
    <echo message="Extracting morph items from dict.xml to morph.xml"/>
    <java classname="org.apache.xalan.xslt.Process"> 
      <arg value="-IN"/> <arg value="${basedir}/dict.xml"/>
      <arg value="-XSL"/> <arg value="${grammars.dir}/extract-morph.xsl"/>
      <arg value="-OUT"/> <arg value="morph.xml"/>
    </java>
    <echo message="Validating grammar.xml, lexicon.xml, morph.xml, rules.xml and types.xml"/>
    <java classname="opennlp.ccg.test.Validator" classpathref="validate.classpath" fork="true"> 
      <arg value="grammar.xml"/>
      <arg value="lexicon.xml"/>
      <arg value="morph.xml"/>
      <arg value="rules.xml"/>
      <arg value="types.xml"/>
    </java>
  </target>

  <target name="skeleton"
          depends="init"
 description="Builds pre-lexicon to start up lexicon development">
    <echo message="Validating parameters.xml"/>
    <java classname="opennlp.ccg.test.Validator" classpathref="validate.classpath" fork="true"> 
      <arg value="parameters.xml"/>
    </java>
    <echo message="Generating preset-families.xml"/>
    <java classname="org.apache.xalan.xslt.Process">
      <arg value="-IN"/> <arg value="${basedir}/parameters.xml"/>
      <arg value="-XSL"/> <arg value="${grammars.dir}/parametric-lexicon.xsl"/>
      <arg value="-OUT"/> <arg value="${basedir}/preset-families.xml"/>
    </java>
    <echo message="Validating preset-families.xml"/>
    <java classname="opennlp.ccg.test.Validator" classpathref="validate.classpath" fork="true"> 
      <arg value="preset-families.xml"/>
    </java>
	<echo message="Generating types.xml"/>
    <java classname="org.apache.xalan.xslt.Process">
      <arg value="-IN"/> <arg value="${basedir}/parameters.xml"/>
      <arg value="-XSL"/> <arg value="${grammars.dir}/parametric-types.xsl"/>
      <arg value="-OUT"/> <arg value="${basedir}/types.xml"/>
    </java>
    <echo message="Validating types.xml"/>
    <java classname="opennlp.ccg.test.Validator" classpathref="validate.classpath" fork="true"> 
      <arg value="types.xml"/>
    </java>
  </target>
</project>

<!-- End of file -->


================================================
FILE: grammars/mini-turkish/dict.xml
================================================
<?xml version="1.0"?>

<dictionary name="Turkish">
 
<!-- Conj  -->
  <entry stem="ve" pred="and" pos="Conj">
    <member-of family="Conj"/>
    <word form="ve" />
  </entry>
  <entry stem="ama" pred="but" pos="Conj">
    <member-of family="Conj"/>
    <word form="ama" />
  </entry>

  <entry stem="da" pred="and" pos="Conj">
    <member-of family="ConjPart"/>
    <word form="de"/>
    <word form="da"/>
  </entry>

<!-- Noun -->
  <entry stem="adam" pred="man" pos="N">
    <member-of family="Noun"/>
    <word form="adam" macros="@sg @3rd"/>
  </entry>
  <entry stem="kadin" pred="woman" pos="N">
    <member-of family="Noun"/>
    <word form="kadin" macros="@sg @3rd"/>
  </entry>
  <entry stem="cocuk" pred="child" pos="N">
    <member-of family="Noun"/>
    <word form="cocuk" macros="@sg @3rd"/>
    <word form="cocug" macros="@sg @3rd"/>
  </entry>
  <entry stem="kitap" pred="book" pos="N">
    <member-of family="Noun"/>
    <word form="kitap" macros="@sg @3rd"/>
    <word form="kitab" macros="@sg @3rd"/>
  </entry>
  <entry stem="dergi" pred="magazine" pos="N">
    <member-of family="Noun"/>
    <word form="dergi" macros="@sg @3rd"/>
  </entry>
  <entry stem="kiz" pred="girl" pos="N">
    <member-of family="Noun"/>
    <word form="kiz" macros="@sg @3rd"/>
  </entry>
  

<!-- Intransitive -->
  <entry stem="dus" pred="fell-down" pos="V">
    <member-of family="IV"/>
    <word form="dustu" macros="@past"/>
    <word form="dus" macros="@past @non-fin"/>
  </entry>
  <entry stem="uyu" pred="sleep" pos="V">
    <member-of family="IV"/>
    <word form="uyudu" macros="@past"/>
    <word form="uyu" macros="@past @non-fin"/>
  </entry>

<!-- Transitive -->
  <entry stem="gor" pred="see" pos="V">
    <member-of family="TV"/>
    <word form="gor" macros="@acc2 @non-fin"/>
    <word form="gordu" macros="@acc2 @past"/>
  </entry>
  <entry stem="bak" pred="look" pos="V">
    <member-of family="TV"/>
    <word form="bakti" macros="@dat2 @past"/>
    <word form="bak" macros="@dat2 @non-fin"/>
  </entry>
  <entry stem="al" pred="buy" pos="V">
    <member-of family="TV"/>
    <word form="al" macros="@acc2 @non-fin"/>
    <word form="almisti" macros="@acc2 @past"/>
  </entry>
  <entry stem="oku" pred="read" pos="V">
    <member-of family="TV"/>
    <word form="okudu" macros="@acc2 @past"/>
    <word form="oku" macros="@acc2 @non-fin"/>
  </entry>
  <entry stem="carp" pred="run-into" pos="V">
    <member-of family="TV"/>
    <word form="carpti" macros="@dat2 @past"/>
    <word form="carp" macros="@dat2 @non-fin"/>
  </entry>


<!-- Transitive + control-->
  <entry stem="iste" pred="want" pos="V">
    <member-of family="TV"/>
    <member-of family="IV-control1"/>
    <word form="istedi" macros="@acc3 @past"/>
    <word form="iste" macros="@acc3 @non-fin"/>
  </entry>
  <entry stem="calis" pred="try" pos="V">
    <member-of family="TV"/>
    <member-of family="IV-control1"/>
    <word form="calisti" macros="@dat3 @past"/>
    <word form="calis" macros="@dat3 @non-fin"/>
  </entry>
  <entry stem="sozver" pred="promise" pos="V">
    <member-of family="IV"/>
    <member-of family="IV-control1"/>
    <member-of family="TV-control1"/>
    <word form="sozverdi" macros="@dat3 @past"/>
    <word form="sozver" macros="@dat3 @non-fin"/>
  </entry>
  <entry stem="zorla" pred="force" pos="V">
    <member-of family="TV"/>
    <member-of family="TV-control2"/>
    <word form="zorladi" macros="@dat3 @past"/>
    <word form="zorla" macros="@dat3 @non-fin"/>
  </entry>

<!-- Ditransitive -->

  <entry stem="ver" pred="give" pos="V">
    <member-of family="DV"/>
    <word form="verdi" macros="@past"/>
    <word form="ver" macros="@non-fin"/>
  </entry>


<!-- Affix -->
  <entry stem="mek" pos="Affix">
    <member-of family="To-Infinitive"/>
    <word form="me" />
    <word form="ma" />
    <word form="mek"/>
    <word form="mak"/>
  </entry>
  <entry stem="yi" pos="Affix">
    <member-of family="case"/>
    <member-of family="inf-case"/>
    <word form="yu" macros="@acc0 @def0"/>
    <word form="yi" macros="@acc0 @def0"/>
    <word form="i" macros="@acc0 @def0"/>
    <word form="u" macros="@acc0 @def0"/>
  </entry>
  <entry stem="in" pos="Affix">
    <member-of family="agr-case"/>
    <word form="in" />
    <word form="un" />
    <word form="n" />
  </entry>
  <entry stem="ya" pred="to" pos="Affix">
    <member-of family="case"/>
    <member-of family="inf-case"/>
    <word form="ya" macros="@dat0 @def0"/>
    <word form="ye" macros="@dat0 @def0"/>
    <word form="a" macros="@dat0 @def0"/>
    <word form="e" macros="@dat0 @def0"/>
  </entry>
  <entry stem="yan" pred="that" pos="Affix">
    <member-of family="rel"/>
    <word form="yan" macros="@nom2"/>
    <word form="yen" macros="@nom2"/>
    <word form="en" macros="@nom2"/>
    <word form="an" macros="@nom2"/> 
  </entry>
  <entry stem="dik" pred="whom" pos="Affix">
    <member-of family="rel"/>
    <word form="digi" macros="@agr1"/> <!--embedded IV must be IVagr,cf an-->
    <word form="dugu" macros="@agr1"/>
    <word form="tigi" macros="@agr1"/>
    <word form="tugu" macros="@agr1"/>
  </entry>


<macro name="@agr1">
  <fs id="1" attr="agr" val="true"/>
</macro>
<macro name="@gen1">
  <fs id="1" attr="case" val="gen"/>
</macro>
<macro name="@gen2">
  <fs id="2" attr="case" val="gen"/>
</macro>
<macro name="@acc0">
  <fs id="0" attr="case" val="p-case"/>
</macro>
<macro name="@acc1">
  <fs id="1" attr="case" val="p-case"/>
</macro>
<macro name="@acc2">
  <fs id="2" attr="case" val="p-case"/>
</macro>
<macro name="@acc3">
  <fs id="3" attr="case" val="p-case"/>
</macro>
<macro name="@def0">
  <fs id="0" attr="def" val="true"/>
</macro>
<macro name="@nom0">
  <fs id="0" attr="case" val="subject-case"/>
</macro>
<macro name="@nom1">
  <fs id="1" attr="case" val="subject-case"/>
</macro>
<macro name="@nom2">
  <fs id="2" attr="case" val="subject-case"/>
</macro>
<macro name="@dat0">
  <fs id="0" attr="case" val="dat"/>
</macro>
<macro name="@dat2">
  <fs id="2" attr="case" val="dat"/>
</macro>
<macro name="@dat3">
  <fs id="3" attr="case" val="dat"/>
</macro>
<macro name="@sg">
  <fs id="0" attr="num" val="sing"/>
</macro>
<macro name="@sg1">
  <fs id="1" attr="num" val="sing"/>
</macro>
<macro name="@sg2">
  <fs id="2" attr="num" val="sing"/>
</macro>
<macro name="@sg3">
  <fs id="3" attr="num" val="sing"/>
</macro>
<macro name="@3rd">
  <fs id="0" attr="person" val="3"/>
</macro>
<macro name="@3rd1">
  <fs id="1" attr="person" val="3"/>
</macro>
<macro name="@3rd2">
  <fs id="2" attr="person" val="3"/>
</macro>
<macro name="@3rd3">
  <fs id="3" attr="person" val="3"/>
</macro>
<macro name="@1st">
  <fs id="0" attr="person" val="1"/>
</macro>
<macro name="@1st1">
  <fs id="1" attr="person" val="1"/>
</macro>
<macro name="@1st2">
  <fs id="2" attr="person" val="1"/>
</macro>
<macro name="@2nd">
  <fs id="0" attr="person" val="1"/>
</macro>
<macro name="@2nd1">
  <fs id="1" attr="person" val="2"/>
</macro>
<macro name="@2nd2">		    
  <fs id="2" attr="person" val="1"/>
</macro>
<macro name="@non-fin">
  <fs id="0" attr="vform" val="non-fin"/> 
  </macro>
<macro name="@past">
  <fs id="0" attr="vform" val="finite"/> 
</macro>
</dictionary>


================================================
FILE: grammars/mini-turkish/grammar.xml
================================================
<?xml version="1.0"?>
<!-- 
Copyright (C) 2003 Michael White 
$Revision: 1.1 $, $Date: 2005/08/03 14:23:29 $ 
-->
<grammar name="Turkish"
  xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
  xsi:noNamespaceSchemaLocation="../grammar.xsd"
>

  <lexicon file="lexicon.xml"/>
  <morphology file="morph.xml"/>
  <rules file="rules.xml"/> 
  <types file="types.xml"/>

</grammar>


================================================
FILE: grammars/mini-turkish/lexicon-base.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!-- Additional families by Cem Bozsahin, 6/2003 -->
<!-- 
      - This file is generated by lexicon-skeleton.xsl to set up
          accusativity/ergativity parameter for IV and TV primary families
          and control primary families.

          NB: pre-CCG categories of lexicon-skeleton.xml are mapped to
              CCG categories in this file. From now on, it's all CCG

    Suggestions to start-up lexicon development:

      1) Copy this file to lexicon-base.xml to avoid losing your changes
         to it (remember, this file is auto-generated at the start)
      2) Edit lexicon-base.xml to modify the preset families and to add your 
          own families as needed (merging the entries of same family is
          left to you)
      3) Use the build facility of openCCG to build
          the lexicon.xml, morph.xml and rules.xml files needed by the system.
  -->
<!--

      *** Families derived from language parameters ***

   Includes primary entries for IV, TV, TV-control1, TV-control2, IV-control1
   
  -->
<ccg-lexicon name="Turkish" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:noNamespaceSchemaLocation="../lexicon.xsd">
  <family closed="true" pos="V" name="IV">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="agr" val="false"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="n">
          <fs id="1">
            <feat attr="case" val="s-case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>

  <family closed="true" pos="V" name="TV">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="agr" val="false"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <setarg>
          <slash dir="\"/>
          <atomcat type="n">
            <fs id="1">
              <feat attr="case" val="a-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="n">
            <fs id="2">
                     <!-- macros decide about the case -->
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </setarg>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="X2"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>

  <family closed="true" pos="V" name="TV-control2">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="agr" val="false"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <setarg>
          <slash dir="\"/>
          <atomcat type="n">
            <fs id="1">
              <feat attr="case" val="a-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <complexcat>
                  <!--NB: Word order and directionality of embedded clause's |(S|NP) 
type is an 'educated guess' from the syntactic type of TV. Change them
accordingly 
  -->
            <atomcat type="s">
              <fs id="3">
                <feat val="inf" attr="vform"/>
                <feat attr="index">
                  <lf>
                    <nomvar name="E2"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
            <slash dir="|"/>
            <atomcat type="n">
              <fs id="4">
              <feat attr="case" val="subject-case"/>
                <feat attr="index">
                  <lf>
                    <nomvar name="X2"/>
                  </lf>
                           <!--NB: Index is same as Arg2's 
  -->
                </feat>
              </fs>
            </atomcat>
          </complexcat>
          <slash dir="\"/>
          <atomcat type="n">
            <fs id="2">
              <feat attr="case" val="p-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </setarg>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="X2"/>
            </diamond>
            <diamond mode="Arg3">
              <nomvar name="E2"/>
                     <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>

  <family closed="true" pos="V" name="TV-control1">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="agr" val="false"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <setarg>
          <slash dir="\"/>
          <atomcat type="n">
            <fs id="1">
              <feat attr="case" val="a-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <complexcat>
                  <!--NB: Word order and directionality of embedded clause's 
|(S|NP) type is an 'educated guess' from the syntactic type of TV. 
Change them accordingly.
  -->
            <atomcat type="s">
              <fs id="3">
                <feat val="inf" attr="vform"/>
                <feat attr="index">
                  <lf>
                    <nomvar name="E2"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
            <slash dir="|"/>
            <atomcat type="n">
              <fs id="4">
               <feat attr="case" val="subject-case"/>
                <feat attr="index">
                  <lf>
                    <nomvar name="X1"/>
                  </lf>
                           <!--NB: Index is same as Arg1's 
  -->
                </feat>
              </fs>
            </atomcat>
          </complexcat>
          <slash dir="\"/>
          <atomcat type="n">
            <fs id="2">
              <feat attr="case" val="p-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </setarg>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="X2"/>
            </diamond>
            <diamond mode="Arg3">
              <nomvar name="E2"/>
                     <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>

  <family closed="true" pos="V" name="IV-control1">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="agr" val="false"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <setarg>
          <slash dir="\"/>
          <atomcat type="n">
            <fs id="1">
              <feat attr="case" val="s-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <complexcat>
                  <!--NB: Word order and directionality of embedded clause's 
|(S|NP) type is an 'educated guess' from the syntactic type of TV. 
Change them accordingly.
  -->
            <atomcat type="s">
              <fs id="3">
                <feat val="inf" attr="vform"/>
                <feat attr="index">
                  <lf>
                    <nomvar name="E2"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
            <slash dir="|"/>
            <atomcat type="n">
              <fs id="4">
                <feat attr="case" val="subject-case"/>
                <feat attr="index">
                  <lf>
                    <nomvar name="X1"/>
                  </lf>
                           <!--NB: Index is same as Arg1's 
  -->
                </feat>
              </fs>
            </atomcat>
          </complexcat>
        </setarg>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="E2"/>
                     <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
   <!--

    *** End of derived families ***
 
        Add new families here, and merge the new entries for preset
         families as needed (e.g., you may add an entry to TV family
         for pro-dropping the subject etc.)
  -->

  <!-- Turkish specific families -->

  <family closed="true" pos="V" name="DV">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="agr" val="false"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <setarg>
          <slash dir="\"/>
          <atomcat type="n">
            <fs id="1">
              <feat attr="case" val="a-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="n">
            <fs id="2">
              <feat attr="case" val="p-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="n">
            <fs id="3">
              <feat attr="case" val="dat"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X3"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </setarg>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="X2"/>
            </diamond>
            <diamond mode="Arg3">
              <nomvar name="X3"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>

  <family indexRel="Restr" pos="Affix" closed="true" name="rel">
    <entry name="primary">
      <complexcat>
        <atomcat type="n">
          <fs inheritsFrom="0">
            <feat attr="case">
              <featvar name="CASE"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/"/>
        <atomcat type="n">
          <fs id="0">
            <feat attr="case">
              <featvar name="CASE"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="*"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="n">
<!-- no co-indexing with fs 0; this aint HPSG-->
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="X">
            <diamond mode="Restr">
              <nomvar name="E"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>

  <family pos="Affix" closed="true" name="case">
    <entry name="primary">
      <complexcat>
        <atomcat type="n">
          <fs inheritsFrom="1" id="0">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="*"/>
        <atomcat type="n">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X">
            <diamond mode="Spec">
              <nomvar name="D"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>

  <family pos="Affix" closed="true" name="agr-case">
    <entry name="value-raised-agr">  <!-- for genitive subject -->
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="0">
            <feat attr="agr" val="true"/>  <!--it's false in all V cats by def-->
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="0">
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="n">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash dir="\" mode="*"/>
        <atomcat type="n">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X">
            <diamond mode="Spec">
              <nomvar name="D"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>

  <family closed="true" pos="Affix" name="adjunct-case">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash/>
        <dollar name="1"/>
        <slash dir="|"/>
        <complexcat>
          <atomcat type="s">
            <fs id="0">
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
        </complexcat>
        <slash dir="\" mode="*"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="P">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Pred">
              <nomvar name="E"/>
              <diamond mode="Mod">
                <nomvar name="Y"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>

  <family pos="N" closed="true" name="Noun">
    <entry name="bare-nom">
      <atomcat type="n">
        <fs id="0">
          <feat attr="case" val="subject-case"/>
          <feat attr="def" val="true"/>
          <feat attr="index">
            <lf>
              <nomvar name="X"/>
            </lf>
          </feat>
        </fs>
        <lf>
          <satop nomvar="X">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </atomcat>
    </entry>
    <entry name="bare-acc">
      <atomcat type="n">
        <fs id="0">
          <feat attr="case" val="p-case"/>
          <feat attr="def" val="false"/>
          <feat attr="index">
            <lf>
              <nomvar name="X"/>
            </lf>
          </feat>
        </fs>
        <lf>
          <satop nomvar="X">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </atomcat>
    </entry>
  </family>

  <family closed="true" pos="Conj" name="Conj">
    <entry name="sentential">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S0"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash/>
        <dollar name="1"/>
	<slash dir="/" mode="*"/>
        <complexcat>
          <atomcat type="s">
            <fs inheritsFrom="1">
              <feat attr="index">
                <lf>
                  <nomvar name="S1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
        </complexcat>
        <slash dir="\" mode="*"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="S2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
        </complexcat>
        <lf>
          <satop nomvar="S0">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="List">
              <nomvar name="S1"/>
              <diamond mode="Coord">
                <nomvar name="S2"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
   </family>

<!-- Umut -->

  <family closed="true" pos="Conj" name="ConjPart">

    <entry name="non-subject-left"> <!-- (74a) in ugwot -->
      <complexcat>
        <atomcat type="s">
	  <fs inheritsFrom="1">
	    <feat attr="index">
              <lf>
                <nomvar name="S0"/>
              </lf>
            </feat>
	  </fs>
	</atomcat>
	<slash dir="\"/>
	<atomcat type="n">
	  <fs id="2"/> <!-- coindexed with the missing n of the left conjunct-->
	</atomcat>
	<slash dir="\" mode="*"/>
	<complexcat>
	<atomcat type="s">
	  <fs inheritsFrom="1">
	    <feat attr="index">
              <lf>
                <nomvar name="S1"/>
              </lf>
            </feat>
	  </fs> 
	 </atomcat>
	 <slash dir="\"/>
	 <atomcat type="n">
	   <fs id="2">
	     <feat attr="case" val="non-subject-cases"/>
	     <feat attr="index">
	      <lf>
                <nomvar name="X"/> <!--coindexed in lf with the missing n of
                the right conjunct -->
	      </lf>
	    </feat>
	   </fs> 
	 </atomcat>   
	</complexcat>
	<slash dir="/" mode="*"/>
	<complexcat>
	  <atomcat type="s">
	    <fs id="1">
	      <feat attr="index">
                <lf>
                  <nomvar name="S2"/>
                </lf>
              </feat>
	    </fs> 
	  </atomcat>
	  <slash dir="\"/>
	  <atomcat type="n">	
	  <fs id="4">
	    <feat attr="case" val="non-subject-cases"/>
	    <feat attr="index">
	      <lf>
                <nomvar name="X"/> <!--coindexed in lf with the missing n of
                the left conjunct -->
	      </lf>
	    </feat>
	  </fs> 
	  </atomcat>
	  <slash dir="\"/>
	  <atomcat type="n">
	    <fs id="3"/>
          </atomcat>
	</complexcat>
	<slash dir="\" mode="*"/>
	<atomcat type="n">
	  <fs id="3"/> 
	</atomcat>
	<lf>
	  <satop nomvar="S0">
	    <prop name="[*DEFAULT*]"/>
	    <diamond mode="List">
	      <nomvar name="S1"/>
	        <diamond mode="Coord">
		  <nomvar name="S2"/>
		</diamond>
	    </diamond>
	  </satop>
	</lf>
</complexcat>
</entry>

 <entry name="non-subject-right">  <!-- (74b) in ugwot -->
      <complexcat>
        <atomcat type="s">
	  <fs inheritsFrom="1">
	    <feat attr="index">
              <lf>
                <nomvar name="S0"/>
              </lf>
            </feat>
	  </fs>
	</atomcat>
	<slash dir="/"/>
	<atomcat type="n">
	  <fs id="4"/><!-- coindexed with the missing n of the right conjunct-->
	</atomcat>
	<slash dir="\" mode="*"/>
	<complexcat>
	<atomcat type="s">
	  <fs inheritsFrom="1">
	    <feat attr="index">
              <lf>
                <nomvar name="S1"/>
              </lf>
            </feat>
	  </fs> 
	 </atomcat>
	 <slash dir="\"/>
	 <atomcat type="n">
	   <fs id="2">
	     <feat attr="case" val="non-subject-cases"/>
	     <feat attr="index">
	       <lf>
	        <nomvar name="X"/> <!--coindexed in lf with the missing n of
                the right conjunct -->
	       </lf>
	     </feat>
	   </fs> 
	 </atomcat>   
	</complexcat>
	<slash dir="/" mode="*"/>
	<complexcat>
	  <atomcat type="s">
	    <fs id="1">
	      <feat attr="index">
                <lf>
                  <nomvar name="S2"/>
                </lf>
              </feat>
	    </fs> 
	  </atomcat>
	  <slash dir="\"/>
	  <atomcat type="n">	
	  <fs id="4">
	    <feat attr="case" val="non-subject-cases"/>
	    <feat attr="index">
	       <lf>
	         <nomvar name="X"/> <!--coindexed in lf with the missing n of
                the left conjunct -->
	       </lf>
	    </feat>
	  </fs> 
	  </atomcat>
	  <slash dir="\"/>
	  <atomcat type="n">
	    <fs id="3"/>
          </atomcat>
	</complexcat>
	<slash dir="\" mode="*"/>
	<atomcat type="n">
	  <fs id="3"/> 
	</atomcat>
        <lf>
	  <satop nomvar="S0">
	    <prop name="[*DEFAULT*]"/>
	    <diamond mode="List">
	      <nomvar name="S1"/>
	        <diamond mode="Coord">
		  <nomvar name="S2"/>
		</diamond>
	    </diamond>
	  </satop>
	</lf>
</complexcat>
</entry>

    <entry name="subject-left">  
      <complexcat>
        <atomcat type="s">
	  <fs inheritsFrom="1">
	    <feat attr="index">
              <lf>
                <nomvar name="S0"/>
              </lf>
            </feat>
	  </fs>
	</atomcat>
	<slash dir="\"/>
	<atomcat type="n">
	  <fs id="2"/>
	</atomcat>
	<slash dir="\" mode="*"/>
	<complexcat>
	<atomcat type="s">
	  <fs inheritsFrom="1">
	    <feat attr="index">
              <lf>
                <nomvar name="S1"/>
              </lf>
            </feat>
	  </fs> 
	 </atomcat>
	 <slash dir="\"/>
	 <atomcat type="n">
	   <fs id="2"/>
	 </atomcat>   
	</complexcat>
	<slash dir="/" mode="*"/>
	<complexcat>
	  <atomcat type="s">
	    <fs id="1">
	      <feat attr="index">
                <lf>
                  <nomvar name="S2"/>
                </lf>
              </feat>
	    </fs> 
	  </atomcat>
	  <slash dir="\"/>
	  <atomcat type="n">	
	  <fs id="2">
	    <feat attr="case" val="subject-case"/>
	    <feat attr="index">
	       <lf>
	         <nomvar name="X"/> <!--coindexed in lf with the missing n of the left conjunct -->
	       </lf>
	    </feat>
	  </fs> 
	  </atomcat>
	  <slash dir="\"/>
	  <atomcat type="n">
	    <fs id="3"/>
          </atomcat>
	</complexcat>
	<slash dir="\" mode="*"/>
	<atomcat type="n">
	  <fs id="3"/> 
	</atomcat>
        <lf>
	  <satop nomvar="S0">
	    <prop name="[*DEFAULT*]"/>
	    <diamond mode="List">
	      <nomvar name="S1"/>
	        <diamond mode="Coord">
		  <nomvar name="S2"/>
		</diamond>
	    </diamond>
	  </satop>
	</lf>
     </complexcat>
   </entry>

 <entry name="subject-right"> <!-- (74d) in ugwot -->
      <complexcat>
        <atomcat type="s">
	  <fs inheritsFrom="1">
	    <feat attr="index">
              <lf>
                <nomvar name="S0"/>
              </lf>
            </feat>
	  </fs>
	</atomcat>
	<slash dir="/"/>
	<atomcat type="n">
	  <fs id="2"/>
	</atomcat>
	<slash dir="\" mode="*"/>
	<complexcat>
	<atomcat type="s">
	  <fs inheritsFrom="1">
	    <feat attr="index">
              <lf>
                <nomvar name="S1"/>
              </lf>
            </feat>
	  </fs> 
	 </atomcat>
	 <slash dir="\"/>
	 <atomcat type="n">
	   <fs id="2"/>
	 </atomcat>   
	</complexcat>
	<slash dir="/" mode="*"/>
	<complexcat>
	  <atomcat type="s">
	    <fs id="1">
	      <feat attr="index">
                <lf>
                  <nomvar name="S2"/>
                </lf>
              </feat>
	    </fs> 
	  </atomcat>
	  <slash dir="\"/>
	  <atomcat type="n">	
	  <fs id="2">
	    <feat attr="case" val="subject-case"/>
	    <feat attr="index">
	       <lf>
	         <nomvar name="X"/> <!--coindexed in lf with the missing n of the left conjunct -->
	       </lf>
	    </feat>
	  </fs> 
	  </atomcat>
	  <slash dir="\"/>
	  <atomcat type="n">
	    <fs id="3"/>
          </atomcat>
	</complexcat>
	<slash dir="\" mode="*"/>
	<atomcat type="n">
	  <fs id="3"/> 
	</atomcat>
        <lf>
	  <satop nomvar="S0">
	    <prop name="[*DEFAULT*]"/>
	    <diamond mode="List">
	      <nomvar name="S1"/>
	        <diamond mode="Coord">
		  <nomvar name="S2"/>
		</diamond>
	    </diamond>
	  </satop>
	</lf>
</complexcat>
</entry>
</family>

  <family indexRel="*NoSem*" closed="true" pos="Affix" name="To-Infinitive">
    <entry name="Basic">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="inf" attr="vform"/>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="\"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat val="non-fin" attr="vform"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="n">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
      </complexcat>
    </entry>
  </family>

  <family indexRel="*NoSem*" closed="true" pos="Affix" name="inf-case">
    <entry name="Basic">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="n">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <complexcat>
          <atomcat type="s">
            <fs id="0">
              <feat val="inf" attr="vform"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="n">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
      </complexcat>
    </entry>
  </family>

</ccg-lexicon>


================================================
FILE: grammars/mini-turkish/lexicon.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!-- Additional families by Cem Bozsahin, 6/2003 -->
<!-- 
      - This file is generated by lexicon-skeleton.xsl to set up
          accusativity/ergativity parameter for IV and TV primary families
          and control primary families.

          NB: pre-CCG categories of lexicon-skeleton.xml are mapped to
              CCG categories in this file. From now on, it's all CCG

    Suggestions to start-up lexicon development:

      1) Copy this file to lexicon-base.xml to avoid losing your changes
         to it (remember, this file is auto-generated at the start)
      2) Edit lexicon-base.xml to modify the preset families and to add your 
          own families as needed (merging the entries of same family is
          left to you)
      3) Use the build facility of openCCG to build
          the lexicon.xml, morph.xml and rules.xml files needed by the system.
  -->
<!--

      *** Families derived from language parameters ***

   Includes primary entries for IV, TV, TV-control1, TV-control2, IV-control1
   
  -->
<ccg-lexicon xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" name="Turkish" xsi:noNamespaceSchemaLocation="../lexicon.xsd">
  <family closed="true" pos="V" name="IV">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="agr" val="false"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="n">
          <fs id="1">
            <feat attr="case" val="s-case"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="dus" pred="fell-down"/>
    <member stem="uyu" pred="sleep"/>
    <member stem="sozver" pred="promise"/>
  </family>
  <family closed="true" pos="V" name="TV">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="agr" val="false"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <setarg>
          <slash dir="\"/>
          <atomcat type="n">
            <fs id="1">
              <feat attr="case" val="a-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="n">
            <fs id="2">
              <!-- macros decide about the case -->
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </setarg>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="X2"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="gor" pred="see"/>
    <member stem="bak" pred="look"/>
    <member stem="al" pred="buy"/>
    <member stem="oku" pred="read"/>
    <member stem="carp" pred="run-into"/>
    <member stem="iste" pred="want"/>
    <member stem="calis" pred="try"/>
    <member stem="zorla" pred="force"/>
  </family>
  <family closed="true" pos="V" name="TV-control2">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="agr" val="false"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <setarg>
          <slash dir="\"/>
          <atomcat type="n">
            <fs id="1">
              <feat attr="case" val="a-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <complexcat>
            <!--NB: Word order and directionality of embedded clause's |(S|NP) 
type is an 'educated guess' from the syntactic type of TV. Change them
accordingly 
  -->
            <atomcat type="s">
              <fs id="3">
                <feat val="inf" attr="vform"/>
                <feat attr="index">
                  <lf>
                    <nomvar name="E2"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
            <slash dir="|"/>
            <atomcat type="n">
              <fs id="4">
                <feat attr="case" val="subject-case"/>
                <feat attr="index">
                  <lf>
                    <nomvar name="X2"/>
                  </lf>
                  <!--NB: Index is same as Arg2's 
  -->
                </feat>
              </fs>
            </atomcat>
          </complexcat>
          <slash dir="\"/>
          <atomcat type="n">
            <fs id="2">
              <feat attr="case" val="p-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </setarg>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="X2"/>
            </diamond>
            <diamond mode="Arg3">
              <nomvar name="E2"/>
              <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="zorla" pred="force"/>
  </family>
  <family closed="true" pos="V" name="TV-control1">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="agr" val="false"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <setarg>
          <slash dir="\"/>
          <atomcat type="n">
            <fs id="1">
              <feat attr="case" val="a-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <complexcat>
            <!--NB: Word order and directionality of embedded clause's 
|(S|NP) type is an 'educated guess' from the syntactic type of TV. 
Change them accordingly.
  -->
            <atomcat type="s">
              <fs id="3">
                <feat val="inf" attr="vform"/>
                <feat attr="index">
                  <lf>
                    <nomvar name="E2"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
            <slash dir="|"/>
            <atomcat type="n">
              <fs id="4">
                <feat attr="case" val="subject-case"/>
                <feat attr="index">
                  <lf>
                    <nomvar name="X1"/>
                  </lf>
                  <!--NB: Index is same as Arg1's 
  -->
                </feat>
              </fs>
            </atomcat>
          </complexcat>
          <slash dir="\"/>
          <atomcat type="n">
            <fs id="2">
              <feat attr="case" val="p-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </setarg>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="X2"/>
            </diamond>
            <diamond mode="Arg3">
              <nomvar name="E2"/>
              <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="sozver" pred="promise"/>
  </family>
  <family closed="true" pos="V" name="IV-control1">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="agr" val="false"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <setarg>
          <slash dir="\"/>
          <atomcat type="n">
            <fs id="1">
              <feat attr="case" val="s-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <complexcat>
            <!--NB: Word order and directionality of embedded clause's 
|(S|NP) type is an 'educated guess' from the syntactic type of TV. 
Change them accordingly.
  -->
            <atomcat type="s">
              <fs id="3">
                <feat val="inf" attr="vform"/>
                <feat attr="index">
                  <lf>
                    <nomvar name="E2"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
            <slash dir="|"/>
            <atomcat type="n">
              <fs id="4">
                <feat attr="case" val="subject-case"/>
                <feat attr="index">
                  <lf>
                    <nomvar name="X1"/>
                  </lf>
                  <!--NB: Index is same as Arg1's 
  -->
                </feat>
              </fs>
            </atomcat>
          </complexcat>
        </setarg>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="E2"/>
              <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="iste" pred="want"/>
    <member stem="calis" pred="try"/>
    <member stem="sozver" pred="promise"/>
  </family>
  <!--

    *** End of derived families ***
 
        Add new families here, and merge the new entries for preset
         families as needed (e.g., you may add an entry to TV family
         for pro-dropping the subject etc.)
  -->
  <!-- Turkish specific families -->
  <family closed="true" pos="V" name="DV">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="agr" val="false"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <setarg>
          <slash dir="\"/>
          <atomcat type="n">
            <fs id="1">
              <feat attr="case" val="a-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="n">
            <fs id="2">
              <feat attr="case" val="p-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="n">
            <fs id="3">
              <feat attr="case" val="dat"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X3"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </setarg>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X1"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="X2"/>
            </diamond>
            <diamond mode="Arg3">
              <nomvar name="X3"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="ver" pred="give"/>
  </family>
  <family indexRel="Restr" pos="Affix" closed="true" name="rel">
    <entry name="primary">
      <complexcat>
        <atomcat type="n">
          <fs inheritsFrom="0">
            <feat attr="case">
              <featvar name="CASE"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/"/>
        <atomcat type="n">
          <fs id="0">
            <feat attr="case">
              <featvar name="CASE"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="*"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="n">
            <!-- no co-indexing with fs 0; this aint HPSG-->
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="X">
            <diamond mode="Restr">
              <nomvar name="E"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="yan" pred="that"/>
    <member stem="dik" pred="whom"/>
  </family>
  <family pos="Affix" closed="true" name="case">
    <entry name="primary">
      <complexcat>
        <atomcat type="n">
          <fs inheritsFrom="1" id="0">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="*"/>
        <atomcat type="n">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X">
            <diamond mode="Spec">
              <nomvar name="D"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="yi"/>
    <member stem="ya" pred="to"/>
  </family>
  <family pos="Affix" closed="true" name="agr-case">
    <entry name="value-raised-agr">
      <!-- for genitive subject -->
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="0">
            <feat attr="agr" val="true"/>
            <!--it's false in all V cats by def-->
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="0">
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="n">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash dir="\" mode="*"/>
        <atomcat type="n">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X">
            <diamond mode="Spec">
              <nomvar name="D"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="in"/>
  </family>
  <family closed="true" pos="Affix" name="adjunct-case">
    <entry name="primary">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash/>
        <dollar name="1"/>
        <slash dir="|"/>
        <complexcat>
          <atomcat type="s">
            <fs id="0">
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
        </complexcat>
        <slash dir="\" mode="*"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="P">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Pred">
              <nomvar name="E"/>
              <diamond mode="Mod">
                <nomvar name="Y"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
  <family pos="N" closed="true" name="Noun">
    <entry name="bare-nom">
      <atomcat type="n">
        <fs id="0">
          <feat attr="case" val="subject-case"/>
          <feat attr="def" val="true"/>
          <feat attr="index">
            <lf>
              <nomvar name="X"/>
            </lf>
          </feat>
        </fs>
        <lf>
          <satop nomvar="X">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </atomcat>
    </entry>
    <entry name="bare-acc">
      <atomcat type="n">
        <fs id="0">
          <feat attr="case" val="p-case"/>
          <feat attr="def" val="false"/>
          <feat attr="index">
            <lf>
              <nomvar name="X"/>
            </lf>
          </feat>
        </fs>
        <lf>
          <satop nomvar="X">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </atomcat>
    </entry>
    <member stem="adam" pred="man"/>
    <member stem="kadin" pred="woman"/>
    <member stem="cocuk" pred="child"/>
    <member stem="kitap" pred="book"/>
    <member stem="dergi" pred="magazine"/>
    <member stem="kiz" pred="girl"/>
  </family>
  <family closed="true" pos="Conj" name="Conj">
    <entry name="sentential">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S0"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash/>
        <dollar name="1"/>
        <slash dir="/" mode="*"/>
        <complexcat>
          <atomcat type="s">
            <fs inheritsFrom="1">
              <feat attr="index">
                <lf>
                  <nomvar name="S1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
        </complexcat>
        <slash dir="\" mode="*"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="S2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
        </complexcat>
        <lf>
          <satop nomvar="S0">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="List">
              <nomvar name="S1"/>
              <diamond mode="Coord">
                <nomvar name="S2"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="ve" pred="and"/>
    <member stem="ama" pred="but"/>
  </family>
  <!-- Umut -->
  <family closed="true" pos="Conj" name="ConjPart">
    <entry name="non-subject-left">
      <!-- (74a) in ugwot -->
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S0"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="n">
          <fs id="2"/>
          <!-- coindexed with the missing n of the left conjunct-->
        </atomcat>
        <slash dir="\" mode="*"/>
        <complexcat>
          <atomcat type="s">
            <fs inheritsFrom="1">
              <feat attr="index">
                <lf>
                  <nomvar name="S1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="n">
            <fs id="2">
              <feat attr="case" val="non-subject-cases"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                  <!--coindexed in lf with the missing n of
                the right conjunct -->
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash dir="/" mode="*"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="S2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="n">
            <fs id="4">
              <feat attr="case" val="non-subject-cases"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                  <!--coindexed in lf with the missing n of
                the left conjunct -->
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="n">
            <fs id="3"/>
          </atomcat>
        </complexcat>
        <slash dir="\" mode="*"/>
        <atomcat type="n">
          <fs id="3"/>
        </atomcat>
        <lf>
          <satop nomvar="S0">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="List">
              <nomvar name="S1"/>
              <diamond mode="Coord">
                <nomvar name="S2"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="non-subject-right">
      <!-- (74b) in ugwot -->
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S0"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/"/>
        <atomcat type="n">
          <fs id="4"/>
          <!-- coindexed with the missing n of the right conjunct-->
        </atomcat>
        <slash dir="\" mode="*"/>
        <complexcat>
          <atomcat type="s">
            <fs inheritsFrom="1">
              <feat attr="index">
                <lf>
                  <nomvar name="S1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="n">
            <fs id="2">
              <feat attr="case" val="non-subject-cases"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                  <!--coindexed in lf with the missing n of
                the right conjunct -->
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash dir="/" mode="*"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="S2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="n">
            <fs id="4">
              <feat attr="case" val="non-subject-cases"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                  <!--coindexed in lf with the missing n of
                the left conjunct -->
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="n">
            <fs id="3"/>
          </atomcat>
        </complexcat>
        <slash dir="\" mode="*"/>
        <atomcat type="n">
          <fs id="3"/>
        </atomcat>
        <lf>
          <satop nomvar="S0">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="List">
              <nomvar name="S1"/>
              <diamond mode="Coord">
                <nomvar name="S2"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="subject-left">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S0"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="n">
          <fs id="2"/>
        </atomcat>
        <slash dir="\" mode="*"/>
        <complexcat>
          <atomcat type="s">
            <fs inheritsFrom="1">
              <feat attr="index">
                <lf>
                  <nomvar name="S1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="n">
            <fs id="2"/>
          </atomcat>
        </complexcat>
        <slash dir="/" mode="*"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="S2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="n">
            <fs id="2">
              <feat attr="case" val="subject-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                  <!--coindexed in lf with the missing n of the left conjunct -->
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="n">
            <fs id="3"/>
          </atomcat>
        </complexcat>
        <slash dir="\" mode="*"/>
        <atomcat type="n">
          <fs id="3"/>
        </atomcat>
        <lf>
          <satop nomvar="S0">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="List">
              <nomvar name="S1"/>
              <diamond mode="Coord">
                <nomvar name="S2"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="subject-right">
      <!-- (74d) in ugwot -->
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="S0"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/"/>
        <atomcat type="n">
          <fs id="2"/>
        </atomcat>
        <slash dir="\" mode="*"/>
        <complexcat>
          <atomcat type="s">
            <fs inheritsFrom="1">
              <feat attr="index">
                <lf>
                  <nomvar name="S1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="n">
            <fs id="2"/>
          </atomcat>
        </complexcat>
        <slash dir="/" mode="*"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="S2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="n">
            <fs id="2">
              <feat attr="case" val="subject-case"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                  <!--coindexed in lf with the missing n of the left conjunct -->
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="n">
            <fs id="3"/>
          </atomcat>
        </complexcat>
        <slash dir="\" mode="*"/>
        <atomcat type="n">
          <fs id="3"/>
        </atomcat>
        <lf>
          <satop nomvar="S0">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="List">
              <nomvar name="S1"/>
              <diamond mode="Coord">
                <nomvar name="S2"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="da" pred="and"/>
  </family>
  <family indexRel="*NoSem*" closed="true" pos="Affix" name="To-Infinitive">
    <entry name="Basic">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="inf" attr="vform"/>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="\"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat val="non-fin" attr="vform"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="n">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
      </complexcat>
    </entry>
    <member stem="mek"/>
  </family>
  <family indexRel="*NoSem*" closed="true" pos="Affix" name="inf-case">
    <entry name="Basic">
      <complexcat>
        <atomcat type="s">
          <fs id="0">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="n">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <complexcat>
          <atomcat type="s">
            <fs id="0">
              <feat val="inf" attr="vform"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="n">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
      </complexcat>
    </entry>
    <member stem="yi"/>
    <member stem="ya" pred="to"/>
  </family>
</ccg-lexicon>


================================================
FILE: grammars/mini-turkish/morph.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<morph xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:noNamespaceSchemaLocation="../morph.xsd" name="Turkish">
  <!-- Conj  -->
  <entry pos="Conj" word="ve"/>
  <entry pos="Conj" word="ama"/>
  <entry pos="Conj" word="de" stem="da"/>
  <entry pos="Conj" word="da"/>
  <!-- Noun -->
  <entry pos="N" word="adam" macros="@sg @3rd"/>
  <entry pos="N" word="kadin" macros="@sg @3rd"/>
  <entry pos="N" word="cocuk" macros="@sg @3rd"/>
  <entry pos="N" word="cocug" stem="cocuk" macros="@sg @3rd"/>
  <entry pos="N" word="kitap" macros="@sg @3rd"/>
  <entry pos="N" word="kitab" stem="kitap" macros="@sg @3rd"/>
  <entry pos="N" word="dergi" macros="@sg @3rd"/>
  <entry pos="N" word="kiz" macros="@sg @3rd"/>
  <!-- Intransitive -->
  <entry pos="V" word="dustu" stem="dus" macros="@past"/>
  <entry pos="V" word="dus" macros="@past @non-fin"/>
  <entry pos="V" word="uyudu" stem="uyu" macros="@past"/>
  <entry pos="V" word="uyu" macros="@past @non-fin"/>
  <!-- Transitive -->
  <entry pos="V" word="gor" macros="@acc2 @non-fin"/>
  <entry pos="V" word="gordu" stem="gor" macros="@acc2 @past"/>
  <entry pos="V" word="bakti" stem="bak" macros="@dat2 @past"/>
  <entry pos="V" word="bak" macros="@dat2 @non-fin"/>
  <entry pos="V" word="al" macros="@acc2 @non-fin"/>
  <entry pos="V" word="almisti" stem="al" macros="@acc2 @past"/>
  <entry pos="V" word="okudu" stem="oku" macros="@acc2 @past"/>
  <entry pos="V" word="oku" macros="@acc2 @non-fin"/>
  <entry pos="V" word="carpti" stem="carp" macros="@dat2 @past"/>
  <entry pos="V" word="carp" macros="@dat2 @non-fin"/>
  <!-- Transitive + control-->
  <entry pos="V" word="istedi" stem="iste" macros="@acc3 @past"/>
  <entry pos="V" word="iste" macros="@acc3 @non-fin"/>
  <entry pos="V" word="calisti" stem="calis" macros="@dat3 @past"/>
  <entry pos="V" word="calis" macros="@dat3 @non-fin"/>
  <entry pos="V" word="sozverdi" stem="sozver" macros="@dat3 @past"/>
  <entry pos="V" word="sozver" macros="@dat3 @non-fin"/>
  <entry pos="V" word="zorladi" stem="zorla" macros="@dat3 @past"/>
  <entry pos="V" word="zorla" macros="@dat3 @non-fin"/>
  <!-- Ditransitive -->
  <entry pos="V" word="verdi" stem="ver" macros="@past"/>
  <entry pos="V" word="ver" macros="@non-fin"/>
  <!-- Affix -->
  <entry pos="Affix" word="me" stem="mek"/>
  <entry pos="Affix" word="ma" stem="mek"/>
  <entry pos="Affix" word="mek"/>
  <entry pos="Affix" word="mak" stem="mek"/>
  <entry pos="Affix" word="yu" stem="yi" macros="@acc0 @def0"/>
  <entry pos="Affix" word="yi" macros="@acc0 @def0"/>
  <entry pos="Affix" word="i" stem="yi" macros="@acc0 @def0"/>
  <entry pos="Affix" word="u" stem="yi" macros="@acc0 @def0"/>
  <entry pos="Affix" word="in"/>
  <entry pos="Affix" word="un" stem="in"/>
  <entry pos="Affix" word="n" stem="in"/>
  <entry pos="Affix" word="ya" macros="@dat0 @def0"/>
  <entry pos="Affix" word="ye" stem="ya" macros="@dat0 @def0"/>
  <entry pos="Affix" word="a" stem="ya" macros="@dat0 @def0"/>
  <entry pos="Affix" word="e" stem="ya" macros="@dat0 @def0"/>
  <entry pos="Affix" word="yan" macros="@nom2"/>
  <entry pos="Affix" word="yen" stem="yan" macros="@nom2"/>
  <entry pos="Affix" word="en" stem="yan" macros="@nom2"/>
  <entry pos="Affix" word="an" stem="yan" macros="@nom2"/>
  <entry pos="Affix" word="digi" stem="dik" macros="@agr1"/>
  <!--embedded IV must be IVagr,cf an-->
  <entry pos="Affix" word="dugu" stem="dik" macros="@agr1"/>
  <entry pos="Affix" word="tigi" stem="dik" macros="@agr1"/>
  <entry pos="Affix" word="tugu" stem="dik" macros="@agr1"/>
  <macro name="@agr1">
    <fs id="1" attr="agr" val="true"/>
  </macro>
  <macro name="@gen1">
    <fs id="1" attr="case" val="gen"/>
  </macro>
  <macro name="@gen2">
    <fs id="2" attr="case" val="gen"/>
  </macro>
  <macro name="@acc0">
    <fs id="0" attr="case" val="p-case"/>
  </macro>
  <macro name="@acc1">
    <fs id="1" attr="case" val="p-case"/>
  </macro>
  <macro name="@acc2">
    <fs id="2" attr="case" val="p-case"/>
  </macro>
  <macro name="@acc3">
    <fs id="3" attr="case" val="p-case"/>
  </macro>
  <macro name="@def0">
    <fs id="0" attr="def" val="true"/>
  </macro>
  <macro name="@nom0">
    <fs id="0" attr="case" val="subject-case"/>
  </macro>
  <macro name="@nom1">
    <fs id="1" attr="case" val="subject-case"/>
  </macro>
  <macro name="@nom2">
    <fs id="2" attr="case" val="subject-case"/>
  </macro>
  <macro name="@dat0">
    <fs id="0" attr="case" val="dat"/>
  </macro>
  <macro name="@dat2">
    <fs id="2" attr="case" val="dat"/>
  </macro>
  <macro name="@dat3">
    <fs id="3" attr="case" val="dat"/>
  </macro>
  <macro name="@sg">
    <fs id="0" attr="num" val="sing"/>
  </macro>
  <macro name="@sg1">
    <fs id="1" attr="num" val="sing"/>
  </macro>
  <macro name="@sg2">
    <fs id="2" attr="num" val="sing"/>
  </macro>
  <macro name="@sg3">
    <fs id="3" attr="num" val="sing"/>
  </macro>
  <macro name="@3rd">
    <fs id="0" attr="person" val="3"/>
  </macro>
  <macro name="@3rd1">
    <fs id="1" attr="person" val="3"/>
  </macro>
  <macro name="@3rd2">
    <fs id="2" attr="person" val="3"/>
  </macro>
  <macro name="@3rd3">
    <fs id="3" attr="person" val="3"/>
  </macro>
  <macro name="@1st">
    <fs id="0" attr="person" val="1"/>
  </macro>
  <macro name="@1st1">
    <fs id="1" attr="person" val="1"/>
  </macro>
  <macro name="@1st2">
    <fs id="2" attr="person" val="1"/>
  </macro>
  <macro name="@2nd">
    <fs id="0" attr="person" val="1"/>
  </macro>
  <macro name="@2nd1">
    <fs id="1" attr="person" val="2"/>
  </macro>
  <macro name="@2nd2">
    <fs id="2" attr="person" val="1"/>
  </macro>
  <macro name="@non-fin">
    <fs id="0" attr="vform" val="non-fin"/>
  </macro>
  <macro name="@past">
    <fs id="0" attr="vform" val="finite"/>
  </macro>
</morph>


================================================
FILE: grammars/mini-turkish/parameters.xml
================================================
<?xml version="1.0"?>

<!-- Basque's parameter specifications - June 2004 Cem Bozsahin -->

<language name="Turkish" type="acc" 
	
	xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" 
	xsi:noNamespaceSchemaLocation="../parameters.xsd"> 
	
  <parameters>

   <!-- NB1: predicate, setarg, arg, x-argument are pre-CCG categories.
             This notation is mapped to CCG notation by lexical rules.
             setarg and arg are serialized as in CCG.
  
        NB2: TV skeleton should NOT carry case information; it is set up 
             from language type and single argument of the IV

        NB3: IV's only argument MUST have its case specified 
        
    -->
		
    <infinitive subject-type="syntactic"/>
       
    <iv>
      <predicate syn-type="s"/>
      <arg>
        <s-argument dir="\" syn-type="n" case="nom"/>
      </arg>
    </iv>

   <!-- For example, Basque's
        tv category simply says the order is V-A-P and V-P-A because
        the specs give Pred{\A-Arg, \P-Arg}.
        Pred, A-Arg, P-Arg are syntactically: s, np, np. 
     -->
		
    <tv>
      <predicate syn-type="s"/>
      <setarg>
        <a-argument dir="\" syn-type="n"/>
        <p-argument dir="\" syn-type="n"/>
      </setarg>
    </tv>
	
  </parameters>

</language>


================================================
FILE: grammars/mini-turkish/preset-families.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!-- 
      - This file is generated by parametric-lexicon.xsl to set up
          accusativity/ergativity parameter for IV and TV primary families
          and control primary families.

          NB: pre-CCG categories of parameters.xml are mapped to
              CCG categories in this file. From now on, it's all CCG

    Suggestions to start-up lexicon development:

      1) Copy this file to lexicon-base.xml to avoid losing your changes
         to it (remember, this file is auto-generated at the start)
      2) Edit lexicon-base.xml to modify the preset families and to add your 
          own families as needed (merging the entries of same family is
          left to you)
      3) Use the ccg-build facility of openCCG, which uses lexicon-base to build
          the lexicon.xml, morph.xml and rules.xml files needed by the system.
  -->
<!--

      *** Families derived from language parameters ***

   Includes primary entries for IV (unerg and unacc), basic TV, TV-control1, 
   TV-control2, IV-control1
   
  -->
<!--
  subject-case, s-case, p-case and a-case are value types that set up ergative-
  accusative mapping and surface cases of these argumnents (cf. types.xml file).
  Actual case values for them (e.g. nom for a-case in accusative languages,
  erg for a-case in ergative languages) are defined in types.xml file.
  You can of course refer to actual values since they are types,  but if a
  construction is related to GR mapping (ERG or ACC), it's better to use
  `subject-case' (which covers a-case and s-case in ACC; p-case and s-case in ERG).
  Types.xml sets these up from parameter specification.
  
  -->
<ccg-lexicon xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:noNamespaceSchemaLocation="../lexicon.xsd" name="Turkish">
   <family closed="true" pos="V" name="unergative">
      <entry name="primary">
         <complexcat>
            <atomcat type="s">
               <fs id="100">
                  <feat attr="index">
                     <lf>
                        <nomvar name="E"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <slash dir="\"/>
            <atomcat type="n">
               <fs id="1">
                  <feat attr="case" val="s-case"/>
                  <feat attr="index">
                     <lf>
                        <nomvar name="X1"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <lf>
               <satop nomvar="E">
                  <prop name="[*DEFAULT*]"/>
                  <diamond mode="Arg1">
                     <nomvar name="X1"/>
                  </diamond>
                  <diamond mode="Arg2">
                     <nom name="one"/>
                  </diamond>
               </satop>
            </lf>
         </complexcat>
      </entry>
   </family>
   <family closed="true" pos="V" name="unaccusative">
      <entry name="primary">
         <complexcat>
            <atomcat type="s">
               <fs id="100">
                  <feat attr="index">
                     <lf>
                        <nomvar name="E"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <slash dir="\"/>
            <atomcat type="n">
               <fs id="1">
                  <feat attr="case" val="s-case"/>
                  <feat attr="index">
                     <lf>
                        <nomvar name="X1"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <lf>
               <satop nomvar="E">
                  <prop name="[*DEFAULT*]"/>
                  <diamond mode="Arg2">
                     <nomvar name="X1"/>
                  </diamond>
                  <diamond mode="Arg1">
                     <nom name="one"/>
                  </diamond>
               </satop>
            </lf>
         </complexcat>
      </entry>
   </family>
   <family closed="true" pos="V" name="TV">
      <entry name="primary">
         <complexcat>
            <atomcat type="s">
               <fs id="100">
                  <feat attr="index">
                     <lf>
                        <nomvar name="E"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <setarg>
               <slash dir="\"/>
               <atomcat type="n">
                  <fs id="1">
                     <feat attr="case" val="a-case"/>
                     <feat attr="index">
                        <lf>
                           <nomvar name="X1"/>
                        </lf>
                     </feat>
                  </fs>
               </atomcat>
               <slash dir="\"/>
               <atomcat type="n">
                  <fs id="2">
                     <feat attr="case" val="p-case"/>
                     <feat attr="index">
                        <lf>
                           <nomvar name="X2"/>
                        </lf>
                     </feat>
                  </fs>
               </atomcat>
            </setarg>
            <lf>
               <satop nomvar="E">
                  <prop name="[*DEFAULT*]"/>
                  <diamond mode="Arg1">
                     <nomvar name="X1"/>
                  </diamond>
                  <diamond mode="Arg2">
                     <nomvar name="X2"/>
                  </diamond>
               </satop>
            </lf>
         </complexcat>
      </entry>
   </family>
   <family closed="true" pos="V" name="TV-control2">
      <entry name="primary">
         <complexcat>
            <atomcat type="s">
               <fs id="100">
                  <feat attr="index">
                     <lf>
                        <nomvar name="E"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <setarg>
               <slash dir="\"/>
               <atomcat type="n">
                  <fs id="1">
                     <feat attr="case" val="a-case"/>
                     <feat attr="index">
                        <lf>
                           <nomvar name="X1"/>
                        </lf>
                     </feat>
                  </fs>
               </atomcat>
               <slash dir="\"/>
               <complexcat>
                  <!--NB: Word order and directionality of embedded clause's |(S|NP) 
type is an 'educated guess' from the syntactic type of TV. Change them
accordingly 
  -->
                  <atomcat type="s">
                     <fs id="3">
                        <feat val="non-fin" attr="vform"/>
                        <feat attr="index">
                           <lf>
                              <nomvar name="E2"/>
                           </lf>
                        </feat>
                     </fs>
                  </atomcat>
                  <slash dir="|"/>
                  <atomcat type="n">
                     <fs id="4">
                        <!-- NB: If infinitive type is syntactic subject (which is the 
		  default), there is a built-in type in types.xml file called
		  "subject-case". Include in this type all the subjects that
		  can be controlled e.g. nominative subjects only (as in German), 
		  dative and nominative subjects (as in Malayalam) etc. In this
		  case, the controllee is not semantically restricted.
		  
		  If infinitive type is semantic subject, you need a larger
		  fragment of Hybrid Logic than HLDS uses to implement identity
		  of two event variables e.g.
		  
		  @_e(Arg1 a) ^ @_e(Arg1 b) - -> @_a(b)
		  
		  where a is the event variable for controller verb, and
		  b is the event variable for the controlled verb, and Arg1 is the
		  modality for primary arguments (1s).
		  
		  This constraint is formulable in HL but HLDS does not cover that
		  fragment (yet). When it does, the lf tag should just stick in that
		  constraint.
		  
		  Currently, OpenCCG can generate an LF with TWO non-identical Arg1 modalities
		  in the same event structure, therefore some illicit examples would
		  go through.
		-->
                        <feat attr="case" val="subject-case"/>
                        <feat attr="index">
                           <lf>
                              <nomvar name="X2"/>
                           </lf>
                           <!--NB: Index is same as Arg2's  -->
                        </feat>
                     </fs>
                  </atomcat>
               </complexcat>
               <slash dir="\"/>
               <atomcat type="n">
                  <fs id="2">
                     <feat attr="case" val="p-case"/>
                     <feat attr="index">
                        <lf>
                           <nomvar name="X2"/>
                        </lf>
                     </feat>
                  </fs>
               </atomcat>
            </setarg>
            <lf>
               <satop nomvar="E">
                  <prop name="[*DEFAULT*]"/>
                  <diamond mode="Arg1">
                     <nomvar name="X1"/>
                  </diamond>
                  <diamond mode="Arg2">
                     <nomvar name="X2"/>
                  </diamond>
                  <diamond mode="Arg3">
                     <nomvar name="E2"/>
                     <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
                  </diamond>
               </satop>
            </lf>
         </complexcat>
      </entry>
   </family>
   <family closed="true" pos="V" name="TV-control1">
      <entry name="primary">
         <complexcat>
            <atomcat type="s">
               <fs id="100">
                  <feat attr="index">
                     <lf>
                        <nomvar name="E"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <setarg>
               <slash dir="\"/>
               <atomcat type="n">
                  <fs id="1">
                     <feat attr="case" val="a-case"/>
                     <feat attr="index">
                        <lf>
                           <nomvar name="X1"/>
                        </lf>
                     </feat>
                  </fs>
               </atomcat>
               <slash dir="\"/>
               <complexcat>
                  <!--NB: Word order and directionality of embedded clause's 
|(S|NP) type is an 'educated guess' from the syntactic type of TV. 
Change them accordingly.
  -->
                  <atomcat type="s">
                     <fs id="3">
                        <feat val="non-fin" attr="vform"/>
                        <feat attr="index">
                           <lf>
                              <nomvar name="E2"/>
                           </lf>
                        </feat>
                     </fs>
                  </atomcat>
                  <slash dir="|"/>
                  <atomcat type="n">
                     <fs id="4">
                        <!-- NB: If infinitive type is syntactic subject (which is the 
		  default), there is a built-in type in types.xml file called
		  "subject-case". Include in this type all the subjects that
		  can be controlled e.g. nominative subjects only (as in German), 
		  dative and nominative subjects (as in Malayalam) etc. In this
		  case, the controllee is not semantically restricted.
		  
		  If infinitive type is semantic subject, you need a larger
		  fragment of Hybrid Logic than HLDS uses to implement identity
		  of two event variables e.g.
		  
		  @_e(Arg1 a) ^ @_e(Arg1 b) - -> @_a(b)
		  
		  where a is the event variable for controller verb, and
		  b is the event variable for the controlled verb, and Arg1 is the
		  modality for primary arguments (1s).
		  
		  This constraint is formulable in HL but HLDS does not cover that
		  fragment (yet). When it does, the lf tag should just stick in that
		  constraint.
		  
		  Currently, OpenCCG can generate an LF with TWO non-identical Arg1 modalities
		  in the same event structure, therefore some illicit examples would
		  go through.
		-->
                        <feat attr="case" val="subject-case"/>
                        <feat attr="index">
                           <lf>
                              <nomvar name="X1"/>
                           </lf>
                           <!--NB: Index is same as Arg1's -->
                        </feat>
                     </fs>
                  </atomcat>
               </complexcat>
               <slash dir="\"/>
               <atomcat type="n">
                  <fs id="2">
                     <feat attr="case" val="p-case"/>
                     <feat attr="index">
                        <lf>
                           <nomvar name="X2"/>
                        </lf>
                     </feat>
                  </fs>
               </atomcat>
            </setarg>
            <lf>
               <satop nomvar="E">
                  <prop name="[*DEFAULT*]"/>
                  <diamond mode="Arg1">
                     <nomvar name="X1"/>
                  </diamond>
                  <diamond mode="Arg2">
                     <nomvar name="X2"/>
                  </diamond>
                  <diamond mode="Arg3">
                     <nomvar name="E2"/>
                     <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
                  </diamond>
               </satop>
            </lf>
         </complexcat>
      </entry>
   </family>
   <family closed="true" pos="V" name="IV-control1">
      <entry name="primary">
         <complexcat>
            <atomcat type="s">
               <fs id="100">
                  <feat attr="index">
                     <lf>
                        <nomvar name="E"/>
                     </lf>
                  </feat>
               </fs>
            </atomcat>
            <setarg>
               <slash dir="\"/>
               <atomcat type="n">
                  <fs id="1">
                     <feat attr="case" val="a-case"/>
                     <feat attr="index">
                        <lf>
                           <nomvar name="X1"/>
                        </lf>
                     </feat>
                  </fs>
               </atomcat>
               <slash dir="\"/>
               <complexcat>
                  <!--NB: Word order and directionality of embedded clause's 
|(S|NP) type is an 'educated guess' from the syntactic type of TV. 
Change them accordingly.
  -->
                  <atomcat type="s">
                     <fs id="3">
                        <feat val="non-fin" attr="vform"/>
                        <feat attr="index">
                           <lf>
                              <nomvar name="E2"/>
                           </lf>
                        </feat>
                     </fs>
                  </atomcat>
                  <slash dir="|"/>
                  <atomcat type="n">
                     <fs id="4">
                        <!-- NB: If infinitive type is syntactic subject (which is the 
		  default), there is a built-in type in types.xml file called
		  "subject-case". Include in this type all the subjects that
		  can be controlled e.g. nominative subjects only (as in German), 
		  dative and nominative subjects (as in Malayalam) etc. In this
		  case, the controllee is not semantically restricted.
		  
		  If infinitive type is semantic subject, you need a larger
		  fragment of Hybrid Logic than HLDS uses to implement identity
		  of two event variables e.g.
		  
		  @_e(Arg1 a) ^ @_e(Arg1 b) - -> @_a(b)
		  
		  where a is the event variable for controller verb, and
		  b is the event variable for the controlled verb, and Arg1 is the
		  modality for primary arguments (1s).
		  
		  This constraint is formulable in HL but HLDS does not cover that
		  fragment (yet). When it does, the lf tag should just stick in that
		  constraint.
		  
		  Currently, OpenCCG can generate an LF with TWO non-identical Arg1 modalities
		  in the same event structure, therefore some illicit examples would
		  go through.
		-->
                        <feat attr="case" val="subject-case"/>
                        <feat attr="index">
                           <lf>
                              <nomvar name="X1"/>
                           </lf>
                           <!--NB: Index is same as Arg1's -->
                        </feat>
                     </fs>
                  </atomcat>
               </complexcat>
            </setarg>
            <lf>
               <satop nomvar="E">
                  <prop name="[*DEFAULT*]"/>
                  <diamond mode="Arg1">
                     <nomvar name="X1"/>
                  </diamond>
                  <diamond mode="Arg2">
                     <nomvar name="E2"/>
                     <!--NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
-->
                  </diamond>
               </satop>
            </lf>
         </complexcat>
      </entry>
   </family>
   <!--

    *** End of derived families ***
 
        Add new families here, and merge the new entries for preset
         families as needed (e.g., you may add an entry to TV family
         for pro-dropping the subject etc.)
  -->
</ccg-lexicon>


================================================
FILE: grammars/mini-turkish/rules.xml
================================================
<?xml version='1.0' encoding='UTF-8'?>
<rules
xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
    xsi:noNamespaceSchemaLocation="../rules.xsd"
>
  <application dir="forward"/>
  <application dir="backward"/>
  <composition dir="forward" harmonic="true"/>
  <composition dir="forward" harmonic="false"/>
  <composition dir="backward" harmonic="true"/>
  <composition dir="backward" harmonic="false"/>
  <typeraising dir="forward" useDollar="true">
    <arg><atomcat type="n"/>
    </arg>
  </typeraising>
  <typeraising dir="backward" useDollar="true">
    <arg><atomcat type="n"/>
    </arg>
  </typeraising>
  <substitution dir="forward" harmonic="true"/>
  <substitution dir="forward" harmonic="false"/>
  <substitution dir="backward" harmonic="true"/>
  <substitution dir="backward" harmonic="false"/>
  <typechanging name="pd">
    <arg>
      <complexcat>
        <atomcat type="s">
            <fs id="1">
			<feat attr="v-form" val="finite"/>
            <feat attr="index">
             <lf>
              <nomvar name="E"/>
             </lf>
            </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="n">
            <fs id="2">
              <feat attr="case" val="subject-case"/>
              <feat attr="index">
               <lf>
                <nomvar name="X"/>
               </lf>
              </feat>
            </fs>
          </atomcat>
      </complexcat>
    </arg>
    <result>
      <atomcat type="s">
        <fs >
		  <feat attr="v-form" val="finite"/>
          <feat attr="index">
            <lf>
             <nomvar name="E"/>
            </lf>
          </feat>
        </fs>
      </atomcat>
    </result>
  </typechanging>
</rules>


================================================
FILE: grammars/mini-turkish/testbed.out
================================================
Loading grammar from URL: file:/home/bozsahin/openccg/grammars/mini-turkish/grammar.xml

Parse	Realize	String
-----	-------	------
ok	-	cocuk kitab i oku ma ya calisti
ok	-	*cocuk kitab i oku ma yi calisti
ok	-	cocuk kitab i oku mak istedi
ok	-	cocuk kitab i oku ma yi istedi
ok	-	*cocuk kitab i oku ma ya istedi
ok	-	*cocuk adam kitab i ver me yi istedi
ok	-	adam cocug u kitab i oku ma ya zorladi
ok	-	*adam cocug u kitab i oku ma yi zorladi
ok	-	cocug u adam kitab i oku ma ya zorladi
ok	-	adam cocug u kitab i kadin a ver me ye zorladi
ok	-	adam cocug u kadin a kitab i ver me ye zorladi
ok	-	cocug u adam kadin a kitab i ver me ye zorladi
ok	-	*adam cocug u kadin kitab i ver me ye zorladi
ok	-	*adam cocug a kadin a kitab i ver me ye zorladi
ok	-	kitab i oku yan adam uyudu
ok	-	cocuk kitab i oku yan adam i gordu
ok	-	adam in gor dugu cocuk uyudu
ok	-	cocuk adam in gor dugu kitab i okudu
ok	-	cocug un kitab i ver digi adam uyudu
ok	-	cocug un adam a ver digi kitap dustu
ok	-	*adam cocug un adam a ver en kadin i gordu
ok	-	*adam adam a kitab i ver digi kadin i gordu
ok	-	adam cocug a carpti ve dustu
ok	-	cocug a adam carpti ve dustu
ok	-	cocug a carpti ve adam dustu
ok	-	kitab i adam cocug a verdi ama kadin almisti
ok	-	cocug a kitab i adam verdi ama kadin almisti
ok	-	dergi ye adam bakti ama cocuk okudu


================================================
FILE: grammars/mini-turkish/testbed.xml
================================================
<?xml version="1.0"?>
<regression>
  <item numOfParses="1" string="cocuk kitab i oku ma ya calisti"/>
  <item numOfParses="0" string="cocuk kitab i oku ma yi calisti"/>
  <item numOfParses="1" string="cocuk kitab i oku mak istedi"/>
  <item numOfParses="1" string="cocuk kitab i oku ma yi istedi"/>
  <item numOfParses="0" string="cocuk kitab i oku ma ya istedi"/>
  <item numOfParses="0" string="cocuk adam kitab i ver me yi istedi"/>
  <item numOfParses="1" string="adam cocug u kitab i oku ma ya zorladi"/>
  <item numOfParses="0" string="adam cocug u kitab i oku ma yi zorladi"/>
  <item numOfParses="1" string="cocug u adam kitab i oku ma ya zorladi"/>
  <item numOfParses="1" string="adam cocug u kitab i kadin a ver me ye zorladi"/>
  <item numOfParses="1" string="adam cocug u kadin a kitab i ver me ye zorladi"/>
  <item numOfParses="1" string="cocug u adam kadin a kitab i ver me ye zorladi"/>
  <item numOfParses="0" string="adam cocug u kadin kitab i ver me ye zorladi"/>
  <item numOfParses="0" string="adam cocug a kadin a kitab i ver me ye zorladi"/>
  <item numOfParses="1" string="kitab i oku yan adam uyudu"/>
  <item numOfParses="1" string="cocuk kitab i oku yan adam i gordu"/>
  <item numOfParses="1" string="adam in gor dugu cocuk uyudu"/>
  <item numOfParses="1" string="cocuk adam in gor dugu kitab i okudu"/>
  <item numOfParses="1" string="cocug un kitab i ver digi adam uyudu"/>
  <item numOfParses="1" string="cocug un adam a ver digi kitap dustu"/>
  <item numOfParses="0" string="adam cocug un adam a ver en kadin i gordu"/>
  <item numOfParses="0" string="adam adam a kitab i ver digi kadin i gordu"/>
  <item numOfParses="2" string="adam cocug a carpti ve dustu"/>
  <item numOfParses="1" string="cocug a adam carpti ve dustu"/>
  <item numOfParses="1" string="cocug a carpti ve adam dustu"/>
  <item numOfParses="2" string="kitab i adam cocug a verdi ama kadin almisti"/>
  <item numOfParses="1" string="cocug a kitab i adam verdi ama kadin almisti"/>
  <item numOfParses="1" string="dergi ye adam bakti ama cocuk okudu"/>
</regression>


================================================
FILE: grammars/mini-turkish/types.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!-- 
      - This file is generated by parametric-types.xsl from parameter specs
	    (parameters.xml) to set up  types.xml file for development.
         
      - If the language in question has eg. quirky subjects etc., add their 
	    values under appropriate types.
	 
	 -->
<!--
	   subject-case, s-case, p-case and a-case are pre-defined types that are
	   used in the automatically generated initial lexicon (preset-families
	   .xml). We recommend that you dont change them. They handle
	   accusative/ergative mapping among other things (cf. types.xml initial
	   hierarchy).
	  
	 -->
<types xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:noNamespaceSchemaLocation="../types.xsd" name="Turkish">
  <type name="s-case" parents="subject-case"/>
  <type name="subject-case"/>
  <type parents="a-case s-case" name="nom"/>
  <type name="a-case" parents="subject-case"/>
  <type parents="p-case" name="acc"/>
  <type name="p-case"/>
</types>


================================================
FILE: grammars/morph.xsd
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!-- 
Copyright (C) 2003 University of Edinburgh (Michael White) 
$Revision: 1.9 $, $Date: 2004/12/07 12:00:39 $ 
-->
<xsd:schema xmlns:xsd="http://www.w3.org/2001/XMLSchema">

  <xsd:annotation>
  <xsd:documentation>
    Schema for morph file.
    
    A morph file lists all the known word forms (morph items) together with 
    their stems, parts of speech, semantic classes, associated macros, and 
    excluded lexical categories.
    
    The part of speech is used to help determine the mapping between morph 
    items and lexical categories.  A morph item is automatically associated 
    with all open families with matching parts of speech.  With closed 
    families, the morph item's stem must be listed as a family member, 
    and the parts of speech must match.  It is also possible to exclude 
    certain lexical category entries or families, by including the entry 
    name, qualified entry name or family name in the morph item's list of 
    excluded lexical categories.
    
    NB: A limitation of the current implementation is that the mapping between  
    morph items and open families can only be done with the stem as the predicate; 
    to use different predicates, closed families must be used.

    Semantic classes may also be given, for n-gram ranking purposes, and for 
    restricting the unification of nominals to compatible types, specified 
    in the types file.  When a category is instantiated, the semantic class 
    is assigned to the nominal var(s) for the proposition with the reserved name 
    '[*DEFAULT*]'.  The types of all nominal vars are then propagated to all 
    other nominal vars with the same name, throughout the category.

    The macros are used to add features or semantic predications to a lexical 
    category that depend on the particular morph item (e.g. tense, number, case, etc.).
  </xsd:documentation>
  </xsd:annotation>

  <xsd:include schemaLocation="categories.xsd"/>
  
  <xsd:element name="morph">
    <xsd:annotation>
    <xsd:documentation>
      The root element, containing a list of entries (morph items) and macros.
      Each macro must have a unique name.
    </xsd:documentation>
    </xsd:annotation>
    <xsd:complexType>
      <xsd:sequence>
        <xsd:element ref="entry" maxOccurs="unbounded"/>
        <xsd:element ref="macro" minOccurs="0" maxOccurs="unbounded"/>
      </xsd:sequence>
      <xsd:attribute name="name" type="xsd:string"/>
    </xsd:complexType>
    <xsd:unique name="macroNameUniqueness">
      <xsd:selector xpath="macro"/>
      <xsd:field    xpath="@name"/>
    </xsd:unique>
  </xsd:element>

  <xsd:element name="entry">
    <xsd:annotation>
    <xsd:documentation>
      A morph item, with its word form, stem, part of speech, and optional semantic class, 
      associated macros, and excluded lexical categories.  The stem defaults to word form.
      At run time, when the grammar is loaded, a cross-reference check is 
      performed on the names in the lists of associated macros and excluded 
      lexical categories.
      
      The coart flag indicates that this entry is a coarticulation, eg a pitch accent, 
      gesture, or other word-associated element.  With coarticulations, the word form 
      should be one or more attribute-value pairs, with attributes and values separated 
      by hyphens, and multiple pairs separated by colons.  When multiple attribute-value 
      pairs are given, only the first one is used for indexing purposes.  An identifying 
      value for the stem should also be given, eg *accent* for a pitch accent.
      
      NB: Lexical attributes supplied by coarticulations must be done so uniformly; that 
      is, they cannot appear already on some lexical items.  Also, when there are 
      multipled, independent coarticulations, they must supply disjoint sets of lexical 
      attributes, and their categories must be capable of applying in any order.
    </xsd:documentation>
    </xsd:annotation>
    <xsd:complexType>
      <xsd:attribute name="word" type="token" use="required"/>
      <xsd:attribute name="stem" type="token"/>
      <xsd:attribute name="pos" type="token" use="required"/>
      <xsd:attribute name="class" type="token"/>
      <xsd:attribute name="macros" type="listOfMacroNames"/>
      <xsd:attribute name="excluded" type="listOfTokens"/>  
      <xsd:attribute name="coart" type="xsd:boolean"/>
    </xsd:complexType>
  </xsd:element>

  <xsd:element name="macro">
    <xsd:annotation>
    <xsd:documentation>
      A named macro, with a set of features and/or semantic predications to add to
      a lexical category.
      
      The features are given by feature structure declarations, where the id is used 
      to indicate where the features are to be added (i.e., to the feature structure 
      of which atomic category).
      
      The semantic predications are given in an 'lf' element; at run time, these HLDS 
      predications are flattened and added to any predications already present in 
      the lexical category.
    </xsd:documentation>
    </xsd:annotation>
    <xsd:complexType>
      <xsd:sequence>
        <xsd:element ref="fs" minOccurs="0" maxOccurs="unbounded"/>
        <xsd:element name="lf" type="hldsPreds" minOccurs="0"/>
      </xsd:sequence>
      <xsd:attribute name="name" type="macroName" use="required"/>
    </xsd:complexType>
  </xsd:element>

  <xsd:simpleType name="macroName">
    <xsd:annotation>
    <xsd:documentation>
      Macro names begin with @ (for historical reasons) and are followed 
      by at least one non-whitespace character.
    </xsd:documentation>
    </xsd:annotation>
    <xsd:restriction base="xsd:string">
      <xsd:pattern value="@\S+"/>
    </xsd:restriction>
  </xsd:simpleType>

  <xsd:simpleType name="listOfMacroNames">
    <xsd:list itemType="macroName"/>
  </xsd:simpleType>

</xsd:schema>


================================================
FILE: grammars/parameters.xsd
================================================
<?xml version="1.0" encoding="UTF-8"?>

<!--
      Cem Bozsahin (adapted from Mike White's xsd definitions)
  -->

<xsd:schema xmlns:xsd="http://www.w3.org/2001/XMLSchema">

  <xsd:annotation>
    <xsd:documentation>
   
    Schema for the parameters.xml file.

    The parameters file contains definitions of language type, its basic 
    word order and category for basic intransitive verbs, and the word order
    skeleton for the basic transitive verbs. 

    iv and tv are pre-CCG categories. They refer to grammatical roles S,A,P,
    described by XML tags s-argument, a-argument and p-argument.
    They are mapped to CCG categories by parametric-lexicon.xsl.

    Word order can be specified as ordered/unordered list of arguments. 
    Curried arguments can be described by enclosing them in arg tag, 
    and set of arguments as setarg tag (the latter is also a valid category 
    in openCCG, cf. categories.xsd and lexicon.xsd. But arg is not).

    For further information and how to start up lexicon design from a skeletal
    lexicon, see Bozsahin and Steedman (2003) (draft), and the comments
    generated in the file preset-families.xml by paramatric-lexicon.xsl.

    As usual, the best way to learn is to look at an example file. Parameter
    files are provided for Basque, Dyirbal, English, Inuit, Tagalog and 
    Turkish (in their respective directories). 

   </xsd:documentation>
  </xsd:annotation>

  <xsd:complexType name="ArgType">
    <xsd:annotation>
      <xsd:documentation>
     p-argument and a-argument must not carry case; they are set from iv 
     specs. 
   </xsd:documentation>
    </xsd:annotation>
    <xsd:attribute name="syn-type" type="xsd:string" use="required"/>
    <xsd:attribute name="dir" use="required" type="DirType"/>
  </xsd:complexType>

  <xsd:complexType name="SArgType">
    <xsd:annotation>
      <xsd:documentation>
     s-argument must  carry case; tv category and its grammatical relations
     are set up from this case and language type.
   </xsd:documentation>
    </xsd:annotation>
    <xsd:attribute name="syn-type" type="xsd:string" use="required"/>
    <xsd:attribute name="dir" use="required" type="DirType"/>
    <xsd:attribute name="case" type="xsd:string" use="required"/>
  </xsd:complexType>

  <xsd:complexType name="predType">
    <xsd:attribute name="syn-type" type="xsd:string" use="required"/>
  </xsd:complexType>

  <xsd:simpleType name="DirType">
    <xsd:annotation>
      <xsd:documentation>
    The direction of the slash.
    The direction can be forward (/), backward (\) or both (|).
   </xsd:documentation>
    </xsd:annotation>
    <xsd:restriction base="xsd:string">
      <xsd:enumeration value="/"/>
      <xsd:enumeration value="\"/>
      <xsd:enumeration value="|"/>
    </xsd:restriction>
  </xsd:simpleType>

  <xsd:simpleType name="SubjType">
    <xsd:annotation>
      <xsd:documentation>
    What kind of subject is missing from the infinitive (parameter)
   </xsd:documentation>
    </xsd:annotation>
    <xsd:restriction base="xsd:string">
      <xsd:enumeration value="none"/>
      <xsd:enumeration value="semantic"/>
      <xsd:enumeration value="syntactic"/>
    </xsd:restriction>
  </xsd:simpleType>


  <xsd:complexType name="parameter-types">
    <xsd:annotation>
      <xsd:documentation>
        The parameters must include infinitival, iv and tv specifications. The latter
		two must
        have a predicate specification. iv has s-argument,
        tv has a-argument and p-argument, wrapped around either arg or setarg
        tags. They can appear in any order (both iv and tv specs, and argument
        and predicate specs).
		Controllee must specify subject type as semantic or syntactic.
    </xsd:documentation>
    </xsd:annotation>

    <xsd:all>
	
      <xsd:element name="infinitive" minOccurs="1" maxOccurs="1">
        <xsd:complexType>
          <xsd:attribute name="subject-type" type="SubjType" use="required"/>
        </xsd:complexType>
      </xsd:element>

      <xsd:element name="iv" minOccurs="1" maxOccurs="1">
        <xsd:complexType>
          <xsd:all>
            <xsd:element name="predicate" minOccurs="1" maxOccurs="1" type="predType"/>
            <xsd:element name="arg" minOccurs="0" maxOccurs="1">
              <xsd:complexType>
                <xsd:sequence>
                  <xsd:element name="s-argument" minOccurs="1" maxOccurs="1" type="SArgType"/>
                </xsd:sequence>
              </xsd:complexType>
            </xsd:element>
            <xsd:element name="setarg" minOccurs="0" maxOccurs="1">
              <xsd:complexType>
                <xsd:sequence>
                  <xsd:element name="s-argument" minOccurs="1" maxOccurs="1" type="SArgType"/>
                </xsd:sequence>
              </xsd:complexType>
            </xsd:element>
          </xsd:all>
        </xsd:complexType>
      </xsd:element>

      <xsd:element name="tv" minOccurs="1" maxOccurs="1">
        <xsd:complexType>
          <xsd:all>
            <xsd:element name="predicate" minOccurs="1" maxOccurs="1" type="predType"/>
            <xsd:element name="arg" minOccurs="0" maxOccurs="1">
              <xsd:complexType>
                <xsd:all>
                  <xsd:element name="a-argument" minOccurs="1" maxOccurs="1" type="ArgType"/>
                  <xsd:element name="p-argument" minOccurs="1" maxOccurs="1" type="ArgType"/>
                </xsd:all>
              </xsd:complexType>
            </xsd:element>
            <xsd:element name="setarg" minOccurs="0" maxOccurs="1">
              <xsd:complexType>
                <xsd:all>
                  <xsd:element name="a-argument" minOccurs="1" maxOccurs="1" type="ArgType"/>
                  <xsd:element name="p-argument" minOccurs="1" maxOccurs="1" type="ArgType"/>
                </xsd:all>
              </xsd:complexType>
            </xsd:element>
          </xsd:all>
        </xsd:complexType>
      </xsd:element>
    </xsd:all>
  </xsd:complexType>

<!-- *** Beginning of The schema contents -->

  <xsd:element name="language">
    <xsd:complexType>
      <xsd:sequence>
        <xsd:element name="parameters" type="parameter-types"/>
      </xsd:sequence>
      <xsd:attribute name="name" type="xsd:string" use="required"/>
      <xsd:attribute name="type" use="required">
        <xsd:simpleType>
          <xsd:restriction base="xsd:string">
            <xsd:enumeration value="acc"/>
            <xsd:enumeration value="erg"/>
            <xsd:enumeration value="unaligned"/>
          </xsd:restriction>
        </xsd:simpleType>
      </xsd:attribute>
    </xsd:complexType>
  </xsd:element>
</xsd:schema>


================================================
FILE: grammars/parametric-lexicon.xsl
================================================
<?xml version="1.0"?>

<!-- Setting up the lexicon parameters from parameters file (parameters.xml)

 Cem Bozsahin 2003-5 (cem.bozsahin@ed.ac.uk / bozsahin@metu.edu.tr)
-->

<xsl:transform xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
    version="1.0" xmlns:xalan="http://xml.apache.org/xslt"
    exclude-result-prefixes="xalan">

  <xsl:output method="xml" encoding="UTF-8" indent="yes"
      xalan:indent-amount="3"/>

  <xsl:variable name="controlled.predicate.basic.type"
      select="//iv//predicate/@syn-type"/>

  <xsl:variable name="infinitive.type"
      select="//infinitive/@subject-type"/>

  <xsl:variable name="controlled.argument.basic.type"
      select="//iv//s-argument/@syn-type"/>

  <xsl:variable name="pred.0.E">
    <fs id="100">        <!-- 0 is special; use 100 instead for result-->
      <feat attr="index">
        <lf>
          <nomvar name="E"/>
        </lf>
      </feat>
    </fs>
  </xsl:variable>

  <xsl:variable name="controlled-vp-inf-cat.1">
    <complexcat>
      <xsl:comment>NB: Word order and directionality of embedded clause's 
|(S|NP) type is an 'educated guess' from the syntactic type of TV. 
Change them accordingly.
  </xsl:comment>
      <atomcat>
        <xsl:attribute name="type">
          <xsl:value-of select="$controlled.predicate.basic.type"/>
        </xsl:attribute>
        <fs id="3">
          <feat attr="vform" val="non-fin"/>
          <feat attr="index">
            <lf>
              <nomvar name="E2"/>
            </lf>
          </feat>
        </fs>
      </atomcat>
      <slash dir="|"/>
      <atomcat>
        <xsl:attribute name="type">
          <xsl:value-of select="$controlled.argument.basic.type"/>
        </xsl:attribute>
        <fs id="4">
          <xsl:comment> NB: If infinitive type is syntactic subject (which is the 
		  default), there is a built-in type in types.xml file called
		  "subject-case". Include in this type all the subjects that
		  can be controlled e.g. nominative subjects only (as in German), 
		  dative and nominative subjects (as in Malayalam) etc. In this
		  case, the controllee is not semantically restricted.
		  
		  If infinitive type is semantic subject, you need a larger
		  fragment of Hybrid Logic than HLDS uses to implement identity
		  of two event variables e.g.
		  
		  @_e(Arg1 a) ^ @_e(Arg1 b) --> @_a(b)
		  
		  where a is the event variable for controller verb, and
		  b is the event variable for the controlled verb, and Arg1 is the
		  modality for primary arguments (1s).
		  
		  This constraint is formulable in HL but HLDS does not cover that
		  fragment (yet). When it does, the lf tag should just stick in that
		  constraint.
		  
		  Currently, OpenCCG can generate an LF with TWO non-identical Arg1 modalities
		  in the same event structure, therefore some illicit examples would
		  go through.
		</xsl:comment>
          <xsl:choose>
            <xsl:when test="$infinitive.type = 'semantic'">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
                <xsl:comment>NB: Index is same as Arg1's </xsl:comment>
              </feat>
            </xsl:when>
            <xsl:otherwise>
              <xsl:call-template name="make-attr-val">
                <xsl:with-param name="attr" select="'case'"/>
                <xsl:with-param name="val" select="'subject-case'"/>
              </xsl:call-template>
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
                <xsl:comment>NB: Index is same as Arg1's </xsl:comment>
              </feat>
            </xsl:otherwise>
          </xsl:choose>
        </fs>
      </atomcat>
    </complexcat>
  </xsl:variable>

  <xsl:variable name="controlled-vp-inf-cat.2">
    <complexcat>
      <xsl:comment>NB: Word order and directionality of embedded clause's |(S|NP) 
type is an 'educated guess' from the syntactic type of TV. Change them
accordingly 
  </xsl:comment>
      <atomcat>
        <xsl:attribute name="type">
          <xsl:value-of select="$controlled.predicate.basic.type"/>
        </xsl:attribute>
        <fs id="3">
          <feat attr="vform" val="non-fin"/>
          <feat attr="index">
            <lf>
              <nomvar name="E2"/>
            </lf>
          </feat>
        </fs>
      </atomcat>
      <slash dir="|"/>
      <atomcat>
        <xsl:attribute name="type">
          <xsl:value-of select="$controlled.argument.basic.type"/>
        </xsl:attribute>
        <fs id="4">
          <xsl:comment> NB: If infinitive type is syntactic subject (which is the 
		  default), there is a built-in type in types.xml file called
		  "subject-case". Include in this type all the subjects that
		  can be controlled e.g. nominative subjects only (as in German), 
		  dative and nominative subjects (as in Malayalam) etc. In this
		  case, the controllee is not semantically restricted.
		  
		  If infinitive type is semantic subject, you need a larger
		  fragment of Hybrid Logic than HLDS uses to implement identity
		  of two event variables e.g.
		  
		  @_e(Arg1 a) ^ @_e(Arg1 b) --> @_a(b)
		  
		  where a is the event variable for controller verb, and
		  b is the event variable for the controlled verb, and Arg1 is the
		  modality for primary arguments (1s).
		  
		  This constraint is formulable in HL but HLDS does not cover that
		  fragment (yet). When it does, the lf tag should just stick in that
		  constraint.
		  
		  Currently, OpenCCG can generate an LF with TWO non-identical Arg1 modalities
		  in the same event structure, therefore some illicit examples would
		  go through.
		</xsl:comment>
          <xsl:choose>
            <xsl:when test="$infinitive.type = 'semantic'">
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
                <xsl:comment>NB: Index is same as Arg2's </xsl:comment>
              </feat>
            </xsl:when>
            <xsl:otherwise>
              <xsl:call-template name="make-attr-val">
                <xsl:with-param name="attr" select="'case'"/>
                <xsl:with-param name="val" select="'subject-case'"/>
              </xsl:call-template>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
                <xsl:comment>NB: Index is same as Arg2's  </xsl:comment>
              </feat>
            </xsl:otherwise>
          </xsl:choose>
        </fs>
      </atomcat>
    </complexcat>
  </xsl:variable>

  <xsl:template match="language">

   <!-- ** start output here ** -->

    <xsl:comment> 
      - This file is generated by parametric-lexicon.xsl to set up
          accusativity/ergativity parameter for IV and TV primary families
          and control primary families.

          NB: pre-CCG categories of parameters.xml are mapped to
              CCG categories in this file. From now on, it's all CCG

    Suggestions to start-up lexicon development:

      1) Copy this file to lexicon-base.xml to avoid losing your changes
         to it (remember, this file is auto-generated at the start)
      2) Edit lexicon-base.xml to modify the preset families and to add your 
          own families as needed (merging the entries of same family is
          left to you)
      3) Use the ccg-build facility of openCCG, which uses lexicon-base to build
          the lexicon.xml, morph.xml and rules.xml files needed by the system.
  </xsl:comment>

    <xsl:comment>

      *** Families derived from language parameters ***

   Includes primary entries for IV (unerg and unacc), basic TV, TV-control1, 
   TV-control2, IV-control1
   
  </xsl:comment>
    <xsl:comment>
  subject-case, s-case, p-case and a-case are value types that set up ergative-
  accusative mapping and surface cases of these argumnents (cf. types.xml file).
  Actual case values for them (e.g. nom for a-case in accusative languages,
  erg for a-case in ergative languages) are defined in types.xml file.
  You can of course refer to actual values since they are types,  but if a
  construction is related to GR mapping (ERG or ACC), it's better to use
  `subject-case' (which covers a-case and s-case in ACC; p-case and s-case in ERG).
  Types.xml sets these up from parameter specification.
  
  </xsl:comment>

    <ccg-lexicon xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:noNamespaceSchemaLocation="../lexicon.xsd">

      <xsl:attribute name="name">
        <xsl:value-of select="@name"/>
      </xsl:attribute>


      <xsl:apply-templates select="parameters/iv"/>
      <xsl:apply-templates select="parameters/tv" mode="normal"/>
      <xsl:apply-templates select="parameters/tv" mode="control"/>

      <xsl:comment>

    *** End of derived families ***
 
        Add new families here, and merge the new entries for preset
         families as needed (e.g., you may add an entry to TV family
         for pro-dropping the subject etc.)
  </xsl:comment>


    </ccg-lexicon>

  </xsl:template>

  <xsl:template match="parameters/iv">

    <family name="unergative" pos="V" closed="true">
      <entry name="primary">
        <complexcat>
          <atomcat>
            <xsl:attribute name="type">
              <xsl:value-of select="predicate/@syn-type"/>
            </xsl:attribute>
            <xsl:copy-of select="$pred.0.E"/>
          </atomcat>
          <xsl:apply-templates select="setarg|arg">
            <xsl:with-param name="mode" select="'normal'"/>
          </xsl:apply-templates>
          <lf>
            <satop nomvar="E">
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Arg1">
                <nomvar name="X1"/>
              </diamond>
              <diamond mode="Arg2">
                <nom name="one"/>
              </diamond>
            </satop>
          </lf>
        </complexcat>
      </entry>
    </family>

    <family name="unaccusative" pos="V" closed="true">
      <entry name="primary">
        <complexcat>
          <atomcat>
            <xsl:attribute name="type">
              <xsl:value-of select="predicate/@syn-type"/>
            </xsl:attribute>
            <xsl:copy-of select="$pred.0.E"/>
          </atomcat>
          <xsl:apply-templates select="setarg|arg">
            <xsl:with-param name="mode" select="'normal'"/>
          </xsl:apply-templates>
          <lf>
            <satop nomvar="E">
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Arg2">
                <nomvar name="X1"/>
              </diamond>
              <diamond mode="Arg1">
                <nom name="one"/>
              </diamond>
            </satop>
          </lf>
        </complexcat>
      </entry>
    </family>
  </xsl:template>

  <xsl:template match="parameters/tv" mode="normal">

    <family name="TV" pos="V" closed="true">
      <entry name="primary">
        <complexcat>
          <atomcat>
            <xsl:attribute name="type">
              <xsl:value-of select="predicate/@syn-type"/>
            </xsl:attribute>
            <xsl:copy-of select="$pred.0.E"/>
          </atomcat>
          <xsl:apply-templates select="setarg|arg">
            <xsl:with-param name="mode" select="'normal'"/>
          </xsl:apply-templates>
          <lf>
            <satop nomvar="E">
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Arg1">
                <nomvar name="X1"/>
              </diamond>
              <diamond mode="Arg2">
                <nomvar name="X2"/>
              </diamond>
            </satop>
          </lf>
        </complexcat>
      </entry>
    </family>
  </xsl:template>

  <xsl:template match="parameters/tv" mode="control">

    <family name="TV-control2" pos="V" closed="true">
      <entry name="primary">
        <complexcat>
          <atomcat>
            <xsl:attribute name="type">
              <xsl:value-of select="predicate/@syn-type"/>
            </xsl:attribute>
            <xsl:copy-of select="$pred.0.E"/>
          </atomcat>
          <xsl:apply-templates select="setarg|arg">
            <xsl:with-param name="mode" select="'control2-tv'"/>
          </xsl:apply-templates>
          <lf>
            <satop nomvar="E">
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Arg1">
                <nomvar name="X1"/>
              </diamond>
              <diamond mode="Arg2">
                <nomvar name="X2"/>
              </diamond>
              <diamond mode="Arg3">
                <nomvar name="E2"/>
                <xsl:comment>NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
</xsl:comment>
              </diamond>
            </satop>
          </lf>
        </complexcat>
      </entry>
    </family>
    <family name="TV-control1" pos="V" closed="true">
      <entry name="primary">
        <complexcat>
          <atomcat>
            <xsl:attribute name="type">
              <xsl:value-of select="predicate/@syn-type"/>
            </xsl:attribute>
            <xsl:copy-of select="$pred.0.E"/>
          </atomcat>
          <xsl:apply-templates select="setarg|arg">
            <xsl:with-param name="mode" select="'control1-tv'"/>
          </xsl:apply-templates>
          <lf>
            <satop nomvar="E">
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Arg1">
                <nomvar name="X1"/>
              </diamond>
              <diamond mode="Arg2">
                <nomvar name="X2"/>
              </diamond>
              <diamond mode="Arg3">
                <nomvar name="E2"/>
                <xsl:comment>NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
</xsl:comment>
              </diamond>
            </satop>
          </lf>
        </complexcat>
      </entry>
    </family>
    <family name="IV-control1" pos="V" closed="true">
      <entry name="primary">
        <complexcat>
          <atomcat>
            <xsl:attribute name="type">
              <xsl:value-of select="predicate/@syn-type"/>
            </xsl:attribute>
            <xsl:copy-of select="$pred.0.E"/>
          </atomcat>
          <xsl:apply-templates select="setarg|arg">
            <xsl:with-param name="mode" select="'control1-iv'"/>
          </xsl:apply-templates>
          <lf>
            <satop nomvar="E">
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Arg1">
                <nomvar name="X1"/>
              </diamond>
              <diamond mode="Arg2">
                <nomvar name="E2"/>
                <xsl:comment>NB: Argument is the PAS of the embedded S|NP  (cf. E2 above)
</xsl:comment>
              </diamond>
            </satop>
          </lf>
        </complexcat>
      </entry>
    </family>
  </xsl:template>

  <xsl:template match="setarg">
    <xsl:param name="mode"/>

    <setarg>
      <xsl:apply-templates select="s-argument|a-argument|p-argument">
        <xsl:with-param name="mode" select="$mode"/>
      </xsl:apply-templates>
    </setarg>
  </xsl:template>

  <xsl:template match="arg">
    <xsl:param name="mode"/>

    <xsl:apply-templates select="s-argument|a-argument|p-argument">
      <xsl:with-param name="mode" select="$mode"/>
    </xsl:apply-templates>
  </xsl:template>

  <xsl:template match="a-argument">
    <xsl:param name="mode"/>

    <slash>
      <xsl:attribute name="dir">
        <xsl:value-of select="@dir"/>
      </xsl:attribute>
    </slash>
    <atomcat>
      <xsl:attribute name="type">
        <xsl:value-of select="@syn-type"/>
      </xsl:attribute>
      <fs id="1">
        <xsl:call-template name="make-attr-val">
          <xsl:with-param name="attr" select="'case'"/>
          <xsl:with-param name="val" select="'a-case'"/>
        </xsl:call-template>
        <feat attr="index">
          <lf>
            <nomvar name="X1"/>
          </lf>
        </feat>
      </fs>
    </atomcat>
  </xsl:template>

  <xsl:template match="p-argument">
    <xsl:param name="mode"/>

    <xsl:choose>
      <xsl:when test="$mode = 'normal'">
        <xsl:call-template name="set-p-argument-only"/>
      </xsl:when>
      <xsl:when test="$mode = 'control1-tv' or 'control2-tv' or 'control1-iv'">
        <xsl:call-template name="set-p-argument-and-control">
          <xsl:with-param name="mode" select="$mode"/>
        </xsl:call-template>
      </xsl:when>
    </xsl:choose>
  </xsl:template>

  <xsl:template name="set-p-argument-only">

    <slash>
      <xsl:attribute name="dir">
        <xsl:value-of select="@dir"/>
      </xsl:attribute>
    </slash>
    <atomcat>
      <xsl:attribute name="type">
        <xsl:value-of select="@syn-type"/>
      </xsl:attribute>
      <fs id="2">
        <xsl:call-template name="make-attr-val">
          <xsl:with-param name="attr" select="'case'"/>
          <xsl:with-param name="val" select="'p-case'"/>
        </xsl:call-template>
        <feat attr="index">
          <lf>
            <nomvar name="X2"/>
          </lf>
        </feat>
      </fs>
    </atomcat>
  </xsl:template>

  <xsl:template name="set-p-argument-and-control">
    <xsl:param name="mode"/>
  
      <!-- S|NP comes after NP2 of matrix clause in SAME direction-->
    <slash>
      <xsl:attribute name="dir">
        <xsl:value-of select="@dir"/>
      </xsl:attribute>
    </slash>
    <xsl:choose>
      <xsl:when test="$mode = 'control1-tv'">
        <xsl:copy-of select="$controlled-vp-inf-cat.1"/>
        <slash>
          <xsl:attribute name="dir">
            <xsl:value-of select="@dir"/>
          </xsl:attribute>
        </slash>
        <atomcat>
          <xsl:attribute name="type">
            <xsl:value-of select="@syn-type"/>
          </xsl:attribute>
          <fs id="2">
            <xsl:call-template name="make-attr-val">
              <xsl:with-param name="attr" select="'case'"/>
              <xsl:with-param name="val" select="'p-case'"/>
            </xsl:call-template>
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </xsl:when>
      <xsl:when test="$mode = 'control1-iv'">
      <!-- just replace the NP2 of TV with S|NP with SAME direc.-->
        <xsl:copy-of select="$controlled-vp-inf-cat.1"/>
      </xsl:when>
      <xsl:when test="$mode = 'control2-tv'">
        <xsl:copy-of select="$controlled-vp-inf-cat.2"/>
        <slash>
          <xsl:attribute name="dir">
            <xsl:value-of select="@dir"/>
          </xsl:attribute>
        </slash>
        <atomcat>
          <xsl:attribute name="type">
            <xsl:value-of select="@syn-type"/>
          </xsl:attribute>
          <fs id="2">
            <xsl:call-template name="make-attr-val">
              <xsl:with-param name="attr" select="'case'"/>
              <xsl:with-param name="val" select="'p-case'"/>
            </xsl:call-template>
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </xsl:when>
    </xsl:choose>
  </xsl:template>

  <xsl:template match="s-argument">
    <xsl:param name="mode"/>

    <slash>
      <xsl:attribute name="dir">
        <xsl:value-of select="@dir"/>
      </xsl:attribute>
    </slash>
    <atomcat>
      <xsl:attribute name="type">
        <xsl:value-of select="@syn-type"/>
      </xsl:attribute>
      <fs id="1">
        <xsl:call-template name="make-attr-val">
          <xsl:with-param name="attr" select="'case'"/>
          <xsl:with-param name="val" select="'s-case'"/>
        </xsl:call-template>
        <feat attr="index">
          <lf>
            <nomvar name="X1"/>
          </lf>
        </feat>
      </fs>
    </atomcat>
  </xsl:template>

  <xsl:template name="make-attr-val">
    <xsl:param name="attr"/>
    <xsl:param name="val"/>

    <feat>
      <xsl:attribute name="attr">
        <xsl:value-of select="$attr"/>
      </xsl:attribute>
      <xsl:attribute name="val">
        <xsl:value-of select="$val"/>
      </xsl:attribute>
    </feat>
  </xsl:template>

</xsl:transform>


================================================
FILE: grammars/parametric-types.xsl
================================================
<?xml version="1.0"?>


<!-- Rules to set up initial types.xml file. Lexicons refer to s-case, a-case, p-case,
     whose values are derived from the parameters.xml
- Cem Bozsahin 2004 (cem.bozsahin@ed.ac.uk / bozsahin@metu.edu.tr)
-->

<xsl:transform 
	xmlns:xsl="http://www.w3.org/1999/XSL/Transform" 
	version="1.0" 
	xmlns:set="xalan://java.util.HashSet"
	xmlns:xalan2="http://xml.apache.org/xslt"
	exclude-result-prefixes="set xalan2">
  
   <xsl:output indent="yes" xalan2:indent-amount="2"/> 
   <xsl:strip-space elements="*"/>

  <xsl:variable name="infinitive.type" select="//infinitive/@subject-type"/>
  
	  
  <xsl:template match="language">

   <!-- ** start output here ** -->
   
	<xsl:comment> 
      - This file is generated by parametric-types.xsl from parameter specs
	    (parameters.xml) to set up  types.xml file for development.
         
      - If the language in question has eg. quirky subjects etc., add their 
	    values under appropriate types.
	 
	 </xsl:comment>
	 <xsl:comment>
	   subject-case, s-case, p-case and a-case are pre-defined types that are
	   used in the automatically generated initial lexicon (preset-families
	   .xml). We recommend that you dont change them. They handle
	   accusative/ergative mapping among other things (cf. types.xml initial
	   hierarchy).
	  
	 </xsl:comment>

    <types xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" 
	xsi:noNamespaceSchemaLocation="../types.xsd">
	
      <xsl:attribute name="name">
        <xsl:value-of select="@name"/>
      </xsl:attribute>

      <xsl:apply-templates select="parameters/iv">
        <xsl:with-param name="new.case" select="@type"/>
        <xsl:with-param name="iv.1.case" select="parameters/iv//@case"/>
      </xsl:apply-templates>
      <xsl:apply-templates select="parameters/tv">
        <xsl:with-param name="new.case" select="@type"/>
        <xsl:with-param name="iv.1.case" select="parameters/iv//@case"/>
      </xsl:apply-templates>
	
    </types>

  </xsl:template>

  <xsl:template match="parameters/iv">
    <xsl:param name="new.case"/>
    <xsl:param name="iv.1.case"/>


    <xsl:apply-templates select="setarg|arg">
      <xsl:with-param name="new.case" select="$new.case"/>
      <xsl:with-param name="iv.1.case" select="$iv.1.case"/>
    </xsl:apply-templates>

  </xsl:template>

  <xsl:template match="parameters/tv">
    <xsl:param name="new.case"/>
    <xsl:param name="iv.1.case"/>

    <xsl:apply-templates select="setarg|arg">
      <xsl:with-param name="mode" select="'normal'"/>
      <xsl:with-param name="new.case" select="$new.case"/>
      <xsl:with-param name="iv.1.case" select="$iv.1.case"/>
    </xsl:apply-templates>

  </xsl:template>


  <xsl:template match="setarg">
    <xsl:param name="new.case"/>
    <xsl:param name="iv.1.case"/>

    <xsl:apply-templates select="s-argument|a-argument|p-argument">
      <xsl:with-param name="new.case" select="$new.case"/>
      <xsl:with-param name="iv.1.case" select="$iv.1.case"/>
    </xsl:apply-templates>
  </xsl:template>

  <xsl:template match="arg">
    <xsl:param name="new.case"/>
    <xsl:param name="iv.1.case"/>

    <xsl:apply-templates select="s-argument|a-argument|p-argument">
      <xsl:with-param name="new.case" select="$new.case"/>
      <xsl:with-param name="iv.1.case" select="$iv.1.case"/>
    </xsl:apply-templates>
  </xsl:template>

  <xsl:template match="a-argument">
    <xsl:param name="new.case"/>
    <xsl:param name="iv.1.case"/>

    <xsl:choose>
      <xsl:when test="$new.case = 'erg'">
        <type parents="a-case">
          <xsl:attribute name="name">
            <xsl:value-of select="$new.case"/>
          </xsl:attribute>
        </type>
        <type name="a-case"/>
      </xsl:when>
      <xsl:when test="$new.case = 'acc'">
        <type parents="a-case s-case">
          <xsl:attribute name="name">
            <xsl:value-of select="$iv.1.case"/>
          </xsl:attribute>
        </type>
        <type parents="subject-case" name="a-case"/>
      </xsl:when>

      <xsl:otherwise>   <!-- unaligned language -->
        <type parents="a-case">
          <xsl:attribute name="name">
            <xsl:value-of select="'unknown'"/>
          </xsl:attribute>
        </type>
        <type name="a-case"/>
      </xsl:otherwise>
    </xsl:choose>

  </xsl:template>

  <xsl:template match="p-argument">
    <xsl:param name="new.case"/>
    <xsl:param name="iv.1.case"/>

    <xsl:choose>
      <xsl:when test="$new.case = 'erg'">
        <type parents="s-case p-case">
          <xsl:attribute name="name">
            <xsl:value-of select="$iv.1.case"/>
          </xsl:attribute>
        </type>
        <type parents="subject-case" name="p-case"/>
      </xsl:when>
      <xsl:when test="$new.case = 'acc'">
        <type parents="p-case">
          <xsl:attribute name="name">
            <xsl:value-of select="$new.case"/>
          </xsl:attribute>
        </type>
        <type name="p-case"/>
      </xsl:when>

      <xsl:otherwise>   <!-- unaligned language -->
        <type parents="p-case">
          <xsl:attribute name="name">
            <xsl:value-of select="'unknown2'"/>
          </xsl:attribute>
        </type>
        <type name="p-case"/>
      </xsl:otherwise>
    </xsl:choose>

  </xsl:template>


  <xsl:template match="s-argument">
    <xsl:param name="new.case"/>
    <xsl:param name="iv.1.case"/>

    <type parents="subject-case" name="s-case"/>
    <type name="subject-case"/>
    <xsl:choose>
      <xsl:when test="$new.case = 'erg'"/>
      <xsl:when test="$new.case = 'acc'"/>
      <xsl:otherwise>   <!-- unaligned language -->
        <type parents="s-case">
          <xsl:attribute name="name">
            <xsl:value-of select="$iv.1.case"/>
          </xsl:attribute>
        </type>
        <xsl:comment>
		 Warning: Please substitute case names as children
		of a-case and p-case since these cannot be predicted parametrically
		for an unaligned language (cf. unknown and unknown2 values)
        </xsl:comment>
      </xsl:otherwise>
    </xsl:choose>
  </xsl:template>

</xsl:transform>


================================================
FILE: grammars/raise-nodes.xsl
================================================
<?xml version="1.0"?>
<!-- 
Copyright (C) 2003-4 University of Edinburgh (Michael White)
$Revision: 1.8 $, $Date: 2010/08/30 02:46:36 $ 

This transformation raises desired shared nodes up to a parallel location, 
so that the resulting subtrees can be more easily chunked into realizable
constituents.  The predicates are moved under a new satop, leaving behind 
just a nominal reference.
-->
<xsl:transform 
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform" 
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:set="xalan://java.util.HashSet"
  xmlns:xalan2="http://xml.apache.org/xslt"
  exclude-result-prefixes="set xalan2">

  <xsl:output indent="yes" xalan2:indent-amount="2"/> 
  <xsl:strip-space elements="*"/>

  <!-- tracks nodes which have been moved -->
  <xsl:variable name="moved" select="set:new()"/>
  
  
  <!-- raise coordinated nodes --> 
  <xsl:template match="*[diamond[@mode='First']]">
    <xsl:call-template name="raise-shared-nodes">
      <!-- look for nominals in the list -->
      <xsl:with-param name="noms-root" select="diamond[@mode='First']"/>
      <!-- check for shared nominals under different list items -->
      <xsl:with-param name="rel">Next</xsl:with-param>
    </xsl:call-template>
  </xsl:template>

  
  <!-- skip the predicates of moved nodes -->
  <xsl:template match="*[preceding-sibling::nom[set:contains($moved, string(@name))]]" priority="1.0"/>

  
  <!-- raises shared nodes --> 
  <xsl:template name="raise-shared-nodes">
    <xsl:param name="noms-root" select="."/>
    <xsl:param name="rel-root" select="$noms-root"/>
    <xsl:param name="rel"/>
    
    <!-- get all nominals with predicates under $noms-root, but not already moved -->
    <xsl:variable name="noms" 
      select="$noms-root//nom[not(set:contains($moved, string(@name))) and following-sibling::prop]"/>

    <!-- check each such nominal, gathering shared stuff to move -->
    <xsl:variable name="shared"> 
      <xsl:for-each select="$noms">
        <!-- check for the same nominal appearing under and not under $rel from $rel-root -->
        <xsl:variable name="nom" select="@name"/>
        <xsl:if test="$rel-root/diamond[@mode =  $rel]//nom[@name=$nom] and
                      $rel-root/diamond[@mode != $rel]//nom[@name=$nom]"
        >
          <!-- make new satop for preds on shared nominal -->
          <satop nom="{$nom}">
            <xsl:apply-templates select="following-sibling::node()"/>
          </satop>
          <!-- record the move -->
          <xsl:if test="set:add($moved, string($nom))"/>
        </xsl:if>
      </xsl:for-each>
    </xsl:variable>

    <!-- recurse, copying shared stuff at end -->
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
      <xsl:copy-of select="$shared"/>
    </xsl:copy>
  </xsl:template>
  
  
  <!-- Copy -->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: grammars/routes/build.xml
================================================
<!-- $Id: build.xml,v 1.2 2007/03/26 18:31:14 mwhite14850 Exp $ -->
<!-- Copyright (C) 2006 Michael White -->
<project default="grammar" basedir=".">

  <!-- =================================================================== -->
  <!-- Initialization target                                               -->
  <!-- =================================================================== -->
  <target name="init">
    <tstamp/>
    <property name="Name" value="OpenCCG"/>
    <property name="name" value="openccg"/>

    <echo message="----------- ${Name} ------------"/>

    <property name="lib.dir" value="${openccg.home}/lib"/>
    <property name="grammars.dir" value="${openccg.home}/grammars"/>

    <path id="validate.classpath">
      <pathelement location="${lib.dir}/xercesImpl.jar"/>
      <pathelement location="${lib.dir}/${name}.jar"/>
    </path>
  </target>
  

  <!-- =================================================================== -->
  <!-- Help on usage                                                       -->
  <!-- =================================================================== -->
  <target name="usage">
    <echo message=""/>
    <echo message=""/>
    <echo message="OpenCCG grammar build file"/>
    <echo message="-------------------------------------------------------------"/>
    <echo message=""/>
    <echo message=" Available targets are:"/>
    <echo message=""/>
    <echo message="   grammar  --> builds the grammar (default)"/>
    <echo message=""/>
    <echo message=" See the comments inside the build.xml file for more details."/>
    <echo message="-------------------------------------------------------------"/>
    <echo message=""/>
    <echo message=""/>
  </target>
  

  <!-- =================================================================== -->
  <!-- Builds grammar                                                     -->
  <!-- =================================================================== -->
  <target name="grammar" depends="init" description="builds grammar">
    <echo message="Adding family members from dict.xml to lexicon-base.xml, yielding lexicon.xml"/>
    <java classname="org.apache.xalan.xslt.Process"> 
      <arg value="-IN"/> <arg value="lexicon-base.xml"/>
      <arg value="-XSL"/> <arg value="${grammars.dir}/add-family-members.xsl"/>
      <arg value="-PARAM"/> <arg value="dict-file"/> <arg value="${basedir}/dict.xml"/>
      <arg value="-OUT"/> <arg value="lexicon.xml"/>
    </java>
    <echo message="Extracting morph items from dict.xml to morph.xml"/>
    <java classname="org.apache.xalan.xslt.Process"> 
      <arg value="-IN"/> <arg value="dict.xml"/>
      <arg value="-XSL"/> <arg value="${grammars.dir}/extract-morph.xsl"/>
      <arg value="-OUT"/> <arg value="morph.xml"/>
    </java>
    <echo message="Validating grammar.xml, lexicon.xml, morph.xml, rules.xml and types.xml"/>
    <java classname="opennlp.ccg.test.Validator" classpathref="validate.classpath" fork="true"> 
      <arg value="grammar.xml"/>
      <arg value="lexicon.xml"/>
      <arg value="morph.xml"/>
      <arg value="rules.xml"/>
      <arg value="types.xml"/>
    </java>
  </target>

</project>

<!-- End of file -->


================================================
FILE: grammars/routes/dict.xml
================================================
<?xml version="1.0"?>
<!-- 
Copyright (C) 2006 Michael White
$Revision: 1.11 $, $Date: 2006/05/20 20:34:16 $ 
-->
<dictionary name="routes"
  xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
  xsi:noNamespaceSchemaLocation="../dict.xsd"
>

  <!-- ===================== Simple determiners ==================== -->

  <entry stem="a" pos="Det" macros="@sg">
    <member-of family="Det"/>
    <word form="a"/>
    <word form="an"/>
  </entry>
  <entry stem="about" pos="Det">
    <member-of family="Det"/>
  </entry>
  <entry stem="the" pos="Det">
    <member-of family="Det"/>
  </entry>

  
  <!-- ======================== Pronouns =========================== -->
  
  <entry stem="pro1" pos="Pro" class="animate-being" macros="@1st">
    <member-of family="ProNP"/>
    <word form="I" macros="@sg @nom @sg-X"/>
    <word form="me" macros="@sg @acc @sg-X"/>
    <word form="we" macros="@pl @nom @pl-X"/>
    <word form="us" macros="@pl @acc @pl-X"/>
  </entry>
  <entry word="you" stem="pro2" pos="Pro" class="animate-being" macros="@2nd">
    <member-of family="ProNP"/>
  </entry>
  <entry stem="pro3f" pos="Pro" class="animate-being" macros="@3rd">
    <member-of family="ProNP"/>
    <word form="she" macros="@sg @nom @sg-X"/>
    <word form="her" macros="@sg @acc @sg-X"/>
  </entry>
  <entry stem="pro3m" pos="Pro" class="animate-being" macros="@3rd">
    <member-of family="ProNP"/>
    <word form="he" macros="@sg @nom @sg-X"/>
    <word form="him" macros="@sg @acc @sg-X"/>
  </entry>
  <entry stem="pro3n" pos="Pro" macros="@3rd">
    <member-of family="ProNP"/>
    <word form="it" macros="@sg @sg-X"/>
    <word form="they" macros="@pl @nom @pl-X"/>
    <word form="them" macros="@pl @acc @pl-X"/>
  </entry>

  <entry stem="this" pos="Pro" macros="@3rd">
    <member-of family="ProNP"/>
    <word form="this" macros="@sg @sg-X"/>
    <word form="these" macros="@pl @pl-X"/>
  </entry>
  <entry stem="that" pos="Pro" macros="@3rd">
    <member-of family="ProNP"/>
    <word form="that" macros="@sg @sg-X"/>
    <word form="those" macros="@pl @pl-X"/>
  </entry>

  <entry stem="pro1" pos="PossPro" class="animate-being">
    <member-of family="PossPro"/>
    <word form="my" macros="@sg-P"/>
    <word form="our" macros="@pl-P"/>
  </entry>
  <entry word="your" stem="pro2" pos="PossPro" class="animate-being">
    <member-of family="PossPro"/>
  </entry>
  <entry word="her" stem="pro3f" pos="PossPro" macros="@sg-P">
    <member-of family="PossPro"/>
  </entry>
  <entry word="his" stem="pro3m" pos="PossPro" macros="@sg-P">
    <member-of family="PossPro"/>
  </entry>
  <entry stem="pro3n" pos="PossPro">
    <member-of family="PossPro"/>
    <word form="its" macros="@sg-P"/>
    <word form="their" macros="@pl-P"/>
  </entry>

  
  <!-- ======================= Prepositions ======================== -->
  
  <entry stem="at" pos="Prep">
    <member-of family="LocPP"/>
  </entry>
  <entry stem="after" pos="Prep">
    <member-of family="LocPP"/>
  </entry>
  <entry stem="before" pos="Prep">
    <member-of family="LocPP"/>
  </entry>
  <entry stem="off" pos="Prep">
    <member-of family="Particle"/>
    <member-of family="LocPP"/>
  </entry>
  <entry stem="on" pos="Prep">
    <member-of family="Particle"/>
    <member-of family="LocPP"/>
  </entry>
  
  <entry stem="along" pos="Prep">
    <member-of family="PathPP"/>
    <member-of family="Fronted-PathPP"/>
  </entry>
  <entry stem="from" pos="Prep">
    <member-of family="PathPP"/>
    <member-of family="Fronted-PathPP"/>
  </entry>

  <entry stem="for" pos="Prep">
    <member-of family="For-Dist"/>
  </entry>

  <entry stem="across" pos="Prep">
    <member-of family="PathPP"/>
  </entry>
  <entry stem="into" pos="Prep">
    <member-of family="PathPP"/>
  </entry>
  <entry stem="out_of" pos="Prep">
    <member-of family="PathPP"/>
  </entry>
  <entry stem="over" pos="Prep">
    <member-of family="PathPP"/>
  </entry>
  <entry stem="past" pos="Prep">
    <member-of family="PathPP"/>
  </entry>
  <entry stem="through" pos="Prep">
    <member-of family="PathPP"/>
  </entry>
  <entry stem="under" pos="Prep">
    <member-of family="PathPP"/>
  </entry>
  <entry stem="via" pos="Prep">
    <member-of family="PathPP"/>
  </entry>
  
  <entry stem="away_from" pos="Prep">
    <member-of family="PathPP"/>
  </entry>
  <entry stem="toward" pos="Prep">
    <member-of family="PathPP"/>
  </entry>
  
  <entry stem="onto" pos="Prep">
    <member-of family="Particle"/>
    <member-of family="PathPP"/>
  </entry>
  <entry stem="to" pos="Prep">
    <member-of family="Particle"/>
    <member-of family="PathPP"/>
  </entry>

  <entry stem="up" pos="Prep">
    <member-of family="PathPP"/>
  </entry>
  <entry stem="down" pos="Prep">
    <member-of family="PathPP"/>
  </entry>

  
  <!-- ========================= Adverbs =========================== -->

  <entry stem="soon" pos="Adv">
    <member-of family="Adverb"/>
  </entry>
  
  
  <!-- ======================== Adverbials ========================= -->
  
  <entry stem="until" pos="Adv">
    <member-of family="TempAdv"/>
    <member-of family="Loc-TempAdv"/>
  </entry>
  <entry stem="when" pos="Adv">
    <member-of family="TempAdv"/>
  </entry>
  
  
  <!-- ======================= Punctuation ========================= -->
  
  <entry stem="." pos=".">
    <member-of family="FullStop"/>
  </entry>
  
  <entry stem="," pos=",">
    <member-of family="Comma"/>
  </entry>
  

  <!-- ========================= Numbers =========================== -->

  <entry stem="[*NUM*]" class="num" pos="Num" macros="@pl"/>
  <entry stem="one" class="num" pos="Num" macros="@sg">
    <member-of family="One-Det"/>
  </entry>
  <entry stem="1" class="num" pos="Num" macros="@sg">
    <member-of family="One-Det"/>
  </entry>
  <entry stem="several" class="num" pos="Num" macros="@pl"/>
  <entry stem="two" class="num" pos="Num" macros="@pl"/>
  <entry stem="three" class="num" pos="Num" macros="@pl"/>
  <entry stem="four" class="num" pos="Num" macros="@pl"/>
  <entry stem="five" class="num" pos="Num" macros="@pl"/>
  
  
  <!-- ======================== Adjectives ========================= -->
  
  <entry stem="left" class="direction" pos="Adj"/>
  <entry stem="right" class="direction" pos="Adj"/>
  
  <entry stem="first" class="ord" pos="Adj">
    <member-of family="PredicativeAdjective"/>
  </entry>
  <entry stem="second" class="ord" pos="Adj">
    <member-of family="PredicativeAdjective"/>
  </entry>
  <entry stem="third" class="ord" pos="Adj">
    <member-of family="PredicativeAdjective"/>
  </entry>
  <entry stem="last" class="ord" pos="Adj">
    <member-of family="PredicativeAdjective"/>
  </entry>
  
  <entry stem="immediate" class="dist" pos="Adj"/>

  <entry stem="long" pos="Adj"/>
  <entry stem="short" pos="Adj"/>
  <entry stem="traffic" pos="Adj"/>

  
  <!-- ========================== Nouns ============================ -->
  
  <entry stem="bridge" class="landmark" pos="N">
    <word form="bridge" macros="@sg @sg-X"/>
    <word form="bridges" macros="@pl @pl-X"/>
  </entry>
  <entry stem="destination" class="landmark" pos="N">
    <word form="destination" macros="@sg @sg-X"/>
    <word form="destinations" macros="@pl @pl-X"/>
  </entry>
  <entry stem="exit" class="landmark" pos="N">
    <word form="exit" macros="@sg @sg-X"/>
    <word form="exits" macros="@pl @pl-X"/>
  </entry>
  <entry stem="house" class="landmark" pos="N">
    <word form="house" macros="@sg @sg-X"/>
    <word form="houses" macros="@pl @pl-X"/>
  </entry>
  <entry stem="light" class="landmark" pos="N">
    <word form="light" macros="@sg @sg-X"/>
    <word form="lights" macros="@pl @pl-X"/>
  </entry>
  <entry stem="pizzeria" class="landmark" pos="N">
    <word form="pizzeria" macros="@sg @sg-X"/>
    <word form="pizzerias" macros="@pl @pl-X"/>
  </entry>
  <entry stem="river" class="landmark" pos="N">
    <word form="river" macros="@sg @sg-X"/>
    <word form="rivers" macros="@pl @pl-X"/>
  </entry>
  <entry stem="Starbucks" class="landmark" pos="N">
    <word form="Starbucks" macros="@sg @sg-X"/>
    <word form="Starbuckses" macros="@pl @pl-X"/>
  </entry>
  <entry stem="tunnel" class="landmark" pos="N">
    <word form="tunnel" macros="@sg @sg-X"/>
    <word form="tunnels" macros="@pl @pl-X"/>
  </entry>
  <entry stem="underpass" class="landmark" pos="N">
    <word form="underpass" macros="@sg @sg-X"/>
    <word form="underpasses" macros="@pl @pl-X"/>
  </entry>

  <entry stem="expressway" class="road" pos="N">
    <word form="expressway" macros="@sg @sg-X"/>
    <word form="expressways" macros="@pl @pl-X"/>
  </entry>
  <entry stem="road" class="road" pos="N">
    <word form="road" macros="@sg @sg-X"/>
    <word form="roads" macros="@pl @pl-X"/>
  </entry>
  <entry stem="way" class="road" pos="N">
    <word form="way" macros="@sg @sg-X"/>
    <word form="ways" macros="@pl @pl-X"/>
  </entry>

  <entry stem="left" class="turn" pos="N">
    <word form="left" macros="@sg @sg-X"/>
    <word form="lefts" macros="@pl @pl-X"/>
  </entry>
  <entry stem="right" class="turn" pos="N">
    <word form="right" macros="@sg @sg-X"/>
    <word form="rights" macros="@pl @pl-X"/>
  </entry>

  <entry stem="fork" class="action" pos="N">
    <word form="fork" macros="@sg @sg-X"/>
    <word form="forks" macros="@pl @pl-X"/>
  </entry>
  <entry stem="turn" class="action" pos="N">
    <word form="turn" macros="@sg @sg-X"/>
    <word form="turns" macros="@pl @pl-X"/>
  </entry>

  <entry stem="left" class="direction" pos="N"/>
  <entry stem="right" class="direction" pos="N"/>
  <entry stem="straight" class="direction" pos="N"/>
  
  <entry stem="north" class="direction" pos="N"/>
  <entry stem="south" class="direction" pos="N"/>
  <entry stem="east" class="direction" pos="N"/>
  <entry stem="west" class="direction" pos="N"/>
  <entry stem="northeast" class="direction" pos="N"/>
  <entry stem="northwest" class="direction" pos="N"/>
  <entry stem="southeast" class="direction" pos="N"/>
  <entry stem="southwest" class="direction" pos="N"/>
  
  <entry stem="mile" class="dist" pos="N">
    <word form="mile" macros="@sg @sg-X"/>
    <word form="miles" macros="@pl @pl-X"/>
  </entry>
  
  
  <!-- ========================== Verbs ============================ -->  

  <!-- 'be' -->  
  <entry stem="be" pos="V">
    <member-of family="Copula"/>
    <!-- 
    <member-of pred="there-be" family="ThereExistential"/>
    -->
    <word form="be" macros="@base"/>
    <word form="am" macros="@pres @1st @sg"/>
    <word form="'m" macros="@pres @1st @sg"/>
    <word form="are" macros="@pres @2nd @sg"/>
    <word form="'re" macros="@pres @2nd @sg"/>
    <word form="is" macros="@pres @3rd @sg"/>
    <word form="'s" macros="@pres @3rd @sg"/>
    <word form="are" macros="@pres @pl"/>
    <word form="'re" macros="@pres @pl"/>
    <word form="was" macros="@past @1st @sg"/>
    <word form="were" macros="@past @2nd @sg"/>
    <word form="was" macros="@past @3rd @sg"/>
    <word form="were" macros="@past @pl"/>
  </entry>
  
  <!-- Modal verbs -->
  <entry stem="should" pos="V">
    <member-of family="Modal"/>
  </entry>
  <entry stem="will" pos="V">
    <member-of family="Modal"/>
    <word form="will"/>
    <word form="'ll"/>
  </entry>
  
  <!-- Regular verbs -->
  <entry stem="bear" pos="V" class="action">
    <member-of family="GoDirection"/>
    <word form="bear" macros="@base"/>
    <word form="bear" macros="@pres @non-3rd @sg"/>
    <word form="bears" macros="@pres @3rd @sg"/>
    <word form="bear" macros="@pres @pl"/>
    <word form="bore" macros="@past"/>
  </entry>

  <entry stem="continue" pos="V" class="action">
    <member-of family="IntransitiveVerbs"/>
    <member-of family="GoDirection"/>
    <word form="continue" macros="@base"/>
    <word form="continue" macros="@pres @non-3rd @sg"/>
    <word form="continues" macros="@pres @3rd @sg"/>
    <word form="continue" macros="@pres @pl"/>
    <word form="continued" macros="@past"/>
  </entry>

  <entry stem="cross" pos="V" class="action">
    <member-of family="TransitiveVerbs"/>
    <word form="cross" macros="@base"/>
    <word form="cross" macros="@pres @non-3rd @sg"/>
    <word form="crosses" macros="@pres @3rd @sg"/>
    <word form="cross" macros="@pres @pl"/>
    <word form="crossed" macros="@past"/>
  </entry>

  <entry stem="drive" pos="V" class="action">
    <member-of family="IntransitiveVerbs"/>
    <member-of family="GoDirection"/>
    <word form="drive" macros="@base"/>
    <word form="drive" macros="@pres @non-3rd @sg"/>
    <word form="drives" macros="@pres @3rd @sg"/>
    <word form="drive" macros="@pres @pl"/>
    <word form="drove" macros="@past"/>
  </entry>

  <entry stem="fork" pos="V" class="action">
    <member-of family="GoDirection"/>
    <word form="fork" macros="@base"/>
    <word form="fork" macros="@pres @non-3rd @sg"/>
    <word form="forks" macros="@pres @3rd @sg"/>
    <word form="fork" macros="@pres @pl"/>
    <word form="forked" macros="@past"/>
  </entry>
  
  <entry stem="get" pos="V" class="action">
    <member-of family="GetOff" pred="get-off"/>
    <member-of family="GetOn" pred="get-on"/>
    <member-of family="GetTo" pred="get-to"/>
    <word form="get" macros="@base"/>
    <word form="get" macros="@pres @non-3rd @sg"/>
    <word form="gets" macros="@pres @3rd @sg"/>
    <word form="get" macros="@pres @pl"/>
    <word form="got" macros="@past"/>
  </entry>

  <entry stem="go" pos="V" class="action">
    <member-of family="IntransitiveVerbs"/>
    <member-of family="TakeRoad"/>
    <member-of family="GoDirection"/>
    <word form="go" macros="@base"/>
    <word form="go" macros="@pres @non-3rd @sg"/>
    <word form="goes" macros="@pres @3rd @sg"/>
    <word form="go" macros="@pres @pl"/>
    <word form="went" macros="@past"/>
  </entry>

  <entry stem="pass" pos="V" class="action">
    <member-of family="Reach"/>
    <word form="pass" macros="@base"/>
    <word form="pass" macros="@pres @non-3rd @sg"/>
    <word form="passes" macros="@pres @3rd @sg"/>
    <word form="pass" macros="@pres @pl"/>
    <word form="passed" macros="@past"/>
  </entry>

  <entry stem="reach" pos="V" class="action">
    <member-of family="Reach"/>
    <word form="reach" macros="@base"/>
    <word form="reach" macros="@pres @non-3rd @sg"/>
    <word form="reaches" macros="@pres @3rd @sg"/>
    <word form="reach" macros="@pres @pl"/>
    <word form="reached" macros="@past"/>
  </entry>

  <entry stem="see" pos="V" class="action">
    <member-of family="Perceiving"/>
    <word form="see" macros="@base"/>
    <word form="see" macros="@pres @non-3rd @sg"/>
    <word form="sees" macros="@pres @3rd @sg"/>
    <word form="see" macros="@pres @pl"/>
    <word form="saw" macros="@past"/>
  </entry>

  <entry stem="stay" pos="V" class="action">
    <member-of family="IntransitiveVerbs"/>
    <member-of family="GoDirection"/>
    <word form="stay" macros="@base"/>
    <word form="stay" macros="@pres @non-3rd @sg"/>
    <word form="stays" macros="@pres @3rd @sg"/>
    <word form="stay" macros="@pres @pl"/>
    <word form="stayed" macros="@past"/>
  </entry>

  <entry stem="take" pos="V" class="action">
    <member-of family="TakeAction"/>
    <member-of family="TakeRoad"/>
    <word form="take" macros="@base"/>
    <word form="take" macros="@pres @non-3rd @sg"/>
    <word form="takes" macros="@pres @3rd @sg"/>
    <word form="take" macros="@pres @pl"/>
    <word form="took" macros="@past"/>
  </entry>

  <entry stem="turn" pos="V" class="action">
    <member-of family="GoDirection"/>
    <word form="turn" macros="@base"/>
    <word form="turn" macros="@pres @non-3rd @sg"/>
    <word form="turns" macros="@pres @3rd @sg"/>
    <word form="turn" macros="@pres @pl"/>
    <word form="turned" macros="@past"/>
  </entry>


  <!-- ======================== Proper Names ======================= -->  
  
  <entry stem="Broadway" pos="NNP" class="road" macros="@sg"/>
  <entry stem="Cambridge" pos="NNP" class="road" macros="@sg"/>
  <entry stem="Cambridge_Street" pos="NNP" class="road" macros="@sg"/>
  <entry stem="Concord_Avenue" pos="NNP" class="road" macros="@sg"/>
  <entry stem="Irving_Terrace" pos="NNP" class="road" macros="@sg"/>
  <entry stem="JFK_Street" pos="NNP" class="road" macros="@sg"/>
  <entry stem="Mass_Pike" pos="NNP" class="road" macros="@sg"/>
  <entry stem="Memorial_Drive" pos="NNP" class="road" macros="@sg"/>
  <entry stem="Prescott_Street" pos="NNP" class="road" macros="@sg"/>
  <entry stem="Prospect_Street" pos="NNP" class="road" macros="@sg"/>
  <entry stem="River_Street" pos="NNP" class="road" macros="@sg"/>
  <entry stem="Route_2" pos="NNP" class="road" macros="@sg"/>
  <entry stem="Storrow_Drive" pos="NNP" class="road" macros="@sg"/>
  <entry stem="Sumner_Road" pos="NNP" class="road" macros="@sg"/>
  
  <entry stem="Charles" pos="NNP" class="person" macros="@sg"/>
  <entry stem="Longfellow" pos="NNP" class="person" macros="@sg"/>
  <entry stem="Mona_Lisa" pos="NNP" class="person" macros="@sg"/>
  
  <entry stem="Alston_tolls" pos="NNP" class="place" macros="@sg"/>
  <entry stem="Central_Square" pos="NNP" class="place" macros="@sg"/>
  <entry stem="Harvard" pos="NNP" class="place" macros="@sg"/>
  <entry stem="Harvard_Square" pos="NNP" class="place" macros="@sg"/>
  <entry stem="Harvard_Yard" pos="NNP" class="place" macros="@sg"/>
  <entry stem="Kendall_Square" pos="NNP" class="place" macros="@sg"/>
  <entry stem="mid-Cambridge" pos="NNP" class="place" macros="@sg"/>
  <entry stem="MIT" pos="NNP" class="place" macros="@sg"/>
  
  
  <!-- ========================== Macros =========================== -->  
  <!-- ============================================================= -->  

  <!--
    The macro @non-3rd supplies a syntactic number value that is
    compatible with both @1st and @2nd, as specified in types.xml.
  -->
  <macro name="@1st">
     <fs id="2" attr="pers" val="1st"/>
  </macro>
  <macro name="@2nd">
     <fs id="2" attr="pers" val="2nd"/>
  </macro>
  <macro name="@3rd">
     <fs id="2" attr="pers" val="3rd"/>
  </macro>
  <macro name="@non-3rd">
     <fs id="2" attr="pers" val="non-3rd"/>
  </macro>
  
  <macro name="@nom">
    <fs id="2" attr="case" val="nom"/>
  </macro>
  <macro name="@acc">
    <fs id="2" attr="case" val="acc"/>
  </macro>
  
  <macro name="@sg">
     <fs id="2" attr="num" val="sg"/>
  </macro>
  <macro name="@pl">
     <fs id="2" attr="num" val="pl"/>
  </macro>

  <!--
    The @base macro is for bare verbal forms.
  -->  
  <macro name="@base">
    <fs id="1" attr="form" val="base"/>
  </macro>
  
  
  <!-- 
    The macros @sg-X and @pl-X add a semantic number feature on the
    nominal head X to the LFs of nouns and pronouns; 
    @sg-P and @pl-P are analogous for the nominal var P.
  -->
  <macro name="@sg-X">
    <lf>
      <satop nomvar="X">
        <diamond mode="num"> <prop name="sg"/> </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@pl-X">
    <lf>
      <satop nomvar="X">
        <diamond mode="num"> <prop name="pl"/> </diamond>
      </satop>
    </lf>
  </macro>

  <macro name="@sg-P">
    <lf>
      <satop nomvar="P">
        <diamond mode="num"> <prop name="sg"/> </diamond>
      </satop>
    </lf>
  </macro>
  
  <macro name="@pl-P">
    <lf>
      <satop nomvar="P">
        <diamond mode="num"> <prop name="pl"/> </diamond>
      </satop>
    </lf>
  </macro>
  
  
  <!--
    The @past and @pres macros add tense info.
  -->  
  <macro name="@past">
    <lf>
      <satop nomvar="E">
        <diamond mode="tense"> <prop name="past"/> </diamond>
      </satop>
    </lf>
  </macro>

  <macro name="@pres">
    <lf>
      <satop nomvar="E">
        <diamond mode="tense"> <prop name="pres"/> </diamond>
      </satop>
    </lf>
  </macro>

</dictionary>


================================================
FILE: grammars/routes/dlf_test.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<xml>
  <lf>
    <node id="d1:action" pred="drive" mood="imp">
      <rel name="Actor">
        <node id="p1:animate-being" pred="pro2"/>
      </rel>
      <one-of>
        <rel name="Direction">
          <node id="w1:direction" pred="west"/>
        </rel>
        <rel name="Path">
          <node id="t1:path" pred="toward">
            <rel name="Ref">
	      <node id="h1:place" pred="Harvard_Yard"/>
            </rel>
          </node>
        </rel>
      </one-of>
      <rel name="Dist">
        <node id="m1:dist" pred="mile" num="sg">
	  <one-of>
	    <atts det="a"/>
	    <atts det="about">
	      <rel name="Card"> 
		<node id="n1:num" pred="1"/>
	      </rel>
	    </atts>
	  </one-of>
        </node>
      </rel>
      <rel name="Loc">
        <node id="o1:location" pred="on">
          <rel name="Ref">
            <node id="c1:road" pred="Cambridge_Street"/>
          </rel>
        </node>
      </rel>
      <opt>
        <rel name="Path">
          <node id="f1:path" pred="from">
            <rel name="Ref">
	      <node id="m2:place" pred="mid-Cambridge"/>
            </rel>
          </node>
        </rel>
      </opt>
    </node>
  </lf>
  <target>from mid-Cambridge , drive west on Cambridge_Street for about 1 mile .</target>
  <target>from mid-Cambridge , drive on Cambridge_Street toward Harvard_Yard for a mile .</target>
  <target>drive west on Cambridge_Street for a mile .</target>
  <target>drive on Cambridge_Street toward Harvard_Yard for about 1 mile .</target>
</xml>


================================================
FILE: grammars/routes/grammar.xml
================================================
<?xml version="1.0"?>
<!-- 
This grammar contains a lexicon and categories for giving route directions.

Copyright (C) 2006 Michael White
$Revision: 1.2 $, $Date: 2006/05/20 20:34:16 $ 
-->

<grammar name="routes"
  xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
  xsi:noNamespaceSchemaLocation="../grammar.xsd"
>

  <lexicon file="lexicon.xml"/>
  <morphology file="morph.xml"/>
  <rules file="rules.xml"/>
  <types file="types.xml"/>
  <tokenizer replacement-sem-classes="direction landmark num ord person place road turn"/>

  <LF-from-XML>
    <transform file="../treeify-lists.xsl"/>
    <transform file="../convert-to-hlds.xsl"/>
    <transform file="../core-en/add-chunks.xsl"/>
  </LF-from-XML>

  <LF-to-XML>
    <transform file="../core-en/raise-nodes.xsl"/>
    <transform file="../convert-to-graph.xsl"/>
    <transform file="../simplify-lists.xsl"/>
  </LF-to-XML>

</grammar>


================================================
FILE: grammars/routes/lexicon-base.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!-- 
This file contains the lexical families.

Copyright (C) 2006 Michael White
$Revision: 1.6 $, $Date: 2006/04/25 05:21:25 $ 
-->
<ccg-lexicon 
  name="routes"
  xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" 
  xsi:noNamespaceSchemaLocation="../lexicon.xsd"
>

  <!-- The sort order for relations in the LFs. -->
  <relation-sorting order="Actor Action Patient Road Direction * Dist Loc Path TempRel"/>
  
  
  <!-- ==================== The "Noun" family ===================== -->
  <!-- 
       This family is taken from the 'tiny' grammar.
  -->
  <family name="Noun" pos="N">
    <entry name="Primary">
      <atomcat type="n">
        <fs id="2">
          <feat attr="num"> <featvar name="NUM"/> </feat>
          <feat attr="index"> <lf> <nomvar name="X"/> </lf> </feat>
        </fs>
        <lf>
          <satop nomvar="X:sem-obj">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </atomcat>
    </entry>
  </family>

  
  <!-- ==================== The "ProNP" family ===================== -->
  <!-- 
       Also from the 'tiny' grammar.
  -->
  <family name="ProNP" pos="Pro" closed="true">
    <entry name="Primary">
      <atomcat type="np">
        <fs id="2">
          <feat attr="num"> <featvar name="NUM"/> </feat>
          <feat attr="pers"> <featvar name="PERS:pers-vals"/> </feat>
          <feat attr="case"> <featvar name="CASE"/> </feat>
          <feat attr="index"> <lf> <nomvar name="X"/> </lf> </feat>
        </fs>
        <lf>
          <satop nomvar="X:sem-obj">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </atomcat>
    </entry>
  </family>

  
  <!-- ==================== The PossPro family ===================== -->
  <!-- 
       Possessive pronouns introduce a Gen(eralized)Owner modifier:
       
         np[X]/n[X] : @X(<GenOwner>(P ^ *DEFAULT*))
  -->
  <family name="PossPro" pos="PossPro" closed="true">
    <entry name="Primary">
      <complexcat>
        <atomcat type="np">
          <fs id="2">
            <feat attr="pers" val="3rd"/>
            <feat attr="index"> <lf> <nomvar name="X"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="^"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index"> <lf> <nomvar name="X"/> </lf> </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="GenOwner">
              <nomvar name="P:sem-obj"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>

  
  <!-- ================= The Adjective families ==================== -->
  <!-- 
       Adjectives have a prenominal (1) and predicative (2) form:  
       
         (1) n[X]/n[X] : @X(<HasProp>(P ^ *DEFAULT*))
         (2) s[adj,P]\np[X] : @P(*DEFAULT* ^ <Of>X)
       
       With the former, the predicate is a modifier, whereas 
       with the latter, the predicate is the semantic head.
  -->
  <family name="Adjective" pos="Adj">
    <entry name="Primary">
      <complexcat>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index"> <lf> <nomvar name="X"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="^"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index"> <lf> <nomvar name="X"/> </lf> </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="HasProp">
              <nomvar name="P:property"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
  
  <family name="PredicativeAdjective" pos="Adj" closed="true">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs>
            <feat attr="form" val="adj"/>
            <feat attr="index"> <lf> <nomvar name="P"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="\" ability="inert" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index"> <lf> <nomvar name="X"/> </lf> </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="P:property">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Of"> <nomvar name="X:sem-obj"/> </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
  
  
  <!-- ====================== The Num family ======================= -->
  <!-- 
       Numbers get their own category, as well as an adjectival one, 
       that adds a Card(inality) relation:
       
         n[X]/n[X] : @X(<Card>(N ^ *DEFAULT*))
  -->
  <family name="Num" pos="Num">
    <entry name="Primary">
      <atomcat type="num">
        <fs id="2">
          <feat attr="num"> <featvar name="NUM"/> </feat>
          <feat attr="index"> <lf> <nomvar name="X"/> </lf>
          </feat>
        </fs>
        <lf>
          <satop nomvar="X:num">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </atomcat>
    </entry>
    <entry name="Adjectival">
      <complexcat>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index"> <lf> <nomvar name="X"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="^"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index"> <lf> <nomvar name="X"/> </lf> </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="Card">
              <nomvar name="N:num"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>

  
  <!-- ================== The Proper Name family =================== -->
  <!-- 
       Proper names are 3rd person.
       The main entry is your basic NP.
       There is also adjectival category that adds a Name relation:
       
         n[X]/n[X] : @X(<Name>(N ^ *DEFAULT*))
  -->
  <family name="Name" pos="NNP">
	  <entry name="Primary">
      <atomcat type="np">
        <fs id="2">
          <feat attr="pers" val="3rd"/>
          <feat attr="index"> <lf> <nomvar name="X"/> </lf> </feat>
        </fs>
        <lf>
          <satop nomvar="X:sem-obj">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </atomcat>
    </entry>
    <entry name="Adjectival">
      <complexcat>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index"> <lf> <nomvar name="X"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="^"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index"> <lf> <nomvar name="X"/> </lf> </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="Name">
              <nomvar name="N:sem-obj"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>

  
	<!-- ===================== The "Det" family ====================== -->
  <!-- 
       Also from the 'tiny' grammar.
  -->
  <family name="Det" pos="Det" closed="true" indexRel="det">
    <entry name="Primary">
      <complexcat>
        <atomcat type="np">
          <fs id="2">
            <feat attr="pers" val="3rd"/>
            <feat attr="index"> <lf> <nomvar name="X"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="^"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index"> <lf> <nomvar name="X"/> </lf> </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="det"> <prop name="[*DEFAULT*]"/> </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>

  
	<!-- ========================== One-Det ========================== -->
  <!-- 
       "One" as a determiner.
  -->
  <family name="One-Det" pos="Num" closed="true">
    <entry name="Primary">
      <complexcat>
        <atomcat type="np">
          <fs id="2">
            <feat attr="pers" val="3rd"/>
            <feat attr="index"> <lf> <nomvar name="W"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="^"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index"> <lf> <nomvar name="W"/> </lf> </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="W:sem-obj">
            <diamond mode="det">
              <prop name="nil"/>
            </diamond>
            <diamond mode="Card">
              <nomvar name="X:num"/>
            </diamond>
          </satop>
          <satop nomvar="X:num">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="one"/>
    <member stem="1"/>
  </family>
  
  
  <!-- ================== The "Prep-Nom" family ==================== -->
  <!-- 
       Also from the 'tiny' grammar.
  -->
  <family name="PrepNom" pos="Prep" closed="true" indexRel="*NoSem*">
    <entry name="Nominal">
      <complexcat>
        <atomcat type="pp">
          <fs inheritsFrom="3">
            <feat attr="lex" val="[*DEFAULT*]"/>
          </fs>
        </atomcat>
        <slash dir="/" mode="&lt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="case" val="acc"/>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
  </family>
  
  
  <!-- ======================== Particles ========================== -->
  <!-- 
       Eg 'off'.
  -->
  <family name="Particle" pos="Prep" closed="true" indexRel="*NoSem*">
    <entry name="Primary">
      <atomcat type="prt">
        <fs>
          <feat attr="lex" val="[*DEFAULT*]"/>
        </fs>
      </atomcat>
    </entry>
  </family>
  
  
  <!-- ================== The "Path PP" family ===================== -->
  <!-- 
       Path prepositions, such as 'onto', 'towards', 'to', etc., 
       can specify a Path argument as a clausal modifier:
    
         s[E]\s[E]/np[Y] : @E(<Path>(P ^ *DEFAULT* ^ <Ref>Y))
         
       The "Fronted Path PP" family, below, similarly provides 
       a fronted modifier with comma, for eg 'from MIT ,':
    
         s[E]/s[E]/punct[,]/np[Y] : @E(<Path>(P ^ *DEFAULT* ^ <Ref>Y))
         
  -->
  <family name="PathPP" pos="Prep" closed="true">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index"> <lf> <nomvar name="E"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index"> <lf> <nomvar name="E"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="case" val="acc"/>
            <feat attr="index"> <lf> <nomvar name="Y"/> </lf> </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:situation">
            <diamond mode="Path">
              <nomvar name="P:path"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Ref">
                <nomvar name="Y:location"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
  
  <family name="Fronted-PathPP" pos="Prep" closed="true">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index"> <lf> <nomvar name="E"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="^"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index"> <lf> <nomvar name="E"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="*"/>
        <atomcat type="punct">
          <fs> <feat attr="lex" val=","/> </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="case" val="acc"/>
            <feat attr="index"> <lf> <nomvar name="Y"/> </lf> </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:situation">
            <diamond mode="Path">
              <nomvar name="P:path"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Ref">
                <nomvar name="Y:location"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
  
  
  <!-- ====================== Locative PPs ========================= -->
  <!-- 
       Locative prepositions, such as 'at', 'in', etc., 
       can specify a Loc argument as a clausal modifier, 
       which may be fronted with a comma:
    
         s[E]\s[E]/np[Y] : @E(<Loc>(P ^ *DEFAULT* ^ <Ref>Y))
         s[E]/s[E]/punct[,]/np[Y] : @E(<Loc>(P ^ *DEFAULT* ^ <Ref>Y))
         
       Alternatively, they can head a predicative adjective category:
       
         s[adj,P]\np[X]/np[Y] : @P(*DEFAULT* ^ <Arg>X ^ <Ref>Y)
  -->
  <family name="LocPP" pos="Prep" closed="true">
    <entry name="SMod">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index"> <lf> <nomvar name="E"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index"> <lf> <nomvar name="E"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="case" val="acc"/>
            <feat attr="index"> <lf> <nomvar name="Y"/> </lf> </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:situation">
            <diamond mode="Loc">
              <nomvar name="P:location"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Ref"> <nomvar name="Y:location"/> </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Fronted">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index"> <lf> <nomvar name="E"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="^"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index"> <lf> <nomvar name="E"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="*"/>
        <atomcat type="punct">
          <fs> <feat attr="lex" val=","/> </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="case" val="acc"/>
            <feat attr="index"> <lf> <nomvar name="Y"/> </lf> </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:situation">
            <diamond mode="Loc">
              <nomvar name="P:location"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Ref">
                <nomvar name="Y:location"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="PredAdj">
      <complexcat>
        <atomcat type="s">
          <fs>
            <feat attr="form" val="adj"/>
            <feat attr="index"> <lf> <nomvar name="P"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="\" ability="inert" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index"> <lf> <nomvar name="X"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="case" val="acc"/>
            <feat attr="index"> <lf> <nomvar name="Y"/> </lf> </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="P:location">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg"> <nomvar name="X:sem-obj"/> </diamond>
            <diamond mode="Ref"> <nomvar name="Y:location"/> </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
  
  
  <!-- ================== The "For-Dist" family ==================== -->
  <!-- 
       This family specifies distance 'for'-adverbials, such 
       as "for one mile".
    
         s[E]\s[E]/np[D] : @E(<Dist>D:dist)
         
  -->
  <family name="For-Dist" pos="Prep" closed="true" indexRel="Dist">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index"> <lf> <nomvar name="E"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index"> <lf> <nomvar name="E"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="index"> <lf> <nomvar name="D"/> </lf> </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:action">
            <diamond mode="Dist"> <nomvar name="D:dist"/> </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>

  
  <!-- ================== Temporal Adverbials ====================== -->
  <!-- 
       Temporal adverbials take a finite clause as an argument that 
       fills the Situation argument, and supply a clausal or fronted 
       modifier, eg 'until you reach Cambridge Street':
       
         s[E]\s[E]/s[dcl,E2] : @E(<TempRel>(P ^ *DEFAULT* ^ <Situation>E2))
         s[E]/s[E]/punct[,]/s[dcl,E2] : @E(<TempRel>(P ^ *DEFAULT* ^ <Situation>E2))
         
  -->
  <family name="TempAdv" pos="Adv" closed="true">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index"> <lf> <nomvar name="E"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="^"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index"> <lf> <nomvar name="E"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="s">
          <fs>
            <feat attr="form" val="dcl"/>
            <feat attr="index"> <lf> <nomvar name="E2"/> </lf> </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:action">
            <diamond mode="TempRel">
              <nomvar name="P:path"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Situation">
                <nomvar name="E2:situation"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Fronted">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index"> <lf> <nomvar name="E"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="^"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index"> <lf> <nomvar name="E"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="*"/>
        <atomcat type="punct">
          <fs> <feat attr="lex" val=","/> </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="s">
          <fs>
            <feat attr="form" val="dcl"/>
            <feat attr="index"> <lf> <nomvar name="E2"/> </lf> </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:action">
            <diamond mode="TempRel">
              <nomvar name="P:path"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Situation">
                <nomvar name="E2:situation"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>

  
  <!-- ============= Locative Temporal Adverbials ================== -->
  <!-- 
       For temporal adverbials that just take an NP specifying a 
       location, eg 'until Cambridge Street':
       
         s[E]\s[E]/np[Y] : @E(<TempRel>(P ^ *DEFAULT* ^ <Ref>Y))
         
  -->
  <family name="Loc-TempAdv" pos="Adv" closed="true">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index"> <lf> <nomvar name="E"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index"> <lf> <nomvar name="E"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="case" val="acc"/>
            <feat attr="index"> <lf> <nomvar name="Y"/> </lf> </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:action">
            <diamond mode="TempRel">
              <nomvar name="P:path"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Ref">
                <nomvar name="Y:location"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>

  
  <!-- ========================= Adverbs =========================== -->
  <!-- 
       Adverbs are just medial for the moment:
       
         s[E]\np[X]/(s[E]\np[X]) : @E:situation(<HasProp>(P:property ^ *DEFAULT*))
         
  -->
  <family name="Adverb" pos="Adv" closed="true">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index"> <lf> <nomvar name="E"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="case" val="nom"/>
            <feat attr="index"> <lf> <nomvar name="X"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="^"/>
        <complexcat>
          <atomcat type="s"> <fs id="1"/> </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np"> <fs id="2"/> </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="E:situation">
            <diamond mode="HasProp">
              <nomvar name="P:property"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
  
  
  <!-- =============== The Intransitive Verb family ================ -->
  <!-- 
       This family defines the category s\np. The result category (s)
       has a feature structure with id=1 (this is referenced in the
       macros in the morph.xml file), and has an index (E for event
       variable).  By default, its form is declarative (dcl).
       
       The subject NP has a feature structure with id=2, and has number,
       person, and case attributes, where case is required to be
       nominative. Its index is X, which is used to unify the nominal of
       the subject into the Actor slot in the logical form, ie
       @E:situation(<Actor>X:animate-being). Note that the types of the
       nominals are specified in the LF.
  -->
  <family name="IntransitiveVerbs" pos="V" closed="true">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index"> <lf> <nomvar name="E"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num"> <featvar name="NUM"/> </feat>
            <feat attr="pers"> <featvar name="PERS:pers-vals"/> </feat>
            <feat attr="case" val="nom"/>
            <feat attr="index"> <lf> <nomvar name="X"/> </lf> </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:situation">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Actor"> <nomvar name="X:animate-being"/> </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>

  
  <!-- ================ The Transitive Verb family ================= -->
  <!-- 
       Transitives are intransitives plus an accusative NP 
       that supplies the Patient role.
  -->
  <family name="TransitiveVerbs" pos="V" closed="true">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index"> <lf> <nomvar name="E"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="case" val="nom"/>
            <feat attr="index"> <lf> <nomvar name="X"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="case" val="acc"/>
            <feat attr="index"> <lf> <nomvar name="Y"/> </lf> </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:situation">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Actor"> <nomvar name="X:animate-being"/> </diamond>
            <diamond mode="Patient"> <nomvar name="Y:sem-obj"/> </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>

  
  <!-- ======================= The Copula ========================== -->
  <!-- 
       The copula can take a predicative adjective or NP as its 
       complement:
       
         (1) s[E]\np[X]/(s[adj,P]\np[X]) : @E:state(be ^ <Arg>X ^ <Prop>P:property)
         (2) s[E]\np[X]/np[Y] : @E:state(be ^ <Arg>X ^ <Pred>Y)
         
       In the latter case, the NP complement is taken to supply a predication 
       in some vague way, eg as identity ('This is Broadway') or 
       as an is-a relation ('This is a short tunnel').
  -->
  <family closed="true" pos="V" name="Copula">
    <entry name="Pred">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index"> <lf> <nomvar name="E"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="case" val="nom"/>
            <feat attr="index"> <lf> <nomvar name="X"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="s">
            <fs>
              <feat attr="form" val="adj"/>
              <feat attr="index"> <lf> <nomvar name="P"/> </lf> </feat>
            </fs>
          </atomcat>
          <slash dir="\" ability="inert" mode="&lt;"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index"> <lf> <nomvar name="X"/> </lf> </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="E:state">
            <prop name="be"/>
            <diamond mode="Arg">
              <nomvar name="X:sem-obj"/>
            </diamond>
            <diamond mode="Prop">
              <nomvar name="P:property"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="NP">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index"> <lf> <nomvar name="E"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="case" val="nom"/>
            <feat attr="index"> <lf> <nomvar name="X"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="case" val="acc"/>
            <feat attr="index"> <lf> <nomvar name="Y"/> </lf> </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:state">
            <prop name="be"/>
            <diamond mode="Arg">
              <nomvar name="X:sem-obj"/>
            </diamond>
            <diamond mode="Pred">
              <nomvar name="Y:sem-obj"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
  
  
  <!-- ================ The Modal Auxiliary family ================= -->
  <!-- 
       Modals like "will" are VP premodifiers:
       
         s[E]\np[X]/(s[base,E2]\np[X]) : @E(*DEFAULT* ^ <Body>E2)
  -->
  <family name="Modal" pos="V" closed="true">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index"> <lf> <nomvar name="E"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="case" val="nom"/>
            <feat attr="index"> <lf> <nomvar name="X"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="^"/>
        <complexcat>
          <atomcat type="s">
            <fs>
              <feat attr="form" val="base"/>
              <feat attr="index"> <lf> <nomvar name="E2"/> </lf> </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np"> <fs id="2"/> </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="E:state">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Body"> <nomvar name="E2:situation"/> </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>

  
  <!-- =============== The "Taking Action" family ================= -->
  <!-- 
       This family is for eg 'take a right turn'.
       It takes an action as an NP complement:
       
         s[E]\np[X]/np[Y] : @E(take ^ <Actor>X ^ <Action>Y)
  -->
  <family name="TakeAction" pos="V" closed="true">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index"> <lf> <nomvar name="E"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="case" val="nom"/>
            <feat attr="index"> <lf> <nomvar name="X"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="case" val="acc"/>
            <feat attr="index"> <lf> <nomvar name="Y"/> </lf> </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:action">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Actor"> <nomvar name="X:animate-being"/> </diamond>
            <diamond mode="Action"> <nomvar name="Y:action"/> </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>

  
  <!-- ================ The "Taking Road" family ================== -->
  <!-- 
       This family is for eg 'take Broadway'.
       It takes a road as an NP complement:
       
         s[E]\np[X]/np[Y] : @E(take ^ <Actor>X ^ <Road>Y)
  -->
  <family name="TakeRoad" pos="V" closed="true">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index"> <lf> <nomvar name="E"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="case" val="nom"/>
            <feat attr="index"> <lf> <nomvar name="X"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="case" val="acc"/>
            <feat attr="index"> <lf> <nomvar name="Y"/> </lf> </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:action">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Actor"> <nomvar name="X:animate-being"/> </diamond>
            <diamond mode="Road"> <nomvar name="Y:road"/> </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>

  
  <!-- ================ The "Getting off" family ================== -->
  <!-- 
       This family is for eg 'getting off Broadway'.
       Its headed by 'get' and takes a road as an optional NP complement, 
       plus the 'off' particle:
       
         s[E]\np[X]/prt[off] : @E(get-off ^ <Actor>X)
         s[E]\np[X]/np[Y]/prt[off] : @E(get-off ^ <Actor>X ^ <Road>Y)
  -->
  <family name="GetOff" pos="V" closed="true">
    <entry name="Intrans">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index"> <lf> <nomvar name="E"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="case" val="nom"/>
            <feat attr="index"> <lf> <nomvar name="X"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="^"/>
        <atomcat type="prt">
          <fs attr="lex" val="off"/>
        </atomcat>
        <lf>
          <satop nomvar="E:action">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Actor"> <nomvar name="X:animate-being"/> </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="NP-Road">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index"> <lf> <nomvar name="E"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="case" val="nom"/>
            <feat attr="index"> <lf> <nomvar name="X"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="case" val="acc"/>
            <feat attr="index"> <lf> <nomvar name="Y"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="^"/>
        <atomcat type="prt">
          <fs attr="lex" val="off"/>
        </atomcat>
        <lf>
          <satop nomvar="E:action">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Actor"> <nomvar name="X:animate-being"/> </diamond>
            <diamond mode="Road"> <nomvar name="Y:road"/> </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>

  
  <!-- ================ The "Getting on" family =================== -->
  <!-- 
       This family is for eg 'getting on Broadway'.
       Its headed by 'get' and takes a road as an NP complement, 
       plus either 'on' or 'onto' as a particle:
       
         s[E]\np[X]/np[Y]/prt[on] : @E(get-on ^ <Actor>X ^ <Road>Y)
         s[E]\np[X]/np[Y]/prt[onto] : @E(get-on ^ <Actor>X ^ <Road>Y)
  -->
  <family name="GetOn" pos="V" closed="true">
    <entry name="Prt-On">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index"> <lf> <nomvar name="E"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="case" val="nom"/>
            <feat attr="index"> <lf> <nomvar name="X"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="case" val="acc"/>
            <feat attr="index"> <lf> <nomvar name="Y"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="^"/>
        <atomcat type="prt">
          <fs attr="lex" val="on"/>
        </atomcat>
        <lf>
          <satop nomvar="E:action">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Actor"> <nomvar name="X:animate-being"/> </diamond>
            <diamond mode="Road"> <nomvar name="Y:road"/> </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Prt-Onto">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index"> <lf> <nomvar name="E"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="case" val="nom"/>
            <feat attr="index"> <lf> <nomvar name="X"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="case" val="acc"/>
            <feat attr="index"> <lf> <nomvar name="Y"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="^"/>
        <atomcat type="prt">
          <fs attr="lex" val="onto"/>
        </atomcat>
        <lf>
          <satop nomvar="E:action">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Actor"> <nomvar name="X:animate-being"/> </diamond>
            <diamond mode="Road"> <nomvar name="Y:road"/> </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>

  
  <!-- ================ The "Getting to" family =================== -->
  <!-- 
       This family is for eg 'getting to Central Square'.
       Its headed by 'get' and takes a location as an NP complement, 
       plus either 'to' as a particle:
       
         s[E]\np[X]/np[Y]/prt[to] : @E(get-to ^ <Actor>X ^ <Loc>Y)
  -->
  <family name="GetTo" pos="V" closed="true">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index"> <lf> <nomvar name="E"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="case" val="nom"/>
            <feat attr="index"> <lf> <nomvar name="X"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="case" val="acc"/>
            <feat attr="index"> <lf> <nomvar name="Y"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="^"/>
        <atomcat type="prt">
          <fs attr="lex" val="to"/>
        </atomcat>
        <lf>
          <satop nomvar="E:action">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Actor"> <nomvar name="X:animate-being"/> </diamond>
            <diamond mode="Loc"> <nomvar name="Y:location"/> </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>

  
  <!-- ================= The "Reaching" family ==================== -->
  <!-- 
       This family is for eg 'reaching Central Square'.
       Like 'getting to', it takes a location as an NP complement:
       
         s[E]\np[X]/np[Y] : @E(*DEFAULT* ^ <Actor>X ^ <Loc>Y)
  -->
  <family name="Reach" pos="V" closed="true">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index"> <lf> <nomvar name="E"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="case" val="nom"/>
            <feat attr="index"> <lf> <nomvar name="X"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="case" val="acc"/>
            <feat attr="index"> <lf> <nomvar name="Y"/> </lf> </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:action">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Actor"> <nomvar name="X:animate-being"/> </diamond>
            <diamond mode="Loc"> <nomvar name="Y:location"/> </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>

  
  <!-- ================ The "Go Direction" family ================= -->
  <!-- 
       This family is for eg 'turn right' or 'go west'.
       It takes a direction as a bare N complement:
       
         s[E]\np[X]/n[Y] : @E(*DEFAULT* ^ <Actor>X ^ <Direction>Y)
  -->
  <family name="GoDirection" pos="V" closed="true">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index"> <lf> <nomvar name="E"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="case" val="nom"/>
            <feat attr="index"> <lf> <nomvar name="X"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="^"/>
        <atomcat type="n">
          <fs id="3">
            <feat attr="index"> <lf> <nomvar name="Y"/> </lf> </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:action">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Actor"> <nomvar name="X:animate-being"/> </diamond>
            <diamond mode="Direction"> <nomvar name="Y:direction"/> </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>

  
  <!-- ================== The Perceiving family =================== -->
  <!-- 
       E.g. "see", with Perceiver and Phenomenon roles.
  -->
  <family name="Perceiving" pos="V" closed="true">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index"> <lf> <nomvar name="E"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="case" val="nom"/>
            <feat attr="index"> <lf> <nomvar name="X"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="case" val="acc"/>
            <feat attr="index"> <lf> <nomvar name="Y"/> </lf> </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:situation">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Perceiver"> <nomvar name="X:animate-being"/> </diamond>
            <diamond mode="Phenomenon"> <nomvar name="Y:sem-obj"/> </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>

  
  <!-- =================== The FullStop family ===================== -->
  <!-- 
       This family defines the categories for a sentence-final period, 
       which add declarative or imperative mood and promote an 's' to 
       a full sentence cat 'sent':
       
          1. sent[E]\s[dcl,E] : @E(<mood>dcl) 
          2. sent[E]\s[imp,E] : @E(<mood>imp)
          
       Note that the imperative category works in concert with the 
       imperative unary rule, which fills in the NP subject with pro2, 
       for 2nd person.
  -->
  <family name="FullStop" closed="true" pos="." indexRel="mood">
    <entry name="Declarative">
      <complexcat>
        <atomcat type="sent">
          <fs>
            <feat attr="index"> <lf> <nomvar name="E"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="*"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index"> <lf> <nomvar name="E"/> </lf> </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:situation">
            <diamond mode="mood"> <prop name="dcl"/> </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Imperative">
      <complexcat>
        <atomcat type="sent">
          <fs>
            <feat attr="index"> <lf> <nomvar name="E"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="*"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="imp"/>
            <feat attr="index"> <lf> <nomvar name="E"/> </lf> </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:situation">
            <diamond mode="mood"> <prop name="imp"/> </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>

  
  <!-- ==================== The Comma family ======================= -->
  <!-- 
       This family defines the categories for a comma.
       The purely syntactic category is simply punct[,].
  -->
  <family name="Comma" pos="," closed="true">
    <entry name="Primary" indexRel="*NoSem*">
      <atomcat type="punct">
        <fs> <feat attr="lex" val=","/> </fs>
      </atomcat>
    </entry>
  </family>
  
</ccg-lexicon>

================================================
FILE: grammars/routes/lexicon.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!-- 
This file contains the lexical families.

Copyright (C) 2006 Michael White
$Revision: 1.11 $, $Date: 2008/01/29 17:18:52 $ 
-->
<ccg-lexicon xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" name="routes" xsi:noNamespaceSchemaLocation="../lexicon.xsd">
  <!-- The sort order for relations in the LFs. -->
  <relation-sorting order="Actor Action Patient Road Direction * Dist Loc Path TempRel"/>
  <!-- ==================== The "Noun" family ===================== -->
  <!-- 
       This family is taken from the 'tiny' grammar.
  -->
  <family name="Noun" pos="N">
    <entry name="Primary">
      <atomcat type="n">
        <fs id="2">
          <feat attr="num">
            <featvar name="NUM"/>
          </feat>
          <feat attr="index">
            <lf>
              <nomvar name="X"/>
            </lf>
          </feat>
        </fs>
        <lf>
          <satop nomvar="X:sem-obj">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </atomcat>
    </entry>
  </family>
  <!-- ==================== The "ProNP" family ===================== -->
  <!-- 
       Also from the 'tiny' grammar.
  -->
  <family name="ProNP" pos="Pro" closed="true">
    <entry name="Primary">
      <atomcat type="np">
        <fs id="2">
          <feat attr="num">
            <featvar name="NUM"/>
          </feat>
          <feat attr="pers">
            <featvar name="PERS:pers-vals"/>
          </feat>
          <feat attr="case">
            <featvar name="CASE"/>
          </feat>
          <feat attr="index">
            <lf>
              <nomvar name="X"/>
            </lf>
          </feat>
        </fs>
        <lf>
          <satop nomvar="X:sem-obj">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </atomcat>
    </entry>
    <member stem="pro1"/>
    <member stem="pro2"/>
    <member stem="pro3f"/>
    <member stem="pro3m"/>
    <member stem="pro3n"/>
    <member stem="this"/>
    <member stem="that"/>
  </family>
  <!-- ==================== The PossPro family ===================== -->
  <!-- 
       Possessive pronouns introduce a Gen(eralized)Owner modifier:
       
         np[X]/n[X] : @X(<GenOwner>(P ^ *DEFAULT*))
  -->
  <family name="PossPro" pos="PossPro" closed="true">
    <entry name="Primary">
      <complexcat>
        <atomcat type="np">
          <fs id="2">
            <feat attr="pers" val="3rd"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="^"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="GenOwner">
              <nomvar name="P:sem-obj"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="pro1"/>
    <member stem="pro2"/>
    <member stem="pro3f"/>
    <member stem="pro3m"/>
    <member stem="pro3n"/>
  </family>
  <!-- ================= The Adjective families ==================== -->
  <!-- 
       Adjectives have a prenominal (1) and predicative (2) form:  
       
         (1) n[X]/n[X] : @X(<HasProp>(P ^ *DEFAULT*))
         (2) s[adj,P]\np[X] : @P(*DEFAULT* ^ <Of>X)
       
       With the former, the predicate is a modifier, whereas 
       with the latter, the predicate is the semantic head.
  -->
  <family name="Adjective" pos="Adj">
    <entry name="Primary">
      <complexcat>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="^"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="HasProp">
              <nomvar name="P:property"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
  <family name="PredicativeAdjective" pos="Adj" closed="true">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs>
            <feat attr="form" val="adj"/>
            <feat attr="index">
              <lf>
                <nomvar name="P"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" ability="inert" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="P:property">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Of">
              <nomvar name="X:sem-obj"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="first"/>
    <member stem="second"/>
    <member stem="third"/>
    <member stem="last"/>
  </family>
  <!-- ====================== The Num family ======================= -->
  <!-- 
       Numbers get their own category, as well as an adjectival one, 
       that adds a Card(inality) relation:
       
         n[X]/n[X] : @X(<Card>(N ^ *DEFAULT*))
  -->
  <family name="Num" pos="Num">
    <entry name="Primary">
      <atomcat type="num">
        <fs id="2">
          <feat attr="num">
            <featvar name="NUM"/>
          </feat>
          <feat attr="index">
            <lf>
              <nomvar name="X"/>
            </lf>
          </feat>
        </fs>
        <lf>
          <satop nomvar="X:num">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </atomcat>
    </entry>
    <entry name="Adjectival">
      <complexcat>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="^"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="Card">
              <nomvar name="N:num"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
  <!-- ================== The Proper Name family =================== -->
  <!-- 
       Proper names are 3rd person.
       The main entry is your basic NP.
       There is also adjectival category that adds a Name relation:
       
         n[X]/n[X] : @X(<Name>(N ^ *DEFAULT*))
  -->
  <family name="Name" pos="NNP">
    <entry name="Primary">
      <atomcat type="np">
        <fs id="2">
          <feat attr="pers" val="3rd"/>
          <feat attr="index">
            <lf>
              <nomvar name="X"/>
            </lf>
          </feat>
        </fs>
        <lf>
          <satop nomvar="X:sem-obj">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </atomcat>
    </entry>
    <entry name="Adjectival">
      <complexcat>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="^"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="Name">
              <nomvar name="N:sem-obj"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
  <!-- ===================== The "Det" family ====================== -->
  <!-- 
       Also from the 'tiny' grammar.
  -->
  <family name="Det" pos="Det" closed="true" indexRel="det">
    <entry name="Primary">
      <complexcat>
        <atomcat type="np">
          <fs id="2">
            <feat attr="pers" val="3rd"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="^"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="det">
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="a"/>
    <member stem="about"/>
    <member stem="the"/>
  </family>
  <!-- ========================== One-Det ========================== -->
  <!-- 
       "One" as a determiner.
  -->
  <family name="One-Det" pos="Num" closed="true">
    <entry name="Primary">
      <complexcat>
        <atomcat type="np">
          <fs id="2">
            <feat attr="pers" val="3rd"/>
            <feat attr="index">
              <lf>
                <nomvar name="W"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="^"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="W"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="W:sem-obj">
            <diamond mode="det">
              <prop name="nil"/>
            </diamond>
            <diamond mode="Card">
              <nomvar name="X:num"/>
            </diamond>
          </satop>
          <satop nomvar="X:num">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="one"/>
    <member stem="1"/>
    <member stem="one"/>
    <member stem="1"/>
  </family>
  <!-- ================== The "Prep-Nom" family ==================== -->
  <!-- 
       Also from the 'tiny' grammar.
  -->
  <family name="PrepNom" pos="Prep" closed="true" indexRel="*NoSem*">
    <entry name="Nominal">
      <complexcat>
        <atomcat type="pp">
          <fs inheritsFrom="3">
            <feat attr="lex" val="[*DEFAULT*]"/>
          </fs>
        </atomcat>
        <slash dir="/" mode="&lt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="case" val="acc"/>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
  </family>
  <!-- ======================== Particles ========================== -->
  <!-- 
       Eg 'off'.
  -->
  <family name="Particle" pos="Prep" closed="true" indexRel="*NoSem*">
    <entry name="Primary">
      <atomcat type="prt">
        <fs>
          <feat attr="lex" val="[*DEFAULT*]"/>
        </fs>
      </atomcat>
    </entry>
    <member stem="off"/>
    <member stem="on"/>
    <member stem="onto"/>
    <member stem="to"/>
  </family>
  <!-- ================== The "Path PP" family ===================== -->
  <!-- 
       Path prepositions, such as 'onto', 'towards', 'to', etc., 
       can specify a Path argument as a clausal modifier:
    
         s[E]\s[E]/np[Y] : @E(<Path>(P ^ *DEFAULT* ^ <Ref>Y))
         
       The "Fronted Path PP" family, below, similarly provides 
       a fronted modifier with comma, for eg 'from MIT ,':
    
         s[E]/s[E]/punct[,]/np[Y] : @E(<Path>(P ^ *DEFAULT* ^ <Ref>Y))
         
  -->
  <family name="PathPP" pos="Prep" closed="true">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="case" val="acc"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:situation">
            <diamond mode="Path">
              <nomvar name="P:path"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Ref">
                <nomvar name="Y:location"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="along"/>
    <member stem="from"/>
    <member stem="across"/>
    <member stem="into"/>
    <member stem="out_of"/>
    <member stem="over"/>
    <member stem="past"/>
    <member stem="through"/>
    <member stem="under"/>
    <member stem="via"/>
    <member stem="away_from"/>
    <member stem="toward"/>
    <member stem="onto"/>
    <member stem="to"/>
    <member stem="up"/>
    <member stem="down"/>
  </family>
  <family name="Fronted-PathPP" pos="Prep" closed="true">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="^"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="*"/>
        <atomcat type="punct">
          <fs>
            <feat attr="lex" val=","/>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="case" val="acc"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:situation">
            <diamond mode="Path">
              <nomvar name="P:path"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Ref">
                <nomvar name="Y:location"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="along"/>
    <member stem="from"/>
  </family>
  <!-- ====================== Locative PPs ========================= -->
  <!-- 
       Locative prepositions, such as 'at', 'in', etc., 
       can specify a Loc argument as a clausal modifier, 
       which may be fronted with a comma:
    
         s[E]\s[E]/np[Y] : @E(<Loc>(P ^ *DEFAULT* ^ <Ref>Y))
         s[E]/s[E]/punct[,]/np[Y] : @E(<Loc>(P ^ *DEFAULT* ^ <Ref>Y))
         
       Alternatively, they can head a predicative adjective category:
       
         s[adj,P]\np[X]/np[Y] : @P(*DEFAULT* ^ <Arg>X ^ <Ref>Y)
  -->
  <family name="LocPP" pos="Prep" closed="true">
    <entry name="SMod">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="case" val="acc"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:situation">
            <diamond mode="Loc">
              <nomvar name="P:location"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Ref">
                <nomvar name="Y:location"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Fronted">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="^"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="*"/>
        <atomcat type="punct">
          <fs>
            <feat attr="lex" val=","/>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="case" val="acc"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:situation">
            <diamond mode="Loc">
              <nomvar name="P:location"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Ref">
                <nomvar name="Y:location"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="PredAdj">
      <complexcat>
        <atomcat type="s">
          <fs>
            <feat attr="form" val="adj"/>
            <feat attr="index">
              <lf>
                <nomvar name="P"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" ability="inert" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="case" val="acc"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="P:location">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg">
              <nomvar name="X:sem-obj"/>
            </diamond>
            <diamond mode="Ref">
              <nomvar name="Y:location"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="at"/>
    <member stem="after"/>
    <member stem="before"/>
    <member stem="off"/>
    <member stem="on"/>
  </family>
  <!-- ================== The "For-Dist" family ==================== -->
  <!-- 
       This family specifies distance 'for'-adverbials, such 
       as "for one mile".
    
         s[E]\s[E]/np[D] : @E(<Dist>D:dist)
         
  -->
  <family name="For-Dist" pos="Prep" closed="true" indexRel="Dist">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="D"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:action">
            <diamond mode="Dist">
              <nomvar name="D:dist"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="for"/>
  </family>
  <!-- ================== Temporal Adverbials ====================== -->
  <!-- 
       Temporal adverbials take a finite clause as an argument that 
       fills the Situation argument, and supply a clausal or fronted 
       modifier, eg 'until you reach Cambridge Street':
       
         s[E]\s[E]/s[dcl,E2] : @E(<TempRel>(P ^ *DEFAULT* ^ <Situation>E2))
         s[E]/s[E]/punct[,]/s[dcl,E2] : @E(<TempRel>(P ^ *DEFAULT* ^ <Situation>E2))
         
  -->
  <family name="TempAdv" pos="Adv" closed="true">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="^"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="s">
          <fs>
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="E2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:action">
            <diamond mode="TempRel">
              <nomvar name="P:path"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Situation">
                <nomvar name="E2:situation"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Fronted">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="^"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="*"/>
        <atomcat type="punct">
          <fs>
            <feat attr="lex" val=","/>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="s">
          <fs>
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="E2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:action">
            <diamond mode="TempRel">
              <nomvar name="P:path"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Situation">
                <nomvar name="E2:situation"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="until"/>
    <member stem="when"/>
  </family>
  <!-- ============= Locative Temporal Adverbials ================== -->
  <!-- 
       For temporal adverbials that just take an NP specifying a 
       location, eg 'until Cambridge Street':
       
         s[E]\s[E]/np[Y] : @E(<TempRel>(P ^ *DEFAULT* ^ <Ref>Y))
         
  -->
  <family name="Loc-TempAdv" pos="Adv" closed="true">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="case" val="acc"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:action">
            <diamond mode="TempRel">
              <nomvar name="P:path"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Ref">
                <nomvar name="Y:location"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="until"/>
  </family>
  <!-- ========================= Adverbs =========================== -->
  <!-- 
       Adverbs are just medial for the moment:
       
         s[E]\np[X]/(s[E]\np[X]) : @E:situation(<HasProp>(P:property ^ *DEFAULT*))
         
  -->
  <family name="Adverb" pos="Adv" closed="true">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="case" val="nom"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="^"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1"/>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="2"/>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="E:situation">
            <diamond mode="HasProp">
              <nomvar name="P:property"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="soon"/>
  </family>
  <!-- =============== The Intransitive Verb family ================ -->
  <!-- 
       This family defines the category s\np. The result category (s)
       has a feature structure with id=1 (this is referenced in the
       macros in the morph.xml file), and has an index (E for event
       variable).  By default, its form is declarative (dcl).
       
       The subject NP has a feature structure with id=2, and has number,
       person, and case attributes, where case is required to be
       nominative. Its index is X, which is used to unify the nominal of
       the subject into the Actor slot in the logical form, ie
       @E:situation(<Actor>X:animate-being). Note that the types of the
       nominals are specified in the LF.
  -->
  <family name="IntransitiveVerbs" pos="V" closed="true">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat attr="case" val="nom"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:situation">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Actor">
              <nomvar name="X:animate-being"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="continue"/>
    <member stem="drive"/>
    <member stem="go"/>
    <member stem="stay"/>
  </family>
  <!-- ================ The Transitive Verb family ================= -->
  <!-- 
       Transitives are intransitives plus an accusative NP 
       that supplies the Patient role.
  -->
  <family name="TransitiveVerbs" pos="V" closed="true">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="case" val="nom"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="case" val="acc"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:situation">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Actor">
              <nomvar name="X:animate-being"/>
            </diamond>
            <diamond mode="Patient">
              <nomvar name="Y:sem-obj"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="cross"/>
  </family>
  <!-- ======================= The Copula ========================== -->
  <!-- 
       The copula can take a predicative adjective or NP as its 
       complement:
       
         (1) s[E]\np[X]/(s[adj,P]\np[X]) : @E:state(be ^ <Arg>X ^ <Prop>P:property)
         (2) s[E]\np[X]/np[Y] : @E:state(be ^ <Arg>X ^ <Pred>Y)
         
       In the latter case, the NP complement is taken to supply a predication 
       in some vague way, eg as identity ('This is Broadway') or 
       as an is-a relation ('This is a short tunnel').
  -->
  <family closed="true" pos="V" name="Copula">
    <entry name="Pred">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="case" val="nom"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="s">
            <fs>
              <feat attr="form" val="adj"/>
              <feat attr="index">
                <lf>
                  <nomvar name="P"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" ability="inert" mode="&lt;"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="E:state">
            <prop name="be"/>
            <diamond mode="Arg">
              <nomvar name="X:sem-obj"/>
            </diamond>
            <diamond mode="Prop">
              <nomvar name="P:property"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="NP">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="case" val="nom"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="case" val="acc"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:state">
            <prop name="be"/>
            <diamond mode="Arg">
              <nomvar name="X:sem-obj"/>
            </diamond>
            <diamond mode="Pred">
              <nomvar name="Y:sem-obj"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="be"/>
  </family>
  <!-- ================ The Modal Auxiliary family ================= -->
  <!-- 
       Modals like "will" are VP premodifiers:
       
         s[E]\np[X]/(s[base,E2]\np[X]) : @E(*DEFAULT* ^ <Body>E2)
  -->
  <family name="Modal" pos="V" closed="true">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="case" val="nom"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="^"/>
        <complexcat>
          <atomcat type="s">
            <fs>
              <feat attr="form" val="base"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="2"/>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="E:state">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Body">
              <nomvar name="E2:situation"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="should"/>
    <member stem="will"/>
  </family>
  <!-- =============== The "Taking Action" family ================= -->
  <!-- 
       This family is for eg 'take a right turn'.
       It takes an action as an NP complement:
       
         s[E]\np[X]/np[Y] : @E(take ^ <Actor>X ^ <Action>Y)
  -->
  <family name="TakeAction" pos="V" closed="true">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="case" val="nom"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="case" val="acc"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:action">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Actor">
              <nomvar name="X:animate-being"/>
            </diamond>
            <diamond mode="Action">
              <nomvar name="Y:action"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="take"/>
  </family>
  <!-- ================ The "Taking Road" family ================== -->
  <!-- 
       This family is for eg 'take Broadway'.
       It takes a road as an NP complement:
       
         s[E]\np[X]/np[Y] : @E(take ^ <Actor>X ^ <Road>Y)
  -->
  <family name="TakeRoad" pos="V" closed="true">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="case" val="nom"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="case" val="acc"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:action">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Actor">
              <nomvar name="X:animate-being"/>
            </diamond>
            <diamond mode="Road">
              <nomvar name="Y:road"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="go"/>
    <member stem="take"/>
  </family>
  <!-- ================ The "Getting off" family ================== -->
  <!-- 
       This family is for eg 'getting off Broadway'.
       Its headed by 'get' and takes a road as an optional NP complement, 
       plus the 'off' particle:
       
         s[E]\np[X]/prt[off] : @E(get-off ^ <Actor>X)
         s[E]\np[X]/np[Y]/prt[off] : @E(get-off ^ <Actor>X ^ <Road>Y)
  -->
  <family name="GetOff" pos="V" closed="true">
    <entry name="Intrans">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="case" val="nom"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="^"/>
        <atomcat type="prt">
          <fs attr="lex" val="off"/>
        </atomcat>
        <lf>
          <satop nomvar="E:action">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Actor">
              <nomvar name="X:animate-being"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="NP-Road">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="case" val="nom"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="case" val="acc"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="^"/>
        <atomcat type="prt">
          <fs attr="lex" val="off"/>
        </atomcat>
        <lf>
          <satop nomvar="E:action">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Actor">
              <nomvar name="X:animate-being"/>
            </diamond>
            <diamond mode="Road">
              <nomvar name="Y:road"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="get" pred="get-off"/>
  </family>
  <!-- ================ The "Getting on" family =================== -->
  <!-- 
       This family is for eg 'getting on Broadway'.
       Its headed by 'get' and takes a road as an NP complement, 
       plus either 'on' or 'onto' as a particle:
       
         s[E]\np[X]/np[Y]/prt[on] : @E(get-on ^ <Actor>X ^ <Road>Y)
         s[E]\np[X]/np[Y]/prt[onto] : @E(get-on ^ <Actor>X ^ <Road>Y)
  -->
  <family name="GetOn" pos="V" closed="true">
    <entry name="Prt-On">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="case" val="nom"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="case" val="acc"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="^"/>
        <atomcat type="prt">
          <fs attr="lex" val="on"/>
        </atomcat>
        <lf>
          <satop nomvar="E:action">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Actor">
              <nomvar name="X:animate-being"/>
            </diamond>
            <diamond mode="Road">
              <nomvar name="Y:road"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Prt-Onto">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="case" val="nom"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="case" val="acc"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="^"/>
        <atomcat type="prt">
          <fs attr="lex" val="onto"/>
        </atomcat>
        <lf>
          <satop nomvar="E:action">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Actor">
              <nomvar name="X:animate-being"/>
            </diamond>
            <diamond mode="Road">
              <nomvar name="Y:road"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="get" pred="get-on"/>
  </family>
  <!-- ================ The "Getting to" family =================== -->
  <!-- 
       This family is for eg 'getting to Central Square'.
       Its headed by 'get' and takes a location as an NP complement, 
       plus either 'to' as a particle:
       
         s[E]\np[X]/np[Y]/prt[to] : @E(get-to ^ <Actor>X ^ <Loc>Y)
  -->
  <family name="GetTo" pos="V" closed="true">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="case" val="nom"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="case" val="acc"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="^"/>
        <atomcat type="prt">
          <fs attr="lex" val="to"/>
        </atomcat>
        <lf>
          <satop nomvar="E:action">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Actor">
              <nomvar name="X:animate-being"/>
            </diamond>
            <diamond mode="Loc">
              <nomvar name="Y:location"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="get" pred="get-to"/>
  </family>
  <!-- ================= The "Reaching" family ==================== -->
  <!-- 
       This family is for eg 'reaching Central Square'.
       Like 'getting to', it takes a location as an NP complement:
       
         s[E]\np[X]/np[Y] : @E(*DEFAULT* ^ <Actor>X ^ <Loc>Y)
  -->
  <family name="Reach" pos="V" closed="true">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="case" val="nom"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="case" val="acc"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:action">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Actor">
              <nomvar name="X:animate-being"/>
            </diamond>
            <diamond mode="Loc">
              <nomvar name="Y:location"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="pass"/>
    <member stem="reach"/>
  </family>
  <!-- ================ The "Go Direction" family ================= -->
  <!-- 
       This family is for eg 'turn right' or 'go west'.
       It takes a direction as a bare N complement:
       
         s[E]\np[X]/n[Y] : @E(*DEFAULT* ^ <Actor>X ^ <Direction>Y)
  -->
  <family name="GoDirection" pos="V" closed="true">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="case" val="nom"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="^"/>
        <atomcat type="n">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:action">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Actor">
              <nomvar name="X:animate-being"/>
            </diamond>
            <diamond mode="Direction">
              <nomvar name="Y:direction"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="bear"/>
    <member stem="continue"/>
    <member stem="drive"/>
    <member stem="fork"/>
    <member stem="go"/>
    <member stem="stay"/>
    <member stem="turn"/>
  </family>
  <!-- ================== The Perceiving family =================== -->
  <!-- 
       E.g. "see", with Perceiver and Phenomenon roles.
  -->
  <family name="Perceiving" pos="V" closed="true">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="case" val="nom"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="case" val="acc"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:situation">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Perceiver">
              <nomvar name="X:animate-being"/>
            </diamond>
            <diamond mode="Phenomenon">
              <nomvar name="Y:sem-obj"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="see"/>
  </family>
  <!-- =================== The FullStop family ===================== -->
  <!-- 
       This family defines the categories for a sentence-final period, 
       which add declarative or imperative mood and promote an 's' to 
       a full sentence cat 'sent':
       
          1. sent[E]\s[dcl,E] : @E(<mood>dcl) 
          2. sent[E]\s[imp,E] : @E(<mood>imp)
          
       Note that the imperative category works in concert with the 
       imperative unary rule, which fills in the NP subject with pro2, 
       for 2nd person.
  -->
  <family name="FullStop" closed="true" pos="." indexRel="mood">
    <entry name="Declarative">
      <complexcat>
        <atomcat type="sent">
          <fs>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="*"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:situation">
            <diamond mode="mood">
              <prop name="dcl"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Imperative">
      <complexcat>
        <atomcat type="sent">
          <fs>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="*"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="imp"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:situation">
            <diamond mode="mood">
              <prop name="imp"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="."/>
  </family>
  <!-- ==================== The Comma family ======================= -->
  <!-- 
       This family defines the categories for a comma.
       The purely syntactic category is simply punct[,].
  -->
  <family name="Comma" pos="," closed="true">
    <entry name="Primary" indexRel="*NoSem*">
      <atomcat type="punct">
        <fs>
          <feat attr="lex" val=","/>
        </fs>
      </atomcat>
    </entry>
    <member stem=","/>
  </family>
</ccg-lexicon>


================================================
FILE: grammars/routes/morph.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!-- 
Copyright (C) 2006 Michael White
$Revision: 1.11 $, $Date: 2008/01/29 17:18:52 $ 
-->
<morph xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:noNamespaceSchemaLocation="../morph.xsd" name="routes">
  <!-- ===================== Simple determiners ==================== -->
  <entry pos="Det" word="a" macros="@sg"/>
  <entry pos="Det" word="an" stem="a" macros="@sg"/>
  <entry word="about" pos="Det"/>
  <entry word="the" pos="Det"/>
  <!-- ======================== Pronouns =========================== -->
  <entry pos="Pro" word="I" stem="pro1" class="animate-being" macros="@1st @sg @nom @sg-X"/>
  <entry pos="Pro" word="me" stem="pro1" class="animate-being" macros="@1st @sg @acc @sg-X"/>
  <entry pos="Pro" word="we" stem="pro1" class="animate-being" macros="@1st @pl @nom @pl-X"/>
  <entry pos="Pro" word="us" stem="pro1" class="animate-being" macros="@1st @pl @acc @pl-X"/>
  <entry word="you" stem="pro2" pos="Pro" class="animate-being" macros="@2nd"/>
  <entry pos="Pro" word="she" stem="pro3f" class="animate-being" macros="@3rd @sg @nom @sg-X"/>
  <entry pos="Pro" word="her" stem="pro3f" class="animate-being" macros="@3rd @sg @acc @sg-X"/>
  <entry pos="Pro" word="he" stem="pro3m" class="animate-being" macros="@3rd @sg @nom @sg-X"/>
  <entry pos="Pro" word="him" stem="pro3m" class="animate-being" macros="@3rd @sg @acc @sg-X"/>
  <entry pos="Pro" word="it" stem="pro3n" macros="@3rd @sg @sg-X"/>
  <entry pos="Pro" word="they" stem="pro3n" macros="@3rd @pl @nom @pl-X"/>
  <entry pos="Pro" word="them" stem="pro3n" macros="@3rd @pl @acc @pl-X"/>
  <entry pos="Pro" word="this" macros="@3rd @sg @sg-X"/>
  <entry pos="Pro" word="these" stem="this" macros="@3rd @pl @pl-X"/>
  <entry pos="Pro" word="that" macros="@3rd @sg @sg-X"/>
  <entry pos="Pro" word="those" stem="that" macros="@3rd @pl @pl-X"/>
  <entry pos="PossPro" word="my" stem="pro1" class="animate-being" macros="@sg-P"/>
  <entry pos="PossPro" word="our" stem="pro1" class="animate-being" macros="@pl-P"/>
  <entry word="your" stem="pro2" pos="PossPro" class="animate-being"/>
  <entry word="her" stem="pro3f" pos="PossPro" macros="@sg-P"/>
  <entry word="his" stem="pro3m" pos="PossPro" macros="@sg-P"/>
  <entry pos="PossPro" word="its" stem="pro3n" macros="@sg-P"/>
  <entry pos="PossPro" word="their" stem="pro3n" macros="@pl-P"/>
  <!-- ======================= Prepositions ======================== -->
  <entry word="at" pos="Prep"/>
  <entry word="after" pos="Prep"/>
  <entry word="before" pos="Prep"/>
  <entry word="off" pos="Prep"/>
  <entry word="on" pos="Prep"/>
  <entry word="along" pos="Prep"/>
  <entry word="from" pos="Prep"/>
  <entry word="for" pos="Prep"/>
  <entry word="across" pos="Prep"/>
  <entry word="into" pos="Prep"/>
  <entry word="out_of" pos="Prep"/>
  <entry word="over" pos="Prep"/>
  <entry word="past" pos="Prep"/>
  <entry word="through" pos="Prep"/>
  <entry word="under" pos="Prep"/>
  <entry word="via" pos="Prep"/>
  <entry word="away_from" pos="Prep"/>
  <entry word="toward" pos="Prep"/>
  <entry word="onto" pos="Prep"/>
  <entry word="to" pos="Prep"/>
  <entry word="up" pos="Prep"/>
  <entry word="down" pos="Prep"/>
  <!-- ========================= Adverbs =========================== -->
  <entry word="soon" pos="Adv"/>
  <!-- ======================== Adverbials ========================= -->
  <entry word="until" pos="Adv"/>
  <entry word="when" pos="Adv"/>
  <!-- ======================= Punctuation ========================= -->
  <entry word="." pos="."/>
  <entry word="," pos=","/>
  <!-- ========================= Numbers =========================== -->
  <entry word="[*NUM*]" class="num" pos="Num" macros="@pl"/>
  <entry word="one" class="num" pos="Num" macros="@sg"/>
  <entry word="1" class="num" pos="Num" macros="@sg"/>
  <entry word="several" class="num" pos="Num" macros="@pl"/>
  <entry word="two" class="num" pos="Num" macros="@pl"/>
  <entry word="three" class="num" pos="Num" macros="@pl"/>
  <entry word="four" class="num" pos="Num" macros="@pl"/>
  <entry word="five" class="num" pos="Num" macros="@pl"/>
  <!-- ======================== Adjectives ========================= -->
  <entry word="left" class="direction" pos="Adj"/>
  <entry word="right" class="direction" pos="Adj"/>
  <entry word="first" class="ord" pos="Adj"/>
  <entry word="second" class="ord" pos="Adj"/>
  <entry word="third" class="ord" pos="Adj"/>
  <entry word="last" class="ord" pos="Adj"/>
  <entry word="immediate" class="dist" pos="Adj"/>
  <entry word="long" pos="Adj"/>
  <entry word="short" pos="Adj"/>
  <entry word="traffic" pos="Adj"/>
  <!-- ========================== Nouns ============================ -->
  <entry pos="N" word="bridge" class="landmark" macros="@sg @sg-X"/>
  <entry pos="N" word="bridges" stem="bridge" class="landmark" macros="@pl @pl-X"/>
  <entry pos="N" word="destination" class="landmark" macros="@sg @sg-X"/>
  <entry pos="N" word="destinations" stem="destination" class="landmark" macros="@pl @pl-X"/>
  <entry pos="N" word="exit" class="landmark" macros="@sg @sg-X"/>
  <entry pos="N" word="exits" stem="exit" class="landmark" macros="@pl @pl-X"/>
  <entry pos="N" word="house" class="landmark" macros="@sg @sg-X"/>
  <entry pos="N" word="houses" stem="house" class="landmark" macros="@pl @pl-X"/>
  <entry pos="N" word="light" class="landmark" macros="@sg @sg-X"/>
  <entry pos="N" word="lights" stem="light" class="landmark" macros="@pl @pl-X"/>
  <entry pos="N" word="pizzeria" class="landmark" macros="@sg @sg-X"/>
  <entry pos="N" word="pizzerias" stem="pizzeria" class="landmark" macros="@pl @pl-X"/>
  <entry pos="N" word="river" class="landmark" macros="@sg @sg-X"/>
  <entry pos="N" word="rivers" stem="river" class="landmark" macros="@pl @pl-X"/>
  <entry pos="N" word="Starbucks" class="landmark" macros="@sg @sg-X"/>
  <entry pos="N" word="Starbuckses" stem="Starbucks" class="landmark" macros="@pl @pl-X"/>
  <entry pos="N" word="tunnel" class="landmark" macros="@sg @sg-X"/>
  <entry pos="N" word="tunnels" stem="tunnel" class="landmark" macros="@pl @pl-X"/>
  <entry pos="N" word="underpass" class="landmark" macros="@sg @sg-X"/>
  <entry pos="N" word="underpasses" stem="underpass" class="landmark" macros="@pl @pl-X"/>
  <entry pos="N" word="expressway" class="road" macros="@sg @sg-X"/>
  <entry pos="N" word="expressways" stem="expressway" class="road" macros="@pl @pl-X"/>
  <entry pos="N" word="road" class="road" macros="@sg @sg-X"/>
  <entry pos="N" word="roads" stem="road" class="road" macros="@pl @pl-X"/>
  <entry pos="N" word="way" class="road" macros="@sg @sg-X"/>
  <entry pos="N" word="ways" stem="way" class="road" macros="@pl @pl-X"/>
  <entry pos="N" word="left" class="turn" macros="@sg @sg-X"/>
  <entry pos="N" word="lefts" stem="left" class="turn" macros="@pl @pl-X"/>
  <entry pos="N" word="right" class="turn" macros="@sg @sg-X"/>
  <entry pos="N" word="rights" stem="right" class="turn" macros="@pl @pl-X"/>
  <entry pos="N" word="fork" class="action" macros="@sg @sg-X"/>
  <entry pos="N" word="forks" stem="fork" class="action" macros="@pl @pl-X"/>
  <entry pos="N" word="turn" class="action" macros="@sg @sg-X"/>
  <entry pos="N" word="turns" stem="turn" class="action" macros="@pl @pl-X"/>
  <entry word="left" class="direction" pos="N"/>
  <entry word="right" class="direction" pos="N"/>
  <entry word="straight" class="direction" pos="N"/>
  <entry word="north" class="direction" pos="N"/>
  <entry word="south" class="direction" pos="N"/>
  <entry word="east" class="direction" pos="N"/>
  <entry word="west" class="direction" pos="N"/>
  <entry word="northeast" class="direction" pos="N"/>
  <entry word="northwest" class="direction" pos="N"/>
  <entry word="southeast" class="direction" pos="N"/>
  <entry word="southwest" class="direction" pos="N"/>
  <entry pos="N" word="mile" class="dist" macros="@sg @sg-X"/>
  <entry pos="N" word="miles" stem="mile" class="dist" macros="@pl @pl-X"/>
  <!-- ========================== Verbs ============================ -->
  <!-- 'be' -->
  <!-- 
    <member-of pred="there-be" family="ThereExistential"/>
    -->
  <entry pos="V" word="be" macros="@base"/>
  <entry pos="V" word="am" stem="be" macros="@pres @1st @sg"/>
  <entry pos="V" word="'m" stem="be" macros="@pres @1st @sg"/>
  <entry pos="V" word="are" stem="be" macros="@pres @2nd @sg"/>
  <entry pos="V" word="'re" stem="be" macros="@pres @2nd @sg"/>
  <entry pos="V" word="is" stem="be" macros="@pres @3rd @sg"/>
  <entry pos="V" word="'s" stem="be" macros="@pres @3rd @sg"/>
  <entry pos="V" word="are" stem="be" macros="@pres @pl"/>
  <entry pos="V" word="'re" stem="be" macros="@pres @pl"/>
  <entry pos="V" word="was" stem="be" macros="@past @1st @sg"/>
  <entry pos="V" word="were" stem="be" macros="@past @2nd @sg"/>
  <entry pos="V" word="was" stem="be" macros="@past @3rd @sg"/>
  <entry pos="V" word="were" stem="be" macros="@past @pl"/>
  <!-- Modal verbs -->
  <entry word="should" pos="V"/>
  <entry pos="V" word="will"/>
  <entry pos="V" word="'ll" stem="will"/>
  <!-- Regular verbs -->
  <entry pos="V" word="bear" class="action" macros="@base"/>
  <entry pos="V" word="bear" class="action" macros="@pres @non-3rd @sg"/>
  <entry pos="V" word="bears" stem="bear" class="action" macros="@pres @3rd @sg"/>
  <entry pos="V" word="bear" class="action" macros="@pres @pl"/>
  <entry pos="V" word="bore" stem="bear" class="action" macros="@past"/>
  <entry pos="V" word="continue" class="action" macros="@base"/>
  <entry pos="V" word="continue" class="action" macros="@pres @non-3rd @sg"/>
  <entry pos="V" word="continues" stem="continue" class="action" macros="@pres @3rd @sg"/>
  <entry pos="V" word="continue" class="action" macros="@pres @pl"/>
  <entry pos="V" word="continued" stem="continue" class="action" macros="@past"/>
  <entry pos="V" word="cross" class="action" macros="@base"/>
  <entry pos="V" word="cross" class="action" macros="@pres @non-3rd @sg"/>
  <entry pos="V" word="crosses" stem="cross" class="action" macros="@pres @3rd @sg"/>
  <entry pos="V" word="cross" class="action" macros="@pres @pl"/>
  <entry pos="V" word="crossed" stem="cross" class="action" macros="@past"/>
  <entry pos="V" word="drive" class="action" macros="@base"/>
  <entry pos="V" word="drive" class="action" macros="@pres @non-3rd @sg"/>
  <entry pos="V" word="drives" stem="drive" class="action" macros="@pres @3rd @sg"/>
  <entry pos="V" word="drive" class="action" macros="@pres @pl"/>
  <entry pos="V" word="drove" stem="drive" class="action" macros="@past"/>
  <entry pos="V" word="fork" class="action" macros="@base"/>
  <entry pos="V" word="fork" class="action" macros="@pres @non-3rd @sg"/>
  <entry pos="V" word="forks" stem="fork" class="action" macros="@pres @3rd @sg"/>
  <entry pos="V" word="fork" class="action" macros="@pres @pl"/>
  <entry pos="V" word="forked" stem="fork" class="action" macros="@past"/>
  <entry pos="V" word="get" class="action" macros="@base"/>
  <entry pos="V" word="get" class="action" macros="@pres @non-3rd @sg"/>
  <entry pos="V" word="gets" stem="get" class="action" macros="@pres @3rd @sg"/>
  <entry pos="V" word="get" class="action" macros="@pres @pl"/>
  <entry pos="V" word="got" stem="get" class="action" macros="@past"/>
  <entry pos="V" word="go" class="action" macros="@base"/>
  <entry pos="V" word="go" class="action" macros="@pres @non-3rd @sg"/>
  <entry pos="V" word="goes" stem="go" class="action" macros="@pres @3rd @sg"/>
  <entry pos="V" word="go" class="action" macros="@pres @pl"/>
  <entry pos="V" word="went" stem="go" class="action" macros="@past"/>
  <entry pos="V" word="pass" class="action" macros="@base"/>
  <entry pos="V" word="pass" class="action" macros="@pres @non-3rd @sg"/>
  <entry pos="V" word="passes" stem="pass" class="action" macros="@pres @3rd @sg"/>
  <entry pos="V" word="pass" class="action" macros="@pres @pl"/>
  <entry pos="V" word="passed" stem="pass" class="action" macros="@past"/>
  <entry pos="V" word="reach" class="action" macros="@base"/>
  <entry pos="V" word="reach" class="action" macros="@pres @non-3rd @sg"/>
  <entry pos="V" word="reaches" stem="reach" class="action" macros="@pres @3rd @sg"/>
  <entry pos="V" word="reach" class="action" macros="@pres @pl"/>
  <entry pos="V" word="reached" stem="reach" class="action" macros="@past"/>
  <entry pos="V" word="see" class="action" macros="@base"/>
  <entry pos="V" word="see" class="action" macros="@pres @non-3rd @sg"/>
  <entry pos="V" word="sees" stem="see" class="action" macros="@pres @3rd @sg"/>
  <entry pos="V" word="see" class="action" macros="@pres @pl"/>
  <entry pos="V" word="saw" stem="see" class="action" macros="@past"/>
  <entry pos="V" word="stay" class="action" macros="@base"/>
  <entry pos="V" word="stay" class="action" macros="@pres @non-3rd @sg"/>
  <entry pos="V" word="stays" stem="stay" class="action" macros="@pres @3rd @sg"/>
  <entry pos="V" word="stay" class="action" macros="@pres @pl"/>
  <entry pos="V" word="stayed" stem="stay" class="action" macros="@past"/>
  <entry pos="V" word="take" class="action" macros="@base"/>
  <entry pos="V" word="take" class="action" macros="@pres @non-3rd @sg"/>
  <entry pos="V" word="takes" stem="take" class="action" macros="@pres @3rd @sg"/>
  <entry pos="V" word="take" class="action" macros="@pres @pl"/>
  <entry pos="V" word="took" stem="take" class="action" macros="@past"/>
  <entry pos="V" word="turn" class="action" macros="@base"/>
  <entry pos="V" word="turn" class="action" macros="@pres @non-3rd @sg"/>
  <entry pos="V" word="turns" stem="turn" class="action" macros="@pres @3rd @sg"/>
  <entry pos="V" word="turn" class="action" macros="@pres @pl"/>
  <entry pos="V" word="turned" stem="turn" class="action" macros="@past"/>
  <!-- ======================== Proper Names ======================= -->
  <entry word="Broadway" pos="NNP" class="road" macros="@sg"/>
  <entry word="Cambridge" pos="NNP" class="road" macros="@sg"/>
  <entry word="Cambridge_Street" pos="NNP" class="road" macros="@sg"/>
  <entry word="Concord_Avenue" pos="NNP" class="road" macros="@sg"/>
  <entry word="Irving_Terrace" pos="NNP" class="road" macros="@sg"/>
  <entry word="JFK_Street" pos="NNP" class="road" macros="@sg"/>
  <entry word="Mass_Pike" pos="NNP" class="road" macros="@sg"/>
  <entry word="Memorial_Drive" pos="NNP" class="road" macros="@sg"/>
  <entry word="Prescott_Street" pos="NNP" class="road" macros="@sg"/>
  <entry word="Prospect_Street" pos="NNP" class="road" macros="@sg"/>
  <entry word="River_Street" pos="NNP" class="road" macros="@sg"/>
  <entry word="Route_2" pos="NNP" class="road" macros="@sg"/>
  <entry word="Storrow_Drive" pos="NNP" class="road" macros="@sg"/>
  <entry word="Sumner_Road" pos="NNP" class="road" macros="@sg"/>
  <entry word="Charles" pos="NNP" class="person" macros="@sg"/>
  <entry word="Longfellow" pos="NNP" class="person" macros="@sg"/>
  <entry word="Mona_Lisa" pos="NNP" class="person" macros="@sg"/>
  <entry word="Alston_tolls" pos="NNP" class="place" macros="@sg"/>
  <entry word="Central_Square" pos="NNP" class="place" macros="@sg"/>
  <entry word="Harvard" pos="NNP" class="place" macros="@sg"/>
  <entry word="Harvard_Square" pos="NNP" class="place" macros="@sg"/>
  <entry word="Harvard_Yard" pos="NNP" class="place" macros="@sg"/>
  <entry word="Kendall_Square" pos="NNP" class="place" macros="@sg"/>
  <entry word="mid-Cambridge" pos="NNP" class="place" macros="@sg"/>
  <entry word="MIT" pos="NNP" class="place" macros="@sg"/>
  <!-- ========================== Macros =========================== -->
  <!-- ============================================================= -->
  <!--
    The macro @non-3rd supplies a syntactic number value that is
    compatible with both @1st and @2nd, as specified in types.xml.
  -->
  <macro name="@1st">
    <fs id="2" attr="pers" val="1st"/>
  </macro>
  <macro name="@2nd">
    <fs id="2" attr="pers" val="2nd"/>
  </macro>
  <macro name="@3rd">
    <fs id="2" attr="pers" val="3rd"/>
  </macro>
  <macro name="@non-3rd">
    <fs id="2" attr="pers" val="non-3rd"/>
  </macro>
  <macro name="@nom">
    <fs id="2" attr="case" val="nom"/>
  </macro>
  <macro name="@acc">
    <fs id="2" attr="case" val="acc"/>
  </macro>
  <macro name="@sg">
    <fs id="2" attr="num" val="sg"/>
  </macro>
  <macro name="@pl">
    <fs id="2" attr="num" val="pl"/>
  </macro>
  <!--
    The @base macro is for bare verbal forms.
  -->
  <macro name="@base">
    <fs id="1" attr="form" val="base"/>
  </macro>
  <!-- 
    The macros @sg-X and @pl-X add a semantic number feature on the
    nominal head X to the LFs of nouns and pronouns; 
    @sg-P and @pl-P are analogous for the nominal var P.
  -->
  <macro name="@sg-X">
    <lf>
      <satop nomvar="X">
        <diamond mode="num">
          <prop name="sg"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@pl-X">
    <lf>
      <satop nomvar="X">
        <diamond mode="num">
          <prop name="pl"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@sg-P">
    <lf>
      <satop nomvar="P">
        <diamond mode="num">
          <prop name="sg"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@pl-P">
    <lf>
      <satop nomvar="P">
        <diamond mode="num">
          <prop name="pl"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <!--
    The @past and @pres macros add tense info.
  -->
  <macro name="@past">
    <lf>
      <satop nomvar="E">
        <diamond mode="tense">
          <prop name="past"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@pres">
    <lf>
      <satop nomvar="E">
        <diamond mode="tense">
          <prop name="pres"/>
        </diamond>
      </satop>
    </lf>
  </macro>
</morph>


================================================
FILE: grammars/routes/rules.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!-- 
This file specifies the available combinatory rules.

Copyright (C) 2006 Michael White 
$Revision: 1.5 $, $Date: 2006/04/25 05:21:25 $ 
-->
<rules
  name="tiny"
  xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
  xsi:noNamespaceSchemaLocation="../rules.xsd"
>

  <!-- Application -->
  <application dir="forward"/>
  <application dir="backward"/>

  <!-- Harmonic Composition -->
  <composition dir="forward" harmonic="true"/>
  <composition dir="backward" harmonic="true"/>

  <!-- Crossed Composition -->
  <!-- <composition dir="forward" harmonic="false"/> -->
  <composition dir="backward" harmonic="false"/>

  <!-- Type-raising -->
  <typeraising dir="forward" useDollar="false"/>
  <typeraising dir="backward" useDollar="true"/>
  <typeraising dir="backward" useDollar="true">
    <arg><atomcat type="pp"/></arg>
  </typeraising>

  <!-- Imperative -->
  <!--
    The imperative rule promotes a bare vp to an s with the imp 
    feature, and fills in the NP subject with pro2, for 2nd person:
    
      s[bare,E]\np[X] => s[imp,E] : @X(pro2)
  -->
  <typechanging name="imp">
    <arg>
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="base"/>
            <feat attr="index"> <lf> <nomvar name="E"/> </lf> </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs>
            <feat attr="index"> <lf> <nomvar name="X"/> </lf> </feat>
          </fs>
        </atomcat>
      </complexcat>
    </arg>
    <result>
      <atomcat type="s">
        <fs inheritsFrom="1">
          <feat attr="form" val="imp"/>
        </fs>
        <lf>
          <satop nomvar="X:sem-obj">
            <prop name="pro2"/>
          </satop>
        </lf>
      </atomcat>
    </result>
  </typechanging>
  
  <!-- Bare NP -->
  <!-- 
    The Bare NP rule promotes a plural (or eventually mass) noun 
    to an NP with det nil:
    
      n[pl,X] => np[pl,3rd,X] : @X(<det>nil)
  -->  
  <typechanging name="bnp">
    <arg>
      <atomcat type="n">
        <fs id="2">
          <feat attr="index"> <lf> <nomvar name="X"/> </lf> </feat>
          <feat attr="num" val="pl"/>
        </fs>
      </atomcat>
    </arg>
    <result>
      <atomcat type="np">
        <fs id="2">
          <feat attr="pers" val="3rd"/>
        </fs>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="det"> <prop name="nil"/> </diamond>
          </satop>
        </lf>
      </atomcat>
    </result>
  </typechanging>

  <!-- Numbered Road -->
  <!--
    The Numbered Road rule promotes a number to a road with than name:
    
      num[N] => np[X] : @X:road(<Name>N:num)
  -->
  <typechanging name="num-road">
    <arg>
      <atomcat type="num">
        <fs>
          <feat attr="index"> <lf> <nomvar name="N"/> </lf> </feat>
        </fs>
      </atomcat>
    </arg>
    <result>
      <atomcat type="np">
        <fs>
          <feat attr="index"> <lf> <nomvar name="X"/> </lf> </feat>
        </fs>
        <lf>
          <satop nomvar="X:road">
            <diamond mode="Name"> <nomvar name="N:num"/> </diamond>
          </satop>
        </lf>
      </atomcat>
    </result>
  </typechanging>
</rules>

================================================
FILE: grammars/routes/testbed.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!-- 
This file lists regression test items.

Copyright (C) 2006 Michael White 
$Revision: 1.9 $, $Date: 2006/05/20 20:34:16 $ 
-->
<regression>
  <item numOfParses="1" string="from mid-Cambridge , take Cambridge_Street toward Harvard_Yard .">
    <lf>
      <node id="t1:action" pred="take" mood="imp">
        <rel name="Actor">
          <node id="p1:animate-being" pred="pro2"/>
        </rel>
        <rel name="Road">
          <node id="c1:road" pred="Cambridge_Street"/>
        </rel>
        <rel name="Path">
          <node id="f1:path" pred="from">
            <rel name="Ref">
              <node id="m1:place" pred="mid-Cambridge"/>
            </rel>
          </node>
        </rel>
        <rel name="Path">
          <node id="t2:path" pred="toward">
            <rel name="Ref">
              <node id="h1:place" pred="Harvard_Yard"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="drive up Cambridge_Street toward Harvard_Yard .">
    <lf>
      <node id="d1:action" pred="drive" mood="imp">
        <rel name="Actor">
          <node id="p1:animate-being" pred="pro2"/>
        </rel>
        <rel name="Path">
          <node id="u1:path" pred="up">
            <rel name="Ref">
              <node id="c1:road" pred="Cambridge_Street"/>
            </rel>
          </node>
        </rel>
        <rel name="Path">
          <node id="t1:path" pred="toward">
            <rel name="Ref">
              <node id="h1:place" pred="Harvard_Yard"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="from mid-Cambridge , drive up Cambridge_Street for about one mile .">
    <lf>
      <node id="d1:action" pred="drive" mood="imp">
        <rel name="Actor">
          <node id="p1:animate-being" pred="pro2"/>
        </rel>
        <rel name="Dist">
          <node id="m1:dist" pred="mile" det="about" num="sg">
            <rel name="Card">
              <node id="o1:num" pred="one"/>
            </rel>
          </node>
        </rel>
        <rel name="Path">
          <node id="f1:path" pred="from">
            <rel name="Ref">
              <node id="m2:place" pred="mid-Cambridge"/>
            </rel>
          </node>
        </rel>
        <rel name="Path">
          <node id="u1:path" pred="up">
            <rel name="Ref">
              <node id="c1:road" pred="Cambridge_Street"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="from mid-Cambridge , drive west on Cambridge_Street toward Harvard_Yard for about 1 mile .">
    <lf>
      <node id="d1:action" pred="drive" mood="imp">
        <rel name="Actor">
          <node id="p1:animate-being" pred="pro2"/>
        </rel>
        <rel name="Direction">
          <node id="w1:direction" pred="west"/>
        </rel>
        <rel name="Dist">
          <node id="m1:dist" pred="mile" det="about" num="sg">
            <rel name="Card">
              <node id="n1:num" pred="1"/>
            </rel>
          </node>
        </rel>
        <rel name="Loc">
          <node id="o1:location" pred="on">
            <rel name="Ref">
              <node id="c1:road" pred="Cambridge_Street"/>
            </rel>
          </node>
        </rel>
        <rel name="Path">
          <node id="f1:path" pred="from">
            <rel name="Ref">
              <node id="m2:place" pred="mid-Cambridge"/>
            </rel>
          </node>
        </rel>
        <rel name="Path">
          <node id="t1:path" pred="toward">
            <rel name="Ref">
              <node id="h1:place" pred="Harvard_Yard"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="drive west on Cambridge_Street for about 1 mile toward Harvard_Yard .">
    <lf>
      <node id="d1:action" pred="drive" mood="imp">
        <rel name="Actor">
          <node id="p1:animate-being" pred="pro2"/>
        </rel>
        <rel name="Direction">
          <node id="w1:direction" pred="west"/>
        </rel>
        <rel name="Dist">
          <node id="m1:dist" pred="mile" det="about" num="sg">
            <rel name="Card">
              <node id="n1:num" pred="1"/>
            </rel>
          </node>
        </rel>
        <rel name="Loc">
          <node id="o1:location" pred="on">
            <rel name="Ref">
              <node id="c1:road" pred="Cambridge_Street"/>
            </rel>
          </node>
        </rel>
        <rel name="Path">
          <node id="t1:path" pred="toward">
            <rel name="Ref">
              <node id="h1:place" pred="Harvard_Yard"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="3" string="along the way , you 'll go past the Mona_Lisa pizzeria on the right .">
    <lf>
      <node id="w1:state" pred="will" mood="dcl">
        <rel name="Body">
          <node id="g1:action" pred="go">
            <rel name="Actor">
              <node id="p1:animate-being" pred="pro2"/>
            </rel>
            <rel name="Loc">
              <node id="o1:location" pred="on">
                <rel name="Ref">
                  <node id="r1:direction" pred="right" det="the"/>
                </rel>
              </node>
            </rel>
            <rel name="Path">
              <node id="p2:path" pred="past">
                <rel name="Ref">
                  <node id="p3:landmark" pred="pizzeria" det="the" num="sg">
                    <rel name="Name">
                      <node id="m1:person" pred="Mona_Lisa"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="Path">
          <node id="a1:path" pred="along">
            <rel name="Ref">
              <node id="w2:road" pred="way" det="the" num="sg"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="2" string="along the way , you 'll pass the Mona_Lisa pizzeria on the right .">
    <lf>
      <node id="w1:state" pred="will" mood="dcl">
        <rel name="Body">
          <node id="p1:action" pred="pass">
            <rel name="Actor">
              <node id="p2:animate-being" pred="pro2"/>
            </rel>
            <rel name="Loc">
              <node id="o1:location" pred="on">
                <rel name="Ref">
                  <node id="r1:direction" pred="right" det="the"/>
                </rel>
              </node>
            </rel>
            <rel name="Loc">
              <node id="p3:landmark" pred="pizzeria" det="the" num="sg">
                <rel name="Name">
                  <node id="m1:person" pred="Mona_Lisa"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="Path">
          <node id="a1:path" pred="along">
            <rel name="Ref">
              <node id="w2:road" pred="way" det="the" num="sg"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="take the last right turn onto Sumner_Road .">
    <lf>
      <node id="t1:action" pred="take" mood="imp">
        <rel name="Actor">
          <node id="p1:animate-being" pred="pro2"/>
        </rel>
        <rel name="Action">
          <node id="t2:action" pred="turn" det="the" num="sg">
            <rel name="HasProp">
              <node id="l1:ord" pred="last"/>
            </rel>
            <rel name="HasProp">
              <node id="r1:direction" pred="right"/>
            </rel>
          </node>
        </rel>
        <rel name="Path">
          <node id="o1:path" pred="onto">
            <rel name="Ref">
              <node id="s1:road" pred="Sumner_Road"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="take the last right before the light onto Sumner_Road .">
    <lf>
      <node id="t1:action" pred="take" mood="imp">
        <rel name="Actor">
          <node id="p1:animate-being" pred="pro2"/>
        </rel>
        <rel name="Action">
          <node id="r1:action" pred="right" det="the" num="sg">
            <rel name="HasProp">
              <node id="l1:ord" pred="last"/>
            </rel>
          </node>
        </rel>
        <rel name="Loc">
          <node id="b1:location" pred="before">
            <rel name="Ref">
              <node id="l2:landmark" pred="light" det="the" num="sg"/>
            </rel>
          </node>
        </rel>
        <rel name="Path">
          <node id="o1:path" pred="onto">
            <rel name="Ref">
              <node id="s1:road" pred="Sumner_Road"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="take the last right turn before the light onto Sumner_Road .">
    <lf>
      <node id="t1:action" pred="take" mood="imp">
        <rel name="Actor">
          <node id="p1:animate-being" pred="pro2"/>
        </rel>
        <rel name="Action">
          <node id="t2:action" pred="turn" det="the" num="sg">
            <rel name="HasProp">
              <node id="l1:ord" pred="last"/>
            </rel>
            <rel name="HasProp">
              <node id="r1:direction" pred="right"/>
            </rel>
          </node>
        </rel>
        <rel name="Loc">
          <node id="b1:location" pred="before">
            <rel name="Ref">
              <node id="l2:landmark" pred="light" det="the" num="sg"/>
            </rel>
          </node>
        </rel>
        <rel name="Path">
          <node id="o1:path" pred="onto">
            <rel name="Ref">
              <node id="s1:road" pred="Sumner_Road"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="take an immediate right onto Irving_Terrace .">
    <lf>
      <node id="t1:action" pred="take" mood="imp">
        <rel name="Actor">
          <node id="p1:animate-being" pred="pro2"/>
        </rel>
        <rel name="Action">
          <node id="r1:action" pred="right" det="a" num="sg">
            <rel name="HasProp">
              <node id="i1:dist" pred="immediate"/>
            </rel>
          </node>
        </rel>
        <rel name="Path">
          <node id="o1:path" pred="onto">
            <rel name="Ref">
              <node id="i2:road" pred="Irving_Terrace"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="take the first right onto Irving_Terrace .">
    <lf>
      <node id="t1:action" pred="take" mood="imp">
        <rel name="Actor">
          <node id="p1:animate-being" pred="pro2"/>
        </rel>
        <rel name="Action">
          <node id="r1:action" pred="right" det="the" num="sg">
            <rel name="HasProp">
              <node id="f1:ord" pred="first"/>
            </rel>
          </node>
        </rel>
        <rel name="Path">
          <node id="o1:path" pred="onto">
            <rel name="Ref">
              <node id="i1:road" pred="Irving_Terrace"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="drive up Broadway for 1.5 miles toward Harvard_Square .">
    <lf>
      <node id="d1:action" pred="drive" mood="imp">
        <rel name="Actor">
          <node id="p1:animate-being" pred="pro2"/>
        </rel>
        <rel name="Dist">
          <node id="m1:dist" pred="mile" det="nil" num="pl">
            <rel name="Card">
              <node id="n1:num" pred="1.5"/>
            </rel>
          </node>
        </rel>
        <rel name="Path">
          <node id="u1:path" pred="up">
            <rel name="Ref">
              <node id="b1:road" pred="Broadway"/>
            </rel>
          </node>
        </rel>
        <rel name="Path">
          <node id="t1:path" pred="toward">
            <rel name="Ref">
              <node id="h1:place" pred="Harvard_Square"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="take Broadway to Prescott_Street .">
    <lf>
      <node id="t1:action" pred="take" mood="imp">
        <rel name="Actor">
          <node id="p1:animate-being" pred="pro2"/>
        </rel>
        <rel name="Road">
          <node id="b1:road" pred="Broadway"/>
        </rel>
        <rel name="Path">
          <node id="t2:path" pred="to">
            <rel name="Ref">
              <node id="p2:road" pred="Prescott_Street"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="turn right onto Cambridge_Street away_from Harvard_Square .">
    <lf>
      <node id="t1:action" pred="turn" mood="imp">
        <rel name="Actor">
          <node id="p1:animate-being" pred="pro2"/>
        </rel>
        <rel name="Direction">
          <node id="r1:direction" pred="right"/>
        </rel>
        <rel name="Path">
          <node id="o1:path" pred="onto">
            <rel name="Ref">
              <node id="c1:road" pred="Cambridge_Street"/>
            </rel>
          </node>
        </rel>
        <rel name="Path">
          <node id="a1:path" pred="away_from">
            <rel name="Ref">
              <node id="h1:place" pred="Harvard_Square"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="take a right onto Cambridge_Street away_from Harvard_Square .">
    <lf>
      <node id="t1:action" pred="take" mood="imp">
        <rel name="Actor">
          <node id="p1:animate-being" pred="pro2"/>
        </rel>
        <rel name="Action">
          <node id="r1:turn" pred="right" det="a" num="sg"/>
        </rel>
        <rel name="Path">
          <node id="o1:path" pred="onto">
            <rel name="Ref">
              <node id="c1:road" pred="Cambridge_Street"/>
            </rel>
          </node>
        </rel>
        <rel name="Path">
          <node id="a1:path" pred="away_from">
            <rel name="Ref">
              <node id="h1:place" pred="Harvard_Square"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="take an immediate left onto Sumner_Road .">
    <lf>
      <node id="t1:action" pred="take" mood="imp">
        <rel name="Actor">
          <node id="p1:animate-being" pred="pro2"/>
        </rel>
        <rel name="Action">
          <node id="l1:action" pred="left" det="a" num="sg">
            <rel name="HasProp">
              <node id="i1:dist" pred="immediate"/>
            </rel>
          </node>
        </rel>
        <rel name="Path">
          <node id="o1:path" pred="onto">
            <rel name="Ref">
              <node id="s1:road" pred="Sumner_Road"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="get off at the Cambridge exit .">
    <lf>
      <node id="g1:action" pred="get-off" mood="imp">
        <rel name="Actor">
          <node id="p1:animate-being" pred="pro2"/>
        </rel>
        <rel name="Loc">
          <node id="a1:location" pred="at">
            <rel name="Ref">
              <node id="e1:landmark" pred="exit" det="the" num="sg">
                <rel name="Name">
                  <node id="c1:road" pred="Cambridge"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="go across the Charles river .">
    <lf>
      <node id="g1:action" pred="go" mood="imp">
        <rel name="Actor">
          <node id="p1:animate-being" pred="pro2"/>
        </rel>
        <rel name="Path">
          <node id="a1:path" pred="across">
            <rel name="Ref">
              <node id="r1:landmark" pred="river" det="the" num="sg">
                <rel name="Name">
                  <node id="c1:person" pred="Charles"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="go left onto Memorial_Drive .">
    <lf>
      <node id="g1:action" pred="go" mood="imp">
        <rel name="Actor">
          <node id="p1:animate-being" pred="pro2"/>
        </rel>
        <rel name="Direction">
          <node id="l1:direction" pred="left"/>
        </rel>
        <rel name="Path">
          <node id="o1:path" pred="onto">
            <rel name="Ref">
              <node id="m1:road" pred="Memorial_Drive"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="take a right at the third light onto JFK_Street .">
    <lf>
      <node id="t1:action" pred="take" mood="imp">
        <rel name="Actor">
          <node id="p1:animate-being" pred="pro2"/>
        </rel>
        <rel name="Action">
          <node id="r1:action" pred="right" det="a" num="sg"/>
        </rel>
        <rel name="Loc">
          <node id="a1:location" pred="at">
            <rel name="Ref">
              <node id="l1:landmark" pred="light" det="the" num="sg">
                <rel name="HasProp">
                  <node id="t2:ord" pred="third"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="Path">
          <node id="o1:path" pred="onto">
            <rel name="Ref">
              <node id="j1:road" pred="JFK_Street"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="turn right at the third light onto JFK_Street .">
    <lf>
      <node id="t1:action" pred="turn" mood="imp">
        <rel name="Actor">
          <node id="p1:animate-being" pred="pro2"/>
        </rel>
        <rel name="Direction">
          <node id="r1:direction" pred="right"/>
        </rel>
        <rel name="Loc">
          <node id="a1:location" pred="at">
            <rel name="Ref">
              <node id="l1:landmark" pred="light" det="the" num="sg">
                <rel name="HasProp">
                  <node id="t2:ord" pred="third"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="Path">
          <node id="o1:path" pred="onto">
            <rel name="Ref">
              <node id="j1:road" pred="JFK_Street"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="go straight through four traffic lights .">
    <lf>
      <node id="g1:action" pred="go" mood="imp">
        <rel name="Actor">
          <node id="p1:animate-being" pred="pro2"/>
        </rel>
        <rel name="Direction">
          <node id="s1:direction" pred="straight"/>
        </rel>
        <rel name="Path">
          <node id="t1:path" pred="through">
            <rel name="Ref">
              <node id="l1:landmark" pred="light" det="nil" num="pl">
                <rel name="Card">
                  <node id="f1:num" pred="four"/>
                </rel>
                <rel name="HasProp">
                  <node id="t2:property" pred="traffic"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="bear right under the Harvard_Yard underpass .">
    <lf>
      <node id="b1:action" pred="bear" mood="imp">
        <rel name="Actor">
          <node id="p1:animate-being" pred="pro2"/>
        </rel>
        <rel name="Direction">
          <node id="r1:direction" pred="right"/>
        </rel>
        <rel name="Path">
          <node id="u1:path" pred="under">
            <rel name="Ref">
              <node id="u2:landmark" pred="underpass" det="the" num="sg">
                <rel name="Name">
                  <node id="h1:place" pred="Harvard_Yard"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="bear left onto Cambridge_Street .">
    <lf>
      <node id="b1:action" pred="bear" mood="imp">
        <rel name="Actor">
          <node id="p1:animate-being" pred="pro2"/>
        </rel>
        <rel name="Direction">
          <node id="l1:direction" pred="left"/>
        </rel>
        <rel name="Path">
          <node id="o1:path" pred="onto">
            <rel name="Ref">
              <node id="c1:road" pred="Cambridge_Street"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="take 93 to Storrow_Drive .">
    <lf>
      <node id="t1:action" pred="take" mood="imp">
        <rel name="Actor">
          <node id="p1:animate-being" pred="pro2"/>
        </rel>
        <rel name="Road">
          <node id="x1:road">
            <rel name="Name">
              <node id="n1:num" pred="93"/>
            </rel>
          </node>
        </rel>
        <rel name="Path">
          <node id="t2:path" pred="to">
            <rel name="Ref">
              <node id="s1:road" pred="Storrow_Drive"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="take Storrow_Drive to the Kendall_Square exit .">
    <lf>
      <node id="t1:action" pred="take" mood="imp">
        <rel name="Actor">
          <node id="p1:animate-being" pred="pro2"/>
        </rel>
        <rel name="Road">
          <node id="s1:road" pred="Storrow_Drive"/>
        </rel>
        <rel name="Path">
          <node id="t2:path" pred="to">
            <rel name="Ref">
              <node id="e1:landmark" pred="exit" det="the" num="sg">
                <rel name="Name">
                  <node id="k1:place" pred="Kendall_Square"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="cross the river on the Longfellow bridge .">
    <lf>
      <node id="c1:action" pred="cross" mood="imp">
        <rel name="Actor">
          <node id="p1:animate-being" pred="pro2"/>
        </rel>
        <rel name="Patient">
          <node id="r1:landmark" pred="river" det="the" num="sg"/>
        </rel>
        <rel name="Loc">
          <node id="o1:location" pred="on">
            <rel name="Ref">
              <node id="b1:landmark" pred="bridge" det="the" num="sg">
                <rel name="Name">
                  <node id="l1:person" pred="Longfellow"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="get onto Broadway at Kendall_Square .">
    <lf>
      <node id="g1:action" pred="get-on" mood="imp">
        <rel name="Actor">
          <node id="p1:animate-being" pred="pro2"/>
        </rel>
        <rel name="Road">
          <node id="b1:road" pred="Broadway"/>
        </rel>
        <rel name="Loc">
          <node id="a1:location" pred="at">
            <rel name="Ref">
              <node id="k1:place" pred="Kendall_Square"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="continue straight at Kendall_Square onto Broadway .">
    <lf>
      <node id="c1:action" pred="continue" mood="imp">
        <rel name="Actor">
          <node id="p1:animate-being" pred="pro2"/>
        </rel>
        <rel name="Direction">
          <node id="s1:direction" pred="straight"/>
        </rel>
        <rel name="Loc">
          <node id="a1:location" pred="at">
            <rel name="Ref">
              <node id="k1:place" pred="Kendall_Square"/>
            </rel>
          </node>
        </rel>
        <rel name="Path">
          <node id="o1:path" pred="onto">
            <rel name="Ref">
              <node id="b1:road" pred="Broadway"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="at Kendall_Square , continue straight onto Broadway .">
    <lf>
      <node id="c1:action" pred="continue" mood="imp">
        <rel name="Actor">
          <node id="p1:animate-being" pred="pro2"/>
        </rel>
        <rel name="Direction">
          <node id="s1:direction" pred="straight"/>
        </rel>
        <rel name="Loc">
          <node id="a1:location" pred="at">
            <rel name="Ref">
              <node id="k1:place" pred="Kendall_Square"/>
            </rel>
          </node>
        </rel>
        <rel name="Path">
          <node id="o1:path" pred="onto">
            <rel name="Ref">
              <node id="b1:road" pred="Broadway"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="take Mass_Pike to the Alston_tolls exit .">
    <lf>
      <node id="t1:action" pred="take" mood="imp">
        <rel name="Actor">
          <node id="p1:animate-being" pred="pro2"/>
        </rel>
        <rel name="Road">
          <node id="m1:road" pred="Mass_Pike"/>
        </rel>
        <rel name="Path">
          <node id="t2:path" pred="to">
            <rel name="Ref">
              <node id="e1:landmark" pred="exit" det="the" num="sg">
                <rel name="Name">
                  <node id="a1:place" pred="Alston_tolls"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="cross the river .">
    <lf>
      <node id="c1:action" pred="cross" mood="imp">
        <rel name="Actor">
          <node id="p1:animate-being" pred="pro2"/>
        </rel>
        <rel name="Patient">
          <node id="r1:landmark" pred="river" det="the" num="sg"/>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="continue on River_Street .">
    <lf>
      <node id="c1:action" pred="continue" mood="imp">
        <rel name="Actor">
          <node id="p1:animate-being" pred="pro2"/>
        </rel>
        <rel name="Loc">
          <node id="o1:location" pred="on">
            <rel name="Ref">
              <node id="r1:road" pred="River_Street"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="at Central_Square , continue straight onto Prospect_Street .">
    <lf>
      <node id="c1:action" pred="continue" mood="imp">
        <rel name="Actor">
          <node id="p1:animate-being" pred="pro2"/>
        </rel>
        <rel name="Direction">
          <node id="s1:direction" pred="straight"/>
        </rel>
        <rel name="Loc">
          <node id="a1:location" pred="at">
            <rel name="Ref">
              <node id="c2:place" pred="Central_Square"/>
            </rel>
          </node>
        </rel>
        <rel name="Path">
          <node id="o1:path" pred="onto">
            <rel name="Ref">
              <node id="p2:road" pred="Prospect_Street"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="continue straight at Central_Square onto Prospect_Street .">
    <lf>
      <node id="c1:action" pred="continue" mood="imp">
        <rel name="Actor">
          <node id="p1:animate-being" pred="pro2"/>
        </rel>
        <rel name="Direction">
          <node id="s1:direction" pred="straight"/>
        </rel>
        <rel name="Loc">
          <node id="a1:location" pred="at">
            <rel name="Ref">
              <node id="c2:place" pred="Central_Square"/>
            </rel>
          </node>
        </rel>
        <rel name="Path">
          <node id="o1:path" pred="onto">
            <rel name="Ref">
              <node id="p2:road" pred="Prospect_Street"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="stay on River_Street until Central_Square .">
    <lf>
      <node id="s1:action" pred="stay" mood="imp">
        <rel name="Actor">
          <node id="p1:animate-being" pred="pro2"/>
        </rel>
        <rel name="Loc">
          <node id="o1:location" pred="on">
            <rel name="Ref">
              <node id="r1:road" pred="River_Street"/>
            </rel>
          </node>
        </rel>
        <rel name="TempRel">
          <node id="u1:path" pred="until">
            <rel name="Ref">
              <node id="c1:place" pred="Central_Square"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="stay on River_Street until you reach Central_Square .">
    <lf>
      <node id="s1:action" pred="stay" mood="imp">
        <rel name="Actor">
          <node id="p1:animate-being" pred="pro2"/>
        </rel>
        <rel name="Loc">
          <node id="o1:location" pred="on">
            <rel name="Ref">
              <node id="r1:road" pred="River_Street"/>
            </rel>
          </node>
        </rel>
        <rel name="TempRel">
          <node id="u1:path" pred="until">
            <rel name="Situation">
              <node id="r2:action" pred="reach" tense="pres">
                <rel name="Actor">
                  <node id="p2:animate-being" pred="pro2"/>
                </rel>
                <rel name="Loc">
                  <node id="c1:place" pred="Central_Square"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="when you get to Central_Square , continue straight onto Prospect_Street .">
    <lf>
      <node id="c1:action" pred="continue" mood="imp">
        <rel name="Actor">
          <node id="p1:animate-being" pred="pro2"/>
        </rel>
        <rel name="Direction">
          <node id="s1:direction" pred="straight"/>
        </rel>
        <rel name="Path">
          <node id="o1:path" pred="onto">
            <rel name="Ref">
              <node id="p2:road" pred="Prospect_Street"/>
            </rel>
          </node>
        </rel>
        <rel name="TempRel">
          <node id="w1:path" pred="when">
            <rel name="Situation">
              <node id="g1:action" pred="get-to" tense="pres">
                <rel name="Actor">
                  <node id="p3:animate-being" pred="pro2"/>
                </rel>
                <rel name="Loc">
                  <node id="c2:place" pred="Central_Square"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="continue straight onto Prospect_Street when you get to Central_Square .">
    <lf>
      <node id="c1:action" pred="continue" mood="imp">
        <rel name="Actor">
          <node id="p1:animate-being" pred="pro2"/>
        </rel>
        <rel name="Direction">
          <node id="s1:direction" pred="straight"/>
        </rel>
        <rel name="Path">
          <node id="o1:path" pred="onto">
            <rel name="Ref">
              <node id="p2:road" pred="Prospect_Street"/>
            </rel>
          </node>
        </rel>
        <rel name="TempRel">
          <node id="w1:path" pred="when">
            <rel name="Situation">
              <node id="g1:action" pred="get-to" tense="pres">
                <rel name="Actor">
                  <node id="p3:animate-being" pred="pro2"/>
                </rel>
                <rel name="Loc">
                  <node id="c2:place" pred="Central_Square"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="turn right at the second light onto Broadway .">
    <lf>
      <node id="t1:action" pred="turn" mood="imp">
        <rel name="Actor">
          <node id="p1:animate-being" pred="pro2"/>
        </rel>
        <rel name="Direction">
          <node id="r1:direction" pred="right"/>
        </rel>
        <rel name="Loc">
          <node id="a1:location" pred="at">
            <rel name="Ref">
              <node id="l1:landmark" pred="light" det="the" num="sg">
                <rel name="HasProp">
                  <node id="s1:ord" pred="second"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="Path">
          <node id="o1:path" pred="onto">
            <rel name="Ref">
              <node id="b1:road" pred="Broadway"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="at the second light , turn right onto Broadway .">
    <lf>
      <node id="t1:action" pred="turn" mood="imp">
        <rel name="Actor">
          <node id="p1:animate-being" pred="pro2"/>
        </rel>
        <rel name="Direction">
          <node id="r1:direction" pred="right"/>
        </rel>
        <rel name="Loc">
          <node id="a1:location" pred="at">
            <rel name="Ref">
              <node id="l1:landmark" pred="light" det="the" num="sg">
                <rel name="HasProp">
                  <node id="s1:ord" pred="second"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="Path">
          <node id="o1:path" pred="onto">
            <rel name="Ref">
              <node id="b1:road" pred="Broadway"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="take Route_2 to Concord_Avenue .">
    <lf>
      <node id="t1:action" pred="take" mood="imp">
        <rel name="Actor">
          <node id="p1:animate-being" pred="pro2"/>
        </rel>
        <rel name="Road">
          <node id="r1:road" pred="Route_2"/>
        </rel>
        <rel name="Path">
          <node id="t2:path" pred="to">
            <rel name="Ref">
              <node id="c1:road" pred="Concord_Avenue"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="continue on Concord_Avenue to Harvard_Square .">
    <lf>
      <node id="c1:action" pred="continue" mood="imp">
        <rel name="Actor">
          <node id="p1:animate-being" pred="pro2"/>
        </rel>
        <rel name="Loc">
          <node id="o1:location" pred="on">
            <rel name="Ref">
              <node id="c2:road" pred="Concord_Avenue"/>
            </rel>
          </node>
        </rel>
        <rel name="Path">
          <node id="t1:path" pred="to">
            <rel name="Ref">
              <node id="h1:place" pred="Harvard_Square"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="go under Harvard via the short tunnel .">
    <lf>
      <node id="g1:action" pred="go" mood="imp">
        <rel name="Actor">
          <node id="p1:animate-being" pred="pro2"/>
        </rel>
        <rel name="Path">
          <node id="u1:path" pred="under">
            <rel name="Ref">
              <node id="h1:place" pred="Harvard"/>
            </rel>
          </node>
        </rel>
        <rel name="Path">
          <node id="v1:path" pred="via">
            <rel name="Ref">
              <node id="t1:landmark" pred="tunnel" det="the" num="sg">
                <rel name="HasProp">
                  <node id="s1:property" pred="short"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="drive under Harvard via the short tunnel .">
    <lf>
      <node id="d1:action" pred="drive" mood="imp">
        <rel name="Actor">
          <node id="p1:animate-being" pred="pro2"/>
        </rel>
        <rel name="Path">
          <node id="u1:path" pred="under">
            <rel name="Ref">
              <node id="h1:place" pred="Harvard"/>
            </rel>
          </node>
        </rel>
        <rel name="Path">
          <node id="v1:path" pred="via">
            <rel name="Ref">
              <node id="t1:landmark" pred="tunnel" det="the" num="sg">
                <rel name="HasProp">
                  <node id="s1:property" pred="short"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="take the right fork out_of the tunnel .">
    <lf>
      <node id="t1:action" pred="take" mood="imp">
        <rel name="Actor">
          <node id="p1:animate-being" pred="pro2"/>
        </rel>
        <rel name="Action">
          <node id="f1:action" pred="fork" det="the" num="sg">
            <rel name="HasProp">
              <node id="r1:direction" pred="right"/>
            </rel>
          </node>
        </rel>
        <rel name="Path">
          <node id="o1:path" pred="out_of">
            <rel name="Ref">
              <node id="t2:landmark" pred="tunnel" det="the" num="sg"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="fork right out_of the tunnel .">
    <lf>
      <node id="f1:action" pred="fork" mood="imp">
        <rel name="Actor">
          <node id="p1:animate-being" pred="pro2"/>
        </rel>
        <rel name="Direction">
          <node id="r1:direction" pred="right"/>
        </rel>
        <rel name="Path">
          <node id="o1:path" pred="out_of">
            <rel name="Ref">
              <node id="t1:landmark" pred="tunnel" det="the" num="sg"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="my house is on the right .">
    <lf>
      <node id="b1:state" pred="be" mood="dcl" tense="pres">
        <rel name="Arg">
          <node id="h1:landmark" pred="house" num="sg">
            <rel name="GenOwner">
              <node id="p1:animate-being" pred="pro1" num="sg"/>
            </rel>
          </node>
        </rel>
        <rel name="Prop">
          <node id="o1:location" pred="on">
            <rel name="Arg">
              <node idref="h1:landmark"/>
            </rel>
            <rel name="Ref">
              <node id="r1:direction" pred="right" det="the"/>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="1" string="this is Broadway .">
    <lf>
      <node id="b1:state" pred="be" mood="dcl" tense="pres">
        <rel name="Arg">
          <node id="t1:sem-obj" pred="this" num="sg"/>
        </rel>
        <rel name="Pred">
          <node id="b2:road" pred="Broadway"/>
        </rel>
      </node>
    </lf>
  </item>
  <item numOfParses="2" string="you should soon see your destination on the left .">
    <lf>
      <node id="s1:state" pred="should" mood="dcl">
        <rel name="Body">
          <node id="s2:action" pred="see">
            <rel name="HasProp">
              <node id="s3:property" pred="soon"/>
            </rel>
            <rel name="Perceiver">
              <node id="p1:animate-being" pred="pro2"/>
            </rel>
            <rel name="Phenomenon">
              <node id="d1:landmark" pred="destination" num="sg">
                <rel name="GenOwner">
                  <node id="p2:animate-being" pred="pro2"/>
                </rel>
              </node>
            </rel>
            <rel name="Loc">
              <node id="o1:location" pred="on">
                <rel name="Ref">
                  <node id="l1:direction" pred="left" det="the"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </node>
    </lf>
  </item>
</regression>


================================================
FILE: grammars/routes/types.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!--
This file contains the syntactic and semantic simple/atomic types.

The syntactic values for person are defined under pers-vals, and the
semantic types/sorts are defined under sem-obj. Indenting shows the
structure of the hierarchy. (In the general case, multiple parents may
be specified.)

Copyright (C) 2006 Michael White
$Revision: 1.4 $, $Date: 2006/05/20 20:34:16 $ 
-->
<types 
  name="tiny"
  xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" 
  xsi:noNamespaceSchemaLocation="../types.xsd"
>

  <!-- person vals -->
  <type name="pers-vals"/>
  <type name="3rd" parents="pers-vals"/>
  <type name="non-3rd" parents="pers-vals"/>
    <type name="1st" parents="non-3rd"/>
    <type name="2nd" parents="non-3rd"/>

  <!-- ontological sorts -->
  <type name="sem-obj"/>
    <type name="abstraction" parents="sem-obj property"/>
      <type name="direction" parents="abstraction location"/>
      <type name="measure" parents="abstraction"/>
        <type name="amt" parents="measure"/>
        <type name="dur" parents="measure"/>
        <type name="dist" parents="measure"/>
      <type name="num" parents="abstraction"/>
      <type name="ord" parents="abstraction"/>
      <type name="time" parents="abstraction"/>
    <type name="location" parents="sem-obj property"/>
      <type name="city" parents="location"/>
      <type name="place" parents="location"/>
    <type name="path" parents="sem-obj"/>
    <type name="phys-obj" parents="sem-obj"/>
      <type name="animate-being" parents="phys-obj"/>
        <type name="person" parents="animate-being"/>
      <type name="thing" parents="phys-obj"/>
        <type name="landmark" parents="thing location"/>
        <type name="road" parents="thing location"/>
	  <type name="property" parents="sem-obj"/>
    <type name="situation" parents="sem-obj"/>
      <type name="change" parents="situation"/>
        <type name="action" parents="change"/>
          <type name="turn" parents="action"/>
      <type name="state" parents="situation"/>

  <!--
	<type name="sem-obj"/>
    <type name="abstraction" parents="sem-obj"/>
      <type name="date" parents="abstraction"/>
      <type name="measure" parents="abstraction"/>
        <type name="amt" parents="measure"/>
        <type name="dur" parents="measure"/>
      <type name="num" parents="abstraction"/>
      <type name="time" parents="abstraction"/>
    <type name="location" parents="sem-obj"/>
      <type name="city" parents="location"/>
    <type name="entity" parents="sem-obj"/>
      <type name="causal-agent" parents="entity"/>
        <type name="organization" parents="causal-agent"/>
      <type name="mental-obj" parents="entity"/>
      <type name="phys-obj" parents="entity"/>
        <type name="animate-being" parents="phys-obj"/>
          <type name="person" parents="animate-being causal-agent"/>
    <type name="grouping" parents="sem-obj"/>
    <type name="situation" parents="sem-obj"/>
      <type name="change" parents="situation"/>
        <type name="action" parents="change"/>
          <type name="statement" parents="action"/>
        <type name="motion" parents="change"/>
      <type name="quantification" parents="situation"/>
      <type name="state" parents="situation"/>
        <type name="proposition" parents="state"/>
        <type name="experience" parents="state"/>
  -->  

</types>


================================================
FILE: grammars/rules.xsd
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!-- 
Copyright (C) 2003 University of Edinburgh (Michael White) 
$Revision: 1.4 $, $Date: 2004/10/05 11:01:40 $ 
-->
<xsd:schema xmlns:xsd="http://www.w3.org/2001/XMLSchema">

  <xsd:annotation>
  <xsd:documentation>
    Schema for combinatory rules file.
    
    A rules file specifies the combinatory rules to use.
    These rules include the (potentially) universal set of application, 
    composition, type raising and substitution rules; they are only 
    "potentially" universal because for efficiency one might want to 
    use a restricted subset of the rules, and because the type raising 
    rules are defined to work with specific, configurable argument and 
    result types.
    
    The rules file may also specify unary type changing rules, which 
    may be thought of as signs for zero morphemes, and thus conceptually 
    belonging to the lexicon rather than to the (potentially) universal 
    rule set.  They are defined in the rules file since, algorithmically, 
    they are handled at the same time as the other combinatory rules.
  </xsd:documentation>
  </xsd:annotation>

  <xsd:include schemaLocation="categories.xsd"/>
  
  
  <xsd:element name="rules">
    <xsd:annotation>
    <xsd:documentation>
      The root element.
    </xsd:documentation>
    </xsd:annotation>
    
    <xsd:complexType>
      <xsd:sequence>

        <xsd:element name="application" minOccurs="0" maxOccurs="2">
          <xsd:annotation>
          <xsd:documentation>
            Application, e.g. X/Y Y => X.
          </xsd:documentation>
          </xsd:annotation>
          <xsd:complexType>
            <xsd:attribute ref="dir" use="required"/>
          </xsd:complexType>
        </xsd:element>

        <xsd:element name="composition" minOccurs="0" maxOccurs="4">
          <xsd:annotation>
          <xsd:documentation>
            Composition, e.g. X/Y Y/Z => X/Z.
          </xsd:documentation>
          </xsd:annotation>
          <xsd:complexType>
            <xsd:attribute ref="dir" use="required"/>
            <xsd:attribute ref="harmonic" use="required"/>
          </xsd:complexType>
        </xsd:element>

        <xsd:element name="typeraising" type="typeraisingType" minOccurs="0" maxOccurs="unbounded"/>

        <xsd:element name="substitution" minOccurs="0" maxOccurs="4">
          <xsd:annotation>
          <xsd:documentation>
            Substitution, e.g. X/Y/Z Y/Z => X/Z.
          </xsd:documentation>
          </xsd:annotation>
          <xsd:complexType>
            <xsd:attribute ref="dir" use="required"/>
            <xsd:attribute ref="harmonic" use="required"/>
          </xsd:complexType>
        </xsd:element>

        <xsd:element name="typechanging" type="typechangingType" minOccurs="0" maxOccurs="unbounded"/>

      </xsd:sequence>
      
      <xsd:attribute name="name" type="xsd:string"/>
    </xsd:complexType>
  </xsd:element>

  
  <xsd:attribute name="dir">
    <xsd:annotation>
    <xsd:documentation>
      Specifies the direction of the rule.
      With forward combination, the functor appears on the left; 
      with backward combination, it appears on the right.
    </xsd:documentation>
    </xsd:annotation>
    <xsd:simpleType>
      <xsd:restriction base="xsd:string">
        <xsd:enumeration value="forward"/>
        <xsd:enumeration value="backward"/>
      </xsd:restriction>
    </xsd:simpleType>
  </xsd:attribute>
  
  <xsd:attribute name="harmonic" type="xsd:boolean">
    <xsd:annotation>
    <xsd:documentation>
      Specifies whether the rule is harmonic (true) or permutative (false).
    </xsd:documentation>
    </xsd:annotation>
  </xsd:attribute>

  
  <xsd:complexType name="typeraisingType">
    <xsd:annotation>
    <xsd:documentation>
      Type raising, e.g. np => s/(s\np).
      The default category for the arg is "np"; 
      the default for the result is "s".
    </xsd:documentation>
    </xsd:annotation>
    <xsd:sequence>
      <xsd:element name="arg" type="atomcatContainer" minOccurs="0"/>
      <xsd:element name="result" type="atomcatContainer" minOccurs="0"/>
    </xsd:sequence>
    <xsd:attribute ref="dir" use="required"/>
    <xsd:attribute name="useDollar" type="xsd:boolean" use="required">
      <xsd:annotation>
      <xsd:documentation>
        Specifies whether a coindexed dollar variable is included on 
        the argument and result categories.
      </xsd:documentation>
      </xsd:annotation>
    </xsd:attribute>
  </xsd:complexType>


  <xsd:complexType name="typechangingType">
    <xsd:annotation>
    <xsd:documentation>
      Unary type changing rule, e.g. np => s/(s/np) for topicalization.
      The arg and result categories are required, as is the name attribute.
    </xsd:documentation>
    </xsd:annotation>
    <xsd:sequence>
      <xsd:element name="arg" type="categoryContainer"/>
      <xsd:element name="result" type="categoryContainer"/>
    </xsd:sequence>
    <xsd:attribute name="name" type="token" use="required"/>
  </xsd:complexType>


  <xsd:complexType name="atomcatContainer">
    <xsd:sequence>
      <xsd:element ref="atomcat"/>
    </xsd:sequence>
  </xsd:complexType>
  
  <xsd:complexType name="categoryContainer">
    <xsd:sequence>
      <xsd:element ref="category"/>
    </xsd:sequence>
  </xsd:complexType>
  
</xsd:schema>


================================================
FILE: grammars/simplify-lists.xsl
================================================
<?xml version="1.0"?>
<!-- 
Copyright (C) 2003-4 University of Edinburgh (Michael White) 
$Revision: 1.3 $, $Date: 2005/07/18 21:19:41 $ 

This transformation flattens list structures to a simpler structure.
-->
<xsl:transform 
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform" 
  version="1.0"
  xmlns:xalan2="http://xml.apache.org/xslt"
  exclude-result-prefixes="xalan2">

  <xsl:output indent="yes" xalan2:indent-amount="2"/> 
  <xsl:strip-space elements="*"/>

  
  <!-- simplify lists: change First rel to List ... -->
  <xsl:template match="rel[@name='First']">
    <rel name="List">
      <xsl:apply-templates select="@*[name(.) != 'name'] | node()"/>
    </rel>
  </xsl:template>
  
  <!-- ... and drop EqL and Last nodes -->
  <xsl:template match="rel[@name='EqL' or @name='Last']"/>
  
  <!-- ... filter elem nodes, and Item and Next rels contained therein -->
  <xsl:template match="node[@pred='elem'] | node[@pred='elem']/rel[@name='Item' or @name='Next']">
    <xsl:apply-templates/>
  </xsl:template>
  
  
  <!-- Copy -->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: grammars/tiny/build.xml
================================================
<!-- $Id: build.xml,v 1.4 2007/03/26 14:39:54 mwhite14850 Exp $ -->
<!-- Copyright (C) 2003 Michael White -->
<project default="grammar" basedir=".">

  <!-- =================================================================== -->
  <!-- Initialization target                                               -->
  <!-- =================================================================== -->
  <target name="init">
    <tstamp/>
    <property name="Name" value="OpenCCG"/>
    <property name="name" value="openccg"/>

    <echo message="----------- ${Name} ------------"/>

    <property name="lib.dir" value="${openccg.home}/lib"/>
    <property name="grammars.dir" value="${openccg.home}/grammars"/>

    <path id="validate.classpath">
      <pathelement location="${lib.dir}/xercesImpl.jar"/>
      <pathelement location="${lib.dir}/${name}.jar"/>
    </path>
  </target>
  

  <!-- =================================================================== -->
  <!-- Help on usage                                                       -->
  <!-- =================================================================== -->
  <target name="usage">
    <echo message=""/>
    <echo message=""/>
    <echo message="OpenCCG grammar build file"/>
    <echo message="-------------------------------------------------------------"/>
    <echo message=""/>
    <echo message=" Available targets are:"/>
    <echo message=""/>
    <echo message="   grammar  --> builds the grammar (default)"/>
    <echo message=""/>
    <echo message=" See the comments inside the build.xml file for more details."/>
    <echo message="-------------------------------------------------------------"/>
    <echo message=""/>
    <echo message=""/>
  </target>
  

  <!-- =================================================================== -->
  <!-- Builds grammar                                                     -->
  <!-- =================================================================== -->
  <target name="grammar" depends="init" description="builds grammar">
    <echo message="Validating grammar.xml, lexicon.xml, morph.xml, rules.xml and types.xml"/>
    <java classname="opennlp.ccg.test.Validator" classpathref="validate.classpath" fork="true"> 
      <arg value="grammar.xml"/>
      <arg value="lexicon.xml"/>
      <arg value="morph.xml"/>
      <arg value="rules.xml"/>
      <arg value="types.xml"/>
    </java>
  </target>
	
	<!-- =================================================================== -->
  <!-- Generates documentation                                             -->
  <!-- =================================================================== -->
	<target name="document">

		<taskdef name="grammardoc" classname="opennlp.ccg.grammardoc.GrammarDoc">
			<classpath>
				<fileset dir="../../lib">
					<include name="ant.jar"/>
				</fileset>
				<fileset dir="../../output">
					<include name="openccg.jar"/>
				</fileset>
			</classpath>
		</taskdef>
		
		<grammardoc srcdir="." destdir="docs/"/>
	</target>
	
</project>

<!-- End of file -->


================================================
FILE: grammars/tiny/grammar.xml
================================================
<?xml version="1.0"?>
<!-- 
This grammar called 'tiny' is a small sample grammar to demonstrate how
OpenCCG grammars are defined.

It is derived from Geert-Jan M. Kruijff's 'coordination' grammar,
which was simplified, revised and extended.

                    David Reitter, dreitter at inf.ed.ac dot uk, 01/2005
                    Michael White, mwhite at inf dot ed.ac.uk, 01/2005


Some example sentences (use with tccg):

the teacher buys the policemen a book
the teacher buys the policemen some flowers
the teachers buy a book
...

(See also testbed.xml.)

Use single phrases ("a book") to find out whether they could be seen as constituents!

Copyright (C) 2005 David Reitter and University of Edinburgh (Michael White) 
$Revision: 1.3 $, $Date: 2005/01/22 12:53:35 $ 
-->

<grammar name="tiny"
  xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
  xsi:noNamespaceSchemaLocation="../grammar.xsd"
>

  <lexicon file="lexicon.xml"/>
  <morphology file="morph.xml"/>
  <rules file="rules.xml"/>
  <types file="types.xml"/>

</grammar>


================================================
FILE: grammars/tiny/lexicon.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!-- 
This file contains the lexical families.

Copyright (C) 2005 David Reitter and University of Edinburgh (Michael White) 
$Revision: 1.6 $, $Date: 2010/09/13 04:45:19 $ 
-->
<ccg-lexicon 
  name="tiny"
  xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" 
  xsi:noNamespaceSchemaLocation="../lexicon.xsd"
>

  <!-- ==================== The "Noun" family ===================== -->
  <!-- 
       Each noun has part of speech ("pos") N, atomic category n, a
       number attribute, and an index term X that links it to its
       meaning.
       
       The feature structure is labeled with id="2", which is referenced
       by the macros in morph.xml.
       
       The meaning is @X:sem-obj([*DEFAULT*]), where the word's
       predicate (typically just the stem) is substituted for
       [*DEFAULT*].  The nominal X is specified to be of type sem-obj, 
       the root of the semantic hierarchy in types.xml.
       
       There is just one type of category (the "Primary" category). This
       is an open class.
  -->
  <family name="Noun" pos="N">
    <entry name="Primary">
      <atomcat type="n">
        <fs id="2">
          <feat attr="num">
            <featvar name="NUM"/>
          </feat>
          <feat attr="index">
            <lf>
              <nomvar name="X"/>
            </lf>
          </feat>
        </fs>
        <lf>
          <satop nomvar="X:sem-obj">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </atomcat>
    </entry>
  </family>

  
  <!-- ==================== The "ProNP" family ===================== -->
  <!-- 
       Pronominal noun phrases have category np and number, person 
       and case attributes.  The person attribute is restricted to 
       come from pers-vals, defined in types.xml.
       
       This is a closed class.
  -->
  <family name="ProNP" pos="Pro" closed="true">
    <entry name="Primary">
      <atomcat type="np">
        <fs id="2">
          <feat attr="num">
            <featvar name="NUM"/>
          </feat>
          <feat attr="pers">
            <featvar name="PERS:pers-vals"/>
          </feat>
          <feat attr="case">
            <featvar name="CASE"/>
          </feat>
          <feat attr="index">
            <lf>
              <nomvar name="X"/>
            </lf>
          </feat>
        </fs>
        <lf>
          <satop nomvar="X:sem-obj">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </atomcat>
    </entry>
    <member stem="pro1"/>
    <member stem="pro2"/>
    <member stem="pro3f"/>
    <member stem="pro3m"/>
    <member stem="pro3n"/>
  </family>

  
  <!-- ===================== The "Det" family ====================== -->
  <!-- 
       The category is np/n, whereby the logical form for the noun
       phrase is built by taking the meaning of the n argument and
       augmenting it with the semantic feature @X(<det>[*DEFAULT*]),
       where X is the semantic head.
       
       For realization, relevant determiners are looked up via the
       relation <det>, as specified by indexRel="det".
       
       Note that we use id="2" for both feature structures, which causes
       the noun features to percolate up to the resulting np category
       (via unification in derivations).
       
       There is just one type of category (the "Primary" category). This
       is a closed class with three members. 
  -->
  <family name="Det" pos="Det" closed="true" indexRel="det">
    <entry name="Primary">
      <complexcat>
        <atomcat type="np">
          <fs id="2">
            <feat attr="pers" val="3rd"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="^"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="det">
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="a"/>
    <member stem="the"/>
    <member stem="some"/>
  </family>

  
  <!-- ===================== The "Adj" family ====================== -->
  <!-- 
       The category is n/n, whereby the logical form for the noun
       is modified by adding the property supplied by the adjective.

       To support adverbial modification, the nominal for the adjective's 
       meaning (M) is made available on the result category using the mod-index 
       feature.  Note that the semantic head (X) is inherited from the modified 
       noun, but the mod-index is allowed to change, to allow multiple adjectival 
       modifiers.

       This is an open class.
  -->
  <family name="Adj" pos="Adj">
    <entry name="Primary">
      <complexcat>
        <atomcat type="n">
          <fs inheritsFrom="2">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="^"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X:sem-obj">
            <diamond mode="Mod">
              <nomvar name="M:state"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>

  
  <!-- ===================== The "AdvIntens" family ====================== -->
  <!-- 
       The category is n/n/(n/n), whereby the logical form for the adjective  
       is modified by adding the magnitude property supplied by the intensifying 
       adverb.

       Note that the adverb uses the mod-index feature to supply its predicate.
       This is a closed class.
  -->
  <family name="AdvIntens" pos="Adv" closed="true">
    <entry name="Primary">
      <complexcat>
        <atomcat type="n">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="^"/>
        <atomcat type="n">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="^"/>
        <complexcat>
          <atomcat type="n">
            <fs inheritsFrom="2">
              <feat attr="mod-index">
                <lf>
                  <nomvar name="M"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="/" mode="^"/>
          <atomcat type="n">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="M:state">
            <diamond mode="Magn">
              <nomvar name="P:state"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="very"/>
  </family>

  
  <!-- ================== The "Prep-Nom" family ==================== -->
  <!-- 
       This family defines the category pp[X,lex=[*DEFAULT*]]/np[X] 
       for prepositions that essentially act as case markers.
       
       For realization, the indexRel is *NoSem* to indicate that it 
       has empty semantics.
       
       The feature structure for the PP atom cat inherits its values 
       from the feature structure with id=3, ie the NP cat, adding 
       the "lex" feature with the value filled in by the word stem.
  -->
  <family name="Prep-Nom" pos="Prep" closed="true" indexRel="*NoSem*">
    <entry name="Nominal">
      <complexcat>
        <atomcat type="pp">
          <fs inheritsFrom="3">
            <feat attr="lex" val="[*DEFAULT*]"/>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="case" val="acc"/>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="for"/>
  </family>
  
  
  <!-- =============== The "Transitive Verb" family ================ -->
  <!-- 
       This family defines the category s\np/np. The result category (s)
       has a feature structure with id=1 (this is referenced in the
       macros in the morph.xml file), and has an index (E for event
       variable).
       
       The subject NP has a feature structure with id=2, and has number,
       person, and case attributes, where case is required to be
       nominative. Its index is X, which is used to unify the nominal of
       the subject into the Actor slot in the logical form, ie
       @E:action(<Actor>X:animate-being). Note that the types of the
       nominals are specified in the LF.
       
       The object NP is similar, but with the case attribute set to
       accusative, and unifies the index Y into the Patient role in the
       LF. 
  -->
  <family name="TransitiveVerbs" pos="V" closed="true">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat attr="case" val="nom"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="case" val="acc"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:action">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Actor">
              <nomvar name="X:animate-being"/>
            </diamond>
            <diamond mode="Patient">
              <nomvar name="Y:sem-obj"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="buy"/>
    <member stem="rent"/>
  </family>

  
  <!-- ========== The "Ditransitive/Beneficiary" family ============ -->
  <!-- 
       This family defines the categories 
       
          1. s[E]\np[X]/np[Y]/np[Z] 
          2. s[E]\np[X]/pp[Z,for]/np[Y]
          
       with semantics that adds
       
          @E:action(<Beneficiary>Z:animate-being) 
       
       to the meaning of the corresponding transitive verb.
       
       Here the category 1 is the ditransitive NP NP category, with
       np[Z] as the indirect object and np[Y] the direct object, and
       category 2 is the NP PP-for alternation with np[Y] again as the
       direct object, and the pp[Z,for] headed by the preposition "for"
       supplying the same argument as the indirect object in the
       ditransitive category. 
  -->
  <family name="DitransitiveBeneficiaryVerbs" pos="V" closed="true">
    <entry name="DTV">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat attr="case" val="nom"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="case" val="acc"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&lt;"/>
        <atomcat type="np">
          <fs id="4">
            <feat attr="case" val="acc"/>
            <feat attr="index">
              <lf>
                <nomvar name="Z"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:action">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Actor">
              <nomvar name="X:animate-being"/>
            </diamond>
            <diamond mode="Patient">
              <nomvar name="Y:sem-obj"/>
            </diamond>
            <diamond mode="Beneficiary">
              <nomvar name="Z:animate-being"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="NP-PPfor">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM"/>
            </feat>
            <feat attr="pers">
              <featvar name="PERS:pers-vals"/>
            </feat>
            <feat attr="case" val="nom"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="pp">
          <fs id="4">
            <feat attr="lex" val="for"/>
            <feat attr="index">
              <lf>
                <nomvar name="Z"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&lt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="case" val="acc"/>
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E:action">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Actor">
              <nomvar name="X:animate-being"/>
            </diamond>
            <diamond mode="Patient">
              <nomvar name="Y:sem-obj"/>
            </diamond>
            <diamond mode="Beneficiary">
              <nomvar name="Z:animate-being"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="buy"/>
    <member stem="rent"/>
  </family>
  
</ccg-lexicon>


================================================
FILE: grammars/tiny/morph.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!-- 
This file contains the morph entries.

Copyright (C) 2005 David Reitter and University of Edinburgh (Michael White) 
$Revision: 1.8 $, $Date: 2010/09/13 04:37:19 $ 
-->
<morph 
  name="tiny"
  xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" 
  xsi:noNamespaceSchemaLocation="../morph.xsd"
>


  <!-- ===================== Simple determiners ==================== -->
  <entry pos="Det" word="a" macros="@sg"/>
  <entry pos="Det" word="the"/>
  <entry pos="Det" word="some"/>

  
  <!-- ======================== Pronouns =========================== -->
  <entry pos="Pro" word="I" stem="pro1" class="animate-being" macros="@1st @sg @nom @sg-X"/>
  <entry pos="Pro" word="me" stem="pro1" class="animate-being" macros="@1st @sg @acc @sg-X"/>
  <entry pos="Pro" word="we" stem="pro1" class="animate-being" macros="@1st @pl @nom @pl-X"/>
  <entry pos="Pro" word="us" stem="pro1" class="animate-being" macros="@1st @pl @acc @pl-X"/>
  <entry pos="Pro" word="you" stem="pro2" class="animate-being" macros="@2nd"/>
  <entry pos="Pro" word="she" stem="pro3f" class="animate-being" macros="@3rd @sg @nom @sg-X"/>
  <entry pos="Pro" word="her" stem="pro3f" class="animate-being" macros="@3rd @sg @acc @sg-X"/>
  <entry pos="Pro" word="he" stem="pro3m" class="animate-being" macros="@3rd @sg @nom @sg-X"/>
  <entry pos="Pro" word="him" stem="pro3m" class="animate-being" macros="@3rd @sg @acc @sg-X"/>
  <entry pos="Pro" word="it" stem="pro3n" class="thing" macros="@3rd @sg @sg-X"/>
  <entry pos="Pro" word="they" stem="pro3n" macros="@3rd @pl @nom @pl-X"/>
  <entry pos="Pro" word="them" stem="pro3n" macros="@3rd @pl @acc @pl-X"/>

  
  <!-- ========================== Nouns ============================ -->
  <entry pos="N" word="book" class="thing" macros="@sg @sg-X"/>
  <entry pos="N" word="books" stem="book" class="thing" macros="@pl @pl-X"/>
  <entry pos="N" word="DVD" class="thing" macros="@sg @sg-X"/>
  <entry pos="N" word="DVDs" stem="DVD" class="thing" macros="@pl @pl-X"/>
  <entry pos="N" word="flower" class="thing" macros="@sg @sg-X"/>
  <entry pos="N" word="flowers" stem="flower" class="thing" macros="@pl @pl-X"/>
  <entry pos="N" word="policeman" class="person" macros="@sg @sg-X"/>
  <entry pos="N" word="policemen" stem="policeman" class="person" macros="@pl @pl-X"/>
  <entry pos="N" word="teacher" class="person" macros="@sg @sg-X"/>
  <entry pos="N" word="teachers" stem="teacher" class="person" macros="@pl @pl-X"/>


  <!-- ======================== Adjectives ========================= -->
  <entry pos="Adj" word="blue"/>
  <entry pos="Adj" word="green"/>
  <entry pos="Adj" word="scarlet"/>
  <entry pos="Adj" word="gray"/>


  <!-- ===================== Intensifying Adverbs ================== -->
  <entry pos="Adv" word="very"/>


  <!-- ======================= Prepositions ======================== -->
  <entry pos="Prep" word="for"/>

  
  <!-- ========================== Verbs ============================ -->  
  <entry pos="V" word="buy" macros="@pres @non-3rd @sg"/>
  <entry pos="V" word="buys" stem="buy" macros="@pres @3rd @sg"/>
  <entry pos="V" word="buy" macros="@pres @pl"/>
  <entry pos="V" word="bought" stem="buy" macros="@past"/>

  <entry pos="V" word="rent" macros="@pres @non-3rd @sg"/>
  <entry pos="V" word="rent" macros="@pres @pl"/>
  <entry pos="V" word="rents" stem="rent" macros="@pres @3rd @sg"/>
  <entry pos="V" word="rented" stem="rent" macros="@past"/>

  
  <!-- ========================== Macros =========================== -->  
  <!-- ============================================================= -->  

  <!--
    The macro @non-3rd supplies a syntactic number value that is
    compatible with both @1st and @2nd, as specified in types.xml.
  -->
  <macro name="@1st">
     <fs id="2" attr="pers" val="1st"/>
  </macro>
  <macro name="@2nd">
     <fs id="2" attr="pers" val="2nd"/>
  </macro>
  <macro name="@3rd">
     <fs id="2" attr="pers" val="3rd"/>
  </macro>
  <macro name="@non-3rd">
     <fs id="2" attr="pers" val="non-3rd"/>
  </macro>
  
  <macro name="@nom">
    <fs id="2" attr="case" val="nom"/>
  </macro>
  <macro name="@acc">
    <fs id="2" attr="case" val="acc"/>
  </macro>
  
  <macro name="@sg">
     <fs id="2">
       <feat attr="num" val="sg"/>
     </fs>
  </macro>
  <macro name="@pl">
     <fs id="2">
       <feat attr="num" val="pl"/>
     </fs>
  </macro>

  <!-- 
    The macros @sg-X and @pl-X add a semantic number feature on the
    nominal head X to the LFs of nouns and pronouns
  -->
  <macro name="@sg-X">
    <lf>
      <satop nomvar="X">
        <diamond mode="num">
          <prop name="sg"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@pl-X">
    <lf>
      <satop nomvar="X">
        <diamond mode="num">
          <prop name="pl"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  
  <macro name="@past">
    <lf>
      <satop nomvar="E">
        <diamond mode="tense">
          <prop name="past"/>
        </diamond>
      </satop>
    </lf>
  </macro>

  <macro name="@pres">
    <lf>
      <satop nomvar="E">
        <diamond mode="tense">
          <prop name="pres"/>
        </diamond>
      </satop>
    </lf>
  </macro>

</morph>


================================================
FILE: grammars/tiny/rules.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!-- 
This file specifies the available combinatory rules.

Copyright (C) 2005 David Reitter and University of Edinburgh (Michael White) 
$Revision: 1.3 $, $Date: 2005/03/22 21:49:21 $ 
-->
<rules
  name="tiny"
  xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
  xsi:noNamespaceSchemaLocation="../rules.xsd"
>

  <!-- Application -->
  <application dir="forward"/>
  <application dir="backward"/>

  <!-- Harmonic Composition -->
  <composition dir="forward" harmonic="true"/>
  <composition dir="backward" harmonic="true"/>

  <!-- Crossed Composition -->
  <composition dir="forward" harmonic="false"/>
  <composition dir="backward" harmonic="false"/>

  <!-- Type-raising -->
  <typeraising dir="forward" useDollar="false"/>
  <typeraising dir="backward" useDollar="true"/>
  <typeraising dir="backward" useDollar="true">
    <arg><atomcat type="pp"/></arg>
  </typeraising>

</rules>

================================================
FILE: grammars/tiny/testbed.xml
================================================
<?xml version="1.0"?>
<!-- 
This file lists regression test items.

Copyright (C) 2005 David Reitter and University of Edinburgh (Michael White) 
$Revision: 1.3 $, $Date: 2010/09/13 04:37:19 $ 
-->
<regression>
  <item numOfParses="1" string="the teacher buys the policeman a book"/>
  <item numOfParses="1" string="the teacher buys the policemen some flowers"/>
  <item numOfParses="3" string="the teachers buy a book"/>
  <item numOfParses="3" string="she buys it"/>
  <item numOfParses="0" string="she buy it"/>
  <item numOfParses="0" string="they buys it"/>
  <item numOfParses="1" string="she buys the flower for him"/>
  <item numOfParses="0" string="she buys the flower for he"/>
  <item numOfParses="0" string="her buys the flower for him"/>
  <item numOfParses="1" string="he rented her a DVD"/>
  <item numOfParses="1" string="he rented a DVD for her"/>
  <item numOfParses="0" string="he rented a DVD her"/>
  <item numOfParses="1" string="she buys him a very blue book"/>
</regression>


================================================
FILE: grammars/tiny/types.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!--
This file contains the syntactic and semantic simple/atomic types.

The syntactic values for person are defined under pers-vals, and the
semantic types/sorts are defined under sem-obj. Indenting shows the
structure of the hierarchy. (In the general case, multiple parents may
be specified.)

Copyright (C) 2005 University of Edinburgh (Michael White)
$Revision: 1.1 $, $Date: 2005/01/22 12:53:35 $ 
-->
<types 
  name="tiny"
  xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" 
  xsi:noNamespaceSchemaLocation="../types.xsd"
>

  <!-- person vals -->
  <type name="pers-vals"/>
  <type name="3rd" parents="pers-vals"/>
  <type name="non-3rd" parents="pers-vals"/>
    <type name="1st" parents="non-3rd"/>
    <type name="2nd" parents="non-3rd"/>

  <!-- ontological sorts -->
  <type name="sem-obj"/>
    <type name="phys-obj" parents="sem-obj"/>
      <type name="animate-being" parents="phys-obj"/>
        <type name="person" parents="animate-being"/>
      <type name="thing" parents="phys-obj"/>
    <type name="situation" parents="sem-obj"/>
      <type name="change" parents="situation"/>
        <type name="action" parents="change"/>
      <type name="state" parents="situation"/>

</types>


================================================
FILE: grammars/tokens.xsd
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!-- 
Copyright (C) 2003 University of Edinburgh (Michael White) 
$Revision: 1.3 $, $Date: 2004/10/05 11:01:40 $ 
-->
<xsd:schema xmlns:xsd="http://www.w3.org/2001/XMLSchema">

  <xsd:annotation>
  <xsd:documentation>
    Definitions for tokens.
  </xsd:documentation>
  </xsd:annotation>

  <xsd:simpleType name="token">
    <xsd:annotation>
    <xsd:documentation>
      A 'token' as defined here is a string with no white space, for easy parsing, 
      but otherwise more flexible than a NMTOKEN.
    </xsd:documentation>
    </xsd:annotation>
    <xsd:restriction base="xsd:string">
      <xsd:pattern value="\S+"/>
    </xsd:restriction>
  </xsd:simpleType>

  <xsd:simpleType name="listOfTokens">
    <xsd:list itemType="token"/>
  </xsd:simpleType>

  <xsd:simpleType name="typedFeature">
    <xsd:annotation>
    <xsd:documentation>
      Feature variables with optional type.
    </xsd:documentation>
    </xsd:annotation>
    <xsd:restriction base="xsd:string">
      <xsd:pattern value="\S+(:\S+)?"/>
    </xsd:restriction>
  </xsd:simpleType>

</xsd:schema>


================================================
FILE: grammars/treeify-lists.xsl
================================================
<?xml version="1.0"?>
<!-- 
Copyright (C) 2003-4 University of Edinburgh (Michael White) 
$Revision: 1.4 $, $Date: 2005/07/18 21:19:41 $ 

This transformation "treeifies" lists into hierarchical structures 
using Item and Next rels.
-->
<xsl:transform 
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform" 
  version="1.0"
  xmlns:xalan2="http://xml.apache.org/xslt"
  exclude-result-prefixes="xalan2">

  <xsl:output indent="yes" xalan2:indent-amount="2"/> 
  <xsl:strip-space elements="*"/>

  
  <!-- change List rel to First and Last, treeify items -->
  <xsl:template match="rel[@name='List']">
    <!-- treeify list under First -->
    <rel name='First'>
      <xsl:call-template name="treeify-items"/>
    </rel>
    <!-- add Last rel to alias of last element -->
    <xsl:variable name="last" select="node[last()]"/>
    <xsl:variable name="alias">
      <xsl:call-template name="make-elem-id">
        <xsl:with-param name="item-id" select="$last/@id"/>
        <xsl:with-param name="ext" select="'_el_EqL'"/>
      </xsl:call-template>
    </xsl:variable>
    <rel name="Last">
      <node idref="{$alias}"/>
    </rel>
  </xsl:template>
  
  <!-- treeify child nodes -->
  <xsl:template name="treeify-items">
    <xsl:param name="pos" select="1"/>
    <xsl:choose>
      <xsl:when test="$pos &gt;= count(node)">
        <xsl:variable name="last" select="node[last()]"/>
        <xsl:variable name="elt-id">
          <xsl:call-template name="make-elem-id">
            <xsl:with-param name="item-id" select="$last/@id"/>
            <xsl:with-param name="ext" select="'_el'"/>
          </xsl:call-template>
        </xsl:variable>
        <xsl:variable name="alias">
          <xsl:call-template name="make-elem-id">
            <xsl:with-param name="item-id" select="$last/@id"/>
            <xsl:with-param name="ext" select="'_el_EqL'"/>
          </xsl:call-template>
        </xsl:variable>
        <node id="{$elt-id}" pred="elem">
          <!-- add EqL relation to final list element -->
          <rel name="EqL">
            <node idref="{$alias}"/>
          </rel>
          <rel name="Item">
            <xsl:apply-templates select="$last"/>
          </rel>
        </node>
      </xsl:when>
      <xsl:otherwise>
        <xsl:variable name="item" select="node[$pos]"/>
        <xsl:variable name="elt-id">
          <xsl:call-template name="make-elem-id">
            <xsl:with-param name="item-id" select="$item/@id"/>
            <xsl:with-param name="ext" select="'_el'"/>
          </xsl:call-template>
        </xsl:variable>
        <node id="{$elt-id}" pred="elem">
          <rel name="Item">
            <xsl:apply-templates select="$item"/>
          </rel>
          <rel name="Next">
            <xsl:call-template name="treeify-items">
              <xsl:with-param name="pos" select="$pos+1"/>
            </xsl:call-template>
          </rel>
        </node>
      </xsl:otherwise>
    </xsl:choose>
  </xsl:template>
  
  <!-- make elem id -->
  <xsl:template name="make-elem-id">
    <xsl:param name="item-id"/>
    <xsl:param name="ext"/>
    <xsl:variable name="item-id-base">
      <xsl:choose>
        <xsl:when test="contains($item-id, ':')">
          <xsl:value-of select="substring-before($item-id, ':')"/>
        </xsl:when>
        <xsl:otherwise>
          <xsl:value-of select="$item-id"/>
        </xsl:otherwise>
      </xsl:choose>
    </xsl:variable>
    <xsl:value-of select="concat($item-id-base, $ext, ':struct')"/>
  </xsl:template>
  
  
  <!-- Copy -->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: grammars/types.xsd
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!-- 
Copyright (C) 2003 Gunes Erkan
$Revision: 1.2 $, $Date: 2003/08/26 09:58:19 $ 
-->
<xsd:schema xmlns:xsd="http://www.w3.org/2001/XMLSchema">
  <xsd:annotation>
  <xsd:documentation>
    Schema for type hierarchy file.

    A type hierarchy file specifies the hierarchy of simple types which
    constitute the domain of syntactic feature values.
  </xsd:documentation>
  </xsd:annotation>

  <xsd:include schemaLocation="tokens.xsd"/>

  <xsd:element name="types">
    <xsd:annotation>
    <xsd:documentation>
      The root element, containing a list of type entries.
      Each type must have a unique name.
    </xsd:documentation>
    </xsd:annotation>
    <xsd:complexType>
      <xsd:sequence>
        <xsd:element name="type" maxOccurs="unbounded">
          <xsd:annotation>
          <xsd:documentation>
            A simple type, with its name and immediate parents in the hierarchy.
            Parents are specified as a space-separated list of type names.
            Parents attribute is optional and defaults to the built-in type "top".
            Only the immediate parents should be specified. 
            The whole hierarchy is constructed during the initial grammar loading process.
          </xsd:documentation>
          </xsd:annotation>
          <xsd:complexType>
            <xsd:attribute name="name" type="token" use="required"/>
            <xsd:attribute name="parents" type="listOfTokens"/>
          </xsd:complexType>
        </xsd:element>
      </xsd:sequence>
      <xsd:attribute name="name" type="xsd:string"/>
    </xsd:complexType>
    <xsd:unique name="typeNameUniqueness">
      <xsd:selector xpath="type"/>
      <xsd:field    xpath="@name"/>
    </xsd:unique>
  </xsd:element>
</xsd:schema>


================================================
FILE: grammars/worldcup/add-chunks.xsl
================================================
<?xml version="1.0"?>
<!-- 
Copyright (C) 2003 University of Edinburgh (Michael White)
$Revision: 1.4 $, $Date: 2005/07/18 21:19:45 $ 

This transformation adds LF chunks (to be realized separately) to the 
HLDS representations.
-->
<xsl:transform 
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform" 
  version="1.0"
  xmlns:xalan2="http://xml.apache.org/xslt"
  exclude-result-prefixes="xalan2">

  <xsl:output indent="yes" xalan2:indent-amount="2"/> 
  <xsl:strip-space elements="*"/>

  <!-- use shared add-chunks.xsl, primarily -->
  <xsl:include href="../add-chunks.xsl"/>
  
  <!-- possibly: don't chunk when there's a rel clause, to allow for extraposition 
  <xsl:template match="*[diamond[@mode='GenRel']]">
    <xsl:call-template name="copy"/>
  </xsl:template>
  -->
  
</xsl:transform>


================================================
FILE: grammars/worldcup/build.xml
================================================
<!-- $Id: build.xml,v 1.7 2007/03/26 14:40:44 mwhite14850 Exp $ -->
<!-- Copyright (C) 2003 University of Edinburgh (Michael White) -->
<project default="grammar" basedir=".">

  <!-- =================================================================== -->
  <!-- Initialization target                                               -->
  <!-- =================================================================== -->
  <target name="init">
    <tstamp/>
    <property name="Name" value="OpenCCG"/>
    <property name="name" value="openccg"/>

    <echo message="----------- ${Name} ------------"/>

    <property name="lib.dir" value="${openccg.home}/lib"/>
    <property name="grammars.dir" value="${openccg.home}/grammars"/>

    <path id="validate.classpath">
      <pathelement location="${lib.dir}/xercesImpl.jar"/>
      <pathelement location="${lib.dir}/${name}.jar"/>
    </path>
  </target>
  

  <!-- =================================================================== -->
  <!-- Help on usage                                                       -->
  <!-- =================================================================== -->
  <target name="usage">
    <echo message=""/>
    <echo message=""/>
    <echo message="OpenCCG grammar build file"/>
    <echo message="-------------------------------------------------------------"/>
    <echo message=""/>
    <echo message=" Available targets are:"/>
    <echo message=""/>
    <echo message="   grammar  --> builds the grammar (default)"/>
    <echo message=""/>
    <echo message=" See the comments inside the build.xml file for more details."/>
    <echo message="-------------------------------------------------------------"/>
    <echo message=""/>
    <echo message=""/>
  </target>
  

  <!-- =================================================================== -->
  <!-- Builds grammar                                                     -->
  <!-- =================================================================== -->
  <target name="grammar" depends="init" description="builds grammar">
    <echo message="Transforming lexicon-base.xsl to lexicon-base.xml"/>
    <java classname="org.apache.xalan.xslt.Process"> 
      <arg value="-XSL"/> <arg value="lexicon-base.xsl"/>
      <arg value="-OUT"/> <arg value="lexicon-base.xml"/>
    </java>
    <echo message="Adding family members from dict.xml to lexicon-base.xml, yielding lexicon.xml"/>
    <java classname="org.apache.xalan.xslt.Process"> 
      <arg value="-IN"/> <arg value="lexicon-base.xml"/>
      <arg value="-XSL"/> <arg value="${grammars.dir}/add-family-members.xsl"/>
      <arg value="-PARAM"/> <arg value="dict-file"/> <arg value="${basedir}/dict.xml"/>
      <arg value="-OUT"/> <arg value="lexicon.xml"/>
    </java>
    <echo message="Extracting morph items from dict.xml to morph.xml"/>
    <java classname="org.apache.xalan.xslt.Process"> 
      <arg value="-IN"/> <arg value="dict.xml"/>
      <arg value="-XSL"/> <arg value="${grammars.dir}/extract-morph.xsl"/>
      <arg value="-OUT"/> <arg value="morph.xml"/>
    </java>
    <echo message="Validating grammar.xml, lexicon.xml, morph.xml and rules.xml"/>
    <java classname="opennlp.ccg.test.Validator" classpathref="validate.classpath" fork="true"> 
      <arg value="grammar.xml"/>
      <arg value="lexicon.xml"/>
      <arg value="morph.xml"/>
      <arg value="rules.xml"/>
    </java>
  </target>

</project>

<!-- End of file -->


================================================
FILE: grammars/worldcup/dict.xml
================================================
<?xml version="1.0"?>
<!-- 
Copyright (C) 2003-4 Jason Baldridge and University of Edinburgh (Michael White) 
$Revision: 1.9 $, $Date: 2004/10/05 11:01:48 $ 
-->
<dictionary name="worldcup"
  xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
  xsi:noNamespaceSchemaLocation="../dict.xsd"
>

  <entry stem="that" pos="Pron">
    <member-of family="Rel"/>
    <member-of family="Comp"/>
  </entry>

  <entry stem="and" pos="Conj">
    <member-of family="Conj"/>
    <stem-for family="Conj" entry="NP-Collective"/>
    <stem-for family="Conj" entry="NP-Distributive-and-Rightward-TR"/>
    <stem-for family="Conj" entry="NP-Distributive-and-Leftward-TR"/>
  </entry>
  <entry stem="or" pos="Conj">
    <member-of family="Conj"/>
    <stem-for family="Conj" entry="NP-Distributive-or-Rightward-TR"/>
    <stem-for family="Conj" entry="NP-Distributive-or-Leftward-TR"/>
  </entry>

  <entry stem="." pred="declare" pos=".">
    <member-of family="FullStop"/>
  </entry>
  <entry stem="?" pred="ask" pos="?">
    <member-of family="QuestionMark"/>
  </entry>

  <entry stem="everyone" pred="every" pos="QNP">
    <member-of family="QuantNP"/>
  </entry>
  <entry stem="who" pos="WhNP">
    <member-of family="WhNP"/>
  </entry>

  <entry stem="a" pos="Det">
    <member-of family="Det"/>
    <word form="a"/>
    <word form="an"/>
  </entry>
  <entry stem="the" pos="Det">
    <member-of family="Det"/>
  </entry>
  
  <entry stem="his" pos="Det" class="PPRO">
    <member-of family="Det"/>
  </entry>
  <entry stem="my" pos="Det" class="PPRO">
    <member-of family="Det"/>
  </entry>
  <entry stem="its" pos="Det" class="PPRO">
    <member-of family="Det"/>
  </entry>
  
  <entry stem="all" pos="QDet">
    <member-of family="QuantDet"/>
  </entry>
  <entry stem="every" pos="QDet">
    <member-of family="QuantDet"/>
  </entry>
  <entry stem="no" pos="QDet">
    <member-of family="QuantDet"/>
  </entry>

  <entry stem="which" pos="Wh">
    <member-of family="WhDet"/>
  </entry>

  <entry stem="up" pos="Prep">
    <member-of family="Particle"/>
  </entry>
  <entry stem="with" pos="Prep">
    <member-of family="Particle"/>
  </entry>
  <entry stem="from" pos="Prep">
    <member-of family="PrepNom"/>
  </entry>
  <entry stem="to" pos="Prep">
    <member-of family="PrepNom"/>
    <member-of family="To-Infinitive"/>
  </entry>
  <entry stem="without" pos="Prep">
    <member-of family="PrepAdv"/>
  </entry>
  <entry stem="'s" pos="Prep"/>
  <entry stem="of" pos="Prep"/>
  <entry stem="about" pos="Prep"/>
  <entry stem="after" pos="Prep"/>
  <entry stem="on" pos="Prep"/>
  <entry stem="for" pos="Prep"/>
  <entry stem="in" pos="Prep"/>
  <entry stem="by" pos="Prep"/>
  <entry stem="between" pos="Prep"/>

  <entry stem="red" pos="Adj" class="COLOR"/>
  <entry stem="yellow" pos="Adj" class="COLOR"/>
  <entry stem="aggressive" pos="Adj"/>
  <entry stem="reckless" pos="Adj"/>
  <entry stem="quick" pos="Adj"/>
  <entry stem="powerful" pos="Adj"/>
  <entry stem="well-deserved" pos="Adj"/>
  <entry stem="first" pos="Adj"/>
  <entry stem="cup" pos="Adj"/>

  <entry stem="today" pos="Adv" class="TEMP_ADV"/>
  <entry stem="yesterday" pos="Adv" class="TEMP_ADV"/>
  <entry word="previously" stem="previous" pos="Adv"/>
  <entry word="skeptically" stem="skeptic" pos="Adv" class="ATT_ADV"/>
  <entry word="joyfully" stem="joyful" pos="Adv" class="ATT_ADV"/>
  <entry word="easily" stem="easy" pos="Adv" class="MANNER_ADV"/>
  <entry word="quickly" stem="quick" pos="Adv" class="MANNER_ADV"/>
  <entry word="skillfully" stem="skillful" pos="Adv" class="MANNER_ADV"/>
  <entry word="angrily" stem="angry" pos="Adv" class="MANNER_ADV"/>

  <entry stem="may" pos="V">
    <member-of family="Modal"/>
  </entry>
  <entry stem="will" pos="V">
    <member-of family="Modal"/>
  </entry>
  <entry stem="should" pos="V">
    <member-of family="Modal"/>
  </entry>
  <entry stem="would" pos="V">
    <member-of family="Modal"/>
  </entry>
  <entry stem="not" pos="V" macros="@nonfin">
    <member-of family="Modal"/>
  </entry>
  
  <entry word="did" stem="do" pos="V" macros="@past">
    <member-of family="Do-Support"/>
  </entry>

  <entry word="celebrated" stem="celebrate" pos="V" macros="@past">
    <member-of family="IV"/>
  </entry>
  <entry stem="cheer" pos="V">
    <member-of family="IV"/>
    <word form="cheer" macros="@nonfin"/>
    <word form="cheered" macros="@past"/>
  </entry>
  <entry stem="come" pos="V">
    <member-of family="IV"/>
    <word form="come" macros="@nonfin"/>
    <word form="came" macros="@past"/>
  </entry>
  <entry stem="leave" pos="V">
    <member-of family="IV"/>
    <word form="leave" macros="@nonfin"/>
    <word form="left" macros="@past"/>
  </entry>
  <entry word="misses" stem="miss" pos="V" macros="@pres @+3rd-agr @sg-agr">
    <member-of family="IV"/>
  </entry>
  <entry stem="score" pos="V">
    <member-of family="IV"/>
    <member-of family="TV"/>
    <word form="score" macros="@nonfin"/>
    <word form="scores" macros="@pres @+3rd-agr @sg-agr"/>
    <word form="scored" macros="@past"/>
  </entry>
  <entry stem="shoot" pos="V">
    <member-of family="IV"/>
    <member-of family="TV"/>
    <word form="shoot" macros="@nonfin"/>
    <word form="shoots" macros="@pres @+3rd-agr @sg-agr"/>
  </entry>
  <entry stem="smile" pos="V">
    <member-of family="IV"/>
    <word form="smile" macros="@nonfin"/>
    <word form="smile" macros="@pres @-3rd-agr"/>
    <word form="smiles" macros="@pres @+3rd-agr @sg-agr"/>
    <word form="smile" macros="@pres @+3rd-agr @pl-agr"/>
    <word form="smiled" macros="@past"/>
  </entry>
  <entry word="stayed" stem="stay" pos="V" macros="@past">
    <member-of family="IV"/>
  </entry>
  <entry stem="win" pos="V">
    <member-of family="IV"/>
    <member-of family="TV"/>
    <word form="won" macros="@past"/>
    <word form="win" macros="@nonfin"/>
  </entry>

  <entry word="astonished" stem="astonish" pos="V" macros="@past">
    <member-of family="TV"/>
  </entry>
  <entry stem="beat" pos="V" macros="@past">
    <member-of family="TV"/>
  </entry>
  <entry word="blocked" stem="block" pos="V" macros="@past">
    <member-of family="TV"/>
  </entry>
  <entry stem="defeat" pos="V">
    <member-of family="TV"/>
    <word form="defeat" macros="@nonfin"/>
    <word form="defeated" macros="@past"/>
  </entry>
  <entry word="enjoying" stem="enjoy" pos="V" macros="@gerund">
    <member-of family="TV"/>
  </entry>
  <entry word="hosted" stem="host" pos="V" macros="@past">
    <member-of family="TV"/>
  </entry>
  <entry word="kicked" stem="kick" pos="V" macros="@past">
    <member-of family="TV"/>
  </entry>
  <entry stem="meet" pos="V">
    <member-of family="TV"/>
    <word form="meet" macros="@nonfin"/>
    <word form="met" macros="@past"/>
  </entry>
  <entry stem="play" pos="V">
    <member-of family="TV"/>
    <word form="play" macros="@nonfin"/>
    <word form="played" macros="@past"/>
  </entry>
  <entry word="read" stem="read" pos="V" macros="@past">
    <member-of family="TV"/>
  </entry>
  <entry word="saw" stem="see" pos="V" macros="@past">
    <member-of family="TV"/>
  </entry>
  <entry stem="support" pos="V" macros="@nonfin">
    <member-of family="TV"/>
  </entry>
  <entry word="threw" stem="throw" pos="V" macros="@past">
    <member-of family="TV"/>
  </entry>
  <entry word="watched" stem="watch" pos="V" macros="@past">
    <member-of family="TV"/>
  </entry>

  <entry stem="return" pos="V" macros="@pp-from">
    <member-of family="TV-Motion"/>
    <word form="return" macros="@nonfin"/>
    <word form="returned" macros="@past"/>
  </entry>
  <entry stem="travel" pos="V" macros="@pp-to">
    <member-of family="TV-Motion"/>
    <word form="travel" macros="@nonfin"/>
    <word form="traveled" macros="@past"/>
  </entry>

  <entry word="knew" stem="know" pos="V" macros="@past">
    <member-of family="TV-Scomp"/>
  </entry>
  <entry word="predicted" stem="predict" pos="V" macros="@past">
    <member-of family="TV-Scomp"/>
  </entry>
  <entry word="said" stem="say" pos="V" macros="@past">
    <member-of family="TV-Scomp"/>
  </entry>
  <entry word="thought" stem="think" pos="V" macros="@past">
    <member-of family="TV-Scomp"/>
  </entry>

  <entry word="picked" stem="pick-up" pos="V" macros="@past @prt-up">
    <member-of family="TV-Phrasal"/>
  </entry>
  <entry stem="tie-with" pos="V" macros="@prt-with">
    <member-of family="TV-PrepComplement"/>
    <word form="tie" macros="@nonfin "/>
    <word form="tied" macros="@past"/>
  </entry>
  
  <entry word="bought" stem="buy" pos="V" macros="@past">
    <member-of family="DTV"/>
  </entry>
  <entry stem="give" pos="V">
    <member-of family="DTV"/>
    <word form="give" macros="@nonfin"/>
    <word form="gives" macros="@pres @+3rd-agr @sg-agr"/>
    <word form="gave" macros="@past"/>
  </entry>
  <entry word="offered" stem="offer" pos="V" macros="@past">
    <member-of family="DTV"/>
  </entry>

  <entry stem="persuade" pos="V">
    <member-of family="ObjectControl"/>
    <word form="persuade" macros="@nonfin"/>
    <word form="persuades" macros="@pres @+3rd-agr @sg-agr"/>
    <word form="persuaded" macros="@past"/>
  </entry>

  <entry stem="shot" pos="N" macros="@sg"/>
  <entry stem="ball" pos="N" macros="@sg"/>
  <entry stem="cup" pos="N" macros="@sg"/>
  <entry stem="friend" pos="N" macros="@sg"/>
  <entry stem="family" pos="N" macros="@sg"/>
  <entry stem="victory" pos="N" macros="@sg"/>
  <entry stem="ticket" pos="N">
    <word form="ticket" macros="@sg"/>
    <word form="tickets" macros="@pl"/>
  </entry>
  <entry stem="book" pos="N" macros="@sg"/>
  <entry stem="card" pos="N" macros="@sg"/>
  <entry stem="goal" pos="N">
    <word form="goal" macros="@sg"/>
    <word form="goals" macros="@pl"/>
  </entry>
  <entry stem="referee" pos="N" macros="@sg"/>
  <entry stem="team" pos="N">
    <word form="team" macros="@sg"/>
    <word form="teams" macros="@pl"/>
  </entry>
  <entry stem="game" pos="N">
    <word form="game" macros="@sg"/>
    <word form="games" macros="@pl"/>
  </entry>
  <entry stem="fan" pos="N" macros="@sg"/>
  <entry stem="final" pos="N" macros="@sg"/>
  <entry stem="field" pos="N" macros="@sg" class="PLACE"/>
  <entry stem="stadium" pos="N" macros="@sg" class="PLACE"/>
  <entry stem="country" pos="N" macros="@sg"/>
  <entry stem="detractor" pos="N" macros="@sg"/>
  <entry stem="player" pos="N">
    <word form="player" macros="@sg"/>
    <word form="players" macros="@pl"/>
  </entry>
  
  <entry stem="I" pos="NNP" macros="@-3rd @sg" class="PRO"/>
  <entry stem="me" pos="NNP" macros="@-3rd @sg" class="PRO"/>
  <entry stem="he" pos="NNP" macros="@sg" class="PRO"/>
  <entry stem="it" pos="NNP" macros="@sg" class="PRO"/>
  <entry stem="you" pos="NNP" macros="@-3rd" class="PRO"/>
  <entry stem="Spain" pos="NNP" macros="@sg" class="COUNTRY"/>
  <entry stem="Germany" pos="NNP" macros="@sg" class="COUNTRY"/>
  <entry stem="Brazil" pos="NNP" macros="@sg" class="COUNTRY"/>
  <entry stem="Turkey" pos="NNP" macros="@sg" class="COUNTRY"/>
  <entry stem="China" pos="NNP" macros="@sg" class="COUNTRY"/>
  <entry stem="Paraguay" pos="NNP" macros="@sg" class="COUNTRY"/>
  <entry stem="John" pos="NNP" macros="@sg" class="PERSON"/>
  <entry stem="Joao" pos="NNP" macros="@sg" class="PERSON"/>
  <entry stem="Maria" pos="NNP" macros="@sg" class="PERSON"/>
  <entry stem="Bill" pos="NNP" macros="@sg" class="PERSON"/>
  <entry stem="Ronaldo" pos="NNP" macros="@sg" class="PERSON"/>
  <entry stem="Ronaldinho" pos="NNP" macros="@sg" class="PERSON"/>
  <entry stem="Rivaldo" pos="NNP" macros="@sg" class="PERSON"/>
  <entry stem="Marcos" pos="NNP" macros="@sg" class="PERSON"/>
  <entry stem="Kahn" pos="NNP" macros="@sg" class="PERSON"/>
  <entry stem="Unsal" pos="NNP" macros="@sg" class="PERSON"/>

  <macro name="@+3rd-agr">
    <fs id="1" attr="3rd" val="+"/>
    <fs id="2" attr="3rd" val="+"/>
  </macro>

  <macro name="@-3rd">
    <fs id="1" attr="3rd" val="-"/>
    <fs id="2" attr="3rd" val="-"/>
  </macro>

  <macro name="@-3rd-agr">
    <fs id="1" attr="3rd" val="-"/>
    <fs id="2" attr="3rd" val="-"/>
  </macro>

  <macro name="@sg">
    <fs id="2" attr="num" val="sg"/>
    <lf>
      <satop nomvar="X">
        <diamond mode="num"><prop name="sg"/></diamond>
      </satop>
    </lf>
  </macro>

  <macro name="@sg-agr">
    <fs id="1" attr="num" val="sg"/>
    <fs id="2" attr="num" val="sg"/>
  </macro>

  <macro name="@pl">
    <fs id="2" attr="num" val="pl"/>
    <lf>
      <satop nomvar="X">
        <diamond mode="num"><prop name="pl"/></diamond>
      </satop>
    </lf>
  </macro>

  <macro name="@pl-agr">
    <fs id="1" attr="num" val="pl"/>
    <fs id="2" attr="num" val="pl"/>
  </macro>

  <macro name="@pp-from">
    <fs id="3" attr="lex" val="from"/>
  </macro>

  <macro name="@pp-to">
    <fs id="3" attr="lex" val="to"/>
  </macro>

  <macro name="@prt-up">
    <fs id="4" attr="lex" val="up"/>
  </macro>

  <macro name="@prt-with">
    <fs id="4" attr="lex" val="with"/>
  </macro>

  <macro name="@gerund">
    <fs id="1" attr="vform" val="ger"/>
  </macro>

  <macro name="@nonfin">
    <fs id="1" attr="vform" val="non-fin"/>
  </macro>

  <macro name="@finite">
    <fs id="1">
      <feat attr="vform" val="fin"/>
    </fs>
  </macro>

  <macro name="@past">
    <lf>
      <satop nomvar="E">
        <diamond mode="tense"><prop name="past"/></diamond>
      </satop>
    </lf>
  </macro>

  <macro name="@pres">
    <lf>
      <satop nomvar="E">
        <diamond mode="tense"><prop name="pres"/></diamond>
      </satop>
    </lf>
  </macro>

</dictionary>


================================================
FILE: grammars/worldcup/grammar.xml
================================================
<?xml version="1.0"?>
<!-- 
Copyright (C) 2003-4 University of Edinburgh (Michael White) 
$Revision: 1.4 $, $Date: 2005/03/22 21:16:45 $ 
-->
<grammar name="worldcup"
  xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
  xsi:noNamespaceSchemaLocation="../grammar.xsd"
>

  <lexicon file="lexicon.xml"/>
  <morphology file="morph.xml"/>
  <rules file="rules.xml"/>
  <tokenizer replacement-sem-classes="ATT_ADV COLOR COUNTRY 
    MANNER_ADV PERSON PLACE TEMP_ADV"/>

  <LF-from-XML>
    <transform file="../convert-to-hlds.xsl"/>
    <transform file="add-chunks.xsl"/>
  </LF-from-XML>

  <LF-to-XML>
    <transform file="raise-nodes.xsl"/>
    <transform file="../convert-to-graph.xsl"/>
  </LF-to-XML>

</grammar>


================================================
FILE: grammars/worldcup/lexicon-base.xsl
================================================
<?xml version="1.0"?>
<!-- 
Copyright (C) 2003-4 Jason Baldridge and University of Edinburgh (Michael White)
$Revision: 1.23 $, $Date: 2004/10/05 11:01:48 $ 

This grammar is a version of Jason's English fragment from his dissertation 
that has been upgraded to work with the new approach to semantic construction 
and grammar definition, and now also includes a new top-level category 
(for distinguishing declaratives from interrogatives), y/n questions, 
distributive NP coordination and gapping. 
-->
<xsl:transform 
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform" 
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  exclude-result-prefixes="xalan">

  <xsl:output indent="yes"/> 
  <xsl:strip-space elements="*"/>

  
  <!-- ***** Start Output Here ***** -->
  <xsl:template match="/">
  <ccg-lexicon name="worldcup"
    xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
    xsi:noNamespaceSchemaLocation="../lexicon.xsd"
  >

  <!-- ***** Feature Declarations ******  -->

  <licensing-features>
    <feat attr="vform" val="inf" location="target-only"/>
    <feat attr="marking" val="marked" license-empty-cats="false" location="target-only"/>
    <feat attr="inv" val="+" license-marked-cats="true"/>
  </licensing-features>
  
  <!-- ***** Relation Sorting ******  -->
  <relation-sorting order=
    "BoundVar First
     Restr Body Pred 
     Actor Patient Recipient Situation
     Item Item1 Item2
     * 
     Direction Modifier Ref 
     GenRel"/>
    
    
  <!-- ***** Base Categories ******  -->
  
  <xsl:variable name="n.2.X.default">
    <atomcat type="n">
      <fs id="2">
        <feat attr="num"><featvar name="NUM"/></feat>
        <feat attr="index"><lf><nomvar name="X"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="n.2.X">
    <atomcat type="n">
      <fs id="2">
        <feat attr="index"><lf><nomvar name="X"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="X.Default">
    <lf>
      <satop nomvar="X">
        <prop name="[*DEFAULT*]"/>
      </satop>
    </lf>
  </xsl:variable>

  <!-- NB: not dealing with case info -->  
  <xsl:variable name="np.2.X.default">
    <atomcat type="np">
      <fs id="2">
        <feat attr="num"><featvar name="NUM"/></feat>
        <feat attr="3rd"><featvar name="3RD"/></feat>
        <feat attr="index"><lf><nomvar name="X"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="np.2.X.3rd">
    <atomcat type="np">
      <fs id="2">
        <feat attr="3rd" val="+"/>
        <feat attr="index"><lf><nomvar name="X"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="np.2.X">
    <atomcat type="np">
      <fs id="2">
        <feat attr="index"><lf><nomvar name="X"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="np.3.Y">
    <atomcat type="np">
      <fs id="3">
        <feat attr="index"><lf><nomvar name="Y"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>
  
  <xsl:variable name="np.4.Z">
    <atomcat type="np">
      <fs id="4">
        <feat attr="index"><lf><nomvar name="Z"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>
  
  <xsl:variable name="np.X0.pl">
    <atomcat type="np">
      <fs>
        <feat attr="num" val="pl"/>
        <feat attr="index"><lf><nomvar name="X0"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="np.X1">
    <atomcat type="np">
      <fs>
        <feat attr="index"><lf><nomvar name="X1"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="np.X2">
    <atomcat type="np">
      <fs>
        <feat attr="index"><lf><nomvar name="X2"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="np.Y1">
    <atomcat type="np">
      <fs>
        <feat attr="index"><lf><nomvar name="Y1"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="np.Y2">
    <atomcat type="np">
      <fs>
        <feat attr="index"><lf><nomvar name="Y2"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>


  <xsl:variable name="pp.from-2.lex-Default">
    <atomcat type="pp">
      <fs inheritsFrom="2">
        <feat attr="lex" val="[*DEFAULT*]"/>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="pp.3.Y">
    <atomcat type="pp">
      <fs id="3">
        <feat attr="index"><lf><nomvar name="Y"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>


  <xsl:variable name="s.1.E.default">
    <atomcat type="s">
      <fs id="1">
        <feat attr="num"><featvar name="NUM"/></feat>
        <feat attr="3rd"><featvar name="3RD"/></feat>
        <feat attr="vform" val="fin"/>
        <feat attr="marking" val="none"/>
        <feat attr="inv" val="-"/>
        <feat attr="quant" val="-"/>
        <feat attr="index"><lf><nomvar name="E"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="s.1.E.QUANT.default">
    <atomcat type="s">
      <fs id="1">
        <feat attr="num"><featvar name="NUM"/></feat>
        <feat attr="3rd"><featvar name="3RD"/></feat>
        <feat attr="vform" val="fin"/>
        <feat attr="marking" val="none"/>
        <feat attr="inv" val="-"/>
        <feat attr="quant"><featvar name="QUANT"/></feat>
        <feat attr="index"><lf><nomvar name="E"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="s.1.E.inv.QUANT.default">
    <atomcat type="s">
      <fs id="1">
        <feat attr="num"><featvar name="NUM"/></feat>
        <feat attr="3rd"><featvar name="3RD"/></feat>
        <feat attr="vform" val="fin"/>
        <feat attr="marking" val="none"/>
        <feat attr="inv" val="+"/>
        <feat attr="quant"><featvar name="QUANT"/></feat>
        <feat attr="index"><lf><nomvar name="E"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="s.1.S.quant.default">
    <atomcat type="s">
      <fs id="1">
        <feat attr="num"><featvar name="NUM"/></feat>
        <feat attr="3rd"><featvar name="3RD"/></feat>
        <feat attr="vform" val="fin"/>
        <feat attr="marking" val="none"/>
        <feat attr="inv" val="-"/>
        <feat attr="quant" val="+"/>
        <feat attr="index"><lf><nomvar name="S"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>
  
  <xsl:variable name="s.1.E.unmarked">
    <atomcat type="s">
      <fs id="1">
        <feat attr="marking" val="none"/>
        <feat attr="index"><lf><nomvar name="E"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>
  
  <xsl:variable name="s.6.E.unmarked.-quant">
    <atomcat type="s">
      <fs id="6">
        <feat attr="marking" val="none"/>
        <feat attr="quant" val="-"/>
        <feat attr="index"><lf><nomvar name="E"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>
  
  <xsl:variable name="s.1.E.inv">
    <atomcat type="s">
      <fs id="1">
        <feat attr="inv" val="+"/>
        <feat attr="index"><lf><nomvar name="E"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>
  
  <xsl:variable name="s.1.E.non-fin">
    <atomcat type="s">
      <fs id="1">
        <feat attr="vform" val="non-fin"/>
        <feat attr="index"><lf><nomvar name="E"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>
  
  <xsl:variable name="s.1.E">
    <atomcat type="s">
      <fs id="1">
        <feat attr="index"><lf><nomvar name="E"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>
  
  <xsl:variable name="s.1.E.fin.unmarked.-inv">
    <atomcat type="s">
      <fs id="1">
        <feat attr="vform" val="fin"/>
        <feat attr="marking" val="none"/>
        <feat attr="inv" val="-"/>
        <feat attr="index"><lf><nomvar name="E"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="s.E.non-fin.unmarked.QUANT">
    <atomcat type="s">
      <fs>
        <feat attr="vform" val="non-fin"/>
        <feat attr="marking" val="none"/>
        <feat attr="quant"><featvar name="QUANT"/></feat>
        <feat attr="index"><lf><nomvar name="E"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="s.E2.ger">
    <atomcat type="s">
      <fs>
        <feat attr="vform" val="ger"/>
        <feat attr="index"><lf><nomvar name="E2"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="s.E2.inf.unmarked">
    <atomcat type="s">
      <fs>
        <feat attr="vform" val="inf"/>
        <feat attr="marking" val="none"/>
        <feat attr="index"><lf><nomvar name="E2"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="s.E2.-inv">
    <atomcat type="s">
      <fs>
        <feat attr="inv" val="-"/>
        <feat attr="index"><lf><nomvar name="E2"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="s.E2.non-fin.unmarked.QUANT">
    <atomcat type="s">
      <fs>
        <feat attr="vform" val="non-fin"/>
        <feat attr="marking" val="none"/>
        <feat attr="quant"><featvar name="QUANT"/></feat>
        <feat attr="index"><lf><nomvar name="E2"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="s.from-1.marked">
    <atomcat type="s">
      <fs inheritsFrom="1">
        <feat attr="marking" val="marked"/>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="s.from-1.fronted">
    <atomcat type="s">
      <fs inheritsFrom="1">
        <feat attr="marking" val="fronted"/>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="s.from-1.inf">
    <atomcat type="s">
      <fs inheritsFrom="1">
        <feat attr="vform" val="inf"/>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="s.from-1.S.quant">
    <atomcat type="s">
      <fs inheritsFrom="1">
        <feat attr="quant" val="+"/>
        <feat attr="index"><lf><nomvar name="S"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="s.from-6.S.quant">
    <atomcat type="s">
      <fs inheritsFrom="6">
        <feat attr="quant" val="+"/>
        <feat attr="index"><lf><nomvar name="S"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>
  
  <xsl:variable name="s.from-1.Q.wh">
    <atomcat type="s">
      <fs inheritsFrom="1">
        <feat attr="marking" val="wh"/>
        <feat attr="index"><lf><nomvar name="Q"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="s.from-1.E0">
    <atomcat type="s">
      <fs inheritsFrom="1">
        <feat attr="index"><lf><nomvar name="E0"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="s.from-1.E1">
    <atomcat type="s">
      <fs inheritsFrom="1">
        <feat attr="index"><lf><nomvar name="E1"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="s.1.E2">
    <atomcat type="s">
      <fs id="1">
        <feat attr="index"><lf><nomvar name="E2"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>
  
  <xsl:variable name="s.E.unmarked.-inv">
    <atomcat type="s">
      <fs>
        <feat attr="marking" val="none"/>
        <feat attr="inv" val="-"/>
        <feat attr="index"><lf><nomvar name="E"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="s.E.fronted.-inv">
    <atomcat type="s">
      <fs>
        <feat attr="marking" val="fronted"/>
        <feat attr="inv" val="-"/>
        <feat attr="index"><lf><nomvar name="E"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="s.E.inv">
    <atomcat type="s">
      <fs>
        <feat attr="inv" val="+"/>
        <feat attr="index"><lf><nomvar name="E"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  <xsl:variable name="s.E.wh">
    <atomcat type="s">
      <fs>
        <feat attr="marking" val="wh"/>
        <feat attr="index"><lf><nomvar name="E"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>


  <xsl:variable name="sent.E">
    <atomcat type="sent">
      <fs>
        <feat attr="index"><lf><nomvar name="E"/></lf></feat>
      </fs>
    </atomcat>
  </xsl:variable>

  
  <!-- ***** Derived Categories and Families ***** -->
  
  <family name="Noun" pos="N">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($n.2.X.default)/*"/>
        <xsl:with-param name="ext" select="$X.Default"/>
      </xsl:call-template>
    </entry>
  </family>

  <!-- NP -->
  <xsl:variable name="np.fronted">    
    <complexcat>
      <xsl:copy-of select="$s.from-1.fronted"/>
      <slash dir="/" mode="^"/>
      <complexcat>
        <xsl:copy-of select="$s.1.E.default"/>
        <slash dir="/"/>
        <xsl:copy-of select="$np.2.X.3rd"/>
      </complexcat>
    </complexcat>
  </xsl:variable>

  <family name="Name" pos="NNP">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($np.2.X.3rd)/*"/>
        <xsl:with-param name="ext" select="$X.Default"/>
      </xsl:call-template>
    </entry>
    <entry name="Fronted">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($np.fronted)/*"/>
        <xsl:with-param name="ext" select="$X.Default"/>
      </xsl:call-template>
    </entry>
  </family>

  <xsl:variable name="qnp.rightward-TR">
    <complexcat>
      <xsl:copy-of select="$s.from-1.S.quant"/>
      <slash dir="/" varmodality="m1" ability="active"/>
      <complexcat>
        <xsl:copy-of select="$s.1.E.unmarked"/>
        <slash dir="\" varmodality="m1" ability="active"/>
        <xsl:copy-of select="$np.2.X.3rd"/>
      </complexcat>
    </complexcat>
  </xsl:variable>

  <xsl:variable name="qnp.leftward-TR">
    <complexcat>
      <xsl:copy-of select="$s.from-1.S.quant"/>
      <slash/>
      <dollar name="1"/>
      <slash dir="\" varmodality="m1" ability="active"/>
      <complexcat>
        <xsl:copy-of select="$s.1.E.unmarked"/>
        <slash/>
        <dollar name="1"/>
        <slash dir="/" varmodality="m1" ability="active"/>
        <xsl:copy-of select="$np.2.X.3rd"/>
      </complexcat>
    </complexcat>
  </xsl:variable>

  <xsl:variable name="S.Default.Restr.X.Body.E">  
    <lf>
      <satop nomvar="S">
        <prop name="[*DEFAULT*]"/>
        <diamond mode="Restr">
          <nomvar name="X"/>
        </diamond>
        <diamond mode="Body"><nomvar name="E"/></diamond>
      </satop>
    </lf>
  </xsl:variable>

  <family name="QuantNP" pos="QNP" closed="true">
    <entry name="RightwardTypeRaised">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($qnp.rightward-TR)/*"/>
        <xsl:with-param name="ext" select="$S.Default.Restr.X.Body.E"/>
      </xsl:call-template>
    </entry>
    <entry name="LeftwardTypeRaised">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($qnp.leftward-TR)/*"/>
        <xsl:with-param name="ext" select="$S.Default.Restr.X.Body.E"/>
      </xsl:call-template>
    </entry>
  </family>

  <xsl:variable name="wh-np.subj">
    <complexcat>
      <xsl:copy-of select="$s.from-1.Q.wh"/>
      <slash dir="/" mode="*"/>
      <complexcat>
        <xsl:copy-of select="$s.1.E.unmarked"/>
        <slash dir="\" mode="&lt;"/>
        <xsl:copy-of select="$np.2.X.3rd"/>
      </complexcat>
    </complexcat>
  </xsl:variable>

  <xsl:variable name="wh-np.obj">
    <complexcat>
      <xsl:copy-of select="$s.from-1.Q.wh"/>
      <slash dir="/" mode="*"/>
      <complexcat>
        <xsl:copy-of select="$s.1.E.inv"/>
        <slash dir="/"/>
        <xsl:copy-of select="$np.2.X.3rd"/>
      </complexcat>
    </complexcat>
  </xsl:variable>

  <xsl:variable name="Q.Default.Restr.X.Body.E">  
    <lf>
      <satop nomvar="Q">
        <prop name="[*DEFAULT*]"/>
        <diamond mode="Restr">
          <nomvar name="X"/>
        </diamond>
        <diamond mode="Body"><nomvar name="E"/></diamond>
      </satop>
    </lf>
  </xsl:variable>

  <family name="WhNP" pos="WhNP" closed="true">
    <entry name="SubjectExtraction">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($wh-np.subj)/*"/>
        <xsl:with-param name="ext" select="$Q.Default.Restr.X.Body.E"/>
      </xsl:call-template>
    </entry>
    <entry name="ObjectExtraction">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($wh-np.obj)/*"/>
        <xsl:with-param name="ext" select="$Q.Default.Restr.X.Body.E"/>
      </xsl:call-template>
    </entry>
  </family>

  <!-- Det -->
  <xsl:variable name="fslash-n.2.X">
    <slash dir="/" mode="^" />
    <xsl:copy-of select="$n.2.X"/>
  </xsl:variable>
  
  <xsl:variable name="det">
    <complexcat>
      <xsl:copy-of select="$np.2.X.3rd"/>
      <xsl:copy-of select="$fslash-n.2.X"/>
    </complexcat>
  </xsl:variable>
  
  <xsl:variable name="det.fronted">    
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($np.fronted)/*"/>
      <xsl:with-param name="ext" select="$fslash-n.2.X"/>
    </xsl:call-template>
  </xsl:variable>

  <xsl:variable name="X.det.Default">
    <lf>
      <satop nomvar="X">
        <diamond mode="det">
          <prop name="[*DEFAULT*]"/>
        </diamond>
      </satop>
    </lf>
  </xsl:variable>
  
  <family name="Det" pos="Det" closed="true" indexRel="det">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($det)/*"/>
        <xsl:with-param name="ext" select="$X.det.Default"/>
      </xsl:call-template>
    </entry>
    <entry name="Fronted">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($det.fronted)/*"/>
        <xsl:with-param name="ext" select="$X.det.Default"/>
      </xsl:call-template>
    </entry>
  </family>

  <xsl:variable name="qdet.rightward-TR">
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($qnp.rightward-TR)/*"/>
      <xsl:with-param name="ext" select="$fslash-n.2.X"/>
    </xsl:call-template>
  </xsl:variable>

  <xsl:variable name="qdet.leftward-TR">    
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($qnp.leftward-TR)/*"/>
      <xsl:with-param name="ext" select="$fslash-n.2.X"/>
    </xsl:call-template>
  </xsl:variable>

  <family name="QuantDet" pos="QDet" closed="true">
    <entry name="RightwardTypeRaised">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($qdet.rightward-TR)/*"/>
        <xsl:with-param name="ext" select="$S.Default.Restr.X.Body.E"/>
      </xsl:call-template>
    </entry>
    <entry name="LeftwardTypeRaised">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($qdet.leftward-TR)/*"/>
        <xsl:with-param name="ext" select="$S.Default.Restr.X.Body.E"/>
      </xsl:call-template>
    </entry>
  </family>

  <xsl:variable name="wh-det.subj">    
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($wh-np.subj)/*"/>
      <xsl:with-param name="ext" select="$fslash-n.2.X"/>
    </xsl:call-template>
  </xsl:variable>

  <xsl:variable name="wh-det.obj">    
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($wh-np.obj)/*"/>
      <xsl:with-param name="ext" select="$fslash-n.2.X"/>
    </xsl:call-template>
  </xsl:variable>

  <family name="WhDet" pos="Wh" closed="true">
    <entry name="SubjectExtraction">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($wh-det.subj)/*"/>
        <xsl:with-param name="ext" select="$Q.Default.Restr.X.Body.E"/>
      </xsl:call-template>
    </entry>
    <entry name="ObjectExtraction">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($wh-det.obj)/*"/>
        <xsl:with-param name="ext" select="$Q.Default.Restr.X.Body.E"/>
      </xsl:call-template>
    </entry>
  </family>

  <!-- Adj -->
  <xsl:variable name="adj">
    <complexcat>
      <xsl:copy-of select="$n.2.X"/>
      <xsl:copy-of select="$fslash-n.2.X"/>
    </complexcat>
  </xsl:variable>
  
  <xsl:variable name="X.Modifier.P.Default">
    <lf>
      <satop nomvar="X">
        <diamond mode="Modifier">
          <nomvar name="P"/>
          <prop name="[*DEFAULT*]"/>
        </diamond>
      </satop>
    </lf>
  </xsl:variable>
  
  <family name="Adjective" pos="Adj">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($adj)/*"/>
        <xsl:with-param name="ext" select="$X.Modifier.P.Default"/>
      </xsl:call-template>
    </entry>
  </family>
  
  <!-- VP (ie S\NP) -->
  <xsl:variable name="vp.1.E.2.X">
    <complexcat>
      <xsl:copy-of select="$s.1.E"/>
      <slash dir="\" mode="&lt;"/>
      <xsl:copy-of select="$np.2.X"/>
    </complexcat>
  </xsl:variable>
  
  <!-- Adv -->
  <xsl:variable name="adv.initial">
    <complexcat>
      <xsl:copy-of select="$s.from-1.fronted"/>
      <slash dir="/" mode="^"/>
      <xsl:copy-of select="$s.1.E.unmarked"/>
    </complexcat>
  </xsl:variable>
  
  <xsl:variable name="adv.forward">
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($vp.1.E.2.X)/*"/>
      <xsl:with-param name="ext">
        <slash dir="/" mode="^"/>
        <xsl:copy-of select="$vp.1.E.2.X"/>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>

  <!-- 
    NB: This category doesn't allow "John said yesterday that Bill smiled" 
        go through, because "John said yesterday" ends up with an inert slash. 
        Another possibility would be to use s$\s$ instead of backwards crossed
        composition, but this would then mistakenly allow "*the referee gave today ..." 
        and "*Joao traveled to skeptically ...".
  -->  
  <xsl:variable name="adv.backward">
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($vp.1.E.2.X)/*"/>
      <xsl:with-param name="ext">
        <slash dir="\"/>
        <xsl:copy-of select="$vp.1.E.2.X"/>
      </xsl:with-param>
    </xsl:call-template>
    <!-- 
    <complexcat>
      <xsl:copy-of select="$s.1.E"/>
      <slash/>
      <dollar name="1"/>
      <slash dir="\" mode="*"/>
      <complexcat>
        <xsl:copy-of select="$s.1.E"/>
        <slash/>
        <dollar name="1"/>
      </complexcat>
    </complexcat>
    -->
  </xsl:variable>
  
  <xsl:variable name="E.Modifier.M.Default">
    <lf>
      <satop nomvar="E">
        <diamond mode="Modifier">
          <nomvar name="M"/>
          <prop name="[*DEFAULT*]"/>
        </diamond>
      </satop>
    </lf>
  </xsl:variable>
  
  <family name="Adverb" pos="Adv">
    <entry name="Initial">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($adv.initial)/*"/>
        <xsl:with-param name="ext" select="$E.Modifier.M.Default"/>
      </xsl:call-template>
    </entry>
    <entry name="Forward">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($adv.forward)/*"/>
        <xsl:with-param name="ext" select="$E.Modifier.M.Default"/>
      </xsl:call-template>
    </entry>
    <entry name="Backward">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($adv.backward)/*"/>
        <xsl:with-param name="ext" select="$E.Modifier.M.Default"/>
      </xsl:call-template>
    </entry>
  </family>
  
  <!-- Particles and Prepositions -->
  <family name="Particle" pos="Prep" closed="true" indexRel="*NoSem*">
    <entry name="Primary">
      <atomcat type="prt">
        <fs><feat attr="lex" val="[*DEFAULT*]"/></fs>
      </atomcat>
    </entry>
  </family>
  
  <family name="PrepNom" pos="Prep" closed="true" indexRel="*NoSem*">
    <entry name="Nominal" active="true">
      <complexcat>
        <xsl:copy-of select="$pp.from-2.lex-Default"/>
        <slash dir="/" mode="&lt;"/>
        <xsl:copy-of select="$np.2.X"/>
      </complexcat>
    </entry>
  </family>
  
  <family name="PrepAdj" pos="Prep"  closed="false">
    <entry name="NP-Modifier">
      <complexcat>
        <xsl:copy-of select="$n.2.X"/>
        <setarg>
          <slash dir="\" mode="*"/>
          <xsl:copy-of select="$n.2.X"/>
          <slash dir="/" mode="&lt;"/>
          <xsl:copy-of select="$np.3.Y"/>
        </setarg>
        <lf>
          <satop nomvar="X">
            <diamond mode="Modifier">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Ref">
                <nomvar name="Y"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
  
  <family name="PrepAdv" pos="Prep" closed="true">
    <entry name="Backward">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($adv.backward)/*"/>
        <xsl:with-param name="ext">
          <slash dir="/" mode="&gt;"/>
          <complexcat>
            <xsl:copy-of select="$s.E2.ger"/>
            <slash dir="\"/>
            <xsl:copy-of select="$np.2.X"/>
          </complexcat>
          <lf>
            <satop nomvar="E">
              <diamond mode="Modifier">
                <nomvar name="M"/>
                <prop name="[*DEFAULT*]"/>
                <diamond mode="Situation">
                  <nomvar name="E2"/>
                </diamond>
              </diamond>
            </satop>
          </lf>
        </xsl:with-param>
      </xsl:call-template>
    </entry>
  </family>

  <!-- IV -->
  <xsl:variable name="iv">    
    <complexcat>
      <xsl:copy-of select="$s.1.E.default"/>
      <slash dir="\" mode="&lt;"/>
      <xsl:copy-of select="$np.2.X.default"/>
    </complexcat>
  </xsl:variable>

  <xsl:variable name="E.Default.Actor.X">  
    <lf>
      <satop nomvar="E">
        <prop name="[*DEFAULT*]"/>
        <diamond mode="Actor"><nomvar name="X"/></diamond>
      </satop>
    </lf>
  </xsl:variable>

  <family name="IV" pos="V" closed="true">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($iv)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Actor.X"/>
      </xsl:call-template>
    </entry>
  </family>
  
  <!-- TV (lifted variant is experimental) -->
  <!-- NB: Lifting is only necessary to compose into the object; 
           this is presumably too rare to bother with beyond this
           test suite. -->
  <xsl:variable name="tv">    
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($iv)/*"/>
      <xsl:with-param name="ext">
        <slash dir="/" mode="&gt;"/>
        <xsl:copy-of select="$np.3.Y"/>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>
  
  <xsl:variable name="tv.lifted">
    <complexcat>
      <xsl:copy-of select="$s.1.S.quant.default"/>
      <slash dir="\" mode="&lt;"/>
      <xsl:copy-of select="$np.2.X.default"/>
      <slash dir="/" mode="&gt;"/>
      <complexcat>
        <xsl:copy-of select="$s.from-6.S.quant"/>
        <slash dir="/"/>
        <complexcat>
          <xsl:copy-of select="$s.6.E.unmarked.-quant"/>
          <slash dir="\"/>
          <xsl:copy-of select="$np.3.Y"/>
        </complexcat>
      </complexcat>
    </complexcat>
  </xsl:variable>

  <xsl:variable name="E.Default.Actor.X.Patient.Y">  
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($E.Default.Actor.X)/*"/>
      <xsl:with-param name="ext">
        <satop nomvar="E">
          <diamond mode="Patient"><nomvar name="Y"/></diamond>
        </satop>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>
  
  <family name="TV" pos="V" closed="true">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($tv)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Actor.X.Patient.Y"/>
      </xsl:call-template>
    </entry>
    <entry name="Lifted">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($tv.lifted)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Actor.X.Patient.Y"/>
      </xsl:call-template>
    </entry>
  </family>

  <!-- TV Motion -->
  <xsl:variable name="tv.motion">    
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($iv)/*"/>
      <xsl:with-param name="ext">
        <slash dir="/" mode="&gt;"/>
        <xsl:copy-of select="$pp.3.Y"/>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>

  <xsl:variable name="E.Default.Actor.X.Direction.Y">  
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($E.Default.Actor.X)/*"/>
      <xsl:with-param name="ext">
        <satop nomvar="E">
          <diamond mode="Direction"><nomvar name="Y"/></diamond>
        </satop>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>
  
  <family name="TV-Motion" pos="V" closed="true">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($tv.motion)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Actor.X.Direction.Y"/>
      </xsl:call-template>
    </entry>
  </family>

  <!-- TV Scomp -->
  <xsl:variable name="tv.scomp">    
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($iv)/*"/>
      <xsl:with-param name="ext">
        <slash dir="/" mode="&lt;"/>
        <xsl:copy-of select="$s.E2.-inv"/>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>

  <xsl:variable name="E.Default.Actor.X.Situation.E2">  
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($E.Default.Actor.X)/*"/>
      <xsl:with-param name="ext">
        <satop nomvar="E">
          <diamond mode="Situation"><nomvar name="E2"/></diamond>
        </satop>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>
  
  <family name="TV-Scomp" pos="V" closed="true">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($tv.scomp)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Actor.X.Situation.E2"/>
      </xsl:call-template>
    </entry>
  </family>

  <!-- TV Phrasal -->
  <xsl:variable name="tv.phrasal">    
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($iv)/*"/>
      <xsl:with-param name="ext">
        <setarg>
          <slash dir="/" mode="&gt;"/>
          <xsl:copy-of select="$np.3.Y"/>
          <slash dir="/" mode="*"/>
          <atomcat type="prt">
            <fs id="4"/>
          </atomcat>
        </setarg>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>
  
  <family name="TV-Phrasal" pos="V" closed="true">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($tv.phrasal)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Actor.X.Patient.Y"/>
      </xsl:call-template>
    </entry>
  </family>

  <!-- TV Prep Complement -->
  <xsl:variable name="tv.prep-complement">    
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($iv)/*"/>
      <xsl:with-param name="ext">
        <slash dir="/" mode="&gt;"/>
        <xsl:copy-of select="$np.3.Y"/>
        <slash dir="/" mode="*"/>
        <atomcat type="prt">
          <fs id="4"/>
        </atomcat>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>
  
  <family name="TV-PrepComplement" pos="V" closed="true">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($tv.prep-complement)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Actor.X.Patient.Y"/>
      </xsl:call-template>
    </entry>
  </family>

  <!-- DTV -->
  <xsl:variable name="dtv">    
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($tv)/*"/>
      <xsl:with-param name="ext">
        <slash dir="/" mode="&lt;"/>
        <xsl:copy-of select="$np.4.Z"/>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>

  <xsl:variable name="E.Default.Actor.X.Patient.Y.Recipient.Z">  
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($E.Default.Actor.X.Patient.Y)/*"/>
      <xsl:with-param name="ext">
        <satop nomvar="E">
          <diamond mode="Recipient"><nomvar name="Z"/></diamond>
        </satop>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>
  
  <family name="DTV" pos="V" closed="true">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($dtv)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Actor.X.Patient.Y.Recipient.Z"/>
      </xsl:call-template>
    </entry>
  </family>

  <!-- Object Control -->
  <xsl:variable name="object-control">    
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($iv)/*"/>
      <xsl:with-param name="ext">
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <xsl:copy-of select="$s.E2.inf.unmarked"/>
          <slash dir="\"/>
          <xsl:copy-of select="$np.3.Y"/>
        </complexcat>
        <slash dir="/" mode="&lt;"/>
        <xsl:copy-of select="$np.3.Y"/>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>

  <xsl:variable name="object-control.lifted">
    <complexcat>
      <xsl:copy-of select="$s.1.S.quant.default"/>
      <slash dir="\" mode="&lt;"/>
      <xsl:copy-of select="$np.2.X.default"/>
      <slash dir="/" mode="&gt;"/>
      <complexcat>
        <xsl:copy-of select="$s.E2.inf.unmarked"/>
        <slash dir="\"/>
        <xsl:copy-of select="$np.3.Y"/>
      </complexcat>
      <slash dir="/" mode="&lt;"/>
      <complexcat>
        <xsl:copy-of select="$s.from-6.S.quant"/>
        <slash dir="/"/>
        <complexcat>
          <xsl:copy-of select="$s.6.E.unmarked.-quant"/>
          <slash dir="\"/>
          <xsl:copy-of select="$np.3.Y"/>
        </complexcat>
      </complexcat>
    </complexcat>
  </xsl:variable>

  <xsl:variable name="E.Default.Actor.X.Patient.Y.Situation.E2">  
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($E.Default.Actor.X.Patient.Y)/*"/>
      <xsl:with-param name="ext">
        <satop nomvar="E">
          <diamond mode="Situation"><nomvar name="E2"/></diamond>
        </satop>
      </xsl:with-param>
    </xsl:call-template>
  </xsl:variable>
  
  <family name="ObjectControl" pos="V" closed="true">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($object-control)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Actor.X.Patient.Y.Situation.E2"/>
      </xsl:call-template>
    </entry>
    <entry name="Lifted">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($object-control.lifted)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Actor.X.Patient.Y.Situation.E2"/>
      </xsl:call-template>
    </entry>
  </family>

  <!-- To Infinitive -->
  <family name="To-Infinitive" pos="Prep" closed="true" indexRel="*NoSem*">
    <entry name="Basic">
      <complexcat>
        <xsl:copy-of select="$s.from-1.inf"/>
        <slash dir="\" mode="&lt;" ability="inert"/>
        <xsl:copy-of select="$np.2.X"/>
        <slash dir="/" mode="^"/>
        <complexcat>
          <xsl:copy-of select="$s.1.E.non-fin"/>
          <slash dir="\" mode="&lt;"/>
          <xsl:copy-of select="$np.2.X"/>
        </complexcat>
      </complexcat>
    </entry>
  </family>

  <!-- Modal -->
  <xsl:variable name="modal">
    <complexcat>
      <xsl:copy-of select="$s.1.E.QUANT.default"/>
      <slash dir="\" mode="&lt;"/>
      <xsl:copy-of select="$np.2.X.default"/>
      <slash dir="/" mode="^"/>
      <complexcat>
        <xsl:copy-of select="$s.E2.non-fin.unmarked.QUANT"/>
        <slash dir="\" mode="&lt;"/>
        <xsl:copy-of select="$np.2.X.default"/>
      </complexcat>
    </complexcat>
  </xsl:variable>

  <xsl:variable name="modal.inverted">
    <complexcat>
      <xsl:copy-of select="$s.1.E.inv.QUANT.default"/>
      <slash dir="/" mode="^"/>
      <xsl:copy-of select="$s.E2.non-fin.unmarked.QUANT"/>
    </complexcat>
  </xsl:variable>

  <xsl:variable name="E.Default.Body.E2">
    <lf>
      <satop nomvar="E">
        <prop name="[*DEFAULT*]"/>
        <diamond mode="Body"><nomvar name="E2"/></diamond>
      </satop>
    </lf>
  </xsl:variable>
  
  <family name="Modal" pos="V" closed="true">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($modal)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Body.E2"/>
      </xsl:call-template>
    </entry>
    <entry name="Inverted">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($modal.inverted)/*"/>
        <xsl:with-param name="ext" select="$E.Default.Body.E2"/>
      </xsl:call-template>
    </entry>
  </family>
  
  <!-- Do Support (experimental) -->
  <!-- NB: While it's good that this treatment of 'do' enables wh-questions 
           extracting from subjects and objects to be treated the same, 
           in declaratives it would probably be better to introduce 'do' 
           only to indicate positive polarity, with the possibility of 
           lexical emphasis. -->
  <xsl:variable name="do-support">
    <complexcat>
      <xsl:copy-of select="$s.1.E.QUANT.default"/>
      <slash dir="\" mode="&lt;"/>
      <xsl:copy-of select="$np.2.X.default"/>
      <slash dir="/" mode="^"/>
      <complexcat>
        <xsl:copy-of select="$s.E.non-fin.unmarked.QUANT"/>
        <slash dir="\" mode="&lt;"/>
        <xsl:copy-of select="$np.2.X.default"/>
      </complexcat>
    </complexcat>
  </xsl:variable>

  <xsl:variable name="do-support.inverted">
    <complexcat>
      <xsl:copy-of select="$s.1.E.inv.QUANT.default"/>
      <slash dir="/" mode="^"/>
      <xsl:copy-of select="$s.E.non-fin.unmarked.QUANT"/>
    </complexcat>
  </xsl:variable>
  
  <family name="Do-Support" pos="V" closed="true" indexRel="tense">
    <entry name="Primary">
      <xsl:copy-of select="$do-support"/>
    </entry>
    <entry name="Inverted">
      <xsl:copy-of select="$do-support.inverted"/>
    </entry>
  </family>
  
  <!-- Rel -->
  <xsl:variable name="rel">
    <complexcat>
      <xsl:copy-of select="$n.2.X"/>
      <setarg>
        <slash dir="\" mode="*"/>
        <xsl:copy-of select="$n.2.X"/>
        <slash dir="/" mode="*"/>
        <complexcat>
          <xsl:copy-of select="$s.1.E.fin.unmarked.-inv"/>
          <slash dir="|"/>
          <xsl:copy-of select="$np.2.X.3rd"/>
        </complexcat>
      </setarg>
    </complexcat>
  </xsl:variable>

  <xsl:variable name="X.GenRel.E">
    <lf>
      <satop nomvar="X">
        <diamond mode="GenRel"><nomvar name="E"/></diamond>
      </satop>
    </lf>
  </xsl:variable>  

  <family name="Rel" pos="Pron" closed="true" indexRel="GenRel">
    <entry name="Primary">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($rel)/*"/>
        <xsl:with-param name="ext" select="$X.GenRel.E"/>
      </xsl:call-template>
    </entry>
  </family>
  
  <!-- Comp -->
  <xsl:variable name="comp">
    <complexcat>
      <xsl:copy-of select="$s.from-1.marked"/>
      <slash dir="/" mode="^"/>
      <xsl:copy-of select="$s.1.E.fin.unmarked.-inv"/>
    </complexcat>
  </xsl:variable>

  <family name="Comp" pos="Pron" closed="true" indexRel="*NoSem*">
    <entry name="Primary">
      <xsl:copy-of select="$comp"/>
    </entry>
  </family>

  <!-- Conj -->
  <!-- NP conjunction with 'and' sets num to pl; with 'or', num is unconstrained -->
  <xsl:variable name="bw.np.X1.fw.np.X2">
    <slash dir="\" mode="*"/>
    <xsl:copy-of select="$np.X1"/>
    <slash dir="/" mode="*"/>
    <xsl:copy-of select="$np.X2"/>
  </xsl:variable>
  
  <xsl:variable name="conj.np.collective">
    <complexcat>
      <xsl:copy-of select="$np.X0.pl"/>
      <xsl:copy-of select="$bw.np.X1.fw.np.X2"/>
    </complexcat>
  </xsl:variable>
  
  <xsl:variable name="X0.and.First.L1.elem.Item.X1.Next.L2.elem.Item.X2">
    <lf>
      <satop nomvar="X0">
        <prop name="and"/>
        <diamond mode="First">
          <nomvar name="L1"/>
          <prop name="elem"/>
          <diamond mode="Item"><nomvar name="X1"/></diamond>
          <diamond mode="Next">
            <nomvar name="L2"/>
            <prop name="elem"/>
            <diamond mode="Item"><nomvar name="X2"/></diamond>
          </diamond>
        </diamond>
      </satop>
    </lf>
  </xsl:variable>

  <xsl:variable name="qnp.pl.rightward-TR">
    <xsl:apply-templates mode="add-np-pl" select="xalan:nodeset($qnp.rightward-TR)/*"/>
  </xsl:variable>
  
  <xsl:variable name="qnp.pl.leftward-TR">
    <xsl:apply-templates mode="add-np-pl" select="xalan:nodeset($qnp.leftward-TR)/*"/>
  </xsl:variable>
  
  <xsl:variable name="conj.np.and.distributive.rightward-TR">
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($qnp.pl.rightward-TR)/*"/>
      <xsl:with-param name="ext" select="$bw.np.X1.fw.np.X2"/>
    </xsl:call-template>
  </xsl:variable>
  
  <xsl:variable name="conj.np.and.distributive.leftward-TR">
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($qnp.pl.leftward-TR)/*"/>
      <xsl:with-param name="ext" select="$bw.np.X1.fw.np.X2"/>
    </xsl:call-template>
  </xsl:variable>
  
  <xsl:variable name="conj.np.or.distributive.rightward-TR">
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($qnp.rightward-TR)/*"/>
      <xsl:with-param name="ext" select="$bw.np.X1.fw.np.X2"/>
    </xsl:call-template>
  </xsl:variable>
  
  <xsl:variable name="conj.np.or.distributive.leftward-TR">
    <xsl:call-template name="extend">
      <xsl:with-param name="elt" select="xalan:nodeset($qnp.leftward-TR)/*"/>
      <xsl:with-param name="ext" select="$bw.np.X1.fw.np.X2"/>
    </xsl:call-template>
  </xsl:variable>
  
  <xsl:variable name="S.Default.First.L1.elem.Item.X1.Next.L2.elem.Item.X2.BoundVar.X.Pred.E">
    <lf>
      <satop nomvar="S">
        <prop name="[*DEFAULT*]"/>
        <diamond mode="First">
          <nomvar name="L1"/>
          <prop name="elem"/>
          <diamond mode="Item"><nomvar name="X1"/></diamond>
          <diamond mode="Next">
            <nomvar name="L2"/>
            <prop name="elem"/>
            <diamond mode="Item"><nomvar name="X2"/></diamond>
          </diamond>
        </diamond>
        <diamond mode="BoundVar"><nomvar name="X"/></diamond>
        <diamond mode="Pred"><nomvar name="E"/></diamond>
      </satop>
    </lf>
  </xsl:variable>

  <xsl:variable name="conj.sentential">
    <complexcat>
      <xsl:copy-of select="$s.from-1.E0"/>
      <slash/>
      <dollar name="1"/>
      <slash dir="\" mode="*"/>
      <complexcat>
        <xsl:copy-of select="$s.from-1.E1"/>
        <slash/>
        <dollar name="1"/>
      </complexcat>
      <slash dir="/" mode="*"/>
      <complexcat>
        <xsl:copy-of select="$s.1.E2"/>
        <slash/>
        <dollar name="1"/>
      </complexcat>
    </complexcat>
  </xsl:variable>

  <xsl:variable name="E0.Default.First.L1.elem.Item.E1.Next.L2.elem.Item.E2">
    <lf>
      <satop nomvar="E0">
        <prop name="[*DEFAULT*]"/>
        <diamond mode="First">
          <nomvar name="L1"/>
          <prop name="elem"/>
          <diamond mode="Item"><nomvar name="E1"/></diamond>
          <diamond mode="Next">
            <nomvar name="L2"/>
            <prop name="elem"/>
            <diamond mode="Item"><nomvar name="E2"/></diamond>
          </diamond>
        </diamond>
      </satop>
    </lf>
  </xsl:variable>

  <xsl:variable name="np.Y1.np.X1.leftward-TR">
    <complexcat>
      <atomcat type="s"/>
      <slash/>
      <dollar name="1"/>
      <slash dir="\"/>
      <complexcat>
        <atomcat type="s"/>
        <slash/>
        <dollar name="1"/>
        <slash dir="/"/>
        <xsl:copy-of select="$np.Y1"/>
        <slash dir="/"/>
        <xsl:copy-of select="$np.X1"/>
      </complexcat>
    </complexcat>
  </xsl:variable>  
  
  <xsl:variable name="np.Y2.np.X2.leftward-TR">
    <complexcat>
      <atomcat type="s"/>
      <slash/>
      <dollar name="1"/>
      <slash dir="\"/>
      <complexcat>
        <atomcat type="s"/>
        <slash/>
        <dollar name="1"/>
        <slash dir="/"/>
        <xsl:copy-of select="$np.Y2"/>
        <slash dir="/"/>
        <xsl:copy-of select="$np.X2"/>
      </complexcat>
    </complexcat>
  </xsl:variable>
  
  <xsl:variable name="conj.argcluster">
    <complexcat>
      <xsl:copy-of select="$s.from-1.S.quant"/>
      <slash/>
      <dollar name="1"/>
      <slash dir="\"/>
      <complexcat>
        <xsl:copy-of select="$s.1.E.unmarked"/>
        <slash/>
        <dollar name="1"/>
        <slash dir="/"/>
        <xsl:copy-of select="$np.3.Y"/>
        <slash dir="/"/>
        <xsl:copy-of select="$np.2.X"/>
      </complexcat>
      <slash dir="\" mode="*"/>
      <xsl:copy-of select="$np.Y1.np.X1.leftward-TR"/>
      <slash dir="/" mode="*"/>
      <xsl:copy-of select="$np.Y2.np.X2.leftward-TR"/>
    </complexcat>
  </xsl:variable>

  <!-- NB: should theoretically use s\(s\np/np) here ... -->
  <xsl:variable name="conj.gapping">
    <complexcat>
      <xsl:copy-of select="$s.from-1.S.quant"/>
      <slash dir="\" mode="*"/>
      <xsl:copy-of select="$np.X1"/>
      <slash dir="\" mode="*"/>
      <complexcat>
        <xsl:copy-of select="$s.1.E.unmarked"/>
        <slash dir="\" mode="&lt;"/>
        <xsl:copy-of select="$np.2.X"/>
        <slash dir="/" mode="&gt;"/>
        <xsl:copy-of select="$np.3.Y"/>
      </complexcat>
      <slash dir="\" mode="*"/>
      <xsl:copy-of select="$np.Y1"/>
      <slash dir="/" mode="*"/>
      <xsl:copy-of select="$np.Y2.np.X2.leftward-TR"/>
    </complexcat>
  </xsl:variable>

  <xsl:variable name="argcluster.sem">
    <lf>
      <satop nomvar="S">
        <prop name="[*DEFAULT*]"/>
        <diamond mode="First">
          <nomvar name="L1"/>
          <prop name="elem"/>
          <diamond mode="Item">
            <nomvar name="T1"/>
            <prop name="tup"/>
            <diamond mode="Item1"><nomvar name="X1"/></diamond>
            <diamond mode="Item2"><nomvar name="Y1"/></diamond>
          </diamond>
          <diamond mode="Next">
            <nomvar name="L2"/>
            <prop name="elem"/>
            <diamond mode="Item">
              <nomvar name="T2"/>
              <prop name="tup"/>
              <diamond mode="Item1"><nomvar name="X2"/></diamond>
              <diamond mode="Item2"><nomvar name="Y2"/></diamond>
            </diamond>
          </diamond>
        </diamond>
        <diamond mode="BoundVar">
          <nomvar name="T"/>
          <prop name="tup"/>
          <diamond mode="Item1"><nomvar name="X"/></diamond>
          <diamond mode="Item2"><nomvar name="Y"/></diamond>
        </diamond>
        <diamond mode="Pred"><nomvar name="E"/></diamond>
      </satop>
    </lf>
  </xsl:variable>
  
  <family name="Conj" pos="Conj" closed="true">
    <entry name="NP-Collective"> 
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($conj.np.collective)/*"/>
        <xsl:with-param name="ext" select="$X0.and.First.L1.elem.Item.X1.Next.L2.elem.Item.X2"/>
      </xsl:call-template>
    </entry>
    <entry name="NP-Distributive-and-Rightward-TR">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($conj.np.and.distributive.rightward-TR)/*"/>
        <xsl:with-param name="ext" select="$S.Default.First.L1.elem.Item.X1.Next.L2.elem.Item.X2.BoundVar.X.Pred.E"/>
      </xsl:call-template>
    </entry>
    <entry name="NP-Distributive-and-Leftward-TR">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($conj.np.and.distributive.leftward-TR)/*"/>
        <xsl:with-param name="ext" select="$S.Default.First.L1.elem.Item.X1.Next.L2.elem.Item.X2.BoundVar.X.Pred.E"/>
      </xsl:call-template>
    </entry>
    <entry name="NP-Distributive-or-Rightward-TR">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($conj.np.or.distributive.rightward-TR)/*"/>
        <xsl:with-param name="ext" select="$S.Default.First.L1.elem.Item.X1.Next.L2.elem.Item.X2.BoundVar.X.Pred.E"/>
      </xsl:call-template>
    </entry>
    <entry name="NP-Distributive-or-Leftward-TR">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($conj.np.or.distributive.leftward-TR)/*"/>
        <xsl:with-param name="ext" select="$S.Default.First.L1.elem.Item.X1.Next.L2.elem.Item.X2.BoundVar.X.Pred.E"/>
      </xsl:call-template>
    </entry>
    <entry name="Sentential">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($conj.sentential)/*"/>
        <xsl:with-param name="ext" select="$E0.Default.First.L1.elem.Item.E1.Next.L2.elem.Item.E2"/>
      </xsl:call-template>
    </entry>
    <entry name="ArgCluster">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($conj.argcluster)/*"/>
        <xsl:with-param name="ext" select="$argcluster.sem"/>
      </xsl:call-template>
    </entry>
    <entry name="Gapping">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($conj.gapping)/*"/>
        <xsl:with-param name="ext" select="$argcluster.sem"/>
      </xsl:call-template>
    </entry>
  </family>

  <xsl:variable name="fullstop.decl.unmarked">
    <complexcat>
      <xsl:copy-of select="$sent.E"/>
      <slash dir="\" mode="*"/>
      <xsl:copy-of select="$s.E.unmarked.-inv"/>
    </complexcat>
  </xsl:variable>
  
  <xsl:variable name="fullstop.decl.fronted">
    <complexcat>
      <xsl:copy-of select="$sent.E"/>
      <slash dir="\" mode="*"/>
      <xsl:copy-of select="$s.E.fronted.-inv"/>
    </complexcat>
  </xsl:variable>
  
  <xsl:variable name="E.mood.dcl">
    <lf>
      <satop nomvar="E">
        <diamond mode="mood"><prop name="dcl"/></diamond>
      </satop>
    </lf>
  </xsl:variable>
  
  <xsl:variable name="S.declare.Prop.E">
    <lf>
      <satop nomvar="S">
        <prop name="declare"/>
        <diamond mode="Prop">
          <nomvar name="E"/>
        </diamond>
      </satop>
    </lf>
  </xsl:variable>
  
  <family name="FullStop" pos="." closed="true" indexRel="mood">
    <entry name="Declare-Unmarked">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($fullstop.decl.unmarked)/*"/>
        <xsl:with-param name="ext" select="$E.mood.dcl"/>
      </xsl:call-template>
    </entry>
    <entry name="Declare-Fronted">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($fullstop.decl.fronted)/*"/>
        <xsl:with-param name="ext" select="$E.mood.dcl"/>
      </xsl:call-template>
    </entry>
  </family>

  <xsl:variable name="qmark.ask.yn">
    <complexcat>
      <xsl:copy-of select="$sent.E"/>
      <slash dir="\" mode="*"/>
      <xsl:copy-of select="$s.E.inv"/>
    </complexcat>
  </xsl:variable>
  
  <xsl:variable name="qmark.ask.wh">
    <complexcat>
      <xsl:copy-of select="$sent.E"/>
      <slash dir="\" mode="*"/>
      <xsl:copy-of select="$s.E.wh"/>
    </complexcat>
  </xsl:variable>
  
  <xsl:variable name="E.mood.int">
    <lf>
      <satop nomvar="E">
        <diamond mode="mood"><prop name="int"/></diamond>
      </satop>
    </lf>
  </xsl:variable>
  
  <xsl:variable name="S.ask.Prop.E">
    <lf>
      <satop nomvar="S">
        <prop name="ask"/>
        <diamond mode="Prop">
          <nomvar name="E"/>
        </diamond>
      </satop>
    </lf>
  </xsl:variable>
  
  <family name="QuestionMark" pos="?" closed="true" indexRel="mood">
    <entry name="Ask-YN">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($qmark.ask.yn)/*"/>
        <xsl:with-param name="ext" select="$E.mood.int"/>
      </xsl:call-template>
    </entry>
    <entry name="Ask-Wh">
      <xsl:call-template name="extend">
        <xsl:with-param name="elt" select="xalan:nodeset($qmark.ask.wh)/*"/>
        <xsl:with-param name="ext" select="$E.mood.int"/>
      </xsl:call-template>
    </entry>
  </family>

  </ccg-lexicon>
  </xsl:template>

  
  <!-- ***** Extend ***** -->
  <xsl:template name="extend">
    <xsl:param name="elt"/>
    <xsl:param name="ext"/>
    <xsl:element name="{name($elt)}">
      <xsl:copy-of select="$elt/@*"/>
      <xsl:copy-of select="$elt/node()"/>
      <xsl:copy-of select="$ext"/>
    </xsl:element>
  </xsl:template>

  
  <!-- ***** Modification modes ***** -->
  <xsl:template match="atomcat[@type='np']/fs" mode="add-np-pl">
    <xsl:copy>
      <xsl:apply-templates select="@*" mode="add-np-pl"/>
      <feat attr="num" val="pl"/>
      <xsl:apply-templates select="node()[@attr != 'num']" mode="add-np-pl"/>
    </xsl:copy>
  </xsl:template>

  
  <!-- ***** Copy ***** -->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

  <xsl:template match="@*|node()" mode="add-np-pl">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()" mode="add-np-pl"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: grammars/worldcup/lexicon.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<ccg-lexicon xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:noNamespaceSchemaLocation="../lexicon.xsd" name="worldcup">
  <licensing-features>
    <feat location="target-only" val="inf" attr="vform"/>
    <feat location="target-only" license-empty-cats="false" val="marked" attr="marking"/>
    <feat license-marked-cats="true" val="+" attr="inv"/>
  </licensing-features>
  <relation-sorting order="BoundVar First      Restr Body Pred       Actor Patient Recipient Situation      Item Item1 Item2      *       Direction Modifier Ref       GenRel"/>
  <family pos="N" name="Noun">
    <entry name="Primary">
      <atomcat type="n">
        <fs id="2">
          <feat attr="num">
            <featvar name="NUM"/>
          </feat>
          <feat attr="index">
            <lf>
              <nomvar name="X"/>
            </lf>
          </feat>
        </fs>
        <lf>
          <satop nomvar="X">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </atomcat>
    </entry>
  </family>
  <family pos="NNP" name="Name">
    <entry name="Primary">
      <atomcat type="np">
        <fs id="2">
          <feat val="+" attr="3rd"/>
          <feat attr="index">
            <lf>
              <nomvar name="X"/>
            </lf>
          </feat>
        </fs>
        <lf>
          <satop nomvar="X">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </atomcat>
    </entry>
    <entry name="Fronted">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="fronted" attr="marking"/>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="num">
                <featvar name="NUM"/>
              </feat>
              <feat attr="3rd">
                <featvar name="3RD"/>
              </feat>
              <feat val="fin" attr="vform"/>
              <feat val="none" attr="marking"/>
              <feat val="-" attr="inv"/>
              <feat val="-" attr="quant"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="/"/>
          <atomcat type="np">
            <fs id="2">
              <feat val="+" attr="3rd"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="X">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
  <family closed="true" pos="QNP" name="QuantNP">
    <entry name="RightwardTypeRaised">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="+" attr="quant"/>
            <feat attr="index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash ability="active" varmodality="m1" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat val="none" attr="marking"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash ability="active" varmodality="m1" dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat val="+" attr="3rd"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="S">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Restr">
              <nomvar name="X"/>
            </diamond>
            <diamond mode="Body">
              <nomvar name="E"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="LeftwardTypeRaised">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="+" attr="quant"/>
            <feat attr="index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash/>
        <dollar name="1"/>
        <slash ability="active" varmodality="m1" dir="\"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat val="none" attr="marking"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
          <slash ability="active" varmodality="m1" dir="/"/>
          <atomcat type="np">
            <fs id="2">
              <feat val="+" attr="3rd"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="S">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Restr">
              <nomvar name="X"/>
            </diamond>
            <diamond mode="Body">
              <nomvar name="E"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="everyone" pred="every"/>
  </family>
  <family closed="true" pos="WhNP" name="WhNP">
    <entry name="SubjectExtraction">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="wh" attr="marking"/>
            <feat attr="index">
              <lf>
                <nomvar name="Q"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat val="none" attr="marking"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat val="+" attr="3rd"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="Q">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Restr">
              <nomvar name="X"/>
            </diamond>
            <diamond mode="Body">
              <nomvar name="E"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="ObjectExtraction">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="wh" attr="marking"/>
            <feat attr="index">
              <lf>
                <nomvar name="Q"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat val="+" attr="inv"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="/"/>
          <atomcat type="np">
            <fs id="2">
              <feat val="+" attr="3rd"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="Q">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Restr">
              <nomvar name="X"/>
            </diamond>
            <diamond mode="Body">
              <nomvar name="E"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="who"/>
  </family>
  <family indexRel="det" closed="true" pos="Det" name="Det">
    <entry name="Primary">
      <complexcat>
        <atomcat type="np">
          <fs id="2">
            <feat val="+" attr="3rd"/>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X">
            <diamond mode="det">
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Fronted">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="fronted" attr="marking"/>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="num">
                <featvar name="NUM"/>
              </feat>
              <feat attr="3rd">
                <featvar name="3RD"/>
              </feat>
              <feat val="fin" attr="vform"/>
              <feat val="none" attr="marking"/>
              <feat val="-" attr="inv"/>
              <feat val="-" attr="quant"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="/"/>
          <atomcat type="np">
            <fs id="2">
              <feat val="+" attr="3rd"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash mode="^" dir="/"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X">
            <diamond mode="det">
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="a"/>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="the"/>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="his"/>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="my"/>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="its"/>
  </family>
  <family closed="true" pos="QDet" name="QuantDet">
    <entry name="RightwardTypeRaised">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="+" attr="quant"/>
            <feat attr="index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash ability="active" varmodality="m1" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat val="none" attr="marking"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash ability="active" varmodality="m1" dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat val="+" attr="3rd"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash mode="^" dir="/"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="S">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Restr">
              <nomvar name="X"/>
            </diamond>
            <diamond mode="Body">
              <nomvar name="E"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="LeftwardTypeRaised">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="+" attr="quant"/>
            <feat attr="index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash/>
        <dollar name="1"/>
        <slash ability="active" varmodality="m1" dir="\"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat val="none" attr="marking"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
          <slash ability="active" varmodality="m1" dir="/"/>
          <atomcat type="np">
            <fs id="2">
              <feat val="+" attr="3rd"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash mode="^" dir="/"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="S">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Restr">
              <nomvar name="X"/>
            </diamond>
            <diamond mode="Body">
              <nomvar name="E"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="all"/>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="every"/>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="no"/>
  </family>
  <family closed="true" pos="Wh" name="WhDet">
    <entry name="SubjectExtraction">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="wh" attr="marking"/>
            <feat attr="index">
              <lf>
                <nomvar name="Q"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat val="none" attr="marking"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat val="+" attr="3rd"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash mode="^" dir="/"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="Q">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Restr">
              <nomvar name="X"/>
            </diamond>
            <diamond mode="Body">
              <nomvar name="E"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="ObjectExtraction">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="wh" attr="marking"/>
            <feat attr="index">
              <lf>
                <nomvar name="Q"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat val="+" attr="inv"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="/"/>
          <atomcat type="np">
            <fs id="2">
              <feat val="+" attr="3rd"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash mode="^" dir="/"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="Q">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Restr">
              <nomvar name="X"/>
            </diamond>
            <diamond mode="Body">
              <nomvar name="E"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="which"/>
  </family>
  <family pos="Adj" name="Adjective">
    <entry name="Primary">
      <complexcat>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X">
            <diamond mode="Modifier">
              <nomvar name="P"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
  <family pos="Adv" name="Adverb">
    <entry name="Initial">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="fronted" attr="marking"/>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <atomcat type="s">
          <fs id="1">
            <feat val="none" attr="marking"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E">
            <diamond mode="Modifier">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Forward">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="E">
            <diamond mode="Modifier">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Backward">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="E">
            <diamond mode="Modifier">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
  <family indexRel="*NoSem*" closed="true" pos="Prep" name="Particle">
    <entry name="Primary">
      <atomcat type="prt">
        <fs>
          <feat val="[*DEFAULT*]" attr="lex"/>
        </fs>
      </atomcat>
    </entry>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="up"/>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="with"/>
  </family>
  <family indexRel="*NoSem*" closed="true" pos="Prep" name="PrepNom">
    <entry active="true" name="Nominal">
      <complexcat>
        <atomcat type="pp">
          <fs inheritsFrom="2">
            <feat val="[*DEFAULT*]" attr="lex"/>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="/"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="from"/>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="to"/>
  </family>
  <family closed="false" pos="Prep" name="PrepAdj">
    <entry name="NP-Modifier">
      <complexcat>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <setarg>
          <slash mode="*" dir="\"/>
          <atomcat type="n">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash mode="&lt;" dir="/"/>
          <atomcat type="np">
            <fs id="3">
              <feat attr="index">
                <lf>
                  <nomvar name="Y"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </setarg>
        <lf>
          <satop nomvar="X">
            <diamond mode="Modifier">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Ref">
                <nomvar name="Y"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
  <family closed="true" pos="Prep" name="PrepAdv">
    <entry name="Backward">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash mode="&gt;" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs>
              <feat val="ger" attr="vform"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="E">
            <diamond mode="Modifier">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Situation">
                <nomvar name="E2"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="without"/>
  </family>
  <family closed="true" pos="V" name="IV">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM"/>
            </feat>
            <feat attr="3rd">
              <featvar name="3RD"/>
            </feat>
            <feat val="fin" attr="vform"/>
            <feat val="none" attr="marking"/>
            <feat val="-" attr="inv"/>
            <feat val="-" attr="quant"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM"/>
            </feat>
            <feat attr="3rd">
              <featvar name="3RD"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Actor">
              <nomvar name="X"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="celebrate"/>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="cheer"/>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="come"/>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="leave"/>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="miss"/>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="score"/>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="shoot"/>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="smile"/>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="stay"/>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="win"/>
  </family>
  <family closed="true" pos="V" name="TV">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM"/>
            </feat>
            <feat attr="3rd">
              <featvar name="3RD"/>
            </feat>
            <feat val="fin" attr="vform"/>
            <feat val="none" attr="marking"/>
            <feat val="-" attr="inv"/>
            <feat val="-" attr="quant"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM"/>
            </feat>
            <feat attr="3rd">
              <featvar name="3RD"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Actor">
              <nomvar name="X"/>
            </diamond>
          </satop>
          <satop nomvar="E">
            <diamond mode="Patient">
              <nomvar name="Y"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Lifted">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM"/>
            </feat>
            <feat attr="3rd">
              <featvar name="3RD"/>
            </feat>
            <feat val="fin" attr="vform"/>
            <feat val="none" attr="marking"/>
            <feat val="-" attr="inv"/>
            <feat val="+" attr="quant"/>
            <feat attr="index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM"/>
            </feat>
            <feat attr="3rd">
              <featvar name="3RD"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs inheritsFrom="6">
              <feat val="+" attr="quant"/>
              <feat attr="index">
                <lf>
                  <nomvar name="S"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="/"/>
          <complexcat>
            <atomcat type="s">
              <fs id="6">
                <feat val="none" attr="marking"/>
                <feat val="-" attr="quant"/>
                <feat attr="index">
                  <lf>
                    <nomvar name="E"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
            <slash dir="\"/>
            <atomcat type="np">
              <fs id="3">
                <feat attr="index">
                  <lf>
                    <nomvar name="Y"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
          </complexcat>
        </complexcat>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Actor">
              <nomvar name="X"/>
            </diamond>
          </satop>
          <satop nomvar="E">
            <diamond mode="Patient">
              <nomvar name="Y"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="score"/>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="shoot"/>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="win"/>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="astonish"/>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="beat"/>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="block"/>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="defeat"/>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="enjoy"/>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="host"/>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="kick"/>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="meet"/>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="play"/>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="read"/>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="see"/>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="support"/>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="throw"/>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="watch"/>
  </family>
  <family closed="true" pos="V" name="TV-Motion">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM"/>
            </feat>
            <feat attr="3rd">
              <featvar name="3RD"/>
            </feat>
            <feat val="fin" attr="vform"/>
            <feat val="none" attr="marking"/>
            <feat val="-" attr="inv"/>
            <feat val="-" attr="quant"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM"/>
            </feat>
            <feat attr="3rd">
              <featvar name="3RD"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="pp">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Actor">
              <nomvar name="X"/>
            </diamond>
          </satop>
          <satop nomvar="E">
            <diamond mode="Direction">
              <nomvar name="Y"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="return"/>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="travel"/>
  </family>
  <family closed="true" pos="V" name="TV-Scomp">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM"/>
            </feat>
            <feat attr="3rd">
              <featvar name="3RD"/>
            </feat>
            <feat val="fin" attr="vform"/>
            <feat val="none" attr="marking"/>
            <feat val="-" attr="inv"/>
            <feat val="-" attr="quant"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM"/>
            </feat>
            <feat attr="3rd">
              <featvar name="3RD"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="/"/>
        <atomcat type="s">
          <fs>
            <feat val="-" attr="inv"/>
            <feat attr="index">
              <lf>
                <nomvar name="E2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Actor">
              <nomvar name="X"/>
            </diamond>
          </satop>
          <satop nomvar="E">
            <diamond mode="Situation">
              <nomvar name="E2"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="know"/>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="predict"/>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="say"/>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="think"/>
  </family>
  <family closed="true" pos="V" name="TV-Phrasal">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM"/>
            </feat>
            <feat attr="3rd">
              <featvar name="3RD"/>
            </feat>
            <feat val="fin" attr="vform"/>
            <feat val="none" attr="marking"/>
            <feat val="-" attr="inv"/>
            <feat val="-" attr="quant"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM"/>
            </feat>
            <feat attr="3rd">
              <featvar name="3RD"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <setarg>
          <slash mode="&gt;" dir="/"/>
          <atomcat type="np">
            <fs id="3">
              <feat attr="index">
                <lf>
                  <nomvar name="Y"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash mode="*" dir="/"/>
          <atomcat type="prt">
            <fs id="4"/>
          </atomcat>
        </setarg>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Actor">
              <nomvar name="X"/>
            </diamond>
          </satop>
          <satop nomvar="E">
            <diamond mode="Patient">
              <nomvar name="Y"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="pick-up"/>
  </family>
  <family closed="true" pos="V" name="TV-PrepComplement">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM"/>
            </feat>
            <feat attr="3rd">
              <featvar name="3RD"/>
            </feat>
            <feat val="fin" attr="vform"/>
            <feat val="none" attr="marking"/>
            <feat val="-" attr="inv"/>
            <feat val="-" attr="quant"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM"/>
            </feat>
            <feat attr="3rd">
              <featvar name="3RD"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <atomcat type="prt">
          <fs id="4"/>
        </atomcat>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Actor">
              <nomvar name="X"/>
            </diamond>
          </satop>
          <satop nomvar="E">
            <diamond mode="Patient">
              <nomvar name="Y"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="tie-with"/>
  </family>
  <family closed="true" pos="V" name="DTV">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM"/>
            </feat>
            <feat attr="3rd">
              <featvar name="3RD"/>
            </feat>
            <feat val="fin" attr="vform"/>
            <feat val="none" attr="marking"/>
            <feat val="-" attr="inv"/>
            <feat val="-" attr="quant"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM"/>
            </feat>
            <feat attr="3rd">
              <featvar name="3RD"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="/"/>
        <atomcat type="np">
          <fs id="4">
            <feat attr="index">
              <lf>
                <nomvar name="Z"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Actor">
              <nomvar name="X"/>
            </diamond>
          </satop>
          <satop nomvar="E">
            <diamond mode="Patient">
              <nomvar name="Y"/>
            </diamond>
          </satop>
          <satop nomvar="E">
            <diamond mode="Recipient">
              <nomvar name="Z"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="buy"/>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="give"/>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="offer"/>
  </family>
  <family closed="true" pos="V" name="ObjectControl">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM"/>
            </feat>
            <feat attr="3rd">
              <featvar name="3RD"/>
            </feat>
            <feat val="fin" attr="vform"/>
            <feat val="none" attr="marking"/>
            <feat val="-" attr="inv"/>
            <feat val="-" attr="quant"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM"/>
            </feat>
            <feat attr="3rd">
              <featvar name="3RD"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs>
              <feat val="inf" attr="vform"/>
              <feat val="none" attr="marking"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="3">
              <feat attr="index">
                <lf>
                  <nomvar name="Y"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash mode="&lt;" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="Y"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Actor">
              <nomvar name="X"/>
            </diamond>
          </satop>
          <satop nomvar="E">
            <diamond mode="Patient">
              <nomvar name="Y"/>
            </diamond>
          </satop>
          <satop nomvar="E">
            <diamond mode="Situation">
              <nomvar name="E2"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Lifted">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM"/>
            </feat>
            <feat attr="3rd">
              <featvar name="3RD"/>
            </feat>
            <feat val="fin" attr="vform"/>
            <feat val="none" attr="marking"/>
            <feat val="-" attr="inv"/>
            <feat val="+" attr="quant"/>
            <feat attr="index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM"/>
            </feat>
            <feat attr="3rd">
              <featvar name="3RD"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&gt;" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs>
              <feat val="inf" attr="vform"/>
              <feat val="none" attr="marking"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\"/>
          <atomcat type="np">
            <fs id="3">
              <feat attr="index">
                <lf>
                  <nomvar name="Y"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash mode="&lt;" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs inheritsFrom="6">
              <feat val="+" attr="quant"/>
              <feat attr="index">
                <lf>
                  <nomvar name="S"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="/"/>
          <complexcat>
            <atomcat type="s">
              <fs id="6">
                <feat val="none" attr="marking"/>
                <feat val="-" attr="quant"/>
                <feat attr="index">
                  <lf>
                    <nomvar name="E"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
            <slash dir="\"/>
            <atomcat type="np">
              <fs id="3">
                <feat attr="index">
                  <lf>
                    <nomvar name="Y"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
          </complexcat>
        </complexcat>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Actor">
              <nomvar name="X"/>
            </diamond>
          </satop>
          <satop nomvar="E">
            <diamond mode="Patient">
              <nomvar name="Y"/>
            </diamond>
          </satop>
          <satop nomvar="E">
            <diamond mode="Situation">
              <nomvar name="E2"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="persuade"/>
  </family>
  <family indexRel="*NoSem*" closed="true" pos="Prep" name="To-Infinitive">
    <entry name="Basic">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="inf" attr="vform"/>
          </fs>
        </atomcat>
        <slash ability="inert" mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat val="non-fin" attr="vform"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
      </complexcat>
    </entry>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="to"/>
  </family>
  <family closed="true" pos="V" name="Modal">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM"/>
            </feat>
            <feat attr="3rd">
              <featvar name="3RD"/>
            </feat>
            <feat val="fin" attr="vform"/>
            <feat val="none" attr="marking"/>
            <feat val="-" attr="inv"/>
            <feat attr="quant">
              <featvar name="QUANT"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM"/>
            </feat>
            <feat attr="3rd">
              <featvar name="3RD"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs>
              <feat val="non-fin" attr="vform"/>
              <feat val="none" attr="marking"/>
              <feat attr="quant">
                <featvar name="QUANT"/>
              </feat>
              <feat attr="index">
                <lf>
                  <nomvar name="E2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="num">
                <featvar name="NUM"/>
              </feat>
              <feat attr="3rd">
                <featvar name="3RD"/>
              </feat>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Body">
              <nomvar name="E2"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Inverted">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM"/>
            </feat>
            <feat attr="3rd">
              <featvar name="3RD"/>
            </feat>
            <feat val="fin" attr="vform"/>
            <feat val="none" attr="marking"/>
            <feat val="+" attr="inv"/>
            <feat attr="quant">
              <featvar name="QUANT"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <atomcat type="s">
          <fs>
            <feat val="non-fin" attr="vform"/>
            <feat val="none" attr="marking"/>
            <feat attr="quant">
              <featvar name="QUANT"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="E2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Body">
              <nomvar name="E2"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="may"/>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="will"/>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="should"/>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="would"/>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="not"/>
  </family>
  <family indexRel="tense" closed="true" pos="V" name="Do-Support">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM"/>
            </feat>
            <feat attr="3rd">
              <featvar name="3RD"/>
            </feat>
            <feat val="fin" attr="vform"/>
            <feat val="none" attr="marking"/>
            <feat val="-" attr="inv"/>
            <feat attr="quant">
              <featvar name="QUANT"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="num">
              <featvar name="NUM"/>
            </feat>
            <feat attr="3rd">
              <featvar name="3RD"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs>
              <feat val="non-fin" attr="vform"/>
              <feat val="none" attr="marking"/>
              <feat attr="quant">
                <featvar name="QUANT"/>
              </feat>
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="num">
                <featvar name="NUM"/>
              </feat>
              <feat attr="3rd">
                <featvar name="3RD"/>
              </feat>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
      </complexcat>
    </entry>
    <entry name="Inverted">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="num">
              <featvar name="NUM"/>
            </feat>
            <feat attr="3rd">
              <featvar name="3RD"/>
            </feat>
            <feat val="fin" attr="vform"/>
            <feat val="none" attr="marking"/>
            <feat val="+" attr="inv"/>
            <feat attr="quant">
              <featvar name="QUANT"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <atomcat type="s">
          <fs>
            <feat val="non-fin" attr="vform"/>
            <feat val="none" attr="marking"/>
            <feat attr="quant">
              <featvar name="QUANT"/>
            </feat>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="do"/>
  </family>
  <family indexRel="GenRel" closed="true" pos="Pron" name="Rel">
    <entry name="Primary">
      <complexcat>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <setarg>
          <slash mode="*" dir="\"/>
          <atomcat type="n">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash mode="*" dir="/"/>
          <complexcat>
            <atomcat type="s">
              <fs id="1">
                <feat val="fin" attr="vform"/>
                <feat val="none" attr="marking"/>
                <feat val="-" attr="inv"/>
                <feat attr="index">
                  <lf>
                    <nomvar name="E"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
            <slash dir="|"/>
            <atomcat type="np">
              <fs id="2">
                <feat val="+" attr="3rd"/>
                <feat attr="index">
                  <lf>
                    <nomvar name="X"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
          </complexcat>
        </setarg>
        <lf>
          <satop nomvar="X">
            <diamond mode="GenRel">
              <nomvar name="E"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="that"/>
  </family>
  <family indexRel="*NoSem*" closed="true" pos="Pron" name="Comp">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="marked" attr="marking"/>
          </fs>
        </atomcat>
        <slash mode="^" dir="/"/>
        <atomcat type="s">
          <fs id="1">
            <feat val="fin" attr="vform"/>
            <feat val="none" attr="marking"/>
            <feat val="-" attr="inv"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="that"/>
  </family>
  <family closed="true" pos="Conj" name="Conj">
    <entry name="NP-Collective" stem="and">
      <complexcat>
        <atomcat type="np">
          <fs>
            <feat val="pl" attr="num"/>
            <feat attr="index">
              <lf>
                <nomvar name="X0"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="np">
          <fs>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <atomcat type="np">
          <fs>
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X0">
            <prop name="and"/>
            <diamond mode="First">
              <nomvar name="L1"/>
              <prop name="elem"/>
              <diamond mode="Item">
                <nomvar name="X1"/>
              </diamond>
              <diamond mode="Next">
                <nomvar name="L2"/>
                <prop name="elem"/>
                <diamond mode="Item">
                  <nomvar name="X2"/>
                </diamond>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="NP-Distributive-and-Rightward-TR" stem="and">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="+" attr="quant"/>
            <feat attr="index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash ability="active" varmodality="m1" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat val="none" attr="marking"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash ability="active" varmodality="m1" dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat val="pl" attr="num"/>
              <feat val="+" attr="3rd"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash mode="*" dir="\"/>
        <atomcat type="np">
          <fs>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <atomcat type="np">
          <fs>
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="S">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="First">
              <nomvar name="L1"/>
              <prop name="elem"/>
              <diamond mode="Item">
                <nomvar name="X1"/>
              </diamond>
              <diamond mode="Next">
                <nomvar name="L2"/>
                <prop name="elem"/>
                <diamond mode="Item">
                  <nomvar name="X2"/>
                </diamond>
              </diamond>
            </diamond>
            <diamond mode="BoundVar">
              <nomvar name="X"/>
            </diamond>
            <diamond mode="Pred">
              <nomvar name="E"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="NP-Distributive-and-Leftward-TR" stem="and">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="+" attr="quant"/>
            <feat attr="index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash/>
        <dollar name="1"/>
        <slash ability="active" varmodality="m1" dir="\"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat val="none" attr="marking"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
          <slash ability="active" varmodality="m1" dir="/"/>
          <atomcat type="np">
            <fs id="2">
              <feat val="pl" attr="num"/>
              <feat val="+" attr="3rd"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash mode="*" dir="\"/>
        <atomcat type="np">
          <fs>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <atomcat type="np">
          <fs>
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="S">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="First">
              <nomvar name="L1"/>
              <prop name="elem"/>
              <diamond mode="Item">
                <nomvar name="X1"/>
              </diamond>
              <diamond mode="Next">
                <nomvar name="L2"/>
                <prop name="elem"/>
                <diamond mode="Item">
                  <nomvar name="X2"/>
                </diamond>
              </diamond>
            </diamond>
            <diamond mode="BoundVar">
              <nomvar name="X"/>
            </diamond>
            <diamond mode="Pred">
              <nomvar name="E"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="NP-Distributive-or-Rightward-TR" stem="or">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="+" attr="quant"/>
            <feat attr="index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash ability="active" varmodality="m1" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat val="none" attr="marking"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash ability="active" varmodality="m1" dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat val="+" attr="3rd"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash mode="*" dir="\"/>
        <atomcat type="np">
          <fs>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <atomcat type="np">
          <fs>
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="S">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="First">
              <nomvar name="L1"/>
              <prop name="elem"/>
              <diamond mode="Item">
                <nomvar name="X1"/>
              </diamond>
              <diamond mode="Next">
                <nomvar name="L2"/>
                <prop name="elem"/>
                <diamond mode="Item">
                  <nomvar name="X2"/>
                </diamond>
              </diamond>
            </diamond>
            <diamond mode="BoundVar">
              <nomvar name="X"/>
            </diamond>
            <diamond mode="Pred">
              <nomvar name="E"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="NP-Distributive-or-Leftward-TR" stem="or">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="+" attr="quant"/>
            <feat attr="index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash/>
        <dollar name="1"/>
        <slash ability="active" varmodality="m1" dir="\"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat val="none" attr="marking"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
          <slash ability="active" varmodality="m1" dir="/"/>
          <atomcat type="np">
            <fs id="2">
              <feat val="+" attr="3rd"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash mode="*" dir="\"/>
        <atomcat type="np">
          <fs>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <atomcat type="np">
          <fs>
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="S">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="First">
              <nomvar name="L1"/>
              <prop name="elem"/>
              <diamond mode="Item">
                <nomvar name="X1"/>
              </diamond>
              <diamond mode="Next">
                <nomvar name="L2"/>
                <prop name="elem"/>
                <diamond mode="Item">
                  <nomvar name="X2"/>
                </diamond>
              </diamond>
            </diamond>
            <diamond mode="BoundVar">
              <nomvar name="X"/>
            </diamond>
            <diamond mode="Pred">
              <nomvar name="E"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Sentential">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="index">
              <lf>
                <nomvar name="E0"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash/>
        <dollar name="1"/>
        <slash mode="*" dir="\"/>
        <complexcat>
          <atomcat type="s">
            <fs inheritsFrom="1">
              <feat attr="index">
                <lf>
                  <nomvar name="E1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
        </complexcat>
        <slash mode="*" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="E2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
        </complexcat>
        <lf>
          <satop nomvar="E0">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="First">
              <nomvar name="L1"/>
              <prop name="elem"/>
              <diamond mode="Item">
                <nomvar name="E1"/>
              </diamond>
              <diamond mode="Next">
                <nomvar name="L2"/>
                <prop name="elem"/>
                <diamond mode="Item">
                  <nomvar name="E2"/>
                </diamond>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="ArgCluster">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="+" attr="quant"/>
            <feat attr="index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash/>
        <dollar name="1"/>
        <slash dir="\"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat val="none" attr="marking"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
          <slash dir="/"/>
          <atomcat type="np">
            <fs id="3">
              <feat attr="index">
                <lf>
                  <nomvar name="Y"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="/"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash mode="*" dir="\"/>
        <complexcat>
          <atomcat type="s"/>
          <slash/>
          <dollar name="1"/>
          <slash dir="\"/>
          <complexcat>
            <atomcat type="s"/>
            <slash/>
            <dollar name="1"/>
            <slash dir="/"/>
            <atomcat type="np">
              <fs>
                <feat attr="index">
                  <lf>
                    <nomvar name="Y1"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
            <slash dir="/"/>
            <atomcat type="np">
              <fs>
                <feat attr="index">
                  <lf>
                    <nomvar name="X1"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
          </complexcat>
        </complexcat>
        <slash mode="*" dir="/"/>
        <complexcat>
          <atomcat type="s"/>
          <slash/>
          <dollar name="1"/>
          <slash dir="\"/>
          <complexcat>
            <atomcat type="s"/>
            <slash/>
            <dollar name="1"/>
            <slash dir="/"/>
            <atomcat type="np">
              <fs>
                <feat attr="index">
                  <lf>
                    <nomvar name="Y2"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
            <slash dir="/"/>
            <atomcat type="np">
              <fs>
                <feat attr="index">
                  <lf>
                    <nomvar name="X2"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
          </complexcat>
        </complexcat>
        <lf>
          <satop nomvar="S">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="First">
              <nomvar name="L1"/>
              <prop name="elem"/>
              <diamond mode="Item">
                <nomvar name="T1"/>
                <prop name="tup"/>
                <diamond mode="Item1">
                  <nomvar name="X1"/>
                </diamond>
                <diamond mode="Item2">
                  <nomvar name="Y1"/>
                </diamond>
              </diamond>
              <diamond mode="Next">
                <nomvar name="L2"/>
                <prop name="elem"/>
                <diamond mode="Item">
                  <nomvar name="T2"/>
                  <prop name="tup"/>
                  <diamond mode="Item1">
                    <nomvar name="X2"/>
                  </diamond>
                  <diamond mode="Item2">
                    <nomvar name="Y2"/>
                  </diamond>
                </diamond>
              </diamond>
            </diamond>
            <diamond mode="BoundVar">
              <nomvar name="T"/>
              <prop name="tup"/>
              <diamond mode="Item1">
                <nomvar name="X"/>
              </diamond>
              <diamond mode="Item2">
                <nomvar name="Y"/>
              </diamond>
            </diamond>
            <diamond mode="Pred">
              <nomvar name="E"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Gapping">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat val="+" attr="quant"/>
            <feat attr="index">
              <lf>
                <nomvar name="S"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="np">
          <fs>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat val="none" attr="marking"/>
              <feat attr="index">
                <lf>
                  <nomvar name="E"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash mode="&lt;" dir="\"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash mode="&gt;" dir="/"/>
          <atomcat type="np">
            <fs id="3">
              <feat attr="index">
                <lf>
                  <nomvar name="Y"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash mode="*" dir="\"/>
        <atomcat type="np">
          <fs>
            <feat attr="index">
              <lf>
                <nomvar name="Y1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <complexcat>
          <atomcat type="s"/>
          <slash/>
          <dollar name="1"/>
          <slash dir="\"/>
          <complexcat>
            <atomcat type="s"/>
            <slash/>
            <dollar name="1"/>
            <slash dir="/"/>
            <atomcat type="np">
              <fs>
                <feat attr="index">
                  <lf>
                    <nomvar name="Y2"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
            <slash dir="/"/>
            <atomcat type="np">
              <fs>
                <feat attr="index">
                  <lf>
                    <nomvar name="X2"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
          </complexcat>
        </complexcat>
        <lf>
          <satop nomvar="S">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="First">
              <nomvar name="L1"/>
              <prop name="elem"/>
              <diamond mode="Item">
                <nomvar name="T1"/>
                <prop name="tup"/>
                <diamond mode="Item1">
                  <nomvar name="X1"/>
                </diamond>
                <diamond mode="Item2">
                  <nomvar name="Y1"/>
                </diamond>
              </diamond>
              <diamond mode="Next">
                <nomvar name="L2"/>
                <prop name="elem"/>
                <diamond mode="Item">
                  <nomvar name="T2"/>
                  <prop name="tup"/>
                  <diamond mode="Item1">
                    <nomvar name="X2"/>
                  </diamond>
                  <diamond mode="Item2">
                    <nomvar name="Y2"/>
                  </diamond>
                </diamond>
              </diamond>
            </diamond>
            <diamond mode="BoundVar">
              <nomvar name="T"/>
              <prop name="tup"/>
              <diamond mode="Item1">
                <nomvar name="X"/>
              </diamond>
              <diamond mode="Item2">
                <nomvar name="Y"/>
              </diamond>
            </diamond>
            <diamond mode="Pred">
              <nomvar name="E"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="and"/>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="or"/>
  </family>
  <family indexRel="mood" closed="true" pos="." name="FullStop">
    <entry name="Declare-Unmarked">
      <complexcat>
        <atomcat type="sent">
          <fs>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="s">
          <fs>
            <feat val="none" attr="marking"/>
            <feat val="-" attr="inv"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E">
            <diamond mode="mood">
              <prop name="dcl"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Declare-Fronted">
      <complexcat>
        <atomcat type="sent">
          <fs>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="s">
          <fs>
            <feat val="fronted" attr="marking"/>
            <feat val="-" attr="inv"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E">
            <diamond mode="mood">
              <prop name="dcl"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="." pred="declare"/>
  </family>
  <family indexRel="mood" closed="true" pos="?" name="QuestionMark">
    <entry name="Ask-YN">
      <complexcat>
        <atomcat type="sent">
          <fs>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="s">
          <fs>
            <feat val="+" attr="inv"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E">
            <diamond mode="mood">
              <prop name="int"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <entry name="Ask-Wh">
      <complexcat>
        <atomcat type="sent">
          <fs>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="s">
          <fs>
            <feat val="wh" attr="marking"/>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="E">
            <diamond mode="mood">
              <prop name="int"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member xmlns:xalan2="http://xml.apache.org/xslt" stem="?" pred="ask"/>
  </family>
</ccg-lexicon>


================================================
FILE: grammars/worldcup/morph.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!-- 
Copyright (C) 2003-4 Jason Baldridge and University of Edinburgh (Michael White) 
$Revision: 1.35 $, $Date: 2005/07/16 19:58:51 $ 
-->
<morph xmlns:xalan2="http://xml.apache.org/xslt" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:noNamespaceSchemaLocation="../morph.xsd" name="worldcup">
  <entry word="that" pos="Pron"/>
  <entry word="and" pos="Conj"/>
  <entry word="or" pos="Conj"/>
  <entry word="." pos="."/>
  <entry word="?" pos="?"/>
  <entry word="everyone" pos="QNP"/>
  <entry word="who" pos="WhNP"/>
  <entry pos="Det" word="a"/>
  <entry pos="Det" word="an" stem="a"/>
  <entry word="the" pos="Det"/>
  <entry word="his" pos="Det" class="PPRO"/>
  <entry word="my" pos="Det" class="PPRO"/>
  <entry word="its" pos="Det" class="PPRO"/>
  <entry word="all" pos="QDet"/>
  <entry word="every" pos="QDet"/>
  <entry word="no" pos="QDet"/>
  <entry word="which" pos="Wh"/>
  <entry word="up" pos="Prep"/>
  <entry word="with" pos="Prep"/>
  <entry word="from" pos="Prep"/>
  <entry word="to" pos="Prep"/>
  <entry word="without" pos="Prep"/>
  <entry word="'s" pos="Prep"/>
  <entry word="of" pos="Prep"/>
  <entry word="about" pos="Prep"/>
  <entry word="after" pos="Prep"/>
  <entry word="on" pos="Prep"/>
  <entry word="for" pos="Prep"/>
  <entry word="in" pos="Prep"/>
  <entry word="by" pos="Prep"/>
  <entry word="between" pos="Prep"/>
  <entry word="red" pos="Adj" class="COLOR"/>
  <entry word="yellow" pos="Adj" class="COLOR"/>
  <entry word="aggressive" pos="Adj"/>
  <entry word="reckless" pos="Adj"/>
  <entry word="quick" pos="Adj"/>
  <entry word="powerful" pos="Adj"/>
  <entry word="well-deserved" pos="Adj"/>
  <entry word="first" pos="Adj"/>
  <entry word="cup" pos="Adj"/>
  <entry word="today" pos="Adv" class="TEMP_ADV"/>
  <entry word="yesterday" pos="Adv" class="TEMP_ADV"/>
  <entry word="previously" stem="previous" pos="Adv"/>
  <entry word="skeptically" stem="skeptic" pos="Adv" class="ATT_ADV"/>
  <entry word="joyfully" stem="joyful" pos="Adv" class="ATT_ADV"/>
  <entry word="easily" stem="easy" pos="Adv" class="MANNER_ADV"/>
  <entry word="quickly" stem="quick" pos="Adv" class="MANNER_ADV"/>
  <entry word="skillfully" stem="skillful" pos="Adv" class="MANNER_ADV"/>
  <entry word="angrily" stem="angry" pos="Adv" class="MANNER_ADV"/>
  <entry word="may" pos="V"/>
  <entry word="will" pos="V"/>
  <entry word="should" pos="V"/>
  <entry word="would" pos="V"/>
  <entry word="not" pos="V" macros="@nonfin"/>
  <entry word="did" stem="do" pos="V" macros="@past"/>
  <entry word="celebrated" stem="celebrate" pos="V" macros="@past"/>
  <entry pos="V" word="cheer" macros="@nonfin"/>
  <entry pos="V" word="cheered" stem="cheer" macros="@past"/>
  <entry pos="V" word="come" macros="@nonfin"/>
  <entry pos="V" word="came" stem="come" macros="@past"/>
  <entry pos="V" word="leave" macros="@nonfin"/>
  <entry pos="V" word="left" stem="leave" macros="@past"/>
  <entry word="misses" stem="miss" pos="V" macros="@pres @+3rd-agr @sg-agr"/>
  <entry pos="V" word="score" macros="@nonfin"/>
  <entry pos="V" word="scores" stem="score" macros="@pres @+3rd-agr @sg-agr"/>
  <entry pos="V" word="scored" stem="score" macros="@past"/>
  <entry pos="V" word="shoot" macros="@nonfin"/>
  <entry pos="V" word="shoots" stem="shoot" macros="@pres @+3rd-agr @sg-agr"/>
  <entry pos="V" word="smile" macros="@nonfin"/>
  <entry pos="V" word="smile" macros="@pres @-3rd-agr"/>
  <entry pos="V" word="smiles" stem="smile" macros="@pres @+3rd-agr @sg-agr"/>
  <entry pos="V" word="smile" macros="@pres @+3rd-agr @pl-agr"/>
  <entry pos="V" word="smiled" stem="smile" macros="@past"/>
  <entry word="stayed" stem="stay" pos="V" macros="@past"/>
  <entry pos="V" word="won" stem="win" macros="@past"/>
  <entry pos="V" word="win" macros="@nonfin"/>
  <entry word="astonished" stem="astonish" pos="V" macros="@past"/>
  <entry word="beat" pos="V" macros="@past"/>
  <entry word="blocked" stem="block" pos="V" macros="@past"/>
  <entry pos="V" word="defeat" macros="@nonfin"/>
  <entry pos="V" word="defeated" stem="defeat" macros="@past"/>
  <entry word="enjoying" stem="enjoy" pos="V" macros="@gerund"/>
  <entry word="hosted" stem="host" pos="V" macros="@past"/>
  <entry word="kicked" stem="kick" pos="V" macros="@past"/>
  <entry pos="V" word="meet" macros="@nonfin"/>
  <entry pos="V" word="met" stem="meet" macros="@past"/>
  <entry pos="V" word="play" macros="@nonfin"/>
  <entry pos="V" word="played" stem="play" macros="@past"/>
  <entry word="read" stem="read" pos="V" macros="@past"/>
  <entry word="saw" stem="see" pos="V" macros="@past"/>
  <entry word="support" pos="V" macros="@nonfin"/>
  <entry word="threw" stem="throw" pos="V" macros="@past"/>
  <entry word="watched" stem="watch" pos="V" macros="@past"/>
  <entry pos="V" word="return" macros="@pp-from @nonfin"/>
  <entry pos="V" word="returned" stem="return" macros="@pp-from @past"/>
  <entry pos="V" word="travel" macros="@pp-to @nonfin"/>
  <entry pos="V" word="traveled" stem="travel" macros="@pp-to @past"/>
  <entry word="knew" stem="know" pos="V" macros="@past"/>
  <entry word="predicted" stem="predict" pos="V" macros="@past"/>
  <entry word="said" stem="say" pos="V" macros="@past"/>
  <entry word="thought" stem="think" pos="V" macros="@past"/>
  <entry word="picked" stem="pick-up" pos="V" macros="@past @prt-up"/>
  <entry pos="V" word="tie" stem="tie-with" macros="@prt-with @nonfin"/>
  <entry pos="V" word="tied" stem="tie-with" macros="@prt-with @past"/>
  <entry word="bought" stem="buy" pos="V" macros="@past"/>
  <entry pos="V" word="give" macros="@nonfin"/>
  <entry pos="V" word="gives" stem="give" macros="@pres @+3rd-agr @sg-agr"/>
  <entry pos="V" word="gave" stem="give" macros="@past"/>
  <entry word="offered" stem="offer" pos="V" macros="@past"/>
  <entry pos="V" word="persuade" macros="@nonfin"/>
  <entry pos="V" word="persuades" stem="persuade" macros="@pres @+3rd-agr @sg-agr"/>
  <entry pos="V" word="persuaded" stem="persuade" macros="@past"/>
  <entry word="shot" pos="N" macros="@sg"/>
  <entry word="ball" pos="N" macros="@sg"/>
  <entry word="cup" pos="N" macros="@sg"/>
  <entry word="friend" pos="N" macros="@sg"/>
  <entry word="family" pos="N" macros="@sg"/>
  <entry word="victory" pos="N" macros="@sg"/>
  <entry pos="N" word="ticket" macros="@sg"/>
  <entry pos="N" word="tickets" stem="ticket" macros="@pl"/>
  <entry word="book" pos="N" macros="@sg"/>
  <entry word="card" pos="N" macros="@sg"/>
  <entry pos="N" word="goal" macros="@sg"/>
  <entry pos="N" word="goals" stem="goal" macros="@pl"/>
  <entry word="referee" pos="N" macros="@sg"/>
  <entry pos="N" word="team" macros="@sg"/>
  <entry pos="N" word="teams" stem="team" macros="@pl"/>
  <entry pos="N" word="game" macros="@sg"/>
  <entry pos="N" word="games" stem="game" macros="@pl"/>
  <entry word="fan" pos="N" macros="@sg"/>
  <entry word="final" pos="N" macros="@sg"/>
  <entry word="field" pos="N" macros="@sg" class="PLACE"/>
  <entry word="stadium" pos="N" macros="@sg" class="PLACE"/>
  <entry word="country" pos="N" macros="@sg"/>
  <entry word="detractor" pos="N" macros="@sg"/>
  <entry pos="N" word="player" macros="@sg"/>
  <entry pos="N" word="players" stem="player" macros="@pl"/>
  <entry word="I" pos="NNP" macros="@-3rd @sg" class="PRO"/>
  <entry word="me" pos="NNP" macros="@-3rd @sg" class="PRO"/>
  <entry word="he" pos="NNP" macros="@sg" class="PRO"/>
  <entry word="it" pos="NNP" macros="@sg" class="PRO"/>
  <entry word="you" pos="NNP" macros="@-3rd" class="PRO"/>
  <entry word="Spain" pos="NNP" macros="@sg" class="COUNTRY"/>
  <entry word="Germany" pos="NNP" macros="@sg" class="COUNTRY"/>
  <entry word="Brazil" pos="NNP" macros="@sg" class="COUNTRY"/>
  <entry word="Turkey" pos="NNP" macros="@sg" class="COUNTRY"/>
  <entry word="China" pos="NNP" macros="@sg" class="COUNTRY"/>
  <entry word="Paraguay" pos="NNP" macros="@sg" class="COUNTRY"/>
  <entry word="John" pos="NNP" macros="@sg" class="PERSON"/>
  <entry word="Joao" pos="NNP" macros="@sg" class="PERSON"/>
  <entry word="Maria" pos="NNP" macros="@sg" class="PERSON"/>
  <entry word="Bill" pos="NNP" macros="@sg" class="PERSON"/>
  <entry word="Ronaldo" pos="NNP" macros="@sg" class="PERSON"/>
  <entry word="Ronaldinho" pos="NNP" macros="@sg" class="PERSON"/>
  <entry word="Rivaldo" pos="NNP" macros="@sg" class="PERSON"/>
  <entry word="Marcos" pos="NNP" macros="@sg" class="PERSON"/>
  <entry word="Kahn" pos="NNP" macros="@sg" class="PERSON"/>
  <entry word="Unsal" pos="NNP" macros="@sg" class="PERSON"/>
  <macro name="@+3rd-agr">
    <fs id="1" attr="3rd" val="+"/>
    <fs id="2" attr="3rd" val="+"/>
  </macro>
  <macro name="@-3rd">
    <fs id="1" attr="3rd" val="-"/>
    <fs id="2" attr="3rd" val="-"/>
  </macro>
  <macro name="@-3rd-agr">
    <fs id="1" attr="3rd" val="-"/>
    <fs id="2" attr="3rd" val="-"/>
  </macro>
  <macro name="@sg">
    <fs id="2" attr="num" val="sg"/>
    <lf>
      <satop nomvar="X">
        <diamond mode="num">
          <prop name="sg"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@sg-agr">
    <fs id="1" attr="num" val="sg"/>
    <fs id="2" attr="num" val="sg"/>
  </macro>
  <macro name="@pl">
    <fs id="2" attr="num" val="pl"/>
    <lf>
      <satop nomvar="X">
        <diamond mode="num">
          <prop name="pl"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@pl-agr">
    <fs id="1" attr="num" val="pl"/>
    <fs id="2" attr="num" val="pl"/>
  </macro>
  <macro name="@pp-from">
    <fs id="3" attr="lex" val="from"/>
  </macro>
  <macro name="@pp-to">
    <fs id="3" attr="lex" val="to"/>
  </macro>
  <macro name="@prt-up">
    <fs id="4" attr="lex" val="up"/>
  </macro>
  <macro name="@prt-with">
    <fs id="4" attr="lex" val="with"/>
  </macro>
  <macro name="@gerund">
    <fs id="1" attr="vform" val="ger"/>
  </macro>
  <macro name="@nonfin">
    <fs id="1" attr="vform" val="non-fin"/>
  </macro>
  <macro name="@finite">
    <fs id="1">
      <feat attr="vform" val="fin"/>
    </fs>
  </macro>
  <macro name="@past">
    <lf>
      <satop nomvar="E">
        <diamond mode="tense">
          <prop name="past"/>
        </diamond>
      </satop>
    </lf>
  </macro>
  <macro name="@pres">
    <lf>
      <satop nomvar="E">
        <diamond mode="tense">
          <prop name="pres"/>
        </diamond>
      </satop>
    </lf>
  </macro>
</morph>


================================================
FILE: grammars/worldcup/raise-nodes.xsl
================================================
<?xml version="1.0"?>
<!-- 
Copyright (C) 2003-4 University of Edinburgh (Michael White)
$Revision: 1.4 $, $Date: 2009/06/16 19:40:53 $ 

This transformation raises desired shared nodes up to a parallel location, 
so that the resulting subtrees can be more easily chunked into realizable
constituents.  The predicates are moved under a new satop, leaving behind 
just a nominal reference.
-->
<xsl:transform 
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform" 
  version="1.0"
  xmlns:java="http://xml.apache.org/xslt/java"
  xmlns:xalan2="http://xml.apache.org/xslt"
  exclude-result-prefixes="java xalan2">

  <xsl:output indent="yes" xalan2:indent-amount="2"/> 
  <xsl:strip-space elements="*"/>

  <!-- use shared raise-nodes.xsl, primarily -->
  <xsl:include href="../raise-nodes.xsl"/>

  
  <!-- raises nodes nested in quantifier's restriction and shared in body --> 
  <xsl:template match="*[diamond[@mode='Restr']]">
    <xsl:call-template name="raise-shared-nodes">
      <!-- check for shared nominals in and out of the restriction -->
      <xsl:with-param name="noms-root" select="."/>
      <xsl:with-param name="rel">Restr</xsl:with-param>
    </xsl:call-template>
  </xsl:template>

</xsl:transform>


================================================
FILE: grammars/worldcup/rules.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<!-- 
Copyright (C) 2003 Jason Baldridge and University of Edinburgh (Michael White) 
$Revision: 1.3 $, $Date: 2004/10/05 11:01:48 $ 
-->
<rules name="worldcup"
  xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
  xsi:noNamespaceSchemaLocation="../rules.xsd"
>
  <application dir="forward"/>
  <application dir="backward"/>
  <composition dir="forward" harmonic="true"/>
  <composition dir="forward" harmonic="false"/>
  <composition dir="backward" harmonic="true"/>
  <composition dir="backward" harmonic="false"/>
  <typeraising dir="forward" useDollar="false"/>
  <typeraising dir="backward" useDollar="true"/>
  <substitution dir="forward" harmonic="true"/>
  <substitution dir="forward" harmonic="false"/>
  <substitution dir="backward" harmonic="true"/>
  <substitution dir="backward" harmonic="false"/>
</rules>


================================================
FILE: grammars/worldcup/testbed.xml
================================================
<?xml version="1.0"?>
<!-- 
Copyright (C) 2003 Jason Baldridge and University of Edinburgh (Michael White) 
$Revision: 1.5 $, $Date: 2004/10/05 11:01:48 $ 
-->
<regression>
  <item numOfParses="1" string="Brazil defeated Germany ."/>
  <item numOfParses="0" string="defeated Brazil Germany ."/>
  <item numOfParses="1" string="did Brazil defeat Germany ?"/>
  <item numOfParses="1" string="Brazil played and defeated Germany ."/>
  <item numOfParses="0" string="Brazil played Germany and defeated ."/>
  <item numOfParses="1" string="Brazil defeated Germany and won the cup ."/>
  <item numOfParses="1" string="John bought and gave his family the tickets ."/>
  <item numOfParses="2" string="Brazil defeated Turkey and Germany ."/>
  <item numOfParses="1" string="team that defeated Germany"/>
  <item numOfParses="1" string="team that Brazil defeated"/>
  <item numOfParses="1" string="team that I thought that Brazil defeated"/>
  <item numOfParses="1" string="team that I thought that you said that Brazil defeated"/>
  <item numOfParses="1" string="team that I thought that you said that John knew that Brazil defeated"/>
  <item numOfParses="1" string="team that Brazil defeated yesterday"/>
  <item numOfParses="1" string="Marcos picked the ball up ."/>
  <item numOfParses="1" string="Marcos picked up the ball ."/>
  <item numOfParses="1" string="Brazil will meet and should defeat China ."/>
  <item numOfParses="1" string="I offered and may give my friend a ticket ."/>
  <item numOfParses="1" string="Marcos threw and Ronaldo kicked the ball ."/>
  <item numOfParses="2" string="the referee gave Unsal a card and Rivaldo the ball ."/>
  <item numOfParses="1" string="Unsal threw the card and Rivaldo the ball ."/>
  <item numOfParses="1" string="Kahn blocked skillfully a powerful shot by Rivaldo ."/>
  <item numOfParses="1" string="shot that Kahn blocked skillfully"/>
  <item numOfParses="1" string="John watched the game without enjoying it ."/>
  <item numOfParses="6" string="John watched without enjoying the game between Germany and Paraguay ."/>
  <item numOfParses="1" string="game that John watched without enjoying"/>
  <item numOfParses="1" string="I persuaded every detractor of Brazil to support the team ."/>
  <item numOfParses="1" string="I persuaded every detractor of to support the team that won the cup final ."/>
  <item numOfParses="1" string="team that I persuaded every detractor of to support"/>
  <item numOfParses="2" string="John knew that Brazil would defeat and Bill predicted that China would tie with Turkey ."/>
  <item numOfParses="0" string="China not won ."/>
  <item numOfParses="1" string="China did not win ."/>
  <item numOfParses="1" string="China Brazil defeated ."/>
  <item numOfParses="0" string="team that Brazil to defeat"/>
  <item numOfParses="0" string="team that to defeat China"/>
  <item numOfParses="2" string="Brazil defeated yesterday the team that it beat previously ."/>
  <item numOfParses="0" string="player that shoots and he misses"/>
  <item numOfParses="1" string="Rivaldo skillfully kicked the ball ."/>
  <item numOfParses="1" string="ball that Rivaldo kicked"/>
  <item numOfParses="1" string="powerful shot by Rivaldo"/>
  <item numOfParses="0" string="powerful by Rivaldo shot"/>
  <item numOfParses="1" string="the players that came from Spain angrily left ."/>
  <item numOfParses="0" string="the players angrily that came from Spain left ."/>
  <item numOfParses="0" string="goals that I saw the players that scored"/>
  <item numOfParses="0" string="player that I saw the red card that the referee gave"/>
  <item numOfParses="0" string="the fan in the field left and in the stadium stayed ."/>
  <item numOfParses="1" string="the fan in the field left and the fan in the stadium stayed ."/>
  <item numOfParses="2" string="player that the referee gave a yellow card"/>
  <item numOfParses="1" string="the referee gave a yellow card the aggressive player ."/>
  <item numOfParses="1" string="team that John knew that Brazil would defeat"/>
  <item numOfParses="0" string="team that John knew that would defeat China"/>
  <item numOfParses="0" string="John Brazil knew that would defeat China ."/>
  <item numOfParses="1" string="team that John knew would defeat China"/>
  <item numOfParses="1" string="the referee gave the player today a well-deserved red card ."/>
  <item numOfParses="0" string="the referee gave today the aggressive player a well-deserved red card ."/>
  <item numOfParses="1" string="Joao traveled to the country that hosted the cup final ."/>
  <item numOfParses="2" string="which country did Joao travel to skeptically and return from joyfully ?"/>
  <item numOfParses="0" string="Joao traveled to skeptically the country that hosted the cup final ."/>
  <item numOfParses="1" string="Joao traveled to and Maria returned from the country that hosted the cup final ."/>
  <item numOfParses="1" string="player that I read a book about"/>
  <item numOfParses="1" string="player that I read a book about yesterday"/>
  <item numOfParses="0" string="player that a book about astonished me" known="true"/>
</regression>


================================================
FILE: lib/ASL
================================================
/*
 * ============================================================================
 *                   The Apache Software License, Version 1.1
 * ============================================================================
 * 
 *    Copyright (C) 1999 The Apache Software Foundation. All rights reserved.
 * 
 * Redistribution and use in source and binary forms, with or without modifica-
 * tion, are permitted provided that the following conditions are met:
 * 
 * 1. Redistributions of  source code must  retain the above copyright  notice,
 *    this list of conditions and the following disclaimer.
 * 
 * 2. Redistributions in binary form must reproduce the above copyright notice,
 *    this list of conditions and the following disclaimer in the documentation
 *    and/or other materials provided with the distribution.
 * 
 * 3. The end-user documentation included with the redistribution, if any, must
 *    include  the following  acknowledgment:  "This product includes  software
 *    developed  by the  Apache Software Foundation  (http://www.apache.org/)."
 *    Alternately, this  acknowledgment may  appear in the software itself,  if
 *    and wherever such third-party acknowledgments normally appear.
 * 
 * 4. The names "Ant" and  "Apache Software Foundation"  must not be used to
 *    endorse  or promote  products derived  from this  software without  prior
 *    written permission. For written permission, please contact
 *    apache@apache.org.
 * 
 * 5. Products  derived from this software may not  be called "Apache", nor may
 *    "Apache" appear  in their name,  without prior written permission  of the
 *    Apache Software Foundation.
 * 
 * THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESSED OR IMPLIED WARRANTIES,
 * INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND
 * FITNESS  FOR A PARTICULAR  PURPOSE ARE  DISCLAIMED.  IN NO  EVENT SHALL  THE
 * APACHE SOFTWARE  FOUNDATION  OR ITS CONTRIBUTORS  BE LIABLE FOR  ANY DIRECT,
 * INDIRECT, INCIDENTAL, SPECIAL,  EXEMPLARY, OR CONSEQUENTIAL  DAMAGES (INCLU-
 * DING, BUT NOT LIMITED TO, PROCUREMENT  OF SUBSTITUTE GOODS OR SERVICES; LOSS
 * OF USE, DATA, OR  PROFITS; OR BUSINESS  INTERRUPTION)  HOWEVER CAUSED AND ON
 * ANY  THEORY OF LIABILITY,  WHETHER  IN CONTRACT,  STRICT LIABILITY,  OR TORT
 * (INCLUDING  NEGLIGENCE OR  OTHERWISE) ARISING IN  ANY WAY OUT OF THE  USE OF
 * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 * 
 * This software  consists of voluntary contributions made  by many individuals
 * on behalf of the  Apache Software Foundation.  For more  information  on the 
 * Apache Software Foundation, please see <http://www.apache.org/>.
 *
 */


================================================
FILE: lib/LGPL
================================================
		  GNU LESSER GENERAL PUBLIC LICENSE
		       Version 2.1, February 1999

 Copyright (C) 1991, 1999 Free Software Foundation, Inc.
     59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
 Everyone is permitted to copy and distribute verbatim copies
 of this license document, but changing it is not allowed.

[This is the first released version of the Lesser GPL.  It also counts
 as the successor of the GNU Library Public License, version 2, hence
 the version number 2.1.]

			    Preamble

  The licenses for most software are designed to take away your
freedom to share and change it.  By contrast, the GNU General Public
Licenses are intended to guarantee your freedom to share and change
free software--to make sure the software is free for all its users.

  This license, the Lesser General Public License, applies to some
specially designated software packages--typically libraries--of the
Free Software Foundation and other authors who decide to use it.  You
can use it too, but we suggest you first think carefully about whether
this license or the ordinary General Public License is the better
strategy to use in any particular case, based on the explanations below.

  When we speak of free software, we are referring to freedom of use,
not price.  Our General Public Licenses are designed to make sure that
you have the freedom to distribute copies of free software (and charge
for this service if you wish); that you receive source code or can get
it if you want it; that you can change the software and use pieces of
it in new free programs; and that you are informed that you can do
these things.

  To protect your rights, we need to make restrictions that forbid
distributors to deny you these rights or to ask you to surrender these
rights.  These restrictions translate to certain responsibilities for
you if you distribute copies of the library or if you modify it.

  For example, if you distribute copies of the library, whether gratis
or for a fee, you must give the recipients all the rights that we gave
you.  You must make sure that they, too, receive or can get the source
code.  If you link other code with the library, you must provide
complete object files to the recipients, so that they can relink them
with the library after making changes to the library and recompiling
it.  And you must show them these terms so they know their rights.

  We protect your rights with a two-step method: (1) we copyright the
library, and (2) we offer you this license, which gives you legal
permission to copy, distribute and/or modify the library.

  To protect each distributor, we want to make it very clear that
there is no warranty for the free library.  Also, if the library is
modified by someone else and passed on, the recipients should know
that what they have is not the original version, so that the original
author's reputation will not be affected by problems that might be
introduced by others.

  Finally, software patents pose a constant threat to the existence of
any free program.  We wish to make sure that a company cannot
effectively restrict the users of a free program by obtaining a
restrictive license from a patent holder.  Therefore, we insist that
any patent license obtained for a version of the library must be
consistent with the full freedom of use specified in this license.

  Most GNU software, including some libraries, is covered by the
ordinary GNU General Public License.  This license, the GNU Lesser
General Public License, applies to certain designated libraries, and
is quite different from the ordinary General Public License.  We use
this license for certain libraries in order to permit linking those
libraries into non-free programs.

  When a program is linked with a library, whether statically or using
a shared library, the combination of the two is legally speaking a
combined work, a derivative of the original library.  The ordinary
General Public License therefore permits such linking only if the
entire combination fits its criteria of freedom.  The Lesser General
Public License permits more lax criteria for linking other code with
the library.

  We call this license the "Lesser" General Public License because it
does Less to protect the user's freedom than the ordinary General
Public License.  It also provides other free software developers Less
of an advantage over competing non-free programs.  These disadvantages
are the reason we use the ordinary General Public License for many
libraries.  However, the Lesser license provides advantages in certain
special circumstances.

  For example, on rare occasions, there may be a special need to
encourage the widest possible use of a certain library, so that it becomes
a de-facto standard.  To achieve this, non-free programs must be
allowed to use the library.  A more frequent case is that a free
library does the same job as widely used non-free libraries.  In this
case, there is little to gain by limiting the free library to free
software only, so we use the Lesser General Public License.

  In other cases, permission to use a particular library in non-free
programs enables a greater number of people to use a large body of
free software.  For example, permission to use the GNU C Library in
non-free programs enables many more people to use the whole GNU
operating system, as well as its variant, the GNU/Linux operating
system.

  Although the Lesser General Public License is Less protective of the
users' freedom, it does ensure that the user of a program that is
linked with the Library has the freedom and the wherewithal to run
that program using a modified version of the Library.

  The precise terms and conditions for copying, distribution and
modification follow.  Pay close attention to the difference between a
"work based on the library" and a "work that uses the library".  The
former contains code derived from the library, whereas the latter must
be combined with the library in order to run.

		  GNU LESSER GENERAL PUBLIC LICENSE
   TERMS AND CONDITIONS FOR COPYING, DISTRIBUTION AND MODIFICATION

  0. This License Agreement applies to any software library or other
program which contains a notice placed by the copyright holder or
other authorized party saying it may be distributed under the terms of
this Lesser General Public License (also called "this License").
Each licensee is addressed as "you".

  A "library" means a collection of software functions and/or data
prepared so as to be conveniently linked with application programs
(which use some of those functions and data) to form executables.

  The "Library", below, refers to any such software library or work
which has been distributed under these terms.  A "work based on the
Library" means either the Library or any derivative work under
copyright law: that is to say, a work containing the Library or a
portion of it, either verbatim or with modifications and/or translated
straightforwardly into another language.  (Hereinafter, translation is
included without limitation in the term "modification".)

  "Source code" for a work means the preferred form of the work for
making modifications to it.  For a library, complete source code means
all the source code for all modules it contains, plus any associated
interface definition files, plus the scripts used to control compilation
and installation of the library.

  Activities other than copying, distribution and modification are not
covered by this License; they are outside its scope.  The act of
running a program using the Library is not restricted, and output from
such a program is covered only if its contents constitute a work based
on the Library (independent of the use of the Library in a tool for
writing it).  Whether that is true depends on what the Library does
and what the program that uses the Library does.
  
  1. You may copy and distribute verbatim copies of the Library's
complete source code as you receive it, in any medium, provided that
you conspicuously and appropriately publish on each copy an
appropriate copyright notice and disclaimer of warranty; keep intact
all the notices that refer to this License and to the absence of any
warranty; and distribute a copy of this License along with the
Library.

  You may charge a fee for the physical act of transferring a copy,
and you may at your option offer warranty protection in exchange for a
fee.

  2. You may modify your copy or copies of the Library or any portion
of it, thus forming a work based on the Library, and copy and
distribute such modifications or work under the terms of Section 1
above, provided that you also meet all of these conditions:

    a) The modified work must itself be a software library.

    b) You must cause the files modified to carry prominent notices
    stating that you changed the files and the date of any change.

    c) You must cause the whole of the work to be licensed at no
    charge to all third parties under the terms of this License.

    d) If a facility in the modified Library refers to a function or a
    table of data to be supplied by an application program that uses
    the facility, other than as an argument passed when the facility
    is invoked, then you must make a good faith effort to ensure that,
    in the event an application does not supply such function or
    table, the facility still operates, and performs whatever part of
    its purpose remains meaningful.

    (For example, a function in a library to compute square roots has
    a purpose that is entirely well-defined independent of the
    application.  Therefore, Subsection 2d requires that any
    application-supplied function or table used by this function must
    be optional: if the application does not supply it, the square
    root function must still compute square roots.)

These requirements apply to the modified work as a whole.  If
identifiable sections of that work are not derived from the Library,
and can be reasonably considered independent and separate works in
themselves, then this License, and its terms, do not apply to those
sections when you distribute them as separate works.  But when you
distribute the same sections as part of a whole which is a work based
on the Library, the distribution of the whole must be on the terms of
this License, whose permissions for other licensees extend to the
entire whole, and thus to each and every part regardless of who wrote
it.

Thus, it is not the intent of this section to claim rights or contest
your rights to work written entirely by you; rather, the intent is to
exercise the right to control the distribution of derivative or
collective works based on the Library.

In addition, mere aggregation of another work not based on the Library
with the Library (or with a work based on the Library) on a volume of
a storage or distribution medium does not bring the other work under
the scope of this License.

  3. You may opt to apply the terms of the ordinary GNU General Public
License instead of this License to a given copy of the Library.  To do
this, you must alter all the notices that refer to this License, so
that they refer to the ordinary GNU General Public License, version 2,
instead of to this License.  (If a newer version than version 2 of the
ordinary GNU General Public License has appeared, then you can specify
that version instead if you wish.)  Do not make any other change in
these notices.

  Once this change is made in a given copy, it is irreversible for
that copy, so the ordinary GNU General Public License applies to all
subsequent copies and derivative works made from that copy.

  This option is useful when you wish to copy part of the code of
the Library into a program that is not a library.

  4. You may copy and distribute the Library (or a portion or
derivative of it, under Section 2) in object code or executable form
under the terms of Sections 1 and 2 above provided that you accompany
it with the complete corresponding machine-readable source code, which
must be distributed under the terms of Sections 1 and 2 above on a
medium customarily used for software interchange.

  If distribution of object code is made by offering access to copy
from a designated place, then offering equivalent access to copy the
source code from the same place satisfies the requirement to
distribute the source code, even though third parties are not
compelled to copy the source along with the object code.

  5. A program that contains no derivative of any portion of the
Library, but is designed to work with the Library by being compiled or
linked with it, is called a "work that uses the Library".  Such a
work, in isolation, is not a derivative work of the Library, and
therefore falls outside the scope of this License.

  However, linking a "work that uses the Library" with the Library
creates an executable that is a derivative of the Library (because it
contains portions of the Library), rather than a "work that uses the
library".  The executable is therefore covered by this License.
Section 6 states terms for distribution of such executables.

  When a "work that uses the Library" uses material from a header file
that is part of the Library, the object code for the work may be a
derivative work of the Library even though the source code is not.
Whether this is true is especially significant if the work can be
linked without the Library, or if the work is itself a library.  The
threshold for this to be true is not precisely defined by law.

  If such an object file uses only numerical parameters, data
structure layouts and accessors, and small macros and small inline
functions (ten lines or less in length), then the use of the object
file is unrestricted, regardless of whether it is legally a derivative
work.  (Executables containing this object code plus portions of the
Library will still fall under Section 6.)

  Otherwise, if the work is a derivative of the Library, you may
distribute the object code for the work under the terms of Section 6.
Any executables containing that work also fall under Section 6,
whether or not they are linked directly with the Library itself.

  6. As an exception to the Sections above, you may also combine or
link a "work that uses the Library" with the Library to produce a
work containing portions of the Library, and distribute that work
under terms of your choice, provided that the terms permit
modification of the work for the customer's own use and reverse
engineering for debugging such modifications.

  You must give prominent notice with each copy of the work that the
Library is used in it and that the Library and its use are covered by
this License.  You must supply a copy of this License.  If the work
during execution displays copyright notices, you must include the
copyright notice for the Library among them, as well as a reference
directing the user to the copy of this License.  Also, you must do one
of these things:

    a) Accompany the work with the complete corresponding
    machine-readable source code for the Library including whatever
    changes were used in the work (which must be distributed under
    Sections 1 and 2 above); and, if the work is an executable linked
    with the Library, with the complete machine-readable "work that
    uses the Library", as object code and/or source code, so that the
    user can modify the Library and then relink to produce a modified
    executable containing the modified Library.  (It is understood
    that the user who changes the contents of definitions files in the
    Library will not necessarily be able to recompile the application
    to use the modified definitions.)

    b) Use a suitable shared library mechanism for linking with the
    Library.  A suitable mechanism is one that (1) uses at run time a
    copy of the library already present on the user's computer system,
    rather than copying library functions into the executable, and (2)
    will operate properly with a modified version of the library, if
    the user installs one, as long as the modified version is
    interface-compatible with the version that the work was made with.

    c) Accompany the work with a written offer, valid for at
    least three years, to give the same user the materials
    specified in Subsection 6a, above, for a charge no more
    than the cost of performing this distribution.

    d) If distribution of the work is made by offering access to copy
    from a designated place, offer equivalent access to copy the above
    specified materials from the same place.

    e) Verify that the user has already received a copy of these
    materials or that you have already sent this user a copy.

  For an executable, the required form of the "work that uses the
Library" must include any data and utility programs needed for
reproducing the executable from it.  However, as a special exception,
the materials to be distributed need not include anything that is
normally distributed (in either source or binary form) with the major
components (compiler, kernel, and so on) of the operating system on
which the executable runs, unless that component itself accompanies
the executable.

  It may happen that this requirement contradicts the license
restrictions of other proprietary libraries that do not normally
accompany the operating system.  Such a contradiction means you cannot
use both them and the Library together in an executable that you
distribute.

  7. You may place library facilities that are a work based on the
Library side-by-side in a single library together with other library
facilities not covered by this License, and distribute such a combined
library, provided that the separate distribution of the work based on
the Library and of the other library facilities is otherwise
permitted, and provided that you do these two things:

    a) Accompany the combined library with a copy of the same work
    based on the Library, uncombined with any other library
    facilities.  This must be distributed under the terms of the
    Sections above.

    b) Give prominent notice with the combined library of the fact
    that part of it is a work based on the Library, and explaining
    where to find the accompanying uncombined form of the same work.

  8. You may not copy, modify, sublicense, link with, or distribute
the Library except as expressly provided under this License.  Any
attempt otherwise to copy, modify, sublicense, link with, or
distribute the Library is void, and will automatically terminate your
rights under this License.  However, parties who have received copies,
or rights, from you under this License will not have their licenses
terminated so long as such parties remain in full compliance.

  9. You are not required to accept this License, since you have not
signed it.  However, nothing else grants you permission to modify or
distribute the Library or its derivative works.  These actions are
prohibited by law if you do not accept this License.  Therefore, by
modifying or distributing the Library (or any work based on the
Library), you indicate your acceptance of this License to do so, and
all its terms and conditions for copying, distributing or modifying
the Library or works based on it.

  10. Each time you redistribute the Library (or any work based on the
Library), the recipient automatically receives a license from the
original licensor to copy, distribute, link with or modify the Library
subject to these terms and conditions.  You may not impose any further
restrictions on the recipients' exercise of the rights granted herein.
You are not responsible for enforcing compliance by third parties with
this License.

  11. If, as a consequence of a court judgment or allegation of patent
infringement or for any other reason (not limited to patent issues),
conditions are imposed on you (whether by court order, agreement or
otherwise) that contradict the conditions of this License, they do not
excuse you from the conditions of this License.  If you cannot
distribute so as to satisfy simultaneously your obligations under this
License and any other pertinent obligations, then as a consequence you
may not distribute the Library at all.  For example, if a patent
license would not permit royalty-free redistribution of the Library by
all those who receive copies directly or indirectly through you, then
the only way you could satisfy both it and this License would be to
refrain entirely from distribution of the Library.

If any portion of this section is held invalid or unenforceable under any
particular circumstance, the balance of the section is intended to apply,
and the section as a whole is intended to apply in other circumstances.

It is not the purpose of this section to induce you to infringe any
patents or other property right claims or to contest validity of any
such claims; this section has the sole purpose of protecting the
integrity of the free software distribution system which is
implemented by public license practices.  Many people have made
generous contributions to the wide range of software distributed
through that system in reliance on consistent application of that
system; it is up to the author/donor to decide if he or she is willing
to distribute software through any other system and a licensee cannot
impose that choice.

This section is intended to make thoroughly clear what is believed to
be a consequence of the rest of this License.

  12. If the distribution and/or use of the Library is restricted in
certain countries either by patents or by copyrighted interfaces, the
original copyright holder who places the Library under this License may add
an explicit geographical distribution limitation excluding those countries,
so that distribution is permitted only in or among countries not thus
excluded.  In such case, this License incorporates the limitation as if
written in the body of this License.

  13. The Free Software Foundation may publish revised and/or new
versions of the Lesser General Public License from time to time.
Such new versions will be similar in spirit to the present version,
but may differ in detail to address new problems or concerns.

Each version is given a distinguishing version number.  If the Library
specifies a version number of this License which applies to it and
"any later version", you have the option of following the terms and
conditions either of that version or of any later version published by
the Free Software Foundation.  If the Library does not specify a
license version number, you may choose any version ever published by
the Free Software Foundation.

  14. If you wish to incorporate parts of the Library into other free
programs whose distribution conditions are incompatible with these,
write to the author to ask for permission.  For software which is
copyrighted by the Free Software Foundation, write to the Free
Software Foundation; we sometimes make exceptions for this.  Our
decision will be guided by the two goals of preserving the free status
of all derivatives of our free software and of promoting the sharing
and reuse of software generally.

			    NO WARRANTY

  15. BECAUSE THE LIBRARY IS LICENSED FREE OF CHARGE, THERE IS NO
WARRANTY FOR THE LIBRARY, TO THE EXTENT PERMITTED BY APPLICABLE LAW.
EXCEPT WHEN OTHERWISE STATED IN WRITING THE COPYRIGHT HOLDERS AND/OR
OTHER PARTIES PROVIDE THE LIBRARY "AS IS" WITHOUT WARRANTY OF ANY
KIND, EITHER EXPRESSED OR IMPLIED, INCLUDING, BUT NOT LIMITED TO, THE
IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
PURPOSE.  THE ENTIRE RISK AS TO THE QUALITY AND PERFORMANCE OF THE
LIBRARY IS WITH YOU.  SHOULD THE LIBRARY PROVE DEFECTIVE, YOU ASSUME
THE COST OF ALL NECESSARY SERVICING, REPAIR OR CORRECTION.

  16. IN NO EVENT UNLESS REQUIRED BY APPLICABLE LAW OR AGREED TO IN
WRITING WILL ANY COPYRIGHT HOLDER, OR ANY OTHER PARTY WHO MAY MODIFY
AND/OR REDISTRIBUTE THE LIBRARY AS PERMITTED ABOVE, BE LIABLE TO YOU
FOR DAMAGES, INCLUDING ANY GENERAL, SPECIAL, INCIDENTAL OR
CONSEQUENTIAL DAMAGES ARISING OUT OF THE USE OR INABILITY TO USE THE
LIBRARY (INCLUDING BUT NOT LIMITED TO LOSS OF DATA OR DATA BEING
RENDERED INACCURATE OR LOSSES SUSTAINED BY YOU OR THIRD PARTIES OR A
FAILURE OF THE LIBRARY TO OPERATE WITH ANY OTHER SOFTWARE), EVEN IF
SUCH HOLDER OR OTHER PARTY HAS BEEN ADVISED OF THE POSSIBILITY OF SUCH
DAMAGES.

		     END OF TERMS AND CONDITIONS

           How to Apply These Terms to Your New Libraries

  If you develop a new library, and you want it to be of the greatest
possible use to the public, we recommend making it free software that
everyone can redistribute and change.  You can do so by permitting
redistribution under these terms (or, alternatively, under the terms of the
ordinary General Public License).

  To apply these terms, attach the following notices to the library.  It is
safest to attach them to the start of each source file to most effectively
convey the exclusion of warranty; and each file should have at least the
"copyright" line and a pointer to where the full notice is found.

    <one line to give the library's name and a brief idea of what it does.>
    Copyright (C) <year>  <name of author>

    This library is free software; you can redistribute it and/or
    modify it under the terms of the GNU Lesser General Public
    License as published by the Free Software Foundation; either
    version 2.1 of the License, or (at your option) any later version.

    This library is distributed in the hope that it will be useful,
    but WITHOUT ANY WARRANTY; without even the implied warranty of
    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
    Lesser General Public License for more details.

    You should have received a copy of the GNU Lesser General Public
    License along with this library; if not, write to the Free Software
    Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA

Also add information on how to contact you by electronic and paper mail.

You should also get your employer (if you work as a programmer) or your
school, if any, to sign a "copyright disclaimer" for the library, if
necessary.  Here is a sample; alter the names:

  Yoyodyne, Inc., hereby disclaims all copyright interest in the
  library `Frob' (a library for tweaking knobs) written by James Random Hacker.

  <signature of Ty Coon>, 1 April 1990
  Ty Coon, President of Vice

That's all there is to it!


================================================
FILE: lib/LIBNOTES
================================================

This file briefly describes the libraries which are used by the 
OpenNLP CCG Library. See the appropriate license files also in this directory.

------------------------------------------------------------------------
ant.jar, ant-launcher.jar, ant-junit.jar, ant-junit4.jar, ant-contrib.jar

The Apache Ant Build System, version 1.9.0
Homepage: http://ant.apache.org/
ANT Contrib, version 1.0b3
Homepage: http://sourceforge.net/projects/ant-contrib/
License: Apache Software License (ASL)

A Java based build tool. 


------------------------------------------------------------------------
jdom.jar

JDOM, version 1.1
Homepage: http://www.jdom.org
License: See jdom.license

A complete, Java-based solution for accessing, manipulating, and
outputting XML data from Java code.


------------------------------------------------------------------------
jgrapht-jdk1.6.jar

JGraphT, version 0.8.3
Homepage: http://www.jgrapht.org
License: LGPL 

A free Java graph library that provides mathematical graph-theory objects 
and algorithms.


------------------------------------------------------------------------
jline.jar

jLine, version 1.0
Homepage: http://jline.sourceforge.net/
License: See jline.license

JLine is a Java library for handling console input.  
It is similar in functionality to BSD editline and GNU readline,
providing a command input history and more.


------------------------------------------------------------------------
junit-4.10.jar

JUnit, version 4.10
Homepage: http://junit.sourceforge.net/
License: Common Public License - v 1.0

JUnit is a simple, open source framework to write and run repeatable
tests. 


------------------------------------------------------------------------
libken.so

KenLM, version 4
Homepage: http://kheafield.com/code/kenlm/
License: LGPL primarily (see src/kenlm/LICENSE)

KenLM is a language modeling toolkit supporting large LMs via a
memory-mapped binary format.  JNI interface for linux adapted from the
Joshua decoder; other platforms possible in principle.


------------------------------------------------------------------------
trove.jar

GNU Trove, version 1.0.2
Homepage: http://trove4j.sf.net
License: LGPL

High performance collections for Java.


------------------------------------------------------------------------
xalan.jar, xercesImpl.jar, xml-apis.jar, xlstc.jar, serializer.jar

The Apache Xalan-J XML transformation processor, version 2.7.1
The Apache Xerces-J XML parser, version 2.9.0
Homepage: http://xml.apache.org
License: Apache Software License (ASL)

XSLT transformation library and associated XML parser,
with schema validation support.


------------------------------------------------------------------------
jopt-simple.jar

JOpt Simple, version 3.1
Homepage: http://jopt-simple.sourceforge.net/
License: MIT License

Command-line options parsing library.


------------------------------------------------------------------------
javacc.jar

JavaCC, version 4.0
Homepage: https://javacc.dev.java.net/
License: SUN License

Java parser generator.


================================================
FILE: lib/MIT
================================================


The MIT License

Copyright (c) <year> <copyright holders>

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the "Software"), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in
all copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
THE SOFTWARE.


================================================
FILE: lib/SUN
================================================
Copyright (c) 2003 Sun Microsystems, Inc. All  Rights Reserved.

Redistribution and use in source and binary forms, with or without modification, 
are permitted provided that the following conditions are met:

-Redistribution of source code must retain the above copyright notice, this  list of conditions and the following disclaimer.

-Redistribution in binary form must reproduce the above copyright notice, 
this list of conditions and the following disclaimer in the documentation and/or 
other materials provided with the distribution.

Neither the name of Sun Microsystems, Inc. or the names of contributors may 
be used to endorse or promote products derived from this software without 
specific prior written permission.

This software is provided "AS IS," without a warranty of any kind. ALL EXPRESS OR IMPLIED CONDITIONS, REPRESENTATIONS AND WARRANTIES, INCLUDING ANY IMPLIED WARRANTY OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE OR NON-INFRINGEMENT, ARE HEREBY EXCLUDED. SUN MIDROSYSTEMS, INC. ("SUN") AND ITS LICENSORS SHALL NOT BE LIABLE FOR ANY DAMAGES SUFFERED BY LICENSEE AS A RESULT OF USING, MODIFYING OR DISTRIBUTING THIS SOFTWARE OR ITS DERIVATIVES. IN NO EVENT WILL SUN OR ITS LICENSORS BE LIABLE FOR ANY LOST REVENUE, PROFIT OR DATA, OR FOR DIRECT, INDIRECT, SPECIAL, CONSEQUENTIAL, INCIDENTAL OR PUNITIVE DAMAGES, HOWEVER CAUSED AND REGARDLESS OF THE THEORY OF LIABILITY, ARISING OUT OF THE USE OF OR INABILITY TO USE THIS SOFTWARE, EVEN IF SUN HAS BEEN ADVISED OF THE POSSIBILITY OF SUCH DAMAGES.

You acknowledge that  this software is not designed, licensed or intended for use in the design, construction, operation or maintenance of any nuclear facility.


================================================
FILE: lib/jdom.license
================================================
/*-- 

 $Id: jdom.license,v 1.1.1.1 2003/02/28 18:02:10 mwhite14850 Exp $

 Copyright (C) 2001 Brett McLaughlin & Jason Hunter.
 All rights reserved.
 
 Redistribution and use in source and binary forms, with or without
 modification, are permitted provided that the following conditions
 are met:
 
 1. Redistributions of source code must retain the above copyright
    notice, this list of conditions, and the following disclaimer.
 
 2. Redistributions in binary form must reproduce the above copyright
    notice, this list of conditions, and the disclaimer that follows 
    these conditions in the documentation and/or other materials 
    provided with the distribution.

 3. The name "JDOM" must not be used to endorse or promote products
    derived from this software without prior written permission.  For
    written permission, please contact license@jdom.org.
 
 4. Products derived from this software may not be called "JDOM", nor
    may "JDOM" appear in their name, without prior written permission
    from the JDOM Project Management (pm@jdom.org).
 
 In addition, we request (but do not require) that you include in the 
 end-user documentation provided with the redistribution and/or in the 
 software itself an acknowledgement equivalent to the following:
     "This product includes software developed by the
      JDOM Project (http://www.jdom.org/)."
 Alternatively, the acknowledgment may be graphical using the logos 
 available at http://www.jdom.org/images/logos.

 THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESSED OR IMPLIED
 WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
 OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
 DISCLAIMED.  IN NO EVENT SHALL THE JDOM AUTHORS OR THE PROJECT
 CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
 SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
 LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF
 USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
 ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
 OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT
 OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
 SUCH DAMAGE.

 This software consists of voluntary contributions made by many 
 individuals on behalf of the JDOM Project and was originally 
 created by Brett McLaughlin <brett@jdom.org> and 
 Jason Hunter <jhunter@jdom.org>.  For more information on the 
 JDOM Project, please see <http://www.jdom.org/>.
 
 */


================================================
FILE: lib/jline.license
================================================
Copyright (c) 2002-2006, Marc Prud'hommeaux <mwp1@cornell.edu>
All rights reserved.

Redistribution and use in source and binary forms, with or
without modification, are permitted provided that the following
conditions are met:

Redistributions of source code must retain the above copyright
notice, this list of conditions and the following disclaimer.

Redistributions in binary form must reproduce the above copyright
notice, this list of conditions and the following disclaimer
in the documentation and/or other materials provided with
the distribution.

Neither the name of JLine nor the names of its contributors
may be used to endorse or promote products derived from this
software without specific prior written permission.

THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
"AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING,
BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY
AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO
EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE
FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY,
OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED
AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING
IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED
OF THE POSSIBILITY OF SUCH DAMAGE.


================================================
FILE: pom.xml
================================================
    <project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
      xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">

      <modelVersion>4.0.0</modelVersion>
      <groupId>opennlp</groupId>
      <artifactId>ccg</artifactId>
      <version>0.10.0</version>
      <packaging>pom</packaging>

      <modules>
          <module>src/</module>
      </modules>
     
      <properties>
        <maven.compiler.source>1.8</maven.compiler.source>
        <maven.compiler.target>1.8</maven.compiler.target>
      </properties>
      
    </project>


================================================
FILE: src/ccg2xml/README
================================================
README for ccg2xml
Ben Wing
October 8, 2006

ccg2xml is a front-end for more conveniently specifying OpenCCG grammars.
The native XML format is not human-friendly and contains much repetition of
information, often involving long-distance dependencies, which are
difficult to keep track of.  The .ccg format that is accepted by ccg2xml is
designed to be expressive, concise and human-friendly, with as little
required duplication as possible.

ccg2xml is run on a .ccg file and produces (by default) the following files
in the current directory:

-	lexicon.xml: Categories, lexical insertion rules
-	morph.xml: Morphological forms of words, feature macros
-	types.xml: Feature type hierarchies
-	rules.xml: Allowable combinatory, type-raising and type-changing rules
-	grammar.xml: File giving the names and locations of the previous four
                     files
-	testbed.xml: File containing test sentences and expected number of
                     parses

The standard OpenCCG tools, such as tccg, can then be run, as if the
grammar had been developed directly in XML.  ccg2xml will output error
messages if it encounters syntax errors, and in such a case will not
generate any XML files. (There are also warnings that it may generate,
which are non-fatal in that they do not prevent generation.) ccg2xml has a
few options:

  -o controls which XML files are generated; this can be useful for using
     ccg2xml in conjunction with an existing grammar.

  -t outputs the file to stdout after all macro substitutions have been
     applied; this can help in debugging complicated macros that aren't
     working as expected.

  -d controls which directory the XML files are output to (by default, the
     current directory).

   -y, -m, and --super-macro-debug are debug options useful mostly for
       developers of ccg2xml.

For more information, run `ccg2xml -h' to get the "usage" message.

ccg2xml is written in Python, and itself a piece of generated code.
ccg2xml makes use of PLY, a Python system for development of non-ambiguous
context-free grammar parsers, similar to lex and yacc.  PLY is written by
David Beazley (dave@dabeaz.com), available at http://www.dabeaz.com/ply/;
PLY 1.6 is included as part of the ccg2cml source (the files lex.py and
yacc.py). PLY uses a clever trick of introspecting on the source file to
determine the rules, which are stored in documentation strings.  However,
this ends up requiring a certain amount of redundancy in the source file.
This gets awkward for large projects, so I created a front-end format that
closely emulates yacc's format, while adding support for regular-expression
operators on the right-hand side (RHS) of a rule (*, +, and ?); it consists
of mixed CFG specifications and Python code.  The file `convert-ply.py'
converts from my local .ply format into standard .py files, and is used
(see `Makefile') to generate the ccg2xml script.

 (It also attempts to work
around a serious bug in PLY .) The source
file ccg.ply is currently 1,727 lines in length (of mixed CFG
specifications and Python code), and the auto-generated ccg2xml file is
2,370 lines.

ccg2xml is written in Python.  It uses PLY, which is a Python
implementation of the standard `yacc' tool.  

NOTE: ccg2xml was written using PLY 1.6, which is included as part of
ccg2xml (lex.py and yacc.py).  PLY 1.6 contains a serious bug involving
empty RHS productions, which convert-cgi.py attempts to work around and
which ccg.ply also works around.  I was never able to figure out the exact
rule format that triggers this bug, so I simply had to use trial and error
in rewriting rules to get a working ccg2xml.  It is strongly recommended to
upgrade to the most recent version of PLY (currently 2.1), which is likely
to fix this problem, and make it possible to deterministically modify
ccg.ply.

--------------------------------------------------
                 The .ccg format
--------------------------------------------------

The general feel of the syntax is like C, Java or Perl.  Indentation and
whitespace is unimportant (The only exception is in macro definitions,
where the text of a macro must either be on the same line as the definition 
-- possibly extended with backslash line-continuation markers -- or be
enclosed in braces). This is critical for macros, where having to worry
about precisely controlling the indentation or whitespace at the beginning
or end of a macro definition (such as would be required in Python or shell
scripts) would be a major hassle and impediment.

The file consists of a number of declarations, which specify features
(feature {}), word stems and inflected formats (word {}), lexical insertion
rules (family {}), test sentences (testbed {}), and other information
relevant to the grammar.  It can also contain macro definitions (def {})
along with corresponding macro calls, such as the calls to noun() and
verb() in the sample grammar above.  The macro mechanism is essentially
just a way of doing parameterized text substitution, and is discussed in
detail in sections 2.4 and 3.2.

In general, declarations can be in any order; any dependencies that must be
computed are done after the entire file has been parsed.  Furthermore, any
declaration containing multiple parts (for example, a feature declaration
encompassing multiple features, a word declaration with multiple
inflections, or a family declaration with multiple insertion rules) can be
split up into separate declarations.  In addition, the syntax tries to be
very forgiving of the usage of commas, semicolons, and other terminators
and separators. (In most lists, in fact, commas are optional, duplicated
commas are no problem, and extra commas at the end of a list are
allowed. The main exception where commas matter is in macro calls.  You can
still put an extra comma at the end of a macro call, but otherwise you must
have exactly one comma (no more, no less) between arguments.  The reason is
that macro arguments can contain pretty much any text whatsoever (including
no text at all), so commas are needed to indicate where one argument stops
and the next one starts.) This simplifies, in a number of ways, the
creation of lists using macros.

The exceptions to these syntactic allowances are all related to macros.
For example, macros must be defined before they can be used. (That is,
before they are used in a macro call in the main text of the grammar; this
does not apply to macro calls inside of another macro definition.)  Also,
the syntax of commas in argument lists of macro calls is much stricter than
in lists occurring elsewhere in the grammar (see above).

Note that, in general, there is no need to put quotes around literal text,
such as the inflected forms of words.  There is also no concept of
"reserved words" in this format.  Words like feature, word, and entry that
have a special significance as "declarators" when in the right place in the
syntax can otherwise be freely used as word stems and inflections, macro
variable names, part of speech tags, etc.  At the same time, however, it is
possible to put quotes (single or double) around text.  This allows special
characters, spaces, etc. to be used in word inflections, feature values,
and the like; otherwise, only letters, numbers, '_', '-', '+', '%' and
non-ASCII characters can be used.  Quotes can also be used to protect
against the accidental interpretation of a word as a declarator, in the
rare case that this is needed.
 
The overall syntactic laxity of the language is part of a general
philosophy of making the grammar language as tolerant and as expressive as
possible.  This is in keeping with the purpose of the language.  Although
it looks similar to a traditional programming language, its semantics is on
a much higher level, where expressiveness is much more important and
precision relatively less important.  Furthermore, the language is intended
for use by non-programmers as well as programmers, and non-programmers are
is likely to have difficulty with rigid syntax rules, especially in the
presence of macros.


--------------------------------------------------
                         Macros
--------------------------------------------------

The mechanism I chose to use to eliminate repetition is parameterized
macros, which work like macro functions in C.  Their definition includes a
series of formal parameters and a section of literal text intermixed with
the names of the macro's parameters.  When a call to the macro occurs, the
macro's text replaces the call, with the actual arguments to the call
substituted for the occurrences of the corresponding formal parameters in
the text.  Any macro calls occurring in this text are then recursively
expanded.

The macro expansion mechanism generally happens at the level of tokens,
where a token is a single word, a single non-alphanumeric character, or a
single piece of quoted text.  However, it is possible to construct a token
by pasting two tokens together, using the dot operator; this is similar to
the ## operator in C.  This is useful for constructing inflected forms of
words, as shown in the tiny.ccg and arabic.ccg sample files.  It is also
possible to compositionally construct the name of a macro and then call
this constructed name; this is used in arabic.ccg, in the macro
3rd-weak-verb().

The parser pays attention to matched pairs of parens, brackets, and braces
in the text of a macro call argument, and will not get confused by commas
inside of such matched delimiters.  Thus, a macro call foo(a, bar(b, c)) is
correctly interpreted as a call to foo() with two arguments, a and bar(b,
c), and not a call to foo() with three arguments, where the first argument
is a, second argument is bar(b, and third argument is c).

The text of both macro definitions and arguments to macro calls can
optionally be surrounded by braces, to clearly delimit the text boundaries.
The braces do not form part of the text itself (to specify text surrounded
by braces, a second set would have to be added around the text).  It is
conventional to surround macro definitions with braces, except sometimes
for very short definitions that fit on one line.  However, braces are not
normally used around macro call arguments unless necessary for correct
parsing (for example, a macro argument containing a comma in it that is not
surrounded by matching delimiters).


--------------------------------
         Sample Files
--------------------------------

Three sample .ccg-format files are currently included in the directory
`ccg-format-grammars' off of the top-level OpenCCG
directory:

- `tinytiny.ccg' is a simple file that parses a basic chunk of
  English (including nouns, personal pronouns, articles, and transitive and
  intransitive verbs) and demonstrates the basic features of the .ccg format.

- `tiny.ccg' is a conversion of the original OpenCCG "tiny" sample grammar
  to .ccg format.  `tiny.ccg' is no longer as small as its name
  implies, especially since it contains a large number of comments describing
  the CCG format in depth, as well as a number of example declarations to
  demonstrate the various features of the CCG format.

- `arabic.ccg' is an Arabic grammar fragment, which demonstrates how to
  effectively use macros in order to efficiently generate the morphology of
  a complex, highly-inflected language.


================================================
FILE: src/ccg2xml/Tree.py
================================================
# Highly optimized Tkinter tree control
# by Charles E. "Gene" Cash
#
# This is documented more fully on my homepage at
# http://home.cfl.rr.com/genecash/ and if it's not there, look in the Vaults
# of Parnassus at http://www.vex.net/parnassus/ which I promise to keep
# updated.
#
# Thanks to Laurent Claustre <claustre@esrf.fr> for sending lots of helpful
# bug reports.
#
# This copyright license is intended to be similar to the FreeBSD license. 
#
# Copyright 1998 Gene Cash All rights reserved. 
#
# Redistribution and use in source and binary forms, with or without
# modification, are permitted provided that the following conditions are
# met:
#
#    1. Redistributions of source code must retain the above copyright
#       notice, this list of conditions and the following disclaimer.
#    2. Redistributions in binary form must reproduce the above copyright
#       notice, this list of conditions and the following disclaimer in the
#       documentation and/or other materials provided with the
#       distribution.
#
# THIS SOFTWARE IS PROVIDED BY GENE CASH ``AS IS'' AND ANY EXPRESS OR
# IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
# OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
# DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE FOR
# ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
# DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
# OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
# HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
# STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN
# ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
# POSSIBILITY OF SUCH DAMAGE.
#
# This means you may do anything you want with this code, except claim you
# wrote it. Also, if it breaks you get to keep both pieces.
#
# 02-DEC-98 Started writing code.
# 22-NOV-99 Changed garbage collection to a better algorithm.
# 28-AUG-01 Added logic to deal with exceptions in user callbacks.
# 02-SEP-01 Fixed hang when closing last node.
# 07-SEP-01 Added binding tracking so nodes got garbage-collected.
#           Also fixed subclass call to initialize Canvas to properly deal
#           with variable arguments and keyword arguments.
# 11-SEP-01 Bugfix for unbinding code.
# 13-OCT-01 Added delete & insert methods for nodes (by email request).
#           LOTS of code cleanup.
#           Changed leading double underscores to PVT nomenclature.
#           Added ability to pass Node subclass to Tree constructor.
#           Removed after_callback since subclassing Node is better idea.
# 15-OCT-01 Finally added drag'n'drop support.  It consisted of a simple
#           change to the Node PVT_click method, and addition of logic like
#           the example in Tkdnd.py.  It took 3 days to grok the Tkdnd
#           example and 2 hours to make the code changes.  Plus another 1/2
#           day to get a working where() function.
# 16-OCT-01 Incorporated fixes to delete() and dnd_commit() bugs by
#           Laurent Claustre <claustre@esrf.fr>.
# 17-OCT-01 Added find_full_id() and cursor_node() methods.
# 18-OCT-01 Fixes to delete() on root during collapse and with
#           drag-in-progress flag by Laurent Claustre <claustre@esrf.fr>.
# 10-FEB-02 Fix to prev_visible() by Nicolas Pascal <pascal@esrf.fr>.
#           Fixes which made insert_before()/insert_after() actually work.
#           Also added expand/collapse indicators like Internet Explorer
#           as requested by Nicolas.
# 11-FEB-02 Another fix to prev_visible().  It works this time.  Honest.
# 31-MAY-02 Added documentation strings so the new PYthon 2.2 help function
#           is a little more useful.
# 19-AUG-02 Minor fix to eliminate crash in "treedemo-icons.py" caused by
#           referencing expand/collapse indicators when lines are turned off.
# 15-OCT-02 Used new idiom for calling Canvas superclass.
# 18-NOV-02 Fixed bug discovered by Amanjit Gill <amanjit.gill@gmx.de>, where
#           I didn't pass "master" properly to the Canvas superclass. Sigh.
#           One step forward, one step back.

import Tkdnd
from Tkinter import *

#------------------------------------------------------------------------------
def report_callback_exception():
    """report exception on sys.stderr."""
    import traceback
    import sys
    
    sys.stderr.write("Exception in Tree control callback\n")
    traceback.print_exc()
    
#------------------------------------------------------------------------------
class Struct:
    """Helper object for add_node() method"""
    def __init__(self):
        pass

#------------------------------------------------------------------------------
class Node:
    """Tree helper class that's instantiated for each element in the tree.  It
    has several useful attributes:
    parent_node     - immediate parent node
    id              - id assigned at creation
    expanded_icon   - image displayed when folder is expanded to display
                      children
    collapsed_icon  - image displayed when node is not a folder or folder is
                      collapsed.
    parent_widget   - reference to tree widget that contains node.
    expandable_flag - is true when node is a folder that may be expanded or
                      collapsed.
    expanded_flag   - true to indicate node is currently expanded.
    h_line          - canvas line to left of node image.
    v_line          - canvas line below node image that connects children.
    indic           - expand/collapse canvas image.
    label           - canvas text label
    symbol          - current canvas image

    Please note that methods prefixed PVT_* are not meant to be used by
    client programs."""
    
    def __init__(self, parent_node, id, collapsed_icon, x, y,
                 parent_widget=None, expanded_icon=None, label=None,
                 expandable_flag=0):
        """Create node and initialize it.  This also displays the node at the
        given position on the canvas, and binds mouseclicks."""
        # immediate parent node
        self.parent_node=parent_node
        # internal name used to manipulate things
        self.id=id
        # bitmaps to be displayed
        self.expanded_icon=expanded_icon
        self.collapsed_icon=collapsed_icon
        # tree widget we belong to
        if parent_widget:
            self.widget=parent_widget
        else:
            self.widget=parent_node.widget
        # for speed
        sw=self.widget
        # our list of child nodes
        self.child_nodes=[]
        # flag that node can be expanded
        self.expandable_flag=expandable_flag
        self.expanded_flag=0
        # add line
        if parent_node and sw.line_flag:
            self.h_line=sw.create_line(x, y, x-sw.dist_x, y)
        else:
            self.h_line=None
        self.v_line=None
        # draw approprate image
        self.symbol=sw.create_image(x, y, image=self.collapsed_icon)
        # add expand/collapse indicator
        self.indic=None
        if expandable_flag and sw.line_flag and sw.plus_icon and sw.minus_icon:
            self.indic=sw.create_image(x-sw.dist_x, y, image=sw.plus_icon)
        # add label
        self.label=sw.create_text(x+sw.text_offset, y, text=label, anchor='w')
        # single-click to expand/collapse
        if self.indic:
            sw.tag_bind(self.indic, '<1>', self.PVT_click)
        else:
            sw.tag_bind(self.symbol, '<1>', self.PVT_click)
        # for drag'n'drop target detection
        sw.tag_bind(self.symbol, '<Any-Enter>', self.PVT_enter)
        sw.tag_bind(self.label, '<Any-Enter>', self.PVT_enter)

    # for testing (gotta make sure nodes get properly GC'ed)
    #def __del__(self):
    #    print self.full_id(), 'deleted'

    # ----- PUBLIC METHODS -----
    def set_collapsed_icon(self, icon):
        """Set node's collapsed image"""
        self.collapsed_icon=icon
        if not self.expanded_flag:
            self.widget.itemconfig(self.symbol, image=icon)

    def set_expanded_icon(self, icon):
        """Set node's expanded image"""
        self.expanded_icon=icon
        if self.expanded_flag:
            self.widget.itemconfig(self.symbol, image=icon)

    def parent(self):
        """Return node's parent node"""
        return self.parent_node

    def prev_sib(self):
        """Return node's previous sibling (the child immediately above it)"""
        i=self.parent_node.child_nodes.index(self)-1
        if i >= 0:
            return self.parent_node.child_nodes[i]
        else:
            return None

    def next_sib(self):
        """Return node's next sibling (the child immediately below it)"""
        i=self.parent_node.child_nodes.index(self)+1
        if i < len(self.parent_node.child_nodes):
            return self.parent_node.child_nodes[i]
        else:
            return None
        
    def next_visible(self):
        """Return next lower visible node"""
        n=self
        if n.child_nodes:
            # if you can go right, do so
            return n.child_nodes[0]
        while n.parent_node:
            # move to next sibling
            i=n.parent_node.child_nodes.index(n)+1
            if i < len(n.parent_node.child_nodes):
                return n.parent_node.child_nodes[i]
            # if no siblings, move to parent's sibling
            n=n.parent_node
        # we're at bottom
        return self
    
    def prev_visible(self):
        """Return next higher visible node"""
        n=self
        if n.parent_node:
            i=n.parent_node.child_nodes.index(n)-1
            if i < 0:
                return n.parent_node
            else:
                j=n.parent_node.child_nodes[i]
                return j.PVT_last()
        else:
            return n
                
    def children(self):
        """Return list of node's children"""
        return self.child_nodes[:]

    def get_label(self):
        """Return string containing text of current label"""
        return self.widget.itemcget(self.label, 'text')

    def set_label(self, label):
        """Set current text label"""
        self.widget.itemconfig(self.label, text=label)

    def expanded(self):
        """Returns true if node is currently expanded, false otherwise"""
        return self.expanded_flag

    def expandable(self):
        """Returns true if node can be expanded (i.e. if it's a folder)"""
        return self.expandable_flag
    
    def full_id(self):
        """Return list of IDs of all parents and node ID"""
        if self.parent_node:
            return self.parent_node.full_id()+(self.id,)
        else:
            return (self.id,)

    def expand(self):
        """Expand node if possible"""
        if not self.expanded_flag:
            self.PVT_set_state(1)
        
    def collapse(self):
        """Collapse node if possible"""
        if self.expanded_flag:
            self.PVT_set_state(0)

    def delete(self, me_too=1):
        """Delete node from tree. ("me_too" is a hack not to be used by
        external code, please!)"""
        sw=self.widget
        if not self.parent_node and me_too:
            # can't delete the root node
            raise ValueError, "can't delete root node"
        self.PVT_delete_subtree()
        # move everything up so that distance to next subnode is correct
        n=self.next_visible()
        x1, y1=sw.coords(self.symbol)
        x2, y2=sw.coords(n.symbol)
        if me_too:
            dist=y2-y1
        else:
            dist=y2-y1-sw.dist_y
        self.PVT_tag_move(-dist)
        n=self
        if me_too:
            if sw.pos == self:
                # move cursor if it points to current node
                sw.move_cursor(self.parent_node)
            self.PVT_unbind_all()
            sw.delete(self.symbol)
            sw.delete(self.label)
            sw.delete(self.h_line)
            sw.delete(self.v_line)
            sw.delete(self.indic)
            self.parent_node.child_nodes.remove(self)
            # break circular ref now, so parent may be GC'ed later
            n=self.parent_node
            self.parent_node=None
        n.PVT_cleanup_lines()
        n.PVT_update_scrollregion()

    def insert_before(self, nodes):
        """Insert list of nodes as siblings before this node.  Call parent
        node's add_node() function to generate the list of nodes."""
        i=self.parent_node.child_nodes.index(self)
        self.parent_node.PVT_insert(nodes, i, self.prev_visible())
    
    def insert_after(self, nodes):
        """Insert list of nodes as siblings after this node.  Call parent
        node's add_node() function to generate the list of nodes."""
        i=self.parent_node.child_nodes.index(self)+1
        self.parent_node.PVT_insert(nodes, i, self.PVT_last())
        
    def insert_children(self, nodes):
        """Insert list of nodes as children of this node.  Call node's
        add_node() function to generate the list of nodes."""
        self.PVT_insert(nodes, 0, self)
        
    def toggle_state(self):
        """Toggle node's state between expanded and collapsed, if possible"""
        if self.expandable_flag:
            if self.expanded_flag:
                self.PVT_set_state(0)
            else:
                self.PVT_set_state(1)
                
    # ----- functions for drag'n'drop support -----
    def PVT_enter(self, event):
        """detect mouse hover for drag'n'drop"""
        self.widget.target=self
        
    def dnd_end(self, target, event):
        """Notification that dnd processing has been ended. It DOES NOT imply
        that we've been dropped somewhere useful, we could have just been
        dropped into deep space and nothing happened to any data structures,
        or it could have been just a plain mouse-click w/o any dragging."""
        if not self.widget.drag:
            # if there's been no dragging, it was just a mouse click
            self.widget.move_cursor(self)
            self.toggle_state()
        self.widget.drag=0

    # ----- PRIVATE METHODS (prefixed with "PVT_") -----
    # these methods are subject to change, so please try not to use them
    def PVT_last(self):
        """Return bottom-most node in subtree"""
        n=self
        while n.child_nodes:
            n=n.child_nodes[-1]
        return n
    
    def PVT_find(self, search):
        """Used by searching functions"""
        if self.id != search[0]:
            # this actually only goes tilt if root doesn't match
            return None
        if len(search) == 1:
            return self
        # get list of children IDs
        i=map(lambda x: x.id, self.child_nodes)
        # if there is a child that matches, search it
        try:
            return self.child_nodes[i.index(search[1])].PVT_find(search[1:])
        except:
            return None

    def PVT_insert(self, nodes, pos, below):
        """Create and insert new children. "nodes" is list previously created
        via calls to add_list(). "pos" is index in the list of children where
        the new nodes are inserted. "below" is node which new children should
        appear immediately below."""
        if not self.expandable_flag:
            raise TypeError, 'not an expandable node'
        # for speed
        sw=self.widget
        # expand and insert children
        children=[]
        self.expanded_flag=1
        sw.itemconfig(self.symbol, image=self.expanded_icon)
        if sw.minus_icon and sw.line_flag:
            sw.itemconfig(self.indic, image=sw.minus_icon)
        if len(nodes):
            # move stuff to make room
            below.PVT_tag_move(sw.dist_y*len(nodes))
            # get position of first new child
            xp, dummy=sw.coords(self.symbol)
            dummy, yp=sw.coords(below.symbol)
            xp=xp+sw.dist_x
            yp=yp+sw.dist_y
            # create vertical line
            if sw.line_flag and not self.v_line:
                self.v_line=sw.create_line(
                    xp, yp,
                    xp, yp+sw.dist_y*len(nodes))
                sw.tag_lower(self.v_line, self.symbol)
            n=sw.node_class
            for i in nodes:
                # add new subnodes, they'll draw themselves
                # this is a very expensive call
                children.append(
                    n(parent_node=self, expandable_flag=i.flag, label=i.name,
                      id=i.id, collapsed_icon=i.collapsed_icon,
                      expanded_icon=i.expanded_icon, x=xp, y=yp))
                yp=yp+sw.dist_y
            self.child_nodes[pos:pos]=children
            self.PVT_cleanup_lines()
            self.PVT_update_scrollregion()
            sw.move_cursor(sw.pos)
        
    def PVT_set_state(self, state):
        """Common code forexpanding/collapsing folders. It's not re-entrant,
        and there are certain cases in which we can be called again before
        we're done, so we use a mutex."""
        while self.widget.spinlock:
            pass
        self.widget.spinlock=1
        # expand & draw our subtrees
        if state:
            self.child_nodes=[]
            self.widget.new_nodes=[]
            if self.widget.get_contents_callback:
                # this callback needs to make multiple calls to add_node()
                try:
                    self.widget.get_contents_callback(self)
                except:
                    report_callback_exception()
            self.PVT_insert(self.widget.new_nodes, 0, self)
        # collapse and delete subtrees
        else:
            self.expanded_flag=0
            self.widget.itemconfig(self.symbol, image=self.collapsed_icon)
            if self.indic:
                self.widget.itemconfig(self.indic, image=self.widget.plus_icon)
            self.delete(0)
        # release mutex
        self.widget.spinlock=0

    def PVT_cleanup_lines(self):
        """Resize connecting lines"""
        if self.widget.line_flag:
            n=self
            while n:
                if n.child_nodes:
                    x1, y1=self.widget.coords(n.symbol)
                    x2, y2=self.widget.coords(n.child_nodes[-1].symbol)
                    self.widget.coords(n.v_line, x1, y1, x1, y2)
                n=n.parent_node

    def PVT_update_scrollregion(self):
        """Update scroll region for new size"""
        x1, y1, x2, y2=self.widget.bbox('all')
        self.widget.configure(scrollregion=(x1, y1, x2+5, y2+5))

    def PVT_delete_subtree(self):
        """Recursively delete subtree & clean up cyclic references to make
        garbage collection happy"""
        sw=self.widget
        sw.delete(self.v_line)
        self.v_line=None
        for i in self.child_nodes:
            # delete node's subtree, if any
            i.PVT_delete_subtree()
            i.PVT_unbind_all()
            # delete widgets from canvas
            sw.delete(i.symbol)
            sw.delete(i.label)
            sw.delete(i.h_line)
            sw.delete(i.v_line)
            sw.delete(i.indic)
            # break circular reference
            i.parent_node=None
        # move cursor if it's in deleted subtree
        if sw.pos in self.child_nodes:
            sw.move_cursor(self)
        # now subnodes will be properly garbage collected
        self.child_nodes=[]
        
    def PVT_unbind_all(self):
        """Unbind callbacks so node gets garbage-collected. This wasn't easy
        to figure out the proper way to do this.  See also tag_bind() for the
        Tree widget itself."""
        for j in (self.symbol, self.label, self.indic, self.h_line,
                  self.v_line):
            for k in self.widget.bindings.get(j, ()):
                self.widget.tag_unbind(j, k[0], k[1])

    def PVT_tag_move(self, dist):
        """Move everything below current icon, to make room for subtree using
        the Disney magic of item tags.  This is the secret of making
        everything as fast as it is."""
        # mark everything below current node as movable
        bbox1=self.widget.bbox(self.widget.root.symbol, self.label)
        bbox2=self.widget.bbox('all')
        self.widget.dtag('move')
        self.widget.addtag('move', 'overlapping', 
                           bbox2[0], bbox1[3], bbox2[2], bbox2[3])
        # untag cursor & node so they don't get moved too
        self.widget.dtag(self.widget.cursor_box, 'move')
        self.widget.dtag(self.symbol, 'move')
        self.widget.dtag(self.label, 'move')
        # now do the move of all the tagged objects
        self.widget.move('move', 0, dist)
    
    def PVT_click(self, event):
        """Handle mouse clicks by kicking off possible drag'n'drop
        processing"""
        if self.widget.drop_callback:
            if Tkdnd.dnd_start(self, event):
                x1, y1, x2, y2=self.widget.bbox(self.symbol)
                self.x_off=(x1-x2)/2
                self.y_off=(y1-y2)/2
        else:
            # no callback, don't bother with drag'n'drop
            self.widget.drag=0
            self.dnd_end(None, None)

#------------------------------------------------------------------------------
class Tree(Canvas):
    # do we have enough possible arguments?!?!?!
    def __init__(self, master, root_id, root_label='',
                 get_contents_callback=None, dist_x=15, dist_y=15,
                 text_offset=10, line_flag=1, expanded_icon=None,
                 collapsed_icon=None, regular_icon=None, plus_icon=None,
                 minus_icon=None, node_class=Node, drop_callback=None,
                 *args, **kw_args):
        # pass args to superclass (new idiom from Python 2.2)
        Canvas.__init__(self, master, *args, **kw_args)
        
        # this allows to subclass Node and pass our class in
        self.node_class=node_class
        # keep track of node bindings
        self.bindings={}
        # cheap mutex spinlock
        self.spinlock=0
        # flag to see if there's been any d&d dragging
        self.drag=0
        # default images (BASE64-encoded GIF files)
        if expanded_icon == None:
            self.expanded_icon=PhotoImage(
                data='R0lGODlhEAANAKIAAAAAAMDAwICAgP//////ADAwMAAAAAAA' \
                'ACH5BAEAAAEALAAAAAAQAA0AAAM6GCrM+jCIQamIbw6ybXNSx3GVB' \
                'YRiygnA534Eq5UlO8jUqLYsquuy0+SXap1CxBHr+HoBjoGndDpNAAA7')
        else:
            self.expanded_icon=expanded_icon
        if collapsed_icon == None:
            self.collapsed_icon=PhotoImage(
                data='R0lGODlhDwANAKIAAAAAAMDAwICAgP//////ADAwMAAAAAAA' \
                'ACH5BAEAAAEALAAAAAAPAA0AAAMyGCHM+lAMMoeAT9Jtm5NDKI4Wo' \
                'FXcJphhipanq7Kvu8b1dLc5tcuom2foAQQAyKRSmQAAOw==')
        else:
            self.collapsed_icon=collapsed_icon
        if regular_icon == None:
            self.regular_icon=PhotoImage(
                data='R0lGODlhCwAOAJEAAAAAAICAgP///8DAwCH5BAEAAAMALAAA' \
                'AAALAA4AAAIphA+jA+JuVgtUtMQePJlWCgSN9oSTV5lkKQpo2q5W+' \
                'wbzuJrIHgw1WgAAOw==')
        else:
            self.regular_icon=regular_icon
        if plus_icon == None:
            self.plus_icon=PhotoImage(
                data='R0lGODdhCQAJAPEAAAAAAH9/f////wAAACwAAAAACQAJAAAC' \
                'FIyPoiu2sJyCyoF7W3hxz850CFIA\nADs=')
        else:
            self.plus_icon=plus_icon
        if minus_icon == None:
            self.minus_icon=PhotoImage(
                data='R0lGODdhCQAJAPEAAAAAAH9/f////wAAACwAAAAACQAJAAAC' \
                'EYyPoivG614LAlg7ZZbxoR8UADs=')
        else:
            self.minus_icon=minus_icon
        # horizontal distance that subtrees are indented
        self.dist_x=dist_x
        # vertical distance between rows
        self.dist_y=dist_y
        # how far to offset text label
        self.text_offset=text_offset
        # flag controlling connecting line display
        self.line_flag=line_flag
        # called just before subtree expand/collapse
        self.get_contents_callback=get_contents_callback
        # called after drag'n'drop
        self.drop_callback=drop_callback
        # create root node to get the ball rolling
        self.root=node_class(parent_node=None, label=root_label,
                             id=root_id, expandable_flag=1,
                             collapsed_icon=self.collapsed_icon,
                             expanded_icon=self.expanded_icon,
                             x=dist_x, y=dist_y, parent_widget=self)
        # configure for scrollbar(s)
        x1, y1, x2, y2=self.bbox('all') 
        self.configure(scrollregion=(x1, y1, x2+5, y2+5))
        # add a cursor
        self.cursor_box=self.create_rectangle(0, 0, 0, 0)
        self.move_cursor(self.root)
        # make it easy to point to control
        self.bind('<Enter>', self.PVT_mousefocus)
        # totally arbitrary yet hopefully intuitive default keybindings
        # stole 'em from ones used by microsoft tree control
        # page-up/page-down
        self.bind('<Next>', self.pagedown)
        self.bind('<Prior>', self.pageup)
        # arrow-up/arrow-down
        self.bind('<Down>', self.next)
        self.bind('<Up>', self.prev)
        # arrow-left/arrow-right
        self.bind('<Left>', self.ascend)
        # (hold this down and you expand the entire tree)
        self.bind('<Right>', self.descend)
        # home/end
        self.bind('<Home>', self.first)
        self.bind('<End>', self.last)
        # space bar
        self.bind('<Key-space>', self.toggle)

    # ----- PRIVATE METHODS (prefixed with "PVT_") -----
    # these methods are subject to change, so please try not to use them
    def PVT_mousefocus(self, event):
        """Soak up event argument when moused-over"""
        self.focus_set()
        
    # ----- PUBLIC METHODS -----
    def tag_bind(self, tag, seq, *args, **kw_args):
        """Keep track of callback bindings so we can delete them later. I
        shouldn't have to do this!!!!"""
        # pass args to superclass
        func_id=apply(Canvas.tag_bind, (self, tag, seq)+args, kw_args)
        # save references
        self.bindings[tag]=self.bindings.get(tag, [])+[(seq, func_id)]

    def add_list(self, list=None, name=None, id=None, flag=0,
                 expanded_icon=None, collapsed_icon=None):
        """Add node construction info to list"""
        n=Struct()
        n.name=name
        n.id=id
        n.flag=flag
        if collapsed_icon:
            n.collapsed_icon=collapsed_icon
        else:
            if flag:
                # it's expandable, use closed folder icon
                n.collapsed_icon=self.collapsed_icon
            else:
                # it's not expandable, use regular file icon
                n.collapsed_icon=self.regular_icon
        if flag:
            if expanded_icon:
                n.expanded_icon=expanded_icon
            else:
                n.expanded_icon=self.expanded_icon
        else:
            # not expandable, don't need an icon
            n.expanded_icon=None
        if list == None:
            list=[]
        list.append(n)
        return list

    def add_node(self, name=None, id=None, flag=0, expanded_icon=None,
                 collapsed_icon=None):
        """Add a node during get_contents_callback()"""
        self.add_list(self.new_nodes, name, id, flag, expanded_icon,
                      collapsed_icon)

    def find_full_id(self, search):
        """Search for a node"""
        return self.root.PVT_find(search)
    
    def cursor_node(self, search):
        """Return node under cursor"""
        return self.pos
        
    def see(self, *items):
        """Scroll (in a series of nudges) so items are visible"""
        x1, y1, x2, y2=apply(self.bbox, items)
        while x2 > self.canvasx(0)+self.winfo_width():
            old=self.canvasx(0)
            self.xview('scroll', 1, 'units')
            # avoid endless loop if we can't scroll
            if old == self.canvasx(0):
                break
        while y2 > self.canvasy(0)+self.winfo_height():
            old=self.canvasy(0)
            self.yview('scroll', 1, 'units')
            if old == self.canvasy(0):
                break
        # done in this order to ensure upper-left of object is visible
        while x1 < self.canvasx(0):
            old=self.canvasx(0)
            self.xview('scroll', -1, 'units')
            if old == self.canvasx(0):
                break
        while y1 < self.canvasy(0):
            old=self.canvasy(0)
            self.yview('scroll', -1, 'units')
            if old == self.canvasy(0):
                break
            
    def move_cursor(self, node):
        """Move cursor to node"""
        self.pos=node
        x1, y1, x2, y2=self.bbox(node.symbol, node.label)
        self.coords(self.cursor_box, x1-1, y1-1, x2+1, y2+1)
        self.see(node.symbol, node.label)
    
    def toggle(self, event=None):
        """Expand/collapse subtree"""
        self.pos.toggle_state()

    def next(self, event=None):
        """Move to next lower visible node"""
        self.move_cursor(self.pos.next_visible())
            
    def prev(self, event=None):
        """Move to next higher visible node"""
        self.move_cursor(self.pos.prev_visible())

    def ascend(self, event=None):
        """Move to immediate parent"""
        if self.pos.parent_node:
            # move to parent
            self.move_cursor(self.pos.parent_node)

    def descend(self, event=None):
        """Move right, expanding as we go"""
        if self.pos.expandable_flag:
            self.pos.expand()
            if self.pos.child_nodes:
                # move to first subnode
                self.move_cursor(self.pos.child_nodes[0])
                return
        # if no subnodes, move to next sibling
        self.next()

    def first(self, event=None):
        """Go to root node"""
        # move to root node
        self.move_cursor(self.root)

    def last(self, event=None):
        """Go to last visible node"""
        # move to bottom-most node
        self.move_cursor(self.root.PVT_last())

    def pageup(self, event=None):
        """Previous page"""
        n=self.pos
        j=self.winfo_height()/self.dist_y
        for i in range(j-3):
            n=n.prev_visible()
        self.yview('scroll', -1, 'pages')
        self.move_cursor(n)

    def pagedown(self, event=None):
        """Next page"""
        n=self.pos
        j=self.winfo_height()/self.dist_y
        for i in range(j-3):
            n=n.next_visible()
        self.yview('scroll', 1, 'pages')
        self.move_cursor(n)
        
    # ----- functions for drag'n'drop support -----
    def where(self, event):
        """Determine drag location in canvas coordinates. event.x & event.y
        don't seem to be what we want."""
        # where the corner of the canvas is relative to the screen:
        x_org=self.winfo_rootx()
        y_org=self.winfo_rooty()
        # where the pointer is relative to the canvas widget,
        # including scrolling
        x=self.canvasx(event.x_root-x_org)
        y=self.canvasy(event.y_root-y_org)
        return x, y
    
    def dnd_accept(self, source, event):
        """Accept dnd messages, i.e. we're a legit drop target, and we do
        implement d&d functions."""
        self.target=None
        return self

    def dnd_enter(self, source, event):
        """Get ready to drag or drag has entered widget (create drag
        object)"""
        # this flag lets us know there's been drag motion
        self.drag=1
        x, y=self.where(event)
        x1, y1, x2, y2=source.widget.bbox(source.symbol, source.label)
        dx, dy=x2-x1, y2-y1
        # create dragging icon
        if source.expanded_flag:
            self.dnd_symbol=self.create_image(x, y,
                                              image=source.expanded_icon)
        else:
            self.dnd_symbol=self.create_image(x, y,
                                              image=source.collapsed_icon)
        self.dnd_label=self.create_text(x+self.text_offset, y, 
                                        text=source.get_label(),
                                        justify='left',
                                        anchor='w')

    def dnd_motion(self, source, event):
        """Move drag icon"""
        self.drag=1
        x, y=self.where(event)
        x1, y1, x2, y2=self.bbox(self.dnd_symbol, self.dnd_label)
        self.move(self.dnd_symbol, x-x1+source.x_off, y-y1+source.y_off)
        self.move(self.dnd_label, x-x1+source.x_off, y-y1+source.y_off)

    def dnd_leave(self, source, event):
        """Finish dragging or drag has left widget (destroy drag object)"""
        self.delete(self.dnd_symbol)
        self.delete(self.dnd_label)

    def dnd_commit(self, source, event):
        """Object has been dropped here"""
        # call our own dnd_leave() to clean up
        self.dnd_leave(source, event)
        # process pending events to detect target node
        # update_idletasks() doesn't do the trick if source & target are
        # on  different widgets
        self.update()
        if not self.target:
            # no target node
            return
        # we must update data structures based on the drop
        if self.drop_callback:
            try:
                # called with dragged node and target node
                # this is where a file manager would move the actual file
                # it must also move the nodes around as it wishes
                self.drop_callback(source, self.target)
            except:
                report_callback_exception()

#------------------------------------------------------------------------------
# the good 'ol test/demo code
if __name__ == '__main__':
    import os
    import sys

    # default routine to get contents of subtree
    # supply this for a different type of app
    # argument is the node object being expanded
    # should call add_node()
    def get_contents(node):
        path=apply(os.path.join, node.full_id())
        for filename in os.listdir(path):
            full=os.path.join(path, filename)
            name=filename
            folder=0
            if os.path.isdir(full):
                # it's a directory
                folder=1
            elif not os.path.isfile(full):
                # but it's not a file
                name=name+' (special)'
            if os.path.islink(full):
                # it's a link
                name=name+' (link to '+os.readlink(full)+')'
            node.widget.add_node(name=name, id=filename, flag=folder)

    root=Tk()
    root.title(os.path.basename(sys.argv[0]))
    tree=os.sep
    if sys.platform == 'win32':
        # we could call the root "My Computer" and mess with get_contents()
        # to return "A:", "B:", "C:", ... etc. as it's children, but that
        # would just be terminally cute and I'd have to shoot myself
        tree='C:'+os.sep

    # create the control
    t=Tree(master=root,
           root_id=tree,
           root_label=tree,
           get_contents_callback=get_contents,
           width=300)
    t.grid(row=0, column=0, sticky='nsew')

    # make expandable
    root.grid_rowconfigure(0, weight=1)
    root.grid_columnconfigure(0, weight=1)

    # add scrollbars
    sb=Scrollbar(root)
    sb.grid(row=0, column=1, sticky='ns')
    t.configure(yscrollcommand=sb.set)
    sb.configure(command=t.yview)

    sb=Scrollbar(root, orient=HORIZONTAL)
    sb.grid(row=1, column=0, sticky='ew')
    t.configure(xscrollcommand=sb.set)
    sb.configure(command=t.xview)

    # must get focus so keys work for demo
    t.focus_set()

    # we could do without this, but it's nice and friendly to have
    Button(root, text='Quit', command=root.quit).grid(row=2, column=0,
                                                      columnspan=2)

    # expand out the root
    t.root.expand()
    
    root.mainloop()


================================================
FILE: src/ccg2xml/arabic.ccg
================================================
#############################################################
#                                                           #
#                         arabic.ccg                        #
#                                                           #
#############################################################

# Author: Ben Wing <ben@666.com>
# Date: April 2006

# This is a grammar for a fragment of Arabic.  It's particularly
# useful for demonstrating the extended use of macros to handle
# complicated morphological inflections.

# See the `tiny' grammar (tiny.ccg) for more info about the format
# of this file.

feature {
  CASE<2>: nom, acc, gen;
  NUM<2>: sg, du, pl;
  GEND<2>: m, f;
  STATE<2>: cons, non-cons {indef, def};
  ANIM<2>: hum, nonhum;
  PERS<2>: 1st, 2nd, 3rd;
  RESUMPTIVE<2>: nonres, res;
  SEM-NUM<X:NUM>: sg-X, du-X, pl-X;
  SEM-PERS<X:PERS>: 1st-X, 2nd-X, 3rd-X;
  TENSE<E>: past, pres;
  MOOD<E>: indic, subj, juss;

  # Here's a more complicated hierarchy, from the original tiny grammar.
  ontology: sem-obj {
              phys-obj {
                animate-being {
                  person
                },
                thing
              },
              situation {
                change {
                  action
                },
                state
              }
            };
}

rule {
  no typeraise;
  typeraise +: n => s;
  typeraise - $: n => s;
  typeraise - $: pp => s;
  typeraise - $: pp/n => s;
  typechange: s$1 | n[nom] => s$1 ;
  typechange: n<~2>[cons] => n<2>[3rd,def] /* n[gen,def] ;
  typechange: n<~2>[cons] => n<2>[3rd,indef] /* n[gen,indef] ;
}

##########################################################################
#                           Morphological entries                        #
#                                 (morph.xml)                            #
##########################################################################

word wa:Conj; # "and"
word anna:Comp; # "that", introducing sentential complements
word inna:Comp; # same, but only after the verb qaal "say"

word maa:InterrogPro(thing): 3rd; # "what"
word man:InterrogPro(person): 3rd; # "who"

word li:Prep; # "what"
word fii:Prep; # "who"

# This word means "this".  
word haadhaa {
  *: sg, m;
  haadhihi: sg, f;
  ha_ulaahi: pl;

  # Bizarrely, this word declines for case only in the dual.
  haadhaani: du, m, nom;
  haadhayni: du, m, acc;
  haadhayni: du, m, gen;

  haataani: du, f, nom;
  haatayni: du, f, acc;
  haatayni: du, f, gen;
}

# This word means "that".  
word dhaalik {
  *: sg, m;
  tilka: sg, f;
  ulaa_ika: pl;

  # Bizarrely, this word declines for case only in the dual.
  dhaanika: du, m, nom;
  dhaynika: du, m, acc;
  dhaynika: du, m, gen;

  taanika: du, f, nom;
  taynika: du, f, acc;
  taynika: du, f, gen;
}

# This is the relative pronoun.
word al-ladhii {
  *: sg, m;
  al-latii: sg, f;
  al-ladhiina: pl, m;
  al-laati: pl, f;

  # Bizarrely, this word declines for case only in the dual.
  al-ladhaani: du, m, nom;
  al-ladhayni: du, m, acc;
  al-ladhayni: du, m, gen;

  al-lataani: du, f, nom;
  al-latayni: du, f, acc;
  al-latayni: du, f, gen;
}

word pro:Pro {
  ana: 1st, 1st-X, sg, sg-X;
  anta: 2nd, 2nd-X, sg, sg-X, m;
  anti: 2nd, 2nd-X, sg, sg-X, f;
  huwa: 3rd, 3rd-X, sg, sg-X, m;
  hiya: 3rd, 3rd-X, sg, sg-X, f;
  naHnu: 1st, 1st-X, pl, pl-X;
  antun: 2nd, 2nd-X, pl, pl-X, m;
  antunna: 2nd, 2nd-X, pl, pl-X, f;
  hum: 3rd, 3rd-X, pl, pl-X, m;
  hunna: 3rd, 3rd-X, pl, pl-X, f;
}

word ii:: 1st, 1st-X, sg, sg-X;
word nii:: 1st, 1st-X, sg, sg-X;
word ka:: 2nd, 2nd-X, sg, sg-X, m;
word ki:: 2nd, 2nd-X, sg, sg-X, f;
word hu:: 3rd, 3rd-X, sg, sg-X, m;
word haa:: 3rd, 3rd-X, sg, sg-X, f;
word naa:: 1st, 1st-X, pl, pl-X;
word kum:: 2nd, 2nd-X, pl, pl-X, m;
word kunna:: 2nd, 2nd-X, pl, pl-X, f;
word hum:: 3rd, 3rd-X, pl, pl-X, m;
word hunna:: 3rd, 3rd-X, pl, pl-X, f;

#############################################
#                    Nouns                  #
#############################################

# This shows how a reasonably complicated morphology can be accommodated.
# It is certainly possible that some of this may (and probably should)
# be offloaded into a separate morphology-processing engine.  However,
# even in that case there is often a good deal more to the lexicon.

# We show a couple examples of complete paradigms, in order to make it
# easier to understand what's going on below.

# Here is a typical noun (kitaab "book") with a broken plural (kutub "books").
# For nouns with broken plurals, the plural is typically declined like
# the singular.  Note that Arabic nouns are conjugated for three numbers
# (singular, dual, plural), three cases (nominative, accusative, dative),
# and three states (indefinite, definite, construct). (The construct state
# is used for nouns that are modified by other nouns -- e.g. "book" in
# "the book of Mary".)

# Form		Nominative	Accusative	Dative
# ---------------------------------------------------------------
# sg.indef	kitaabun	kitaaban	kitaabin
# sg.def	al-kitaabu	al-kitaaba	al-kitaabi
# sg.cons	kitaabu		kitaaba		kitaabi
# 
# du.indef	kitaabaani	kitaabayni	kitaabayni
# du.def	al-kitaabaani	al-kitaabayni	al-kitaabayni
# du.cons	kitaabaa	kitaabay	kitaabay
# 
# pl.indef	kutubun		kutuban		kutubin
# pl.def	al-kutubu	al-kutuba	al-kutubi
# pl.cons	kutubu		kutuba		kutubi

# Here is a typical noun (mudarris "teacher") with a different kind of
# plural, a so-called "strong masculine plural", which has its own declension.

# Form		Nominative	Accusative	Dative
# ---------------------------------------------------------------
# sg.indef	mudarrisun	mudarrisan	mudarrisin
# sg.def	al-mudarrisu	al-mudarrisa	al-mudarrisi
# sg.cons	mudarrisu	mudarrisa	mudarrisi
#
# du.indef	mudarrisaani	mudarrisayni	mudarrisayni
# du.def	al-mudarrisaani	al-mudarrisayni	al-mudarrisayni
# du.cons	mudarrisaa	mudarrisay	mudarrisay
#
# pl.indef	mudarrisuuna	mudarrisiina	mudarrisiina
# pl.def	al-mudarrisuuna	al-mudarrisiina	al-mudarrisiina
# pl.cons	mudarrisuu	mudarrisii	mudarrisii

# Here, we make heavy use of macros.

# This macro says: Every time an expression of the form
# three-form-decl(...) occurs, replace it with the text that comes after.
# The parameters will be substituted into the text.  The braces that
# denote the macro's text do *NOT* form part of the text that is substituted.
# Note that macro substitutions are processed recursively: If the text
# of a macro substitution contains calls to other macros, they will also
# be processed.  This makes "inheritance" very easy to implement.

# This macro is used for a particular paradigm corresponding to a
# particular number of a word.

def three-different-form-decl(indef-form, def-form, cons-form,
			      indef-nom, indef-acc, indef-gen,
 			      def-nom, def-acc, def-gen,
	  	              cons-nom, cons-acc, cons-gen,
	 	              morph-num, sem-num, gend) {
  indef-form.indef-nom: morph-num, sem-num, gend, nom, indef;
  indef-form.indef-acc: morph-num, sem-num, gend, acc, indef;
  indef-form.indef-gen: morph-num, sem-num, gend, gen, indef;

  add-al(def-form.def-nom): morph-num, sem-num, gend, nom, def;
  add-al(def-form.def-acc): morph-num, sem-num, gend, acc, def;
  add-al(def-form.def-gen): morph-num, sem-num, gend, gen, def;

  cons-form.cons-nom: morph-num, sem-num, gend, nom, cons;
  cons-form.cons-acc: morph-num, sem-num, gend, acc, cons;
  cons-form.cons-gen: morph-num, sem-num, gend, gen, cons;
}

# It's questionable whether we should do this.  This assimilates al-
# to a following coronal consonant, e.g. ar-rajul, as-sigaara,
# ath-thalj, an-nuur, aDH-DHuhr, etc.
def add-al(form) regsub('^al-([std]h|DH|[tdszrnTDSZL])', 'a\1-\1', al-.form)

def three-form-decl(form, indef-nom, indef-acc, indef-gen,
		    def-nom, def-acc, def-gen,
		    cons-nom, cons-acc, cons-gen,
		    morph-num, sem-num, gend) {
  three-different-form-decl(form, form, form,
			    indef-nom, indef-acc, indef-gen,
 			    def-nom, def-acc, def-gen,
	  	            cons-nom, cons-acc, cons-gen,
	 	            morph-num, sem-num, gend)
}

# Using the above macro, we create two more macros to handle two common
# paradigm types: Accusative and genitive are the same, and the
# definite is either the same as the construct (two-form-decl-1) or
# the same as the indefinite (two-form-decl-2).

def two-form-decl-1(form, non-cons-nom, non-cons-obl,
		    cons-nom, cons-obl, morph-num, sem-num, gend) {
  three-form-decl(form, non-cons-nom, non-cons-obl, non-cons-obl,
		  non-cons-nom, non-cons-obl, non-cons-obl,
		  cons-nom, cons-obl, cons-obl,
		  morph-num, sem-num, gend)
}

def two-form-decl-2(form, indef-nom, indef-obl,
		    non-indef-nom, non-indef-obl, morph-num, sem-num, gend) {
  three-form-decl(form, indef-nom, indef-obl, indef-obl,
		  non-indef-nom, non-indef-obl, non-indef-obl,
		  non-indef-nom, non-indef-obl, non-indef-obl,
		  morph-num, sem-num, gend)
}

# In turn we create macros for particular paradigms: strong masculine ("uun"),
# strong feminine ("aat"), dual, and basic triptote (the paradigm for
# "kitaab" above and, in general, most singulars).

# Note that an alternative to using braces is to put the macro text on
# the same line as the `def' part of the macro (backslashes can be used
# to join multiple lines together).

def uun-plural(form) two-form-decl-1(form, uuna, iina, uu, ii, pl, pl-X, m)
def aat-plural(form) \
  two-form-decl-2(form, aatun, aatin, aatu, aati, pl, pl-X, f)
def dual(form, gend) \
  two-form-decl-1(form, aani, ayni, aa, ay, du, du-X, gend)
def triptote(form, morph-num, sem-num, gend) \
  three-form-decl(form, un, an, in, u, a, i, u, a, i, morph-num, sem-num, gend)

# Here we define macros for full paradigms for words.  Note how semicolons
# are not used, because they are supplied by the macro text itself.
# (Consult the text for three-form-decl() above, and remember that the
# braces denoting the macro text are not actually part of the text.  This
# means that if you really want braces as the outermost thing in some
# macro text, you'll need to supply two levels of braces.)

def thing(sing, plur) {
  word sing:N(thing) {
    triptote(sing, sg, sg-X, m)
    dual(sing, m)
    triptote(plur, sg, pl-X, f)
  }
}

def fem-thing(sing, plur) {
  word sing:N(thing) {
    triptote(sing.t, sg, sg-X, f)
    dual(sing.t, f)
    triptote(plur, sg, pl-X, f)
  }
}

def person(sing, plur, gend) {
  word sing:N(person) {
    triptote(sing, sg, sg-X, gend)
    dual(sing, gend)
    triptote(plur, pl, pl-X, gend)
  }
}

def male(sing, plur) person(sing, plur, m)
def female(sing, plur) person(sing, plur, f)

def strong-male(sing) {
  word sing:N(person) {
    triptote(sing, sg, sg-X, m)
    dual(sing, m)
    uun-plural(sing)
  }
}

# Here we define the actual words.  Note how short these definitions are,
# specifying only what's unpredictable.

thing(kitaab, kutub)
thing(waqt, _awqaat)
thing(Harf, Huruuf)
thing(dars, duruus)
thing(waqt, _awqaat)
fem-thing(sigaara, sagaayir)
fem-thing(madiina, mudun)
male(rajul, rijaal)
male(walad, _awlaad)
male(Taalib, Tullaab)
female(bint, _abnaat)
strong-male(mudarris)

word imra_a:N(person) {
  three-different-form-decl(imra_at, mar_at, imra_at,
			    un, an, in, u, a, i, u, a, i,
                            sg, sg-X, f)
  three-different-form-decl(imra_at, mar_at, imra_at,
			    aani, ayni, ayni, aani, ayni, ayni, aa, ay, ay,
                            du, du-X, f)
  triptote(nisaa_, pl, pl-X, f)
}

def extended_construct_word(stem, plur) {
  word stem:N(person) {
    three-form-decl(stem, un, an, in, u, a, i, uu, aa, ii, sg, sg-X, m)
    dual(stem, m)
    triptote(plur, pl, pl-X, m)
  }
}

extended_construct_word(_ax, _ixwaan)
extended_construct_word(_ab, _abnaa_)

# Typical paradigms:

# 1sg    'aktaa      'aktaa    'akta    |
# 2sg.m  taktaa      taktaa    takta    |
# 2sg.f  taktayna    taktay    taktay   |
# 3sg.m  yaktaa      yaktaa    yakta    |
# 3sg.f  taktaa      taktaa    takta    |
# 2du    taktayaani  taktayaa  taktayaa |
# 3du.m  yaktayaani  yaktayaa  yaktayaa |
# 3du.f  taktayaani  taktayaa  taktayaa |
# 1pl    naktaa      naktaa    nakta    |
# 2pl.m  taktawna    taktaw    taktaw   |
# 2pl.f  taktayna    taktayna  taktayna |
# 3pl.m  yaktawna    yaktaw    yaktaw   |
# 3pl.f  yaktayna    yaktayna  yaktayna |
# 
# 1sg    'aktuu      'aktuwa   'aktu    | 'aktii      'aktiya   'akti    
# 2sg.m  taktuu      taktuwa   taktu    | taktii      taktiya   takti    
# 2sg.f  taktiina    taktii    taktii   | taktiina    taktii    taktii   
# 3sg.m  yaktuu      yaktuwa   yaktu    | yaktii      yaktiya   yakti    
# 3sg.f  taktuu      taktuwa   taktu    | taktii      taktiya   takti    
# 2du    taktuwaani  taktuwaa  taktuwaa | taktiyaani  taktiyaa  taktiyaa 
# 3du.m  yaktuwaani  yaktuwaa  yaktuwaa | yaktiyaani  yaktiyaa  yaktiyaa 
# 3du.f  taktuwaani  taktuwaa  taktuwaa | taktiyaani  taktiyaa  taktiyaa 
# 1pl    naktuu      naktuwa   naktu    | naktii      naktiya   nakti    
# 2pl.m  taktuuna    taktuu    taktuu   | taktuuna    taktuu    taktuu   
# 2pl.f  taktuuna    taktuuna  taktuuna | taktiina    taktiina  taktiina 
# 3pl.m  yaktuuna    yaktuu    yaktuu   | yaktuuna    yaktuu    yaktuu   
# 3pl.f  yaktuuna    yaktuuna  yaktuuna | yaktiina    yaktiina  yaktiina 


def two-form-past(formv, formc) {
  formc.tu: past, 1st, sg;
  formc.ta: past, 2nd, m, sg;
  formc.ti: past, 2nd, f, sg;
  formv.a: past, 3rd, m, sg;
  formv.at: past, 3rd, f, sg;

  formc.tumaa: past, 2nd, du;
  formv.aa: past, 3rd, m, du;
  formv.ataa: past, 3rd, f, du;

  formc.naa: past, 1st, pl;
  formc.tum: past, 2nd, m, pl;
  formc.tunna: past, 2nd, f, pl;
  formv.uu: past, 3rd, m, pl;
  formc.na: past, 3rd, f, pl;
}

def 3rd-weak-past-ay(form) {
  form.ay.tu: past, 1st, sg;
  form.ay.ta: past, 2nd, m, sg;
  form.ay.ti: past, 2nd, f, sg;
  form.aa: past, 3rd, m, sg;
  form.at: past, 3rd, f, sg;

  form.ay.tumaa: past, 2nd, du;
  form.ay.aa: past, 3rd, m, du;
  form.ataa: past, 3rd, f, du;

  form.ay.naa: past, 1st, pl;
  form.ay.tum: past, 2nd, m, pl;
  form.ay.tunna: past, 2nd, f, pl;
  form.aw: past, 3rd, m, pl;
  form.ay.na: past, 3rd, f, pl;
}

def 3rd-weak-past-aw(form) {
  form.aw.tu: past, 1st, sg;
  form.aw.ta: past, 2nd, m, sg;
  form.aw.ti: past, 2nd, f, sg;
  form.aa: past, 3rd, m, sg;
  form.at: past, 3rd, f, sg;

  form.aw.tumaa: past, 2nd, du;
  form.aw.aa: past, 3rd, m, du;
  form.ataa: past, 3rd, f, du;

  form.aw.naa: past, 1st, pl;
  form.aw.tum: past, 2nd, m, pl;
  form.aw.tunna: past, 2nd, f, pl;
  form.aw: past, 3rd, m, pl;
  form.aw.na: past, 3rd, f, pl;
}

def 3rd-weak-past-ii(form) {
  form.ii.tu: past, 1st, sg;
  form.ii.ta: past, 2nd, m, sg;
  form.ii.ti: past, 2nd, f, sg;
  form.iya: past, 3rd, m, sg;
  form.iyat: past, 3rd, f, sg;

  form.ii.tumaa: past, 2nd, du;
  form.iy.aa: past, 3rd, m, du;
  form.iy.ataa: past, 3rd, f, du;

  form.ii.naa: past, 1st, pl;
  form.ii.tum: past, 2nd, m, pl;
  form.ii.tunna: past, 2nd, f, pl;
  form.uu: past, 3rd, m, pl;
  form.ii.na: past, 3rd, f, pl;
}

def strong-past(form) two-form-past(form, form)

# In general, almost all Arabic present-tense verbs of a particular mood
# can be defined using five forms.  Verbs with a hamza in the first radical
# have a problem in the first-singular; ideally this should be handled
# automatically using a regexp or something of that sort, but we don't have
# such support currently, so we use an optional param.

def gen-pres(mood, fsing, fsing-fem, fdual, fplur-masc, fplur-fem) {
  # This shows how you can use regular expressions if need be.
  # regsub(string, regex, repl) is a special built-in that does regular-
  # expression substitution on STRING, replacing all occurrences of
  # REGEX with REPL. Regular-expression syntax is as in Python.
  # In this case, Arabic verbs have a phonetic rule that eliminates
  # two glottal stops occurring near each other at the beginning of a
  # word.  For example, _a_kulu -> _aakulu, and _u_kalu -> _uukalu.
  # (That is, the vowel is lengthened.)
  # _ . regsub(foo, bar, fsing): pres, mood, 1st, sg;
  _ . regsub('^([aiu])_', '\1\1', fsing): pres, mood, 1st, sg;
  # _.fsing: pres, mood, 1st, sg;
  t.fsing: pres, mood, 2nd, m, sg;
  t.fsing-fem: pres, mood, 2nd, f, sg;
  y.fsing: pres, mood, 3rd, m, sg;
  t.fsing: pres, mood, 3rd, f, sg;

  t.fdual: pres, mood, 2nd, du;
  y.fdual: pres, mood, 3rd, m, du;
  t.fdual: pres, mood, 3rd, f, du;

  n.fsing: pres, mood, 1st, pl;
  t.fplur-masc: pres, mood, 2nd, m, pl;
  t.fplur-fem: pres, mood, 2nd, f, pl;
  y.fplur-masc: pres, mood, 3rd, m, pl;
  y.fplur-fem: pres, mood, 3rd, f, pl;
}

# The "two-form" present uses normal (non-3rd-weak) endings but may
# have two forms of the root, one form vocalic endings (almost all of them)
# and one for consonant endings (only the feminine plural).  This
# encompasses 2nd-weak verbs and doubled verbs, and (trivially) strong verbs.

def two-form-pres-indic(formv, formc) {
  gen-pres(indic, formv.u, formv.iina, formv.aani, formv.uuna, formc.na)
}

def two-form-pres-subj(formv, formc) {
  gen-pres(subj, formv.a, formv.ii, formv.aa, formv.uu, formc.na)
}

# The jussive is different because the base form (fsing) has no ending.
# This means that it may assume the consonant form instead of the vowel
# form, or may have a number of variants (in particular, for doubled
# verbs).  So the base form needs to be given explicitly.

def two-form-pres-juss(base, formv, formc) {
  gen-pres(juss, base, formv.ii, formv.aa, formv.uu, formc.na)
}

def strong-pres(form) {
  two-form-pres-indic(form, form)
  two-form-pres-subj(form, form)
  two-form-pres-juss(form, form, form)
}

def 2nd-weak-pres(formv, formc) {
  two-form-pres-indic(formv, formc)
  two-form-pres-subj(formv, formc)
  two-form-pres-juss(formc, formv, formc)
}

def doubled-pres(formv, formc) {
  two-form-pres-indic(formv, formc)
  two-form-pres-subj(formv, formc)
  two-form-pres-juss(formc, formv, formc)
  two-form-pres-juss(formv.a, formv, formc)
  two-form-pres-juss(formv.i, formv, formc)
}

# Verbs whose third radical is a /w/ or a /y/ have all manner of exceptional
# forms; easiest just to list them.  In general, there are three types,
# depending on whether the base singular forms end in -aa, -ii, or -uu.

def 3rd-weak-pres-aa(form) {
  gen-pres(indic, form.aa, form.ayna, form.ayaani, form.awna, form.ayna)
  gen-pres(subj, form.aa, form.ay, form.ayaa, form.aw, form.ayna)
  # Note the shortened vowel here.
  gen-pres(juss, form.a, form.ay, form.ayaa, form.aw, form.ayna)
}

def 3rd-weak-pres-ii(form) {
  gen-pres(indic, form.ii, form.iina, form.iyaani, form.uuna, form.iina)
  gen-pres(subj, form.iya, form.ii, form.iyaa, form.uu, form.iina)
  # Note the shortened vowel here.
  gen-pres(juss, form.i, form.ii, form.iyaa, form.uu, form.iina)
}

def 3rd-weak-pres-uu(form) {
  gen-pres(indic, form.uu, form.iina, form.uwaani, form.uuna, form.uuna)
  gen-pres(subj, form.uwa, form.ii, form.uwaa, form.uu, form.uuna)
  # Note the shortened vowel here.
  gen-pres(juss, form.u, form.ii, form.uwaa, form.uu, form.uuna)
}

def 2nd-weak-verb(pastv, props, pastc, presv, presc) {
  word pastv: props {
    two-form-past(pastv, pastc)
    2nd-weak-pres(presv, presc)
  }
}

# Note the way that macro calls can be constructed as well.  Here, the
# value of PAST_TYPE is the suffix at the end of the macro name.

def 3rd-weak-verb(past_stem, props, past_type, pres_stem, pres_type) {
  word past_stem . past_type: props {
    3rd-weak-past- . past_type(past_stem)
    3rd-weak-pres- . pres_type(pres_stem)
  }
}

def strong-verb(past, props, pres) {
  word past: props {
    strong-past(past)
    strong-pres(pres)
  }
}

2nd-weak-verb(kaan, TransV(pred=be), kun, akuun, akun)
2nd-weak-verb(naam, IntransV(pred=sleep), nim, anaam, anam)
2nd-weak-verb(qaal, SayV(pred=say), qul, aquul, aqul)
strong-verb(katab, TransV(pred=write), aktub)
strong-verb(dhahab, IntransV(pred=go), adhhab)
# Note that the following verb, which begins with a glottal stop,
# will have a modification made to it in the first-person singular present.
# (See above.)
strong-verb(_akal, IntransV TransV (pred=eat), a_kul)
3rd-weak-verb(ra_, TransV(pred=see), ay, ar, aa)
3rd-weak-verb(_a9T, DitransV(pred=give), ay, u9T, ii)
3rd-weak-verb(laq, TransV(pred=find), ii, alq, aa)
strong-verb(9araf, ThinkV(pred=know), a9rif) # see also 9alam
strong-verb(tafakkar, ThinkV(pred=think), atafakkar)
strong-verb(ta9allam, ThinkV(pred=learn), ata9allam)

family N {
  entry: n<2>[X, 3rd, nonres]: X:sem-obj(*);
}

family InterrogPro(Pro) {
  entry: s/*(s/n<2>[res]);
  entry: s/*(s|n<2>[nonres,nom]);
  entry: s/*(s/n<2>[nonres,acc]);
  member: maa, man;
}

family Pro {
  entry: n<2>[X, nom, def, nonres]: X:sem-obj(*);
  member: pro;
}

family Rel {
  entry: (n<~2>[CASE,nonres]\n<~2>[nonres])/*(s/n<2>[res]);
  entry: (n<~2>[CASE,nonres]\n<~2>[nonres])/*(s|n<2>[nonres,nom]);
  entry: (n<~2>[CASE,nonres]\n<~2>[nonres])/*(s/n<2>[nonres,acc]);
  member: al-ladhii;
}

family AndConj(Conj) {
  entry: n[pl, CASE, STATE] \* n[CASE, STATE] /* n[CASE, STATE];
  entry: s$1 \* s$1 /* s$1;
  member: wa;
}

family Det(indexRel=det) {
  entry: n<2>[X, def, nonres] /^ n<2>[X]: X:sem-obj(<det>*);
  member: haadhaa, dhaalik;
}

# good luck on this one! construct even more complicated ones!  
#
#ar-rajulu al-ladhii kataba al-kutuba ra_aa wa _a9Taa li binti hu al-kilaaba al-latii akalat sagaayira mudarrisii al-waladi

#"the man that wrote the books saw and gave to his daughter the dogs that ate the cigarettes of the boy's teachers."

# Works, correctly:

#ar-rajulu al-ladhii kataba al-kutuba ra_aa wa _a9Taa li binti hu as-sagaayira al-latii qultu inna al-waladu tafakkara anna al-mar_atu _a9Tat haa li ha_ulaahi al-mudarrisiina

#Bad

#ar-rajula al-ladhii katabat al-kutuba ra_aa wa _a9Taa li binti hu as-sagaayira al-latii qultu inna al-waladu tafakkara anna al-mar_atu _a9Tat haa li ha_ulaahi al-mudarrisiina

#"the man that wrote the books saw and gave to his daughter the cigarettes that I said that the boy thought that the woman gave them to those teachers"

# Fails, correctly:

#ar-rajulu al-ladhii kataba al-kutuba ra_aa wa _a9Taa li binti hu as-sagaayira al-latii qultu inna al-waladu tafakkara anna al-mar_atu _a9Tat hu li ha-ulaahi al-mudarrisiina

# Works:

# ar-rajulu al-ladhii al-waladu _a9Taa as-sagaayira li binti hu dhahaba
# ar-rajulu _a9Taa li binti hu as-sagaayira
# ar-rajulu al-ladhii waladu hu _a9Taa as-sagaayira li al-binti dhahaba

# Won't work:

# ar-rajulu al-ladhii al-waladu _a9Taa li binti hu as-sagaayira dhahaba
# ar-rajulu al-ladhii waladu hu _a9Taa li al-binti as-sagaayira dhahaba


family PossClitic(Cli, indexRel=poss) {
  entry: n<~1>[X, def, nonres] \* n<1>[X, cons]: X:sem-obj(<poss>*);
  entry: (n<~1>[X, def, nonres] / n<2>[res]) \* n<1>[X, cons]: X:sem-obj(<poss>*);
  member: ii, ka, ki, hu, haa, naa, kum, kunna, hum, hunna;
}

family ObjClitic(Cli, indexRel=poss) {
  entry: (s$1 | n<3>[nonres]) \ (s$1 / n<2>[nonres] | n<3>[nom,nonres]);
  entry: (s$1 / n<~2>[res] | n<3>[nonres]) \ (s$1 / n<2>[nonres] | n<3>[nom,nonres]);
  member: nii, ka, ki, hu, haa, naa, kum, kunna, hum, hunna;
}

family Adj(indexRel=adj) {
  entry: n<2>[X, NUM, GEND, CASE, STATE] \ n<2>[X]:
         X:sem-obj(<adj>*);
}

family Prep-Nom(Prep, indexRel="*NoSem*") {
  # The pp<~3> notation generates an 'inheritsFrom' tag rather than
  # an 'id' tag for the feature structure.
  entry: pp<~3>[lex=*] /< n<3>[gen,nonres];
  member: li, fii;
}

family Comp(indexRel="*NoSem*") {
  entry: sbar<~1>[lex=*] / s<1>;
  member: anna, inna;
}

family IntransV(V) {
  entry: s[E] | n<2>[X,NUM,PERS,GEND,non-cons,nonres,nom]:
	E:action(* ^ <Actor>X:animate-being);
}

family SayV(V) {
  entry: s[E] / sbar[Z, lex=inna] | n<2>[X,NUM,PERS,GEND,non-cons,nonres,nom]:
        E:action(* ^ <Actor>X:animate-being ^ <Situation>Z);
}

family ThinkV(V) {
  entry: s[E] / sbar[Z, lex=anna] | n<2>[X,NUM,PERS,GEND,non-cons,nonres,nom]:
        E:action(* ^ <Actor>X:animate-being ^ <Situation>Z);
}

family TransV(V) {
  entry: s[E] / n[Y,acc,nonres] | n<2>[X,NUM,PERS,GEND,non-cons,nonres,nom]:
        E:action(* ^ <Actor>X:animate-being ^ <Patient>Y:sem-obj);
}

family DitransV(V) {
  # The first slash (on the pp) is marked with a mode allowing backward xcomp.
  entry: s[E] /< pp[Z,lex=li] / n[Y,acc,nonres] | n<2>[X,NUM,PERS,GEND,non-cons,nonres,nom]:
        E:action(* ^ <Actor>X:animate-being ^ <Patient>Y:sem-obj ^
	         <Recipient>Z:animate-being) ;
}

testbed {
  # different states of subject
  rajulun dhahaba: 1;
  ar-rajulu dhahaba: 1;
  rajulu dhahaba: 0;

  # subject-verb agreement
  rajulun dhahabuu: 0;
  ar-rajulu dhahabuu: 0;
  rajulu dhahabuu: 0;

  # gender agreement
  ar-rajulu dhahaba: 1;
  ar-rajulu dhahabat: 0;
  al-bintu dhahaba: 0;
  al-bintu dhahabat: 1;

  # possession
  rajulun hu dhahaba: 0;
  ar-rajulu hu dhahaba: 0;
  rajulu hu dhahaba: 1;

  # subject case
  ar-rajula dhahaba: 0;
  ar-rajuli dhahaba: 0;

  # case in construct phrase
  _axuu ar-rajuli dhahaba: 1;
  _axuu ar-rajula dhahaba: 0;
  _axuu ar-rajulu dhahaba: 0;

  # construct state in construct phrase
  _axun ar-rajuli dhahaba: 0;
  al-_axu ar-rajuli dhahaba: 0;

  # object case
  ar-rajulu ra_aa al-kitaaba: 1;
  ar-rajulu ra_aa al-kitaabi: 0;
  ar-rajulu ra_aa al-kitaabu: 0;

  # preposition case
  ar-rajulu _a9Taa al-kitaaba li al-waladi: 1;
  ar-rajulu _a9Taa al-kitaaba li al-waladu: 0;
  ar-rajulu _a9Taa al-kitaaba li al-walada: 0;

  # subcategorization
  ar-rajulu ra_aa al-kitaaba li al-waladi: 0;

  # backward xcomp
  ar-rajulu _a9Taa li al-waladi al-kitaaba: 1;
  _a9Taa ar-rajulu li al-waladi al-kitaaba: 1;

  # object clitics
  ana ra_aytu hu: 1;
  ra_aytu hu ana: 1;
  ra_aytu ana hu: 0;
  hu ra_aytu ana: 0;
  hu ana ra_aytu: 0;

  huwa ra_aa nii: 1;
  huwa ra_aa ii: 0;
  huwa ra_aa ana: 0;

  ar-rajulu _a9Taa haa li al-waladi: 1;
  _a9Taa haa ar-rajulu li al-waladi: 1;

  # relative clauses
  # "I gave it to the man that the girl saw him"
  _a9Taytu haa li ar-rajuli al-ladhii al-bintu ra_at hu: 3;
  # "I gave it to the man that the girl saw her"
  _a9Taytu haa li ar-rajuli al-ladhii al-bintu ra_at haa: 0;
  # "I gave it to the man that the girl saw"
  _a9Taytu haa li ar-rajuli al-ladhii al-bintu ra_at: 0;
  # "I gave it to the man that the girl saw the boy"
  _a9Taytu haa li ar-rajuli al-ladhii al-bintu ra_at al-walada: 0;
}


================================================
FILE: src/ccg2xml/build.xml
================================================
<?xml version="1.0"?>

<project name="OpenCCG ccg2xml" basedir="." default="compile-ccg2xml">

  <property name="src.dir" value="../../src"/>
  <property name="bin.dir" value="../../bin"/>
  <property name="ccg2xml.dir" value="${src.dir}/ccg2xml"/>

  <uptodate property="ccg2xml.upToDate" srcfile="${ccg2xml.dir}/ccg.ply"
            targetfile="${bin.dir}/ccg2xml.py"/>

  <!-- =================================================================== -->
  <!-- Compiles ccg2xml                                                    -->
  <!-- =================================================================== -->
  <target name="compile-ccg2xml">
    <antcall target="compile-ccg2xml.1"/>
    <antcall target="compile-ccg2xml.finish"/>
    <antcall target="copy-ccg-edit"/>
  </target>

  <target name="compile-ccg2xml.1" unless="ccg2xml.upToDate">
    <echo message="Compiling ccg2xml"/>

    <available file="${ccg2xml.dir}/convert-ply.py"
               property="convert-ply.py.present"/>
    <fail unless="convert-ply.py.present"
          message="convert-ply.py is not present"/>

    <available file="${ccg2xml.dir}/ccg.ply" property="ccg.ply.present"/>
    <fail unless="ccg.ply.present" message="ccg.ply is not present"/>

    <available file="${ccg2xml.dir}/lex.py" property="lex.py.present"/>
    <fail unless="lex.py.present" message="lex.py is not present"/>

    <available file="${ccg2xml.dir}/yacc.py" property="yacc.py.present"/>
    <fail unless="yacc.py.present" message="yacc.py is not present"/>

    <!-- branch on cygwin -->
    <antcall target="compile-ccg2xml.default"/>
    <antcall target="compile-ccg2xml.cygwin"/>
  </target>

  <target name="compile-ccg2xml.default" unless="cygwin">
    <echo message="(default compile)"/>
    <exec executable="python" dir="${ccg2xml.dir}" failonerror="true">
      <arg line="convert-ply.py -o ccg2xml.py ccg.ply"/>
    </exec>
  </target>

  <target name="compile-ccg2xml.cygwin" if="cygwin">
    <echo message="(cygwin compile)"/>
    <exec executable="bash" dir="${ccg2xml.dir}" failonerror="true">
      <arg value="-c"/>
      <arg value="python convert-ply.py -o ccg2xml.py ccg.ply"/>
    </exec>
  </target>

  <target name="compile-ccg2xml.finish">
    <copy todir="${bin.dir}">
      <fileset dir="${ccg2xml.dir}">
        <include name="ccg2xml.py"/>
        <include name="lex.py"/>
        <include name="yacc.py"/>
      </fileset>
    </copy>
  </target>

  <target name="copy-ccg-edit">
    <copy todir="${bin.dir}">
      <fileset dir="${ccg2xml.dir}">
        <include name="ccg_editor.py"/>
        <include name="Tree.py"/>
      </fileset>
    </copy>
  </target>

  <target name="clean">
    <delete>
      <fileset dir="${ccg2xml.dir}">
        <include name="ccg2xml.py"/>
      </fileset>
      <fileset dir="${bin.dir}">
        <include name="ccg2xml.py"/>
        <include name="lex.py"/>
        <include name="yacc.py"/>
      </fileset>
    </delete>
  </target>

</project>


================================================
FILE: src/ccg2xml/ccg.ply
================================================

# Author: Ben Wing <ben@666.com>
# Date: November 2006

#############################################################################
#                                                                           #
#                                 ccg.ply                                   #
#                                                                           #
#   Convert a .ccg file, specifying a CCG grammar, into files lexicon.xml,  #
#   rules.xml, morph.xml, types.xml and grammar.xml.  You can't actually    #
#   run this file itself; you have to use convert-ply.py to convert it      #
#   into a Python file (ccg2xml), which you then run to generate the XML    #
#   files from the .ccg input.  For a description of the format of this     #
#   file, see the comments in convert-ply.py.                               #
#                                                                           #
#############################################################################


import sys
import re
import optparse
import copy
import os
import cStringIO

# Local imports
import lex, yacc

# Get options

usage = """%prog [OPTIONS] FILE ...

Generate appropriate XML files for input to OpenCCG.
"""

parser = optparse.OptionParser(usage=usage)
parser.add_option("-o", "--omit-output",
                  help="""Omit the specified files from the output.
Value should be a list separated by commas or spaces.  The allowed values are grammar, morph, lexicon, rules, types, and testbed.  If you put a + sign before the list, it means output *only* the specified files."""
                  )
parser.add_option("-p", "--prefix",
                  help="""Optional prefix to attach to each of the generated files, so that output from different files can occur in the same directory.  Defaults to the base name of the input file, minus any extension, plus a hyphen.  If you want such a hyphen or similar char, add it yourself.""",
                  metavar="DIR"
                  )
parser.add_option("-d", "--dir",
                  help="""Directory to store files in (defaults to current directory).""",
                  metavar="DIR"
                  )
parser.add_option("-q", "--quiet",
                  action="store_true",
                  help="Don't output explanatory messages, but only warnings and errors.")
parser.add_option("-t", "--transformed-input",
                  action="store_true",
                  help="Output transformed input after macro substitutions have been applied.")
parser.add_option("-y", "--yacc-debug",
                  action="store_true",
                  help="Show more output about the YACC parser generation.  Also probably generate some extra files, e.g. parser.out, containing info about the generated parser.")
parser.add_option("-m", "--macro-debug",
                  action="store_true",
                  help="Dump macro definitions at end of file.")
parser.add_option("--super-macro-debug",
                  action="store_true",
                  help="Show copious output about macro expansions.")

def parse_arguments(argv):
    global options, global_args
    (options, global_args) = parser.parse_args(argv)

    # Global variables used for debugging; we may move them into the
    # global-state variable
    global lex_debug
    global xml_debug
    global yacc_debug
    global macro_debug
    global super_macro_debug

    lex_debug = 0
    xml_debug = 0
    yacc_debug = options.yacc_debug
    macro_debug = options.macro_debug
    super_macro_debug = options.super_macro_debug

########################################################################
#                           Utility functions                          #
########################################################################


# CONVENTIONS:
#
# --------- XML ----------
#
# Thankfully, the structure of XML is extremely simple.  We represent
# a single XML statement of the form
#
# <biteme foo="1" blorp="baz">
#   <bitemetoo ...>
#     ...
#   gurgle
# </biteme>
#
# as a list
#
# ['biteme', [('foo', '1'), ('blorp', 'baz')],
#    ['bitemetoo', ...],
#    'gurgle'
# ]
#
# i.e. an XML statement corresponds to a list where the first element
# is the statement name, the second element lists any properties, and
# the remaining elements list items inside the statement.
#
# ----------- Property lists -------------
#
# The second element of an XML statement in list form is a "property list",
# a list of two-element tuples (property and value).  Some functions below
# (e.g. `getprop', `putprop') manipulate property lists.
#
# FIXME: Just use a hash table.
#
# ---------- Abstract syntax trees -----------
#
# We use classes to represent statements and blocks.  Below this level, it's
# simpler to just use the XML that we ultimately have to generate anyway.
# The conventions for using XML are either to use property lists or lists of
# XML statements in the list form outlined above.


#############################
#        Handling XML       #
#############################

def xml_sub(crap):
    if type(crap) is not str:
        crap = str(crap)
    crap = crap.replace('<', '&lt;')
    crap = crap.replace('>', '&gt;')
    return crap

def print_xml_1(file, xml, indent=0):
    if xml_debug > 1:
        errout("%sPrinting: %s\n" % (' ' * indent, str(xml)))
    if type(xml) is not list:
        file.write('%s%s\n' % (' ' * indent, xml_sub(xml)))
    else:
        check_arg_type("XML statement", xml[0], str)
        file.write(' ' * indent)
        file.write('<%s' % xml_sub(xml[0]))
        for x in xml[1]:
            check_arg_type("XML statement", x, tuple)
            if len(x) != 2:
                raise TypeError("Bad tuple pair: " + str(x))
            file.write(' %s="%s"' % (xml_sub(x[0]), xml_sub(x[1])))
        subargs = xml[2:]
        if not subargs:
            file.write('/>\n')
        else:
            file.write('>\n')
            for x in subargs:
                print_xml_1(file, x, indent + 2)
            file.write(' ' * indent)
            file.write('</%s>\n' % xml_sub(xml[0]))

# Pretty-print a section of XML, in the format above, to FILE.
# Start at indent INDENT.

def print_xml(file, xml):
    if xml_debug == 1:
        errout("Printing: %s\n" % str(xml))
    print_xml_1(file, xml)

# Return True if PROP is seen as a property in PROPLIST, a list of tuples
# of (prop, value)
def property_specified(prop, proplist):
    return not not ['foo' for (x,y) in proplist if x == prop]

# Return value of property PROP in PROPLIST; signal an error if not found.
def getprop(prop, proplist):
    for (x,y) in proplist:
        if x == prop:
            return y
    raise ValueError("Property %s not found in %s" % (prop, proplist))

# Return value of property PROP in PROPLIST, or DEFAULT.
def getoptprop(prop, proplist, default=None):
    for (x,y) in proplist:
        if x == prop:
            return y
    return default

# Replace value of property PROP with VALUE in PROPLIST.
def putprop(prop, value, proplist):
    for i in xrange(len(proplist)):
        if proplist[i][0] == prop:
            proplist[i] = (prop, value)
            return
    else:
        proplist += [(prop, value)]
    

# Replace property named PROP with NEW in PROPLIST.  Often this is called with
# with PROP equal to None; the None occurs when a PROP=VALUE clause is expected
# but a bare value is supplied.  The context will supply a particular default
# property (e.g. 'name') to be used when the property name is omitted, but the
# generic code to handle property-value clauses doesn't know what this is.
# The surrounding code calls property_name_replace() to fill in the proper name.

def property_name_replace(prop, new, proplist):
    for i in xrange(len(proplist)):
        if proplist[i][0] == prop:
            proplist[i] = (new, proplist[i][1])

#############################
#      Error-handling       #
#############################

def init_errors(errors_to_string):
    # Count of number of errors seen so far.
    global error_count
    error_count = 0

    global write_errors_to_string
    write_errors_to_string = errors_to_string

    global stdout_file, stderr_file
    if errors_to_string:
        stdout_file = cStringIO.StringIO()
        stderr_file = cStringIO.StringIO()
    else:
        stdout_file = sys.stdout
        stderr_file = sys.stderr

    global message_log
    message_log = []

def save_errors(cur):
    cur.error_count = error_count
    cur.write_errors_to_string = write_errors_to_string
    cur.stdout_file = stdout_file
    cur.stderr_file = stderr_file

class InternalError(StandardError):
    pass

def argformat(format, arg):
    if type(format) is str:
        return format % arg
    else:
        return str(format)

# Throw an error, like fprintf(stderr, ...)
def synerr(format, *arg):
    raise SyntaxError(argformat(format, arg))

# Output to stderr, maybe.  But output to stdout if our input is being
# output at the same time, so the two will stay in sync.
def maybe_errout(str):
    # Force display of error
    # FIXME: Maybe we could dump all errors into a single 
    # window display and show the messages together
    #showerror('Message', str)

    if options.transformed_input:
        stdout_file.write(str)
    else:
        stderr_file.write(str)

def error_or_warning(title, lineno, format, *arg):
    formatted_arg = argformat(format, arg)
    if lineno:
        maybe_errout("%s, line %s: %s\n" % (title, lineno,
                                            formatted_arg))
    else:
        maybe_errout("%s: %s\n" % (title, formatted_arg))
    # Add the message as a tuple, for easy recall in the editor
    # Note: lineno being put in irrespective of the fact
    # of whether it exists or not
    # FIXME!! The purpose of errors_to_string and message_log duplicate
    # each other somewhat.  Clean up.
    global message_log
    message_log += [(title, lineno, formatted_arg)]

# Write formatted arguments to stderr, with Error: printed.
def error(lineno, format, *arg):
    global error_count
    error_count += 1
    error_or_warning('Error', lineno, format, *arg)

# Write formatted arguments to stderr, with Warning: printed.
def warning(lineno, format, *arg):
    global warning_count
    warning_count += 1
    error_or_warning('Warning', lineno, format, *arg)

# Write formatted arguments to stdout.
def outout(format, *arg):
    stdout_file.write(argformat(format, arg))

# Write formatted arguments to stderr.
def errout(format, *arg):
    stderr_file.write(argformat(format, arg))

# Debugging output: Always to sys.stderr.
def debug(format, *arg):
    sys.stderr.write(argformat(format, arg))

def check_arg_type(errtype, arg, ty):
    if type(arg) is not ty:
        raise TypeError("%s: Type is not %s: %s" % (errtype, ty, arg))

#############################
#   Abstract Syntax Trees   #
#############################

# Classes beginning with CS (= CCG Syntax) are used for constructing the
# abstract syntax tree corresponding to a CCG source file. (An abstract
# syntax tree, or AST, is a hierarchical representation of the syntax of a
# piece of source code text, in this case a CCG-format file.) The source
# file is made up out of blocks, each of which begins with an identifier
# and is followed by one or more statements.

# A CSNode corresponds to any unified section of source code -- a single
# block or statement, a particular part of a statement (e.g. an
# attribute-value list or a single attribute-value clause), or even the
# whole file.  The basic restriction is that it must correspond to a single
# YACC production; hence it logically belongs in a unit and is the maximum
# extent of text that belongs in the unit or possibly statement in a single
# block.  It has some corresponding source text with starting and ending
# line numbers, a function to generate the XML, and a function to draw the
# node.  If the node is large enough to represent at least one XML
# statement, it should be a list of XML statements in the XML-statement
# form described above (a list [TAG, PROPLIST, CHILD ...]); otherwise, the
# format is undefined, but most likely will be a property list.  The CSNode
# is initialized from the YaccProduction object (stored in variable `p',
# usually, but accessed as $@) associated with a particular production,
# which supplies the extent of source code associated with the production.

class CSNode(object):
    def __init__(self, prod):
        self.prod = prod
    def xml(self):
        # In many cases, it's easiest just to build up the XML at creation time
        # and store it, rather than constructing it dynamically.  Note that we
        # intentionally don't initialize self.static_xml, so we get an error
        # if it's not set.
        return self.static_xml
    # draw(self, parent, cfile, vars): Draw the node by returning a new widget
    # containing the drawn representation: Should be defined if node is
    # drawable.  It should return a widget that is a child of PARENT,
    # also a widget.  It is up to the caller to call pack() or grid()
    # so that the widget's geometry will be set; but the draw() function
    # should appropriately configure any child widgets that it creates.
    # VARS is an object containing Tkinter variables that may control the
    # way that the node is drawn.

# A CSStatement corresponds to a single statement in a single block.  Note
# that, in the interests of simplicity, we don't currently create objects
# for pieces of CCG code that are smaller than a statement; instead, we
# just use the XML representation.  We usually follow the convention that
# if we have to make changes to the XML that make it not be in a one-to-one
# correspondence with the original code, we do this at the level of the
# statement or block.

class CSStatement(CSNode):
    def __init__(self, prod):
        super(CSStatement, self).__init__(prod)

# A CSBlock is a single block.

class CSBlock(CSNode):
    def __init__(self, prod):
        super(CSBlock, self).__init__(prod)

#############################
#             Misc          #
#############################

# Is it identifier material?  Input should be a character.
def isalnumund(str):
    return str.isalnum() or str in '_+-'

# Prior to Python 2.4, no sorted()
def my_sorted(lyst):
    lystcopy = list(lyst)
    lystcopy.sort()
    return lystcopy

########################################################################
#                               Tokenizing                             #
########################################################################

# The following IDs have a special meaning to the OpenCCG tokenizer if a
# token has the form [*ID*].
#magic_names = ('AMT', 'DATE', 'DUR', 'NUM', 'TIME')

# It seems that the tokenizer does not require an [*ID*] token to be a known
# magic thing (i.e. [*FOO*] is a legal surface form), so line 402 is commented
# out.
# If someone decides that [*ID*] tokens should be restricted to the ones
# listed above, uncomment lines 397 and 503.

# Directives -- These are particular words that are specially handled in
# an appropriate position and hence need to be tokens for use in the
# parser.  However, they can also be part of a generic "word" -- in
# other words, we have no "reserved words".

directives = (
    'FAMILY', 'ENTRY', 'MEMBER', 'FEATURE', 'PROP', 'RULE',
    'NO', 'APP', 'COMP', 'XCOMP', 'SUB', 'XSUB', 'TYPERAISE', 'TYPECHANGE',
    'DEF', 'WORD', 'TESTBED', 'RELATION_SORTING'
    )

# Additional tokens that can form part of a word.  A bare 'x' can form
# part of a word as well, except for in a few circumstances.
basic_word_no_x_tokens = ('ID', 'QUOTEDID') + directives
word_no_x_tokens = ('NUMBER',) + basic_word_no_x_tokens
word_no_number_tokens = ('X',) + basic_word_no_x_tokens
word_tokens = ('NUMBER',) + word_no_number_tokens + ('MAGIC_ID',)
bracket_tokens = ('LPAREN', 'RPAREN', 'LBRACKET', 'RBRACKET',
                  'LBRACE', 'RBRACE')
other_tokens = (
    # String tokens
    'SLASH', 'BACKSLASH',
    'LESS', 'GREATER',
    'CARET', 'STAR', 'DOT', 'AT', 'EQUALS', 'GOESTO', 'PIPE',
    'COMMA', 'SEMI', 'DOLLAR', 'COLON', 'BANG', 'TILDE',
    # Handled through t_ID
    'PLUS', 'MINUS', 'PLUSMINUS',
    # Only in a def()
    'NEWLINE',
    'BOGUS_VALUE' # Kludge kludge kludge, fuck me harder
    )

tokens = word_tokens + bracket_tokens + other_tokens

t_LPAREN     = r'\('
t_RPAREN     = r'\)'
t_LBRACKET   = r'\['
t_RBRACKET   = r'\]'
t_LBRACE     = r'\{'
t_RBRACE     = r'\}'

t_SLASH      = r'/'
t_BACKSLASH  = r'\\'
t_LESS       = r'<'
t_GREATER    = r'>'
t_CARET      = r'\^'
t_STAR       = r'\*'
t_DOT        = r'\.'
t_AT         = r'@'
t_EQUALS     = r'='
t_GOESTO     = r'=>'
t_PIPE       = r'\|'
t_COMMA      = r','
t_SEMI       = r';'
t_DOLLAR     = r'\$'
t_COLON      = r':'
t_BANG       = r'!'
t_TILDE      = r'~'

# Identifiers and directives

directives_map = { }
for r in directives:
    directives_map[r.lower().replace('_', '-')] = r
directives_map['x'] = 'X';
# We handle +, -, and +- here because + and - can, in general, form part
# of a token.
directives_map['+'] = 'PLUS';
directives_map['-'] = 'MINUS';
directives_map['+-'] = 'PLUSMINUS';

def t_ID(t):
    r'''(([\-+%a-zA-Z_0-9]|[^\000-\177])+|"[^"\n]+"|\'[^'\n]+')'''
    # convert to directive, maybe
    if re.match(r'^\d+$', t.value):
        t.type = 'NUMBER'
        try:
            t.value = int(t.value)
        except ValueError:
            error(t.lineno, "Integer value too large: %s", t.value)
            t.value = 0
    elif t.value in directives_map:
        t.type = directives_map[t.value]
    else:
        t.type = 'ID'
        # remove quotes if they're there
        if t.value[0] == '"' or t.value[0] == "'":
            t.type = 'QUOTEDID'
            t.value = t.value[1:-1]
    return t

# The distinction from ordinary IDs is currently not really needed, i.e. t_ID
# could to the job, too. However, it leaves open the possibility to handle
# magic IDs differently from ordinary ones.
def t_MAGIC_ID(t):
    r'''(\[\*[^*]+\*\])'''
    t.type = 'MAGIC_ID'
    return t
#t_MAGIC_WORD.func_doc = '(\[\*(' + '|'.join(magic_names) + ')\*\])'

t_ignore = " \t\r"

#bracketmap = {'(': 'LPAREN', ')': 'RPAREN',
#              '[': 'LBRACKET', ']': 'RBRACKET',
#              '{': 'LBRACE', '}': 'RBRACE'}
#
#def t_LBRACKET(t):
#    r'[\[\(\{]'
#    global parendepth
#    parendepth += 1
#    t.type = bracketmap[t.value]
#    return t
#
#def t_RBRACKET(t):
#    r'[\]\)\}]'
#    global parendepth
#    parendepth -= 1
#    t.type = bracketmap[t.value]
#    return t

def t_backslash_newline(t):
    r'\\\r?\n'
    t.lineno += 1
    # If it's not a line continuation, it's just a normal backslash
    if not lexer_track_newlines:
        t.type = 'BACKSLASH'
        return t

def t_newline(t):
    r'\n'
    t.lineno += 1
    if lexer_track_newlines:
        t.type = 'NEWLINE'
        return t

# Comments
def t_comment(t):
    r'\#[^\n]*\n'
    t.lineno += 1

def t_error(t):
    error(t.lineno, "Illegal character '%s'", t.value[0])
    t.skip(1)
    
def init_lexer():
    # This is a signal to us to go into "line mode", where we return a
    # newline as a token and treat backslash at the end of a line as a line
    # continuation device.
    global lexer_track_newlines
    lexer_track_newlines = 0

    # Build the lexer.  This does introspection, on all the t_*() functions.
    global globallexer

    globallexer = lex.lex(debug=lex_debug)

def save_lexer(cur):
    cur.lexer_track_newlines = lexer_track_newlines
    cur.globallexer = globallexer

########################################################################
#                                Parsing                               #
########################################################################

def p_word(p):
    'FILLED IN BELOW'
    p[0] = p[1]
# fill in the documentation (i.e. the cfg rule)
p_word.func_doc = 'word : ' + '\n| '.join(word_tokens)

# hack, to deal with a reduce/reduce conflict
def p_word_except_x(p):
    'FILLED IN BELOW'
    p[0] = p[1]
# fill in the documentation (i.e. the cfg rule)
p_word_except_x.func_doc = 'word_except_x : ' + '\n| '.join(word_no_x_tokens)

def p_word_no_numbers(p):
    'FILLED IN BELOW'
    p[0] = p[1]
# fill in the documentation (i.e. the cfg rule)
p_word_no_numbers.func_doc = (
    'word_no_numbers : ' + '\n| '.join(word_no_number_tokens))

%y
#############################
#  Begin Yacc Declarations  #
#############################

#############################
#      Word lists, etc      #
#############################

empty: : $$ = []

commas: COMMA
      : commas COMMA

typed_word : word
           : word COLON word : $$ = '%s:%s' % ($1, $3)

# Possibly empty list of words

word_0: word
      : word commas

word_list: word_0 *

# Possibly empty list of words or *

word_or_star: word | STAR

word_or_star_0: word_or_star
              : word_or_star commas

# Non-empty list of words

#nonempty_word_list: word_0 : $$ = [$1]
#                  : nonempty_word_list word_0 : $$ = $1 + [$2]

# Attribute lists contain specifications of the form ATTR=VALUE.  The
# return value is a list of (attribute, value) tupes.

attr : word EQUALS word : $$ = ($1, $3)

attr_0: attr
      : attr commas

attr_list: attr_0*

opt_paren_attr_list: empty
                   : LPAREN attr_list RPAREN : $$ = $2

# Extended attribute lists contain either VALUE or ATTR=VALUE.  The return
# value is a list of (attribute, value) tupes; when a bare value is given,
# the attribute is None.

ext_attr : word : $$ = (None, $1)
         : word EQUALS word : $$ = ($1, $3)

ext_attr_0: ext_attr
          : ext_attr commas

ext_attr_list: ext_attr_0*

opt_paren_ext_attr_list: empty
                       : LPAREN ext_attr_list RPAREN : $$ = $2

#############################
#         Statements        #
#############################

top : statement*

statement : family_block | feature_block | rule_block | macro_def | word_block
            | testbed_block | relation_sorting_block
          : SEMI

#############################
#           Macros          #
#############################

%p

def init_macros():
    # Used to turn off macro substitution while processing a macro definition.
    global no_macro_sub
    no_macro_sub = 0

    # Needed to handle issue where macro def is immediately followed by
    # macro call.
    global return_bogus_value
    return_bogus_value = 0

    # Mapping of macro definitions to parameter list and text.
    global macro_defs
    macro_defs = {}

    # It doesn't really matter what the parameter names are for built-ins.
    # There just have to be the right number of them.
    macro_defs['regsub'] = MacroDef(['fromre', 'totext', 'str'], regsub)
    macro_defs['ifmatch'] = MacroDef(['regex', 'string', 'doif', 'doelse'],
                                     ifmatch)
    macro_defs['ifmatch-nocase'] = MacroDef(['regex', 'string', 'doif',
                                             'doelse'],
                                            ifmatch_nocase)

def save_macros(cur):
    cur.no_macro_sub = no_macro_sub
    cur.return_bogus_value = return_bogus_value
    cur.macro_defs = macro_defs

class MacroDef:
    def __init__(self, args, text):
        self.args = args
        self.text = text

class CCGToken(lex.LexToken):
    def __init__(self, type, value):
        self.type = type
        self.value = value

def arg_to_text(arg):
    return ''.join([str(x.value) for x in arg])

# Implementation of built-in 'regsub()': Concatenate the tokens into
# text, then do regex substitution.
def regsub(fromre, totext, string):
    return re.sub(arg_to_text(fromre), arg_to_text(totext),
                  arg_to_text(string))

# If REGEX matches the beginning of STRING, return DOIF, else return DOELSE.
def ifmatch(regex, string, doif, doelse):
    if re.match(arg_to_text(regex), arg_to_text(string)):
        return doif
    else:
        return doelse

# Same as ifmatch() but case-insensitive.
def ifmatch_nocase(regex, string, doif, doelse):
    if re.match(arg_to_text(regex), arg_to_text(string), re.IGNORECASE):
        return doif
    else:
        return doelse

def print_macros():
    for (key, value) in macro_defs.iteritems():
        print "Macro: %s(%s): %s" % (key, value.args, value.text)

# Given some text, expand the macros in it, recursively (i.e. apply
# any macros, then apply macros to the resulting text, etc.).  After
# that, combine text that has the . operator applied to it.
def macroexpand_text(text):
    if super_macro_debug:
        print "Text before expanding: %s" % arg_to_text(text)
    # Now recursively expand macros.  The code to actually check for
    # macros is in MacroLexer.
    lexer = MacroLexer(None)
    lexer.pushstack(text)
    newtext = []
    while True:
        tok = lexer.token()
        #print "Reading token: %s" % tok
        if not tok:
            break
        newtext.append(tok)
    text = newtext
    l = len(text)
    if super_macro_debug:
        print "Text after expanding: %s" % arg_to_text(text)
    # Now directly handle instances with the '.' operator, so that
    # the operator can be used to create new macro calls
    x = 1
    while x < l - 1:
        if (text[x].type == 'DOT' and text[x-1].type in ['ID', 'QUOTEDID']
            and text[x+1].type in ['ID', 'QUOTEDID']):
            tok = CCGToken(text[x-1].type,
                           text[x-1].value + text[x+1].value)
            tok.lineno = text[x].lineno
            # If either is quoted, the result should be quoted.
            if text[x+1].type == 'QUOTEDID':
                tok.type = 'QUOTEDID'
            text[x-1] = tok
            text[x:x+2] = []
            x -= 2
            l -= 2
        x += 1
    return text

# Return text of macro, with ARGS substituted for formal parameters of
# the macro.
def macrosub(macdef, args, lineno):
    text = macdef.text
    # If the text definition is a function (for builtins),
    # macro-expand the arguments, then call the function.
    if callable(text):
        args = [macroexpand_text(x) for x in args]
        text = text(*args)
        if type(text) is str:
            text = [CCGToken('QUOTEDID', text)]
            text[0].lineno = lineno
            return text
        else:
            return macroexpand_text(text)
    else:
        # Otherwise, make a copy of the text and substitute the arguments
        # into it.
        text = text[:]
        args = dict(zip(macdef.args, args))
        l = len(text)
        x = 0
        while x < l:
            if (text[x].type == 'ID' or text[x].type in directives) \
                   and text[x].value in args:
                newtext = args[text[x].value]
                text[x:x+1] = newtext
                l += len(newtext) - 1
                x += len(newtext) - 1
            x += 1
        return macroexpand_text(text)

%y

# We need to do some hackery with BOGUS_VALUE in order to avoid problems
# when a macro definition is immediately followed by a call to that same
# macro.  The problem is that generally the parser wants to read one token
# ahead.  As a result, by the time it's processed the token that ends a
# macro definition, it's already read the following token -- and if that
# token begins a macro call, we're screwed.  To avoid this, we ensure that
# there is an extra BOGUS_VALUE token returned after every macro definition.
# To make this happen, we set a flag return_bogus_value just before the
# parser processes the token ending the macro definition.  At this point,
# the parser has already read that token from the lexer, and before it
# reduces that token, it reads the next token from the lexer -- which
# returns a bogus token, as we instructed it.

macro_def : macro_def_1 BOGUS_VALUE

turn_off_macro_sub: :
    global no_macro_sub
    no_macro_sub = 1

return_bogus_value: :
    global return_bogus_value
    return_bogus_value = 1
    global no_macro_sub
    no_macro_sub = 0

macro_def_1 : turn_off_macro_sub DEF word LPAREN macro_param_list turn_on_linetrack RPAREN macro_text :
    macdef = MacroDef($5, $8)
    macdef.args = $5
    macdef.text = $8
    if $3 in macro_defs:
        error($@.lineno(0), "Redefining macro %s" % $3)
    macro_defs[$3] = macdef
    #print_macros()

macro_param_list : word_list

macro_text: bracemacro_text | linemacro_text

bracemacro_text: turn_off_linetrack LBRACE bracemacro_text_list return_bogus_value RBRACE: $$ = $3

bracemacro_text_list: empty : $$ = []
                    : bracemacro_text_list bracemacro_text_entry : $$ = $1 + $2

# The key thing about these is that they must be invoked BEFORE the
# token that tells you whether to turn the mode on or off.  If you
# try to set the global variable after (even directly after) the
# RPAREN or NEWLINE or whatever has been processed by a rule, it's too
# late: The parser has already looked ahead, and any newline directly
# following the token in question already processed the wrong way.
turn_on_linetrack: :
    global lexer_track_newlines
    lexer_track_newlines = 1

turn_off_linetrack: :
    global lexer_track_newlines
    lexer_track_newlines = 0

%p

def p_bracemacro_text_entry(p):
    '''bracemacro_text_entry : LPAREN bracemacro_text_list RPAREN
                     | LBRACKET bracemacro_text_list RBRACKET
                     | LBRACE bracemacro_text_list RBRACE'''
    p[0] = [p.slice[1]] + p[2] + [p.slice[3]]

def p_bracemacro_text_entry_other(p):
    'FILLED IN BELOW'
    p[0] = [p.slice[1]]
# fill in the documentation (i.e. the cfg rule)
p_bracemacro_text_entry_other.func_doc = (
    'bracemacro_text_entry : ' + '\n| '.join(other_tokens + word_tokens)
    )

%y

linemacro_text: turn_off_linetrack return_bogus_value NEWLINE:
    $$ = []

linemacro_text: linemacro_begin linemacro_next* turn_off_linetrack return_bogus_value NEWLINE:
    $$ = [$1] + $2

%p

def p_linemacro_begin(p):
    p[0] = p.slice[1]

def p_linemacro_next(p):
    p[0] = p.slice[1]

linemacro_begin_tokens = [x for x in tokens
                          if x != 'NEWLINE' and x != 'LBRACE']
linemacro_next_tokens = [x for x in tokens if x != 'NEWLINE']


# fill in the documentation (i.e. the cfg rule)
p_linemacro_begin.func_doc = (
    'linemacro_begin : ' + '\n| '.join(linemacro_begin_tokens)
    )
p_linemacro_next.func_doc = (
    'linemacro_next : ' + '\n| '.join(linemacro_next_tokens)
    )

%y

#############################
#       Feature blocks      #
#############################

%p

def init_features():
    # For each feature value, map its name to a CCGFeatval structure
    # describing it.
    global feature_values
    feature_values = {}
    # List of values for a particular feature; each value is a CCGFeatval,
    # listing a value, its parents, licensing info, macro info, and its
    # feature.
    global feature_to_values
    feature_to_values = {}
    # List of distributive features
    global distributive_features
    distributive_features = []
    # List of XML for licensing features
    global licensing_feature_xml
    licensing_feature_xml = []
    # Mapping of the names of feature values to the value inserted into the
    # XML 'val' attribute; usually the same as the name. (YUCK YUCK YUCK)
    global fv_names_to_values
    fv_names_to_values = {}

def save_features(cur):
    cur.feature_values = feature_values
    cur.feature_to_values = feature_to_values
    cur.distributive_features = distributive_features
    cur.licensing_feature_xml = licensing_feature_xml
    cur.fv_names_to_values = fv_names_to_values

# A feature value: The "name" of the feature value (corresponding to a
# feature macro), the parents of this value, and any licensing info.  Also
# may include a .feature, which is the "feature" that this value is a value
# for.
class CCGFeatval:
    def __init__(self, name, parents, licensing):
        self.name = name
        self.parents = parents
        self.licensing = licensing
    def __str__(self):
        return "CCGFeatval(%s, parents=%s, licensing=%s)" % (
            (self.name, self.parents, self.licensing))
    def __repr__(self):
        return str(self)

# Encapsulates directly obtained values and values obtained recursively,
# so we can avoid needlessly adding parents to the latter kind.
# Used temporarily when building the hierarchy.  Both direct and recursive
# are lists of CCGFeatvals.
class CCGFeatvalList:
    def __init__(self, direct, recursive=None):
        recursive = recursive or [] # fuckme!
        self.direct = direct
        self.recursive = recursive
    def __str__(self):
        return "CCGFeatvalList(direct=%s,recursive=%s)" % (self.direct,self.recursive)
    def __repr__(self):
        return str(self)

# For the given feature, and list of CCGFeatvals, convert the parents in
# each CCGFeatval to a list of CCGFeatvals rather just strings, and clean
# any excess parents.  Basically, if a value has multiple parents and one
# is reachable by following a path starting from another, it needs to be
# removed.

# FIXME!! Also output warnings when a featvar and featval have the same name.

def install_feature(feature, lis, lineno):
    # Add names to reverse-feature list and check for duplicates.
    for x in lis:
        if x.name in feature_values:
            warning(lineno, "Duplicate feature value `%s' (feature `%s', previously in feature `%s')",
                    x.name, feature, feature_values[x.name].feature)
        else:
            feature_values[x.name] = x
            x.feature = feature
    # Change the parents list of each value to point to actual featval objects
    # rather than just strings; check for unrecognized and duplicate values.
    for x in lis:
        newpar = []
        for y in x.parents:
            if y in feature_values:
                if feature_values[y] in newpar:
                    synerr("Duplicate feature value %s as parent of %s, feature %s",
                           y, x.name, feature)
                else:
                    newpar.append(feature_values[y])
            else:
                synerr("Unrecognized feature value %s as parent of %s, feature %s",
                       y, x.name, feature)
        x.parents = newpar

    # Check NODE and its parents to make sure it hasn't been seen before in
    # LIST, adding NODE to LIST as soon as it's seen.
    def check_cycles(node, list):
        if node in list:
            synerr("Cycle seen involving feature value %s", node.name)
        for x in node.parents:
            check_cycles(x, list + [node])
    
    # Check for cycles.
    for x in lis:
        check_cycles(x, [])

    # Check NODE and its parents to make sure that ORIGNODE is not reachable.
    def check_reachable(node, orignode):
        if node == orignode:
            return True
        for x in node.parents:
            if check_reachable(x, orignode):
                return True
        return False
    
    # Clean excess parents.
    for x in lis:
        newpar = []
        for y in x.parents:
            for z in x.parents:
                if z != y and check_reachable(z, y):
                    break
            else:
                newpar.append(y)
        x.parents = newpar

    # Finally: Add to feature list.
    feature_to_values[feature] = lis

# Return XML to go in types.xml.
def make_feature_types_xml():
    xml = []
    for (x, featvals) in feature_to_values.iteritems():
        # FIXME! Figure out what's going wrong here.
#        typename = x
#        print "fv_names_to_values: %s" % fv_names_to_values
#        if x in fv_names_to_values:
#            typename = fv_names_to_values[x]
#        xml += [['type', [('name', typename)]]]
        xml += [['type', [('name', x)]]]
        for y in featvals:
            if y.parents:
                xml += [['type',
                         [('name', y.name),
                          ('parents', ' '.join([z.name for z in y.parents]))]]]
            else:
                xml += [['type', [('name', y.name), ('parents', x)]]]
    return xml

# Return XML to go in morph.xml.
def make_feature_morph_xml():
    xml = []
    for x in my_sorted(feature_values):
        featval = feature_values[x]
        if featval.macrotie:
            entry = ['macro', [('name', '@%s' % x)]]
            for y in featval.macrotie:
                if type(y) is int:
                    entry += [['fs', [('id', y)],
                               ['feat',
                                [('attr', featval.feature),
                                 ('val', fv_names_to_values[x])]]]]
                else:
                    (wordtie, typename) = y
                    entry += [['lf', [],
                               ['satop', [('nomvar', wordtie)],
                                ['diamond', [('mode', typename)],
                                 ['prop',
                                  [('name', fv_names_to_values[x])]]]]]]
            xml += [entry]
    return xml

# Return XML to go in lexicon.xml.
def make_feature_lexicon_xml():
    xml = []
    if distributive_features:
        xml.append(['distributive-features',
                    [('attrs', ' '.join(distributive_features))]])
    if licensing_feature_xml:
        xml.append(['licensing-features', []] + licensing_feature_xml)
    return xml

%y

# Allow you to override the value inserted by a feature macro, if you
# really want to (requested by Fred).

featval_2: word: $$ = ($1, $1)
         : word COLON word: $$ = ($1, $3)

featval_1: featval_2 : $$ = $1 + ([], [])
         : featval_2 LBRACKET word_list RBRACKET : $$ = $1 + ($3, [])
         : featval_2 LPAREN attr_list RPAREN : $$ = $1 + ([], $3)
         : featval_2 LBRACKET word_list RBRACKET LPAREN attr_list RPAREN :
    $$ = $1 + ($3, $6)

featval: featval_1:
    (name, value, parents, licensing) = $1
    fv_names_to_values[name] = value
    $$ = CCGFeatval(name, parents, licensing)

set_featval: featval: $$ = CCGFeatvalList([$1])
           : featval LBRACE set_featval_list RBRACE:
    # The set_featval_list returns a CCGFeatvalList, where the direct entries
    # are those actually in the list itself, and the recursive entries
    # are descendants of them.  First add ourself as parent to the direct
    # entries.  Then move direct into recursive and put ourself as the only
    # direct entry.
    for x in $3.direct:
        x.parents += [$1.name]
    $$ = CCGFeatvalList([$1], $3.direct + $3.recursive)

set_featval_0: set_featval
             : set_featval commas

set_featval_list: set_featval_0
                : set_featval_list set_featval_0:
    $1.direct += $2.direct; $1.recursive += $2.recursive; $$ = $1

featvar: NUMBER: $$ = int($1)
       : word_no_numbers: $$ = ($1, $1)
       : word_no_numbers COLON word: $$ = ($1, $3)

featvar_0 : featvar
          : featvar commas

opt_featspec: empty               : $$ = (None, None)
            : LESS featvar_0+ GREATER : $$ = ($2, None)
            : LPAREN attr_list RPAREN : $$ = (None, $2)
            : LESS featvar_0+ GREATER LPAREN attr_list RPAREN: $$ = ($2, $5)

opt_feature_bang: empty | BANG

# We declare this in a slightly strange way to work around the awful bug
# involving non-recognition of empty RHS rules.
feature_decl_tail: SEMI: $$ = []
                 : COLON set_featval_list SEMI: $$ = $2

feature_decl : opt_feature_bang word opt_featspec feature_decl_tail:
    if $1:
        global distributive_features
        distributive_features.append($2)
    if $4:
        feature_values = $4.direct + $4.recursive
    else:
        feature_values = []
    install_feature($2, feature_values, $@.lineno(0))
    (macrotie, licensing) = $3
    # Add macro-tie info to each feature
    for x in feature_values:
        x.macrotie = macrotie
    # Handle licensing attributes on the feature values
    global licensing_feature_xml
    for x in feature_values:
        if x.licensing:
            licensing_feature_xml.append(
                ['feat',
                 [('attr', $2), ('val', fv_names_to_values[x.name])]
                 + x.licensing])
    # Handle licensing attributes on the feature itself rather than
    # on a feature value
    if licensing:
        licensing_feature_xml.append(['feat', [('attr', $2)] + licensing])

feature_block : FEATURE LBRACE feature_decl* RBRACE

#############################
#     Atomic categories     #
#############################

unification_id: NUMBER: $$ = ('id', $1)
              : TILDE NUMBER: $$ = ('inheritsFrom', $2)

unification_id_0: unification_id
                : unification_id commas

unification_id_spec: LESS unification_id_0* GREATER: $$ = $2

atomcat_bracket_entry : word EQUALS word :
    $$ = ['feat', [('attr', $1), ('val', $3)]]

atomcat_bracket_entry : word EQUALS STAR :
    $$ = ['feat', [('attr', $1), ('val', '[*DEFAULT*]')]]

# FIXME!!!! Be more intelligent in determining how to separate nomvars
# and featvars, instead of just using some isupper() hacks.  We should
# check to see if the nomvars are represented in the corresponding
# hylo spec.  We should also output warnings if a bare word occurs and
# it is not identified anywhere as either a nomvar (should appear in hylo),
# a featvar (should appear in feature {}), or a featval (likewise).

atomcat_bracket_entry : word :
    if $1[0].isupper() and (len($1) == 1 or not $1[1].isupper()):
        $$ = ['feat', [('attr', 'index')],
              ['lf', [], ['nomvar', [('name', $1)]]]]
    elif $1 in feature_values:
        $$ = ['feat', [('attr', feature_values[$1].feature), ('val', $1)]]
    else:
        $$ = ['feat', [('attr', $1)],
              ['featvar', [('name', "%s" % $1.upper())]]]

atomcat_bracket_entry : word COLON word:
    $$ = ['feat', [('attr', $1)],
          ['featvar', [('name', "%s:%s" % ($1.upper(), $3))]]]

atomcat_bracket_entry_0: atomcat_bracket_entry
                       : atomcat_bracket_entry commas

atomcat_bracket : LBRACKET atomcat_bracket_entry_0* RBRACKET : $$ = $2

# The use of word_except_x here is a hack to avoid a reduce/reduce conflict
# due to the use of x as an operator as well as a word.  Without it, the
# parser doesn't know, e.g., how to disambiguate something beginning
# FOO/x(... -- is x an operator or a category?  The parser only looks one
# character ahead, so it can't figure this out.  With this hack, you cannot
# use a single lowercase x as a category name without putting it in quotes,
# e.g. 'x'.

atomcat : word_except_x unification_id_spec? atomcat_bracket? :
    $$ = ['atomcat', [('type', $1)], ['fs', $2] + $3]

#############################
#           Slashes         #
#############################

%p
#  Temporary switch to Python mode to insert the needed function
slash_to_default_mode = {'/':'>', '\\':'<', '|':'.'}
ability_to_ability_value = {'@': 'active', '!': 'inert', None:None}
ability_value_to_ability = {'active': '@', 'inert': '!', None:None}
def makeslash(direc, mode, ability):
    if not mode:
        mode = slash_to_default_mode[direc]
    if direc == '|':
        direc = None
    ability = ability_to_ability_value[ability]
    return ['slash'] + [(direc and [('dir', direc)] or []) +
                        (ability and [('ability', ability)] or []) +
                        (mode and [('mode', mode)] or [])]
%y

bareslash : SLASH | BACKSLASH | PIPE

slash_ability : AT | BANG

slash_mode : X GREATER : $$ = 'x>'
           : LESS X    : $$ = '<x'
           : GREATER | LESS | X | DOT | STAR | CARET

slash : bareslash : $$ = makeslash($1, None, None)
      : bareslash slash_mode : $$ = makeslash($1, $2, None)
      : bareslash slash_ability: $$ = makeslash($1, None, $2)
      : bareslash slash_mode slash_ability: $$ = makeslash($1, $2, $3)
      : bareslash slash_ability slash_mode: $$ = makeslash($1, $3, $2)

#############################
#     Complex categories    #
#############################

# Example:
# 
# Source:
# 
# s<1>[E] \ np<2>[X nom] / np<3>[Y acc]
#
#
# XML output:
# 
# <complexcat>
#   <atomcat type="s">
#     <fs id="1">
#       <feat attr="index">
#         <lf>
#           <nomvar name="E"/>
#         </lf>
#       </feat>
#     </fs>
#   </atomcat>
#   <slash dir="\" mode="&lt;"/>
#   <atomcat type="np">
#     <fs id="2">
#       <feat attr="index">
#         <lf>
#           <nomvar name="X"/>
#         </lf>
#       </feat>
#       <feat attr="case" val="nom"/>
#     </fs>
#   </atomcat>
#   <slash dir="/" mode="&gt;"/>
#   <atomcat type="np">
#     <fs id="3">
#       <feat attr="index">
#         <lf>
#           <nomvar name="Y"/>
#         </lf>
#       </feat>
#       <feat attr="case" val="acc"/>
#     </fs>
#   </atomcat>
# </complexcat>

######################

# This is a basic attempt to create a compact (BNF-style) syntax for
# representing legal XML for categories.  The idea is that this could be
# parsed and used to verify the XML, or perhaps to convert it to some other
# form.  It's not clear this is worth it -- there is already an XML schema
# notation for describing legal XML (albeit it's extremely obnoxious and
# verbose), and verifiers for verifying XML given a schema and a piece of
# XML, and XSLT (again, obnoxiously verbose) for transforming XML.

# category = ( atomcat | complexcat )

# complexcat {
#   atomcat
#   (slash (category | dollar) | dollar | setarg)+
#   lf?
# }

# basicArg = ( slash | category )
# dollarArg = ( slash | dollar )
# dollar(name)
# setarg { basicArg basicArg+ }

# atomcat(!type=[NMTOKEN]) {
#   fs?
#   lf?
# }
    
#   fs(id) {
#     (feat(attr='index') {
#        lf { nomvar(name) } }
#      | feat(attr, val)
#      )+
#   }

# slash(dir=('/', '\\', '|'), mode=('.', '*', '^', 'x', 'x<', '<x', '<', '>'),
#       varmodality, ability=('inert', 'active'))
      
# fs(id): 
#   ...

%p

##################
# Initialization #
##################

# This maps face names to actual properties.  A face is the complete
# description for how a particular piece of text is to be displayed.  The
# properties can specify the font family, size, bold or not, italic or not,
# subscript or not, "scale" (modify the size by the specified value), and
# "inherit" to inherit from a specified face.  If not otherwise given,
# all faces inherit from the default.

face_mapping_init = {
    # The default mapping should contain a value for all parameters
    'default':{'family':'times', 'size':16, 'bold':False, 'italic':False,
               'subscript':False, 'superscript':False, 'scale':100,
               'foreground':None, 'background':None},
    'subscript':{'family':'helvetica', 'subscript':True, 'scale':70,
                 },
    'category':{'bold':True, 'family':'helvetica'},
    'dollar':{},
    'slash':{},
    'slash mode':{'subscript':True, 'scale':65},
    'paren':{},
    'brace':{},
    'family name':{'foreground':'blue', 'scale':130, 'bold':True},
    'lexical item':{'italic':True},
    'numeric index':{'inherit':'subscript'},
    'subscript comma':{'inherit':'subscript'},
    'nomvar':{'inherit':'subscript', 'foreground':'forest green'},
    'feature':{'inherit':'subscript', 'bold':True, 'foreground':'red'},
    # Ideally the following should be in small caps
    'caret':{'scale':115},
    'semname':{'scale':115},
    'semrole':{'scale':85, 'bold':True},
    'member heading':{},
    'member comma':{},
    'member':{'bold':True},
    }

# Offset to be applied to the baseline to handle subscripts and superscripts,
# relative to the size of the font of the subscripted/superscripted text.
# FIXME: Maybe should be relative to the larger size of the base (non-offset)
# text.  This would require that the 'scale' option not be handled in
# fixup_face_properties() but dealt with at the time that the offset is
# computed, so that the original text size is still available.
subscript_offset = -0.5
superscript_offset = 1

# Factor to scale all: FIXME, not currently working
zoom_factor = 100

# Merged and fixed up equivalent of the above.  This will also have a
# 'font' property containing the Tk font item corresponding to the
# family, size, bold, and italic properties.
face_mapping = {}

# Fix up a derived table of properties.  Currently this only handles 'scale'.
# This destructively modifies the property table.
def fixup_face_properties(props):
    if 'scale' in props:
        scale=props['scale']
        del props['scale']
        assert 'size' in props
        # Consider the size to its scaling factor
        props['size'] = int(props['size'] * scale / 100.0 + 0.5)
    family = props['family']
    size = props['size']
    weight = props['bold'] and 'bold' or 'normal'
    slant = props['italic'] and 'italic' or 'roman'
    props['font'] = tkFont.Font(family=family, size=size, weight=weight,
                                slant=slant)
    return props

# Merge two tables of properties, with P2 overriding P1.  Remove the
# 'inherit' property in the process.  Creates a new table, and does not
# modify P1 or P2.
def merge_face_properties(p1, p2):
    props = {}
    for x in p1:
        if x != 'inherit':
            props[x] = p1[x]
    for x in p2:
        if x != 'inherit':
            props[x] = p2[x]
    return props

# Derive the complete list of properties associated with a face name.
def face_properties(name):
    props = face_mapping_init[name]
    # If name is default, return properties directly
    if name == 'default':
        return merge_face_properties(props, {})
    # Else, determine where to inherit from and merge properties with
    # recursively computed value
    if 'inherit' in props:
        inherit = props['inherit']
    else:
        inherit = 'default'
    return merge_face_properties(face_properties(inherit), props)

# Compute the merged properties for all faces.
def compute_face_properties():
    for x in face_mapping_init:
        props = fixup_face_properties(face_properties(x))
        face_mapping[x] = props

def late_init_draw_once():
    compute_face_properties()

#################################
#   Drawing a section of text   #
#################################

# Create tags in a text widget corresponding to the faces and their
# properties. FIXME: Maybe we should do this only when needed, for each
# text widget.
def create_tags(text):
    for x in face_mapping:
        props = face_mapping[x]
        offs = 0
        if props['subscript']:
            offs = subscript_offset
        elif props['superscript']:
            offs = superscript_offset
        offs = offs*props['size']
        offs = '%sp' % offs # Dimension in points
        text.tag_config(x, font=props['font'], offset=offs)
        fg = props['foreground']
        bg = props['background']
        if fg:
            text.tag_config(x, foreground=fg)
        if bg:
            text.tag_config(x, background=bg)
        

# A "draw-into" object, used for incrementally building up some text
# in various fonts.  Initialized with a parent widget and some initial text.
# Drawing into it is done by calls to text().  When done, call finish()
# to return a widget containing the text (which can then be packed, gridded,
# etc.).
class draw_into(object):
    def __init__(self, master, width=120):
        self.wid = Text(master, height=3, width=width,
                        borderwidth=0, relief=FLAT,
                        background='white')
        self.curface = None
	self.wid.slash_image = []
        self.curtext = ''
        create_tags(self.wid)

	# Self.alltext maintains the length of the text printed 
	# for the current widget
	self.alltext = 0

	# FIXME: the tirgger for bigger height of the Text
	# widget is arbitrarily set to 95. This should be 
	# driven by width of individual fonts and chars
	self.expandTrigger = 95

    def finish_run(self):
        if self.curtext:
            self.wid.insert(INSERT, self.curtext, (self.curface,))
            #props = face_mapping[self.curface]
            #Label(self.wid, text=self.curtext,
            #      font=props['font']).pack(side=LEFT)
            self.curtext = ''
    def text(self, tex, face='default'):
        if self.curface == face:
            self.curtext += tex
        else:
            self.finish_run()
            self.curtext = tex
            self.curface = face

	# Increase recorded length of text
	self.alltext += len(tex)

	# Increase height if necessary
	if (self.alltext > self.expandTrigger):
		heightval = 3* (self.alltext/self.expandTrigger +1)
	    	self.wid.config(height= heightval)


    def finish(self):
        self.finish_run()
        self.wid.config(state=DISABLED)
        return self.wid
    def image(self, img):
	# When there is an image to be embedded
	self.finish_run()
	# Access the OPENCCG_HOME environment variable
	# to determine the correct path for the images
	openccg_home = os.environ['OPENCCG_HOME']
	gifdir = openccg_home+"/images/slashes/"
	image = PhotoImage(file=gifdir+img)
	# We are creating an instantiated variable here
	# for the image, because the actual photo object is destroyed once
	# the execution leaves the __init__ code. Without building it this way, 
	# the display was showing only a space for the image but not the image itself
	self.wid.slash_image += [image]
	self.wid.image_create(INSERT, image=image)

    def onHilite(self):
    	self.wid.config(bg = '#E9FFE3')

    def offHilite(self):
    	self.wid.config(bg = 'white')

def category_draw_children(into, chils, depth, vars, need_initial_comma=False,
                           sep='', sepface='default'):
    for x in chils:
        if sep and need_initial_comma:
            into.text(sep, sepface)
        need_initial_comma = True
        category_draw(into, x, depth=depth + 1, vars=vars)

# Given the XML for a category, draw a graphical representation into the
# widget INTO.  The drawing is done by calling into.text(TEXT, FACE)
def category_draw(into, xml, depth, vars):
    ty = xml[0]
    props = xml[1]
    chils = xml[2:]
    if ty == 'complexcat':
        if depth > 0:
            into.text('(', 'paren')
        category_draw_children(into, chils, depth, vars)
        if depth > 0:
            into.text(')', 'paren')
    elif ty == 'atomcat':
        into.text(getprop('type', props), 'category')
        category_draw_children(into, chils, depth, vars)
    elif ty == 'setarg':
        into.text('{', 'brace')
        category_draw_children(into, chils, depth, vars)
        into.text('}', 'brace')
    elif ty == 'fs':
        needcomma = False
        if vars.show_feat_id.get():
            idval = getoptprop('id', props)
            if idval:
                #into.text('<%s>' % idval, 'numeric index')
                into.text('%s' % idval, 'numeric index')
                needcomma = True
        if vars.show_feat_struct.get():
            category_draw_children(into, chils, depth, vars,
                                   need_initial_comma=needcomma, sep=',',
                                   sepface='subscript comma')
    elif ty == 'feat':
        attr = getprop('attr', props)
        if attr == 'index':
            assert len(chils) == 1
            assert chils[0][0] == 'lf'
            chils = chils[0][2:]
            assert len(chils) == 1
            assert chils[0][0] == 'nomvar'
            into.text(getprop('name', chils[0][1]), 'nomvar')
        else:
            val = getoptprop('val', props, None)
            if val:
                if vars.show_full_features.get():
                    into.text("%s=%s" % (attr, getprop('val', props)),
                              'feature')
                else:
                    into.text("%s" % getprop('val', props), 'feature')
            else:
                into.text("%s" % attr, 'feature')
    elif ty == 'slash':
        dir = getoptprop('dir', props, '|')
        mode = getoptprop('mode', props)
        ability = getoptprop('ability', props)
#        into.text('%s' % dir, 'slash')
#        into.text('%s%s' % (mode or '',
#                            ability_to_ability_value[ability] or ''),
#                  'slash mode')
 	
	# We create the file name here
	# By interpreting various parameters
	# and joiing them together as a string
	
	if dir == '\\':
		slash_string = 'bk'
	elif dir == '/':
		slash_string = 'fd'
	else:
		slash_string = 'str'

	#slash_mode : X GREATER : $$ = 'x>'
	#           : LESS X    : $$ = '<x'
	#           : GREATER | LESS | X | DOT | STAR | CARET
           
	modelist = {'x>':'cross_greater',
		    '<x':'lesser_cross',
		    '>':'greater',
		    '<':'lesser',
		    'x':'cross',
		    '.':'dot',
		    '*':'star',
		    '^':'box'}
	if mode == None:
		image_string = slash_string + '.GIF'
	else:
		image_string = slash_string+ '_' + modelist[mode] + '.GIF'
		
	into.image(image_string)

    elif ty == 'dollar':
        name = getoptprop('name', props)
        into.text('$', 'dollar')
        into.text('%s' % name, 'numeric index')
    else:
	# Have commented the following assert Statement
	# and the debug statement
	# Because of validation errors
        #debug('ty??? %s\n' % ty)
        #assert False
	dummy = 1

%y

complexcat_entry : atomcat
                 : LPAREN complexcat RPAREN    : $$ = $2

complexcat_postmod : DOLLAR NUMBER :
    $$ = [['slash', []], ['dollar', [('name', $2)]]]

complexcat_postmod : slash complexcat_entry : $$ = [$1, $2]

#complexcat_postmod : slash DOLLAR NUMBER :
#    $$ = [$1, ['dollar', [('name', $3)]]]

complexcat : complexcat_entry
           : complexcat complexcat_postmod :
    if $1[0] != 'complexcat':
        $1 = ['complexcat', []] + [$1]
    $$ = $1 + $2

cat_set_entry : slash complexcat_entry : $$ = [$1, $2]

cat_set_entry_0: cat_set_entry
               : cat_set_entry commas

complexcat : complexcat LBRACE cat_set_entry_0+ RBRACE :
    # $3 comes as a list of lists of the form [slash, cat]; we need to
    # flatten the list, which is what reduce() does
    if $1[0] != 'complexcat':
        $1 = ['complexcat', []] + [$1]
    $$ = $1 + [['setarg', []] + reduce(lambda x,y:x+y, $3)]

#############################
#       Hybrid logic        #
#############################

# Example:
# 
# Source:
# 
# E:action(* <Actor>X:animate-being <Patient>Y:sem-obj)
# 
# XML output:
# 
# <lf>
#   <satop nomvar="E:action">
#     <prop name="[*DEFAULT*]"/>
#     <diamond mode="Actor">
#       <nomvar name="X:animate-being"/>
#     </diamond>
#     <diamond mode="Patient">
#       <nomvar name="Y:sem-obj"/>
#     </diamond>
#   </satop>
# </lf>

%p

def hylo_draw_children(into, chils, need_initial_comma=False,
                       sep='', sepface='caret'):
    for x in chils:
        if sep and need_initial_comma:
            into.text(sep, sepface)
        need_initial_comma = True
        hylo_draw(into, x)

# Given the XML for a hylo, draw a graphical representation into the
# widget INTO.  The drawing is done by calling into.text(TEXT, FACE)
def hylo_draw(into, xml):
    ty = xml[0]
    props = xml[1]
    chils = xml[2:]
    if ty == 'satop':
        into.text('@')
        into.text(getprop('nomvar', props), 'nomvar')
        into.text('(')
        hylo_draw_children(into, chils, sep=' ^ ')
        into.text(')')
    elif ty == 'prop':
        name = getprop('name', props)
        if name == '[*DEFAULT*]':
            into.text('*', 'semname')
        else:
            into.text(name, 'semname')
    elif ty == 'diamond':
        mode = getprop('mode', props)
        # FIXME: Instead of uppercasing, we really want small caps
        into.text('<%s>' % mode.upper(), 'semrole')
        assert len(chils) > 0
        if len(chils) == 1:
            hylo_draw(into, chils[0])
        else:
            into.text('(')
            hylo_draw_children(into, chils, sep='^')
            into.text(')')
    elif ty == 'nomvar':
        into.text(getprop('name', props), 'nomvar')
    else:
        assert False
%y

hylo_entry : STAR : $$ = ['prop', [('name', '[*DEFAULT*]')]]
           : typed_word :
    if $1[0].isupper():
        $$ = ['nomvar', [('name', $1)]]
    else:
        $$ = ['prop', [('name', $1)]]

hylo_entry : LESS word GREATER hylo_entry :
    $$ = ['diamond', [('mode', $2)], $4]

hylo_entry : LESS word GREATER LPAREN hylo_list RPAREN :
    $$ = ['diamond', [('mode', $2)]] + $5

carets : CARET
       : carets CARET

hylo_entry_0: hylo_entry
            : hylo_entry carets

hylo_list : empty
          : hylo_list hylo_entry_0   : $$ = $1 + [$2]

hylo_list_0 : hylo_list
            : carets: $$ = []
            : carets hylo_list: $$ = $2

hylo_spec : typed_word LPAREN hylo_list_0 RPAREN :
    $$ = ['satop', [('nomvar', $1)]] + $3

hybrid_logic : hylo_spec*
             : AT hylo_spec*: $$ = $2

#############################
#            Words          #
#############################

%p

def init_morphology():
    global morph_xml
    morph_xml = []

    # List families/parts-of-speech of a word.  This comes from the
    # families/parts-of-speech specified in a word {} declaration; hence we
    # can't really tell families from POS's.  This also comes from any
    # member declarations inside of a family.
    global word_to_family_pos
    word_to_family_pos = {}
    # List word members of a family/part-of-speech; more or less the
    # inverse of the previous hash. (Not a perfect inverse because it
    # doesn't currently list any members that come from a member
    # declaration inside of a family, but only from word {} declarations.)
    global family_pos_to_word
    family_pos_to_word = {}
    # word->predicate mapping; this comes from pred=foo declarations in the
    # properties of a word.  This is needed because this info must be added
    # to <member> tags in a family.
    global word_to_predicate
    word_to_predicate = {}
    # Mapping of families to parts-of-speech; comes from family {}
    # declarations.
    global family_to_pos
    family_to_pos = {}
    # Contains a key for each part-of-speech seen in a family {}
    # declaration.
    global pos_hash
    pos_hash = {}
    # (XML for) list of word members explicitly specified using a member
    # statement.
    global family_members
    family_members = {}

def save_morphology(cur):
    cur.morph_xml = morph_xml
    cur.word_to_family_pos = word_to_family_pos
    cur.family_pos_to_word = family_pos_to_word
    cur.word_to_predicate = word_to_predicate
    cur.family_to_pos = family_to_pos
    cur.pos_hash = pos_hash
    cur.family_members = family_members

# Assume that hash[key] is a list, add VALUE to the list if not already there.
def add_uniquely_to_hash_entry_list(hash, key, value):
    if key not in hash:
        hash[key] = []
    if value not in hash[key]:
        hash[key] += [value]

def note_family_member(word, families):
    for x in families:
        add_uniquely_to_hash_entry_list(word_to_family_pos, word, x)
        add_uniquely_to_hash_entry_list(family_pos_to_word, x, word)

def make_word_morph_xml():
    xml = []
    for x in morph_xml:
        word_pos_list = []
        word = getprop('stem', x[1])
        # Each word needs to be listed as many times as it has parts of
        # speech.  We collect together all families and POS's associated
        # with a word, either from word {} or member declarations,
        # and determine all POS's from them.
        for y in word_to_family_pos.get(word, []):
            if y in family_to_pos:
                pos = family_to_pos[y]
            elif y in pos_hash:
                pos = y
            else:
                error(None, 'Family/part-of-speech %s not found (word declaration %s)',
                      y, word)
            if pos not in word_pos_list:
                word_pos_list += [pos]
        for y in word_pos_list:
            # Make a copy of the word's XML and set the POS appropriately.
            entry = x[:]
            putprop('pos', y, entry[1])
            xml += [entry]
    return xml

%y

word_param: word_list: $$ = ($1, [])
          : word_list LPAREN ext_attr_list RPAREN:
    # WORD(VALUE) is equivalent to WORD(class=VALUE).
    property_name_replace(None, 'class', $3)
    $$ = ($1, $3)

word_spec_1: WORD word COLON word_param:
    (families, params) = $4
    note_family_member($2, families)
    pred = getoptprop('pred', params)
    if pred:
        word_to_predicate[$2] = pred
    $$ = ($2, [('pos', None), ('stem', $2)] + params)

word_spec_1: WORD word COLON: $$ = ($2, [('pos', None), ('stem', $2)])

word_spec: WORD word: $$ = ($2, [('pos', None), ('stem', $2)])
         : word_spec_1

word_block: word_spec SEMI:
    (word, params) = $1
    morph_xml.append(['entry', [('word', word)] + params])

word_block: word_spec_1 COLON word_macros SEMI:
    (word, params) = $1
    morph_xml.append(['entry', [('word', word)] + $3 + params])

word_macros: word_list: $$ = [('macros', ' '.join(['@%s' % x for x in $1]))]

word_form: word_or_star SEMI: $$ = ($1, [])

word_form: word_or_star COLON word_macros SEMI: $$ = ($1, $3)

word_forms: : $$ = []
          : word_forms word_form : $$ = $1 + [$2]

word_block: word_spec LBRACE word_forms RBRACE:
    (word, params) = $1
    for (form, macros) in $3:
        if form == '*':
            form = word
        morph_xml.append(['entry', [('word', form)] + macros + params])

#############################
#       Family blocks       #
#############################

%p

def init_lexicon():
    global lexicon_xml
    lexicon_xml = []

def save_lexicon(cur):
    cur.lexicon_xml = lexicon_xml

# lexicon_xml already contains XML for each family and its entries (i.e.
# lexical insertion rules).  We also need to add to each family the words
# that are members of the family -- these come from both word {}
# declarations and member statements.
def make_family_lexicon_xml():
    for x in lexicon_xml:
        # Make sure that open families don't have member entries, or otherwise
        # [*DATE*], [*NUM*], etc. won't work.
        closed = getprop('closed', x[1])
        if closed == 'false':
            continue
        name = getprop('name', x[1])
        words_seen = []
        # Add each stem explicitly given in a member statement.  The
        # predicate comes from any predicate given in the member statement
        # along with the stem, or from the word {} declaration as a backup.
        for y in family_members[name]:
            stem = getprop('stem', y[1])
            words_seen += [stem]
            pred = getoptprop('pred', y[1])
            if not pred:
                pred = word_to_predicate.get(stem, None)
            x += [['member',
                   [('stem', stem)] + (pred and [('pred', pred)] or [])]]
        # Add each stem that specifies that it belongs to this family,
        # unless we already added it.
        for y in family_pos_to_word.get(name, []):
            if y not in words_seen:
                words_seen += [y]
                pred = word_to_predicate.get(y, None)
                x += [['member',
                       [('stem', y)] + (pred and [('pred', pred)] or [])]]
    return lexicon_xml


# A CSFamily is a `family {}' block.
class CSFamily(CSBlock):
    def __init__(self, prod, name, props, statements):
        super(CSFamily, self).__init__(prod)
        self.name = name
        self.props = props
        self.statements = statements
	self.text = None
	self.homeButton = None
	self.btnFrame = None
	self.menuHolder = None

	self.childFrame = None
	self.cfile = None
	self.cf = None
	self.vars = None
	self.canvas = None
	self.mainFrame = None

    def draw(self, childFrame, cfile, vars, row, canvas, mainFrame):
        # Draw the family name
        f = Frame(childFrame, bd=1, relief=SUNKEN, background='white')
        cf = draw_into(f, width=20)
        cf.text('%s' % self.name, 'family name')

	child_widget=cf.finish()
	self.menuHolder = child_widget

        child_widget.pack(fill=BOTH, expand=YES)

	child_widget.bind("<Button-1>", self.editPopup)

	self.childFrame = childFrame
	self.cfile = cfile
	self.cf = cf
	self.vars = vars
	self.canvas = canvas
	self.mainFrame = mainFrame


        f.grid(row=row, column=0, sticky=NSEW)

        # Draw the various statements
        f = Frame(childFrame, bd=1, relief=SUNKEN, background='white')
        for x in self.statements:
            frame = x.draw(f, cfile, vars)
            if frame:
                frame.pack(fill=BOTH, expand=YES)
        f.grid(row=row, column=1, sticky=NSEW)

        childFrame.rowconfigure(row, weight=1)

    # Define the binding procedure for the right-click for editing an entry
    def editPopup(self, event):
	popup = Menu(self.menuHolder, tearoff =0)
	popup.add_command(label=' Edit ', command = lambda: self.editSection(self.childFrame, 
				self.cfile, 
				self.cf, 
				self.vars, 
				self.canvas, 
				self.mainFrame))
	try:
		popup.tk_popup(event.x_root+40, event.y_root, 0)
	finally:
		popup.grab_release()
	
	# Now bind the right-click to the saveSection buttons
	self.menuHolder.bind("<Button-1>", self.savePopup)

    # Define the right click binding for the save entry
    def savePopup(self, event):
    	popup = Menu(self.menuHolder, tearoff = 0)
	popup.add_command(label = 'Done', command = lambda: self.saveSection(self.childFrame,
						self.cfile,
						self.cf,
						self.vars,
						self.canvas,
						self.mainFrame))
	popup.add_command(label = 'Home', command = lambda: self.editHome(self.cfile))

	fileData = self.cfile.getAllText()
	popup.add_command(label = 'Undo All', command = lambda: self.undoEdit(fileData, self.cfile))

	try:
		popup.tk_popup (event.x_root+40, event.y_root, 0)
	finally:
		popup.grab_release()
    
    # Edit a section, i.e. a family of the grammar individually rather than the entire grammar
    # Note that this will have very preliminary editing capabilities and the complete grammar
    # editing should be done through the Edit global view
    def editSection(self, childFrame, cfile, hiliteText, vars, canvas, mainFrame):
        editFrame = Frame(mainFrame, bd=1, background='white')

    	self.text = Text(editFrame, padx=5, wrap=None, undo = YES, background='white', height =10)
	vbar = Scrollbar(editFrame)
	hbar = Scrollbar(editFrame, orient='horizontal')

	self.text.config(yscrollcommand=vbar.set)    # call vbar.set on text move
        self.text.config(xscrollcommand=hbar.set)
        vbar.config(command=self.text.yview)         # call text.yview on scroll move
        hbar.config(command=self.text.xview)         # or hbar['command']=text.xview

	# Changing the mode of the cfile object here,
	# so that once the uer clicks done,
	# the whole object is recompiled and redisplayed
	cfile.mode= 'Edit'

	# Highlight the row being edited
	hiliteText.onHilite()

	vbar.pack(side=RIGHT, fill=Y)
	hbar.pack(side=BOTTOM, fill=X)
	self.text.pack(fill= BOTH, expand= YES)

	# Set a mark at the beginning of the text
	self.text.mark_set("START", INSERT)
	self.text.mark_gravity("START", LEFT)

	# Push in the rest of the file's contents
	fileData = cfile.getAllText()
	self.text.insert(INSERT, fileData)

	# Move the insert position to the first occurence of the family name
	# FIXME: this is poor implementation
	# The positioning of the insert cursor should be happening by parsing the 
	# CFG production rules, using CSFamily.prod.lineno and endlineno
	self.text.config(takefocus=True)
	idx= self.text.search('family '+ self.name, "START")
	self.text.mark_set(CURRENT, idx)
	self.text.see(CURRENT)

        #editFrame.grid(row=row+1, columnspan =3, sticky = NSEW)
        editFrame.grid(row=2, columnspan =2, sticky = NSEW)
	childFrame.update_idletasks()
	canvas.config(scrollregion=canvas.bbox("all"))

    # Finished editing
    #def saveSection(self, childFrame, cfile, hiliteText, varset, canvas, mainFrame, homeButton, undoButton):
    def saveSection(self, childFrame, cfile, hiliteText, varset, canvas, mainFrame):
    	# We force the text contents of the cfile object to copy over 
	# all that is presently in the current text-box
    	cfile.setAllText(self.text.get(1.0,END))

	# Undo the highlight of the row
	hiliteText.offHilite()

	# Recompile whatever was edited and redisplay
	# Note: changes are not saved hereby!!
	cfile.compile_if_needed()
	cfile.onLexicon()

	# Restore the right-click binding to the original
	self.menuHolder.bind("<Button-1>", self.editPopup)

    # Restore view to original place where you wanted to edit
    def editHome(self, cfile):
	# Move the insert position to the first occurence of the family name
	# FIXME: this is poor implementation
	# The positioning of the insert cursor should be happening by parsing the 
	# CFG production rules, using CSFamily.prod.lineno and endlineno
	self.text.config(takefocus=True)
	idx= self.text.search('family '+ self.name, "START")

	if not idx:
		showwarning('Error', 'Original entry for '+self.name+ ' not found!')
	self.text.mark_set(CURRENT, idx)
	self.text.see(CURRENT)

    # Undo all editing done till now
    def undoEdit(self, fileData, cfile):
    	askqn = askokcancel('Warning','Undo all changes till now?')
	if askqn:
		self.text.delete("START", END)
		self.text.insert(CURRENT, fileData)
		self.editHome(cfile)

    	
# CSFamilyEntry is an `entry' statement inside a `family' block.
#
# PROPS is a property list corresponding to the entry's name ('name') and
# any other properties, deriving from the form
#
# entry NAME(PROP=VAL, ...):
#
# Either the name or properties, or both, may be omitted.
#
# CAT is the XML corresponding to the entry's category, and LF is the XML for
# the logical form (hybrid logic).

class CSFamilyEntry(CSStatement):
    def __init__(self, prod, props, cat, lf=None):
        super(CSFamilyEntry, self).__init__(prod)
        self.props = props
        # NOTE: self.cat is a single XML statement, but self.lf is a list
        # of XML statements.  FIXME.
        self.cat = cat
        self.lf = lf
    def xml(self):
        if self.lf:
            lf = [['lf', []] + self.lf]
        else:
            lf = []
        return [['entry', self.props, self.cat + lf]]
    def draw(self, parent, cfile, vars):
        name = getoptprop('name', self.props)
        f = Frame(parent, background='white')
        cf = draw_into(f)
        cf.text('      ')
        if name:
            cf.text('%s: ' % name)
        category_draw(cf, self.cat, depth=0, vars=vars)
        if self.lf and vars.show_semantics.get():
            cf.text(' : ')
            hylo_draw_children(cf, self.lf)
        cf.finish().pack(fill=BOTH, expand=YES, side=LEFT)
        return f

# CSFamilyMember is a `member' statement inside a `family' block.  ITEMS
# lists the items given, in property-list form:
#
# STEM --> [('stem', STEM)]
# STEM(PRED) --> [('stem', STEM), ('pred', PRED)]

class CSFamilyMember(CSStatement):
    def __init__(self, prod, items):
        super(CSFamilyMember, self).__init__(prod)
        self.items = items
    def xml(self):
        return [['member', x] for x in self.items]
    def draw(self, parent, cfile, vars):
        return None
        f = Frame(parent, background='white', bd=1, relief=SUNKEN)
        cf = draw_into(f)
        cf.text('Members: ', 'member heading')
        first = True
        for x in self.items:
            stem = getprop('stem', x)
            pred = getoptprop('pred', x)
            if not first:
                cf.text(', ', 'member comma')
            cf.text(' %s%s' % (stem, pred and "(pred=%s)" % pred or ''),
                    'member')
            first = False

	print len (self.items) 
        cf.finish().pack(fill=BOTH, expand=YES)
        return f

%y

# Omitting the colon between entry category and hybrid logic doesn't
# actually cause parsing problems, but it's probably not a good idea to
# encourage this, because the syntax might change in the future.

entry_name_1: opt_paren_attr_list

# We shouldn't need the first entry below, but we do, due to the bugginess
# in PLY in handling empty rules.
entry_name: word: $$ = [('name', $1)]
          : word entry_name_1: $$ = [('name', $1)] + $2
          : entry_name_1

entry : ENTRY entry_name COLON complexcat COLON hybrid_logic SEMI :
    $$ = CSFamilyEntry($@, props=$2, cat=$4, lf=$6)

entry : ENTRY entry_name COLON complexcat SEMI :
    $$ = CSFamilyEntry($@, props=$2, cat=$4)

member_entry : word                    : $$ = [('stem', $1)]
member_entry : word LPAREN word RPAREN :
    $$ = [('stem', $1), ('pred', $3)]

member_entry_0: member_entry
              : member_entry commas

member : MEMBER COLON member_entry_0+ SEMI	:
    $$ = CSFamilyMember($@, items=$3)

family_statement : member | entry

family_statement_list : empty
		      : family_statement_list family_statement : $$ = $1 + [$2]

family_block : FAMILY word opt_paren_ext_attr_list LBRACE family_statement_list RBRACE :
    # FAMILY(VALUE) is equivalent to FAMILY(pos=VALUE).
    property_name_replace(None, 'pos', $3)
    # Create the AST object -- before adding to $3.
    $$ = CSFamily($@, name=$2, props=$3, statements=$5)
    # 'pos' (part of speech) defaults to the family name; they would only
    # differ when more than one family is used to define a particular part of
    # speech, to handle related characteristics (family Prep-Nom vs. pos Prep).
    if not property_specified('pos', $3):
        $3 += [('pos', $2)]

    # Store mappings related to POS.
    pos = getprop('pos', $3)
    family_to_pos[$2] = pos
    pos_hash[pos] = True

    # Now construct the XML for the family
    xml = ['family', [('name', $2)] + $3]
    family_members[$2] = []
    for x in $5:
        if type(x) is CSFamilyMember:
            family_members[$2].extend(x.xml())
        else:
            xml.extend(x.xml())
    # If members have been specified ('member' statements) and there is no
    # 'closed' property, make the family closed.
    
    # if family_members[$2] and not property_specified('closed', xml[1]):
    #    xml[1] += [('closed', 'true')]
    
    # Actually, we *always* need classes closed, due to a bizarreness in
    # OpenCCG.
    if not property_specified('closed', xml[1]):
        xml[1] += [('closed', 'true')]
    # Add names to entries ('entry' statements) without them.
    primcount = 0
    for x in xml[2:]:
        if not property_specified('name', x[1]):
            primcount += 1
            x[1] = [('name', 'Entry-%s' % primcount)] + x[1]
    # For each specified member, note the family it's in so that its part
    # of speech can be calculated.
    for x in family_members[$2]:
        add_uniquely_to_hash_entry_list(word_to_family_pos,
                                        getprop('stem', x[1]),
                                        $2)
    lexicon_xml.append(xml)
    $$.static_xml = [xml]

#############################
#        Rule blocks        #
#############################

%p
def init_rules():
    global rules
    rules = {
        ('app', '+') : True,
        ('app', '-') : True,
        ('comp', '+') : True,
        ('comp', '-') : True,
        ('xcomp', '+') : True,
        ('xcomp', '-') : True,
        ('sub', '+') : False,
        ('sub', '-') : False,
        ('xsub', '+') : False,
        ('xsub', '-') : False,
        ('typeraise', '+') : [(False, True, True)],
        ('typeraise', '-') : [(True, True, True)],
        'typechange' : [],
        }

    global rules_to_xml_mapping
    rules_to_xml_mapping = {
        'app' : ['application', []],
        'comp' : ['composition', [('harmonic', 'true')]],
        'xcomp' : ['composition', [('harmonic', 'false')]],
        'sub' : ['substitution', [('harmonic', 'true')]],
        'xsub' : ['substitution', [('harmonic', 'false')]],
        }

def save_rules(cur):
    cur.rules = rules
    cur.rules_to_xml_mapping = rules_to_xml_mapping

def make_rules_xml():
    xml = []
    unique = 0
    for (key, value) in my_sorted(rules.items()):
        if type(key) is tuple and key[0] in rules_to_xml_mapping:
            rx = copy.deepcopy(rules_to_xml_mapping[key[0]])
            rx[1] += [('dir', key[1] == '+' and 'forward' or 'backward')]
            xml.append(rx)
        elif type(key) is tuple and key[0] == 'typeraise':
            for (dollar, arg, result) in value:
                xml.append(['typeraising',
                            [('dir', key[1] == '+' and 'forward'
                              or 'backward'),
                             ('useDollar', dollar and 'true' or 'false')]]
                           + (arg != True and
                              [['arg', [], arg]]
                              or [])
                           + (result != True and
                              [['result', [], result]]
                              or []))
        elif key == 'typechange':
            for (arg, result, lf) in value:
                unique += 1
        	if lf:
	            lf = [['lf', []] + lf]
	        else:
	            lf = []
                xml.append(['typechanging', [('name', 'typechange-%d' % unique)],
                            ['arg', [], arg],
                            ['result', [], result + lf]])
        else:
            raise InternalError("Invalid element in rules hash: %s" % str(key))
    return xml

def dotyperaise(plusminus, dollarp, arg, result):
    if plusminus == '+' or plusminus == '+-':
        rules[('typeraise', '+')] += [(dollarp, arg, result)]
    if plusminus == '-' or plusminus == '+-':
        rules[('typeraise', '-')] += [(dollarp, arg, result)]

def rulesreinit():
    rules.clear()
    rules[('typeraise', '+')] = []
    rules[('typeraise', '-')] = []
    rules['typechange'] = []
%y

ruletype : APP | COMP | XCOMP | SUB | XSUB

opt_dollar : DOLLAR : $$ = True
           : empty : $$ = False

opt_atomcat : atomcat
            : empty : $$ = True

opt_complexcat : COLON complexcat : $$ = $2
               : empty : $$ = True

plusminus_spec : PLUS | MINUS | PLUSMINUS

rule : NO SEMI : rulesreinit()
     : NO ruletype SEMI | NO ruletype PLUSMINUS SEMI : \
       del rules[($2, '+')]; del rules[($2, '-')]
     : NO ruletype PLUS SEMI : del rules[($2, '+')]
     : NO ruletype MINUS SEMI : del rules[($2, '-')]
     : NO TYPERAISE SEMI | NO TYPERAISE PLUSMINUS SEMI : \
       rules[('typeraise', '+')] = []; rules[('typeraise', '-')] = []
     : NO TYPERAISE PLUS SEMI : rules[('typeraise', '+')] = []
     : NO TYPERAISE MINUS SEMI : rules[('typeraise', '-')] = []
     : NO TYPECHANGE SEMI : rules['typechange'] = []
     : ruletype PLUSMINUS SEMI : \
       rules[($1, '+')] = True; rules[($1, '-')] = True
     : ruletype PLUS SEMI : rules[($1, '+')] = True
     : ruletype MINUS SEMI : rules[($1, '-')] = True
     : TYPERAISE plusminus_spec opt_dollar
       opt_complexcat SEMI:  dotyperaise($2, $3, $4, True)
     : TYPERAISE plusminus_spec opt_dollar
       COLON complexcat GOESTO opt_atomcat SEMI: dotyperaise($2, $3, $5, $7)
     : TYPECHANGE COLON complexcat GOESTO complexcat SEMI: \
       rules['typechange'] += [($3, $5, None)]
     : TYPECHANGE COLON complexcat GOESTO complexcat COLON hybrid_logic SEMI: \
       rules['typechange'] += [($3, $5, $7)]

rule_list : rule_list rule
          : empty

rule_block : RULE LBRACE rule_list RBRACE

#############################
#           Testbed         #
#############################

%p

def init_testbed():
    global testbed_statements
    testbed_statements = []

def save_testbed(cur):
    cur.testbed_statements = testbed_statements

def add_testbed_statement(bang, words, number):
    testbed_statements.append(['item',
                               [('string', ' '.join(words))] + bang +
                               number])

def make_testbed_xml():
    return testbed_statements

%y

opt_testbed_bang: BANG: $$ = [('known', 'true')]
                : empty

testbed_entry: opt_testbed_bang word_list SEMI: \
    add_testbed_statement($1, $2, [])
             : opt_testbed_bang word_list COLON NUMBER SEMI: \
    add_testbed_statement($1, $2, [('numOfParses', $4)])

testbed_block: TESTBED LBRACE testbed_entry* RBRACE

#############################
#      Relation-sorting     #
#############################

%p

def init_relation_sorting():
    global relation_sorting
    relation_sorting = []

def save_relation_sorting(cur):
    cur.relation_sorting = relation_sorting

def make_relation_sorting_lexicon_xml():
    if relation_sorting:
        return [['relation-sorting',
                 [('order', ' '.join(relation_sorting))]]]
    else:
        return []

%y

relation_sorting_block: RELATION_SORTING COLON word_or_star_0 * SEMI:
    global relation_sorting
    relation_sorting += $3

#############################
#   End Yacc Declarations   #
#############################
%p

def p_error(p):
    if p:
        error(p.lineno, "Syntax error at '%s'", p.value)
    else:
        error(None, "Unexpected end of file")

#############################
#       Lexer classes       #
#############################

# A Lexer that allows for a list of tokens to be pushed onto the front of
# the list of tokens to be returned.  Any number of such lists can be
# pushed.
class StackLexer(object):
    def __init__(self, lexer):
        self.lexer = lexer
        self.tokenstack = []
        self.tokenstackind = []
        self.lineno = 1

    def input(self, s):
        self.lexer.input(s)

    def pushstack(self, stack):
        self.tokenstack.append(stack)
        self.tokenstackind.append(0)

    def token(self):
        global return_bogus_value
        if return_bogus_value:
            return_bogus_value = 0
            tok = CCGToken('BOGUS_VALUE', 'BOGUS_VALUE')
            tok.lineno = self.lineno
            return tok
        while self.tokenstack:
            try:
                tok = self.tokenstack[-1][self.tokenstackind[-1]]
                self.tokenstackind[-1] += 1
                return tok
            except IndexError:
                self.tokenstack.pop()
                self.tokenstackind.pop()
        if self.lexer:
            tok = self.lexer.token()
            if tok:
                self.lineno = tok.lineno
            return tok
        return None

# A Lexer that checks for macro calls and expands them appropriately.
class MacroLexer(StackLexer):
    def __init__(self, lexer):
        self.last_token = None
        self.indentlevel = 0
        super(MacroLexer, self).__init__(lexer)

    def simpletoken(self):
        return super(MacroLexer, self).token()

    def noeoftoken(self):
        tok = self.innertoken()
        if not tok:
            raise SyntaxError("Unexpected EOF")
        return tok
            
    def innertoken(self):
        macrotok = self.simpletoken()
        if not macrotok or no_macro_sub or \
               not (macrotok.type == 'ID' and macrotok.value in macro_defs):
            return macrotok
        else:
            newtok = self.simpletoken()
            if not newtok or newtok.type != 'LPAREN':
                self.pushstack([newtok])
                return macrotok
            macrodef = macro_defs[macrotok.value]
            args = []
            stop = False
            while not stop:
                thisarg = []
                parencount = 0
                expect_rbrace = 0
                newtok = self.noeoftoken()
                if newtok.type == 'LBRACE':
                    parencount += 1
                    expect_rbrace = 1
                    newtok = self.noeoftoken()
                while True:
                    if newtok.type in ['LBRACE', 'LBRACKET', 'LPAREN']:
                        parencount += 1
                    if newtok.type in ['RBRACE', 'RBRACKET', 'RPAREN']:
                        parencount -= 1
                    if parencount < 0:
                        if newtok.type == 'RPAREN':
                            stop = True
                            break
                        error(newtok.lineno, "Syntax error at %s",
                              newtok.value)
                        parencount = 0
                    if parencount == 0 and newtok.type == 'RBRACE' and \
                       expect_rbrace:
                        expect_rbrace = 0
                        newtok = self.noeoftoken()
                        continue
                    if parencount == 0 and newtok.type == 'COMMA':
                        break
                    thisarg.append(newtok)
                    newtok = self.noeoftoken()
                args.append(thisarg)
            # Allow extra trailing comma
            if len(args) == len(macrodef.args) + 1 and not args[-1]:
                args.pop()
            if len(args) != len(macrodef.args):
                error(macrotok.lineno,
                      "Invalid number of arguments to macro %s",
                      macrotok.value)
            else:
                if super_macro_debug:
                    print "Processing macro: %s" % macrotok.value
                self.pushstack(macrosub(macrodef, args, self.lineno))
                return self.innertoken()

    def token(self):
        def pretty_output_transformed(token):
            def newline(num=1):
                outout('\n' * num)
                outout(' ' * 2 * self.indentlevel)
            
            if tok.lineno and self.lineno < tok.lineno:
                if tok.lineno - self.lineno == 1:
                    newline()
                else:
                    newline(2)
            elif self.last_token and (self.last_token.type == 'RBRACE' or
                                      self.last_token.type == 'SEMI'):
                newline()
            elif tok.type == 'LBRACE':
                newline(2)
            value = str(tok.value)
            lastval = self.last_token and str(self.last_token.value)
            if value and lastval and ((isalnumund(lastval[0]) and
                                       isalnumund(value[0]))
                                      or self.last_token.type
                                      in ('COLON', 'COMMA')):
                outout(' ')
            if tok.type == 'QUOTEDID':
                outout('"%s"', value)
            else:
                outout('%s', value)
            if tok.type == 'LBRACE':
                self.indentlevel += 1
            elif tok.type == 'RBRACE':
                self.indentlevel -= 1
            return tok

        # Beginning of actual function
        tok = self.innertoken()
        if options.transformed_input and self.lexer and \
               tok and tok.type != 'BOGUS_VALUE':
               pretty_output_transformed(tok)
        self.last_token = tok
        # print "Saw token: %s" % tok
        return tok

#############################
#           Parsing         #
#############################

def init_parse_once():
    # Initialize the parser once, at beginning.  This does introspection on
    # the rules (i.e. p_*() functions) in this file.
    yacc.yacc(start='top', debug=yacc_debug, method='LALR', write_tables=0)

# Parse a .CCG file whose contents are in STR.

class parse_results:
    pass

def parse_string(str):
    retval = parse_results()
    if str:
        retval.parse = yacc.parse(str, lexer=MacroLexer(globallexer))
    else:
        retval.parse = []
    save_global_state(retval)
    return retval

#############################
#           Graphics        #
#############################

# Given the return value from parsing (a list of abstract syntax tree-related
# objects), draw them into the given frame.

def draw_parse(parse, cfile, childFrame, vars, canvas, mainFrame):
    row = 0

    if parse:
    	for x in parse:
        	if hasattr(x, 'draw'):
            		x.draw(childFrame, cfile, vars, row, canvas, mainFrame)
            		row += 1
    	# Make the column containing the lexical entries expand as necessary
    	childFrame.columnconfigure(1, weight=1)
    	#frame.grid(column=0)


#############################
#       Initialization      #
#############################

# We encapsulate all global-variable initialization into a function that
# can be called repeatedly so we can reinitialize our state and parse more
# than one file.  ARGV is the command-line arguments to parse (normally
# sys.argv[1:]) and ERRORS_TO_STRING indicates whether to write stdout and
# stderr output to strings or to the normal output locations.

def init_global_state(errors_to_string=False):
    init_errors(errors_to_string)
    init_lexer()
    init_macros()
    init_features()
    init_morphology()
    init_lexicon()
    init_testbed()
    init_rules()
    init_relation_sorting()

# When we're finished parsing, save the global state to the specified
# object, so we can track the parse results for more than one file.
def save_global_state(cur):
    save_errors(cur)
    save_lexer(cur)
    save_macros(cur)
    save_features(cur)
    save_morphology(cur)
    save_lexicon(cur)
    save_testbed(cur)
    save_rules(cur)
    save_relation_sorting(cur)

def init_global_state_once():
    init_parse_once()

late_init_graphics_done = 0
# Graphics-related initialization that must be done late, after the first
# Tk top-level window has been created.
def late_init_graphics():
    global late_init_graphics_done
    if not late_init_graphics_done:
        late_init_draw_once()
        late_init_graphics_done = 1
    

#############################
#         Main driver       #
#############################

# Function to output a particular XML file
def output_xml_file(prefix, grammar_name, filebase, top_level_tag, xml):
    xml_file = os.path.join(options.dir, '%s%s.xml' % (prefix, filebase))
    if not options.quiet:
        errout('Outputting XML file: %s\n' % xml_file)
    xml = [top_level_tag, [('name', grammar_name),
                           ('xmlns:xsi',
                            'http://www.w3.org/2001/XMLSchema-instance'),
                           ('xsi:noNamespaceSchemaLocation',
                            '../%s.xsd' % filebase)]] + xml
    fil = open(xml_file, 'w')
    fil.write('<?xml version="1.0" encoding="UTF-8"?>\n')
    print_xml(fil, xml)
    fil.close()

def make_grammar_xml(prefix):
    return [['lexicon', [('file', '%slexicon.xml' % prefix)]],
            ['morphology', [('file', '%smorph.xml' % prefix)]],
            ['rules', [('file', '%srules.xml' % prefix)]],
            ['types', [('file', '%stypes.xml' % prefix)]]]

# Map saying how to output the specified XML file
output_file_map = {
    'lexicon': ('ccg-lexicon',
                lambda pref: make_feature_lexicon_xml() +
                make_relation_sorting_lexicon_xml() +
                make_family_lexicon_xml()),
    'rules': ('rules', lambda pref: make_rules_xml()),
    'morph': ('morph',
              lambda pref: make_word_morph_xml() + make_feature_morph_xml()),
    'types': ('types', lambda pref: make_feature_types_xml()),
    'grammar': ('grammar', make_grammar_xml),
    'testbed': ('regression', lambda pref: make_testbed_xml()),
    }

# Process the --omit-output list.

def split_output_files(arg):
    files = re.split('[,\s]+', arg)
    for x in files:
        if x not in output_file_map:
            parser.error('Unknown file in --omit-output argument')
    return files

def main():
    parse_arguments(sys.argv[1:])
    init_global_state_once()
    init_global_state()

    if options.omit_output:
        if options.omit_output[0] == '+':
            output_files = split_output_files(options.omit_output[1:])
        else:
            suppress_output = split_output_files(options.omit_output)
            output_files = []
            for x in output_file_map:
                if x not in suppress_output:
                    output_files.append(x)
    else:
        output_files = [x for x in output_file_map]
    
    # Now actually parse the input arguments

    prefix = options.prefix
    lastfile = '-'
    args = global_args or ['-']
    
    for arg in args:
        if arg == '-':
            if not options.quiet:
                errout("ccg2xml: Processing standard input\n")
            fil = sys.stdin
        else:
            if not options.quiet:
                errout("ccg2xml: Processing %s\n" % arg)
            fil = file(arg)
            lastfile = arg
            if prefix == None:
                (phead, ptail) = os.path.split(arg)
                (pbase, pext) = os.path.splitext(ptail)
                prefix = '%s-' % pbase
        retval = parse_string(fil.read())
        # print "Retval: %s\n" % retval
    
    if macro_debug:
        print_macros()
    
    # Make output directory if needed, and output files

    if error_count > 0:
        if not options.quiet:
            maybe_errout('Errors during compilation, files not output.\n')
        sys.exit(1)
    else:
        if options.dir:
            if not os.path.isdir(options.dir):
                os.makedirs(options.dir)
        else:
            options.dir = '.'
        
        for x in output_files:
            file_info = output_file_map[x]
            output_xml_file(prefix, lastfile, x, file_info[0],
                            file_info[1](prefix))

if __name__ == '__main__':      # when run as a script
    main()

# Local Variables:
# mode: python
# end:


================================================
FILE: src/ccg2xml/ccg_editor.py
================================================
#!/usr/bin/python

# Author: Ben Wing <ben@666.com>
# Date: April 2006

#############################################################################
#                                                                           #
#                                ccg_editor.ply                             #
#                                                                           #
#   Edit a CCG-format file, graphically.  Will have a mode for displaying   #
#   CCG files in a friendly fashion and allowing for editing of parts or    #
#   all of the file.  Will also have a mode for testing a CCG grammar, and  #
#   allow for compilation and error-finding under control of the editor.    #
#                                                                           #
#############################################################################

# This code is based on PyEdit version 1.1, from Oreilly's Programming
# Python, 2nd Edition, 2001, by Mark Lutz.

from Tkinter import *  # base widgets, constants
from tkFileDialog import *  # standard dialogs
from tkMessageBox import *
from tkSimpleDialog import *
from tkColorChooser import askcolor
from string import split, atoi
import sys, os, string, md5
import ccg2xml
import Tree
import re

START     = '1.0'                          # index of first char: row=1,col=0
SEL_FIRST = SEL + '.first'                 # map sel tag to index
SEL_LAST  = SEL + '.last'                  # same as 'sel.last'

FontScale = 0                              # use bigger font on linux
if sys.platform[:3] != 'win':              # and other non-windows boxes
    FontScale = 3

# Initial top-level window; it's not clear we need this.
# FIXME: It sucks that we have to call Tk() to get the first top-level window
# but Toplevel() for all others.  We should be able to call Tk() initially,
# and then Toplevel() to create all top-level windows, including the first.
root = None

# List of all open CFile objects
openfiles = {}
filenames = []


class CTab(Frame):
    # Initialize this tab.  Usually called from a subclass.  PARENT is
    # the parent widget, CFILE the CFile object associated with the
    # top-level window, and TABNAME is the name of this tab (that tab
    # will be removed from the toolbar).
    def __init__(self, parent, cfile, tabname):
        Frame.__init__(self, parent)
        self.parent = parent
        self.cfile = cfile
        self.toolbar = None
        self.checkbar = None
        self.menubar = [
            ('File', 0,
                [('Open...',    0, self.cfile.onOpen),
                 ('New',        0, self.cfile.onNew),
                 ('Save',       0, self.onSave),
                 ('Save As...', 5, self.onSaveAs),
                 ('Close',      0, self.cfile.onClose),
                 'separator',
                 ('Quit VisCCG',    0, self.cfile.onQuit)]
            ),
            ('Tools', 0,
                 [('Font List',   0, self.cfile.onFontList),
                  ('Pick Bg...',  4, self.cfile.onPickBg),
                  ('Pick Fg...',  0, self.cfile.onPickFg),
                  ('Color List',  0, self.cfile.onColorList),
                 'separator',
                  ('Info...',    0, self.cfile.onInfo)]
            )
        ]
        self.toolbar = [
            # ('Display',   self.cfile.onDisplay,    {'side': LEFT}),
            ('Edit',   self.cfile.onEdit,       {'side': LEFT}),
            ('Lexicon',   self.cfile.onLexicon,  {'side': LEFT}),
            ('Testbed',   self.cfile.onTestbed,  {'side': LEFT}),
            ('Features',   self.cfile.onFeatures,  {'side': LEFT}),
            ('Words',   self.cfile.onWords,  {'side': LEFT}),
            ('Rules',   self.cfile.onRules,  {'side': LEFT}),
            ('Quit',  self.cfile.onClose,   {'side': RIGHT}),
            ('Help',  self.cfile.help,     {'side': RIGHT}),
            ('Save',  self.onSave,         {'side': RIGHT}),
        ]
#        self.remove_toolbar_button(tabname)

    # Add MENU (a tuple corresponding to a single top-level menu item)
    # after the item with the name AFTER.
    def add_menu(self, after, menu):
        newmenu = []
        for x in self.menubar:
            newmenu += [x]
            if x[0] == after:
                newmenu += [menu]
        self.menubar = newmenu

    # Remove the toolbar button named NAME.
    def remove_toolbar_button(self, name):
        newtoolbar = []
        for x in self.toolbar:
            if x[0] != name:
                newtoolbar += [x]
        self.toolbar = newtoolbar

    def reinit(self):
        pass

    #####################
    # File menu commands
    #####################

    def onSave(self):
        self.onSaveAs(self.cfile.currfile)  # may be None

    def onSaveAs(self, forcefile=None):
        file = forcefile or self.cfile.my_asksaveasfilename()
        if file:
            text = self.cfile.getAllText()
            try:
                open(file, 'w').write(text)
            except:
                showerror('CCG Editor', 'Could not write file ' + file)
            else:
                self.cfile.setFileName(file)         # may be newly created
                self.cfile.edit_modified(NO)
        self.cfile.last_save_signature = self.cfile.getSignature(text)


class CEdit(CTab):
    def __init__(self, parent, cfile):
        CTab.__init__(self, parent, cfile, 'Edit')
        self.debugFrame= None

        # Add a frame here, so that debug mode can be enabled
        # by embedding other objects within this frame
        editFrame = Frame(self, bd=1, bg= 'white')
        editFrame.pack(fill=BOTH, expand=YES, side=TOP)

        # Add a button frame, embed the button and
        # link to command for the debug mode
        btnFrame = Frame(editFrame, bd = 1)
        btnFrame.grid (row=0, columnspan=3, sticky=NSEW)

        vldButton = Button (btnFrame, text='Validate', command = lambda: self.onValidate(editFrame, cfile))
        vldButton.pack(side=RIGHT)

        # Put the main edit window in the row below this
        vbar  = Scrollbar(editFrame)
        hbar  = Scrollbar(editFrame, orient='horizontal')
        self.text  = Text(editFrame, padx=5, wrap='none', undo=YES)

        vbar.grid(row=1, column=2, sticky=NS)
        hbar.grid(row=2, columnspan=2, sticky=EW)     # pack text last
        self.text.grid(row=1, column=1, sticky=NSEW)  # else sbars clipped

        editFrame.columnconfigure(1, weight=1)
        editFrame.rowconfigure(1, weight=1)

        # Add a list containing line numbers
        self.lineList = Text(editFrame, relief=SUNKEN, bg='white', bd=2, yscrollcommand = vbar.set, width=3)
        self.lineList.grid(row=1, column=0, sticky=NS)
        self.lineList.config(font=self.cfile.fonts[0],
                             bg=self.cfile.colors[0]['bg'], fg=self.cfile.colors[0]['fg'])

        # TODO: The first time the display of the line numbers
        # strangely doesn't go through --- somehow cfile
        # isn't initialized. However, it works properly in the display.
        # Need to understand why this happens.

        try:
            self.showLineNums()
        except KeyError:
            self.text.config(yscrollcommand=vbar.set)    # call vbar.set on text move
            self.text.config(xscrollcommand=hbar.set)
            #vbar.config(command=text.yview)         # call text.yview on scroll move
            hbar.config(command=self.text.xview)         # or hbar['command']=text.xview

            self.text.config(font=self.cfile.fonts[0],
                             bg=self.cfile.colors[0]['bg'], fg=self.cfile.colors[0]['fg'])

        #Setting the movement of the listbox and the text
        #together to be controlled by the scrollbar
        vbar.config(command=self.scrollSet)

        self.add_menu('File',
                      ('Edit', 0,
                          [('Cut',        0, self.onCut),
                           ('Copy',       1, self.onCopy),
                           ('Paste',      0, self.onPaste),
                           'separator',
                           ('Delete',     0, self.onDelete),
                           ('Select All', 0, self.onSelectAll)]
                      ))
        self.add_menu('Edit',
                      ('Search', 0,
                          [('Goto...',    0, self.cfile.onGoto),
                           ('Find...',    0, self.cfile.onFind),
                           ('Refind',     0, self.cfile.onRefind),
                           ('Change...',  0, self.onChange)]
                      ))

    def scrollSet(self, *args):
        self.lineList.yview(*args)
        self.text.yview(*args)

    def reinit(self):
        self.showLineNums()
        self.text.focus()

    def showLineNums(self):
        #Make the list of lines editable
        self.lineList.config(state=NORMAL)
        textData = self.cfile.getAllText()
        listOfLines = textData.split('\n')
        for num in range(1,len(listOfLines)):
            self.lineList.insert(END,"%s\n" % num)
        #Now that we are done changing the number of lines,
        #we reset the text to be uneditable
        self.lineList.config(state=NORMAL)

    def onValidate(self, editFrame, cfile):
        #showwarning(title= 'Sorry', message='Validate and debug feature coming soon!')
        # Destroy previous display of debug or error messages
        # if present
        if self.debugFrame:
            self.debugFrame.grid_forget()

        # Compile if file signature has changed
        cfile.compile_if_needed()

        # Now, call the error debug routine if errors are found
        if (ccg2xml.error_count > 0):
            self.debugError(editFrame, cfile)
        else:
            showinfo(title='VisCCG: Success', message='No validation errors!')

    def debugError(self, editFrame, cfile):
        self.debugFrame = Frame(editFrame, bg='white', bd=2)
        self.debugFrame.grid(row=3, columnspan=2, sticky=NSEW)

        # Create Listbox and scrollbars
        sbar = Scrollbar(self.debugFrame)
        list = Listbox(self.debugFrame, relief=SUNKEN, bg='white', bd=2, yscrollcommand = sbar.set)
        sbar.config(command=list.yview)
        list.pack(fill=BOTH, side=LEFT, expand=YES)
        sbar.pack(fill=Y, side=RIGHT)

        # Display each message in the log
        for mesg in ccg2xml.message_log:
            type = mesg[0]
            lineno = mesg[1]
            errwarn = mesg[2]

            if lineno:
                dispError = type+' at Line '+str(lineno)+': '+errwarn
            else:
                dispError = type+': '+errwarn

            list.insert(END, dispError)

    #####################
    # Edit menu commands
    #####################

    def onCopy(self):                           # get text selected by mouse,etc
        if not self.text.tag_ranges(SEL):       # save in cross-app clipboard
            showerror('CCG Editor', 'No text selected')
        else:
            text = self.text.get(SEL_FIRST, SEL_LAST)
            self.clipboard_clear()
            self.clipboard_append(text)

    def onDelete(self):                         # delete selected text, no save
        if not self.text.tag_ranges(SEL):
            showerror('CCG Editor', 'No text selected')
        else:
            self.text.delete(SEL_FIRST, SEL_LAST)

    def onCut(self):
        if not self.text.tag_ranges(SEL):
            showerror('CCG Editor', 'No text selected')
        else:
            self.onCopy()                       # save and delete selected text
            self.onDelete()

    def onPaste(self):
        try:
            text = self.selection_get(selection='CLIPBOARD')
        except TclError:
            showerror('CCG Editor', 'Nothing to paste')
            return
        self.text.insert(INSERT, text)          # add at current insert cursor
        self.text.tag_remove(SEL, '1.0', END)
        self.text.tag_add(SEL, INSERT+'-%dc' % len(text), INSERT)
        self.text.see(INSERT)                   # select it, so it can be cut

    def onSelectAll(self):
        self.text.tag_add(SEL, '1.0', END+'-1c')   # select entire text
        self.text.mark_set(INSERT, '1.0')          # move insert point to top
        self.text.see(INSERT)                      # scroll to top

    #######################
    # Search menu commands
    #######################

    def onChange(self):
        new = Toplevel(self)
        Label(new, text='Find text:').grid(row=0, column=0)
        Label(new, text='Change to:').grid(row=1, column=0)
        self.change1 = Entry(new)
        self.change2 = Entry(new)
        self.change1.grid(row=0, column=1, sticky=EW)
        self.change2.grid(row=1, column=1, sticky=EW)
        Button(new, text='Find',
               command=self.onDoFind).grid(row=0, column=2, sticky=EW)
        Button(new, text='Apply',
               command=self.onDoChange).grid(row=1, column=2, sticky=EW)
        new.columnconfigure(1, weight=1)    # expandable entrys

    def onDoFind(self):
        self.onFind(self.change1.get())                    # Find in change box

    def onDoChange(self):
        if self.text.tag_ranges(SEL):                      # must find first
            self.text.delete(SEL_FIRST, SEL_LAST)          # Apply in change
            self.text.insert(INSERT, self.change2.get())   # deletes if empty
            self.text.see(INSERT)
            self.onFind(self.change1.get())                # goto next appear
            self.text.update()                             # force refresh

    ####################################
    # Others, useful outside this class
    ####################################

    def isEmpty(self):
        return not self.getAllText()

    def getAllText(self):
        return self.text.get('1.0', END+'-1c')  # extract text as a string

    def setAllText(self, text):
        self.text.delete('1.0', END)            # store text string in widget
        self.text.insert(END, text)             # or '1.0'
        self.text.mark_set(INSERT, '1.0')       # move insert point to top
        self.text.see(INSERT)                   # scroll to top, insert set
        self.cfile.edit_modified(NO)

    def clearAllText(self):
        self.text.delete('1.0', END)            # clear text in widget


class CWords(CTab):
    def __init__(self, parent, cfile):
        CTab.__init__(self, parent, cfile, 'Words')
        self.child=None
        self.wordList = None
        self.cfile = cfile

    # Called when we switch to this mode using the toolbar at top.
    def reinit(self):
        if self.child:
            self.child.pack_forget()

        self.child = Frame(self, background='white')
        self.child.pack(expand=YES, fill=BOTH)

        scrollbar = Scrollbar(self.child, orient=VERTICAL)
        self.wordList = Listbox(self.child, yscrollcommand=scrollbar.set)
        self.wordList.grid(row=0, column=0, sticky=N+S+E+W)

        scrollbar.config(command= self.wordList.yview)
        scrollbar.grid(row=0, column=1, sticky=N+S)

        self.child.grid_rowconfigure(0, weight=1)
        self.child.grid_columnconfigure(0, weight=1)

        #If the data hasn't been compiled yet, then do so
        try:
            dummy = ccg2xml.morph_xml
        except:
            self.cfile.compile_if_needed()
        #Adding dummy code for all words
        for x in ccg2xml.morph_xml:
            assert x[0] == 'entry'
            self.wordList.insert (END, ccg2xml.getprop('word', x[1]))
            #print ccg2xml.getprop('word', x[1])

class CLexicon(CTab):
    class lexicon_vars(object):
        def __init__(self):
            self.show_feat_id = IntVar()
            self.show_feat_id.set(1)
            self.show_feat_struct = IntVar()
            self.show_feat_struct.set(1)
            self.show_full_features = IntVar()
            self.show_full_features.set(0)
            self.show_semantics = IntVar()
            self.show_semantics.set(1)

    def __init__(self, parent, cfile):
        CTab.__init__(self, parent, cfile, 'Lexicon')
        self.child = None
        self.cnv = None
        self.mainFrame = None

        self.vars = self.lexicon_vars()
        # FIXME?  It's a bit awkward that ccg.ply has references to the
        # variables below scattered throughout it.  But I'm not sure what
        # a better solution would be.
        self.checkbar = [
            ("Show feature ID's", self.vars.show_feat_id),
            ("Show features", self.vars.show_feat_struct),
            ('Full-form features', self.vars.show_full_features),
            ('Show semantics', self.vars.show_semantics),
        ]

    # Called when we switch to this mode using the toolbar at top.
    def reinit(self):
        self.redraw()

    def redraw(self):
        self.cfile.compile_if_needed()
        if self.child:
            self.child.pack_forget()
        if self.mainFrame:
            self.mainFrame.pack_forget()

        self.mainFrame = Frame(self, bd=1, bg='white')
        self.mainFrame.pack_propagate(0)
        self.mainFrame.pack(expand=YES, fill=BOTH)

        self.mainFrame.grid_rowconfigure(0, weight=1)
        self.mainFrame.grid_columnconfigure(0, weight=1)

        xscrollbar = Scrollbar(self.mainFrame, orient=HORIZONTAL)
        xscrollbar.grid(row=1, column=0, sticky=E+W)

        yscrollbar = Scrollbar(self.mainFrame)
        yscrollbar.grid(row=0, column=1, sticky=N+S)

        self.cnv = Canvas(self.mainFrame, bd=2, xscrollcommand=xscrollbar.set,
                          yscrollcommand=yscrollbar.set, width = 847, height=369)

        xscrollbar.config(command= self.cnv.xview)
        yscrollbar.config(command= self.cnv.yview)

        self.child = Frame(self.cnv, bd=2, relief=SUNKEN, background='white')

        self.cnv.create_window(0, 0, anchor='nw', window=self.child)

        ccg2xml.draw_parse(self.cfile.curparse.parse, self.cfile, self.child, self.vars, self.cnv, self.mainFrame)

        self.child.update_idletasks()

        self.cnv.config(scrollregion=self.cnv.bbox("all"))
        self.cnv.grid(row=0, column=0, sticky='NSEW')


class CRules(CTab):
    def __init__(self, parent, cfile):
        CTab.__init__(self, parent, cfile, 'Rules')

class CFeatures(CTab):
    def __init__(self, parent, cfile):
        CTab.__init__(self, parent, cfile, 'Features')
        self.child=None
        self.checkbar=None
        self.edit=None
        self.text=None

    # Called when we switch to this mode using the toolbar at top.
    def reinit(self):
        if self.child:
            self.child.pack_forget()

        self.child = Frame(self, background='white', width = 847, height = 369)
        self.child.pack(expand=YES, fill=BOTH)
        butframe = Frame(self.child, cursor='hand2',
                         relief=SUNKEN, bd=2)
        butframe.pack(fill=X)
        but1 = Button(butframe, text='Expand All', command=self.expand_all)
        but1.pack(side=LEFT)
        but2 = Button(butframe, text='Contract All', command=self.contract_all)
        but2.pack(side=LEFT)
        # Force editing in the same frame: but a lower view:
        # pass self.child as the parent frame
        self.edit = Button(butframe, text='Edit', command= lambda:self.edit_tree(self.child))
        self.edit.pack(side=RIGHT)
        featframe = Frame(self.child, bd=2, relief=SUNKEN,
                          background='white')
        featframe.pack(expand=YES, fill=BOTH)
        self.cfile.compile_if_needed()

        # Build the tree
        self.tree={}
        self.root_name = re.sub(r'^(.*)\.(.*)$', r'\1', self.cfile.file)
        self.tree[self.root_name]=[]
        for feat in self.cfile.curparse.feature_to_values:
            self.tree[self.root_name] += [str(feat)]
        for feat in self.cfile.curparse.feature_to_values:
            self.tree[feat] = []

            for x in self.cfile.curparse.feature_to_values[feat]:
                if x.name not in self.tree:
                    self.tree[x.name] = []

            for x in self.cfile.curparse.feature_to_values[feat]:
                if x.parents:
                    par = x.parents[0]
                    self.tree[par.name] += [x.name]
                else:
                    self.tree[feat] += [x.name]

        # Define the images for opened and closed categories
        shut_icon=PhotoImage(data='R0lGODlhCQAQAJH/AMDAwAAAAGnD/wAAACH5BAEAAAAALAAA'
                             'AAAJABAAQAIdhI8hu2EqXIroyQrb\nyRf0VG0UxnSZ5jFjulrhaxQ'
                             'AO6olVwAAOw==')
        open_icon=PhotoImage(data='R0lGODlhEAAJAJH/AMDAwAAAAGnD/wAAACH5BAEAAAAALAAA'
                             'AAAQAAkAQAIahI+pyyEPg3KwPrko\nTqH7/yGUJWxcZTapUQAAO8b'
                             'yUgAAOw==')

        # Create the tree
        self.t=Tree.Tree(master=featframe,
                         root_id='',
                         root_label=self.root_name,
                         collapsed_icon=shut_icon,
                         expanded_icon=open_icon,
                         get_contents_callback=self.get_treedata,
                         line_flag=False)

        self.t.grid(row=0, column=0, sticky = 'nsew')

        featframe.grid_rowconfigure(0, weight=1)
        featframe.grid_columnconfigure(0, weight=1)

        sb=Scrollbar(featframe)
        sb.grid(row=0, column=1, sticky='ns')
        self.t.configure(yscrollcommand=sb.set)
        sb.configure(command=self.t.yview)

        sb=Scrollbar(featframe, orient=HORIZONTAL)
        sb.grid(row=1, column=0, sticky='ew')
        self.t.configure(xscrollcommand=sb.set)
        sb.configure(command=self.t.xview)

        # Expand the whole tree out
        self.expand_tree(self.t.root)

    # Returns the nodes rooted at the node passed and adds them to the tree
    def get_treedata(self,node):
        lbl = str(node.get_label())
        children = self.tree[lbl]
        for x in children:
            if self.tree[x]:
                expands=1
            else:
                expands=0
        self.t.add_node(name=x,flag=expands)

    # Expand the tree rooted at node recursively
    def expand_tree(self, node):
        node.expand()
        for child in node.children():
            if child.expandable():
                self.expand_tree(child)

    def expand_all(self):
        self.expand_tree(self.t.root)

    def contract_all(self):
        self.t.root.collapse()

    def edit_tree(self, parent):
        editFrame = Frame(parent, bd=1, background='white')


        self.text = Text(editFrame, padx=5, wrap=None, undo = YES, background='white')
        vbar = Scrollbar(editFrame)
        hbar = Scrollbar(editFrame, orient='horizontal')

        self.text.config(yscrollcommand=vbar.set)    # call vbar.set on text move
        self.text.config(xscrollcommand=hbar.set)
        vbar.config(command=self.text.yview)         # call text.yview on scroll move
        hbar.config(command=self.text.xview)         # or hbar['command']=text.xview

        # Change the text on the button, and also pass the rest
        # of the arguments so that the grid for the statements can be reset
        self.edit.config(text='Done', command= lambda:self.save_tree(parent))

        # Changing the mode of the cfile object here,
        # so that once the user clicks done,
        # the whole object is recompiled and redisplayed
        self.cfile.mode= 'Edit'

        vbar.pack(side=RIGHT, fill=Y)
        hbar.pack(side=BOTTOM, fill=X)
        self.text.pack(fill= BOTH, expand= YES)

        # Set a mark at the beginning of the text
        self.text.mark_set("START", INSERT)
        self.text.mark_gravity("START", LEFT)

        # Push in the rest of the file's contents
        fileData = self.cfile.getAllText()
        self.text.insert(INSERT, fileData)

        # Move the insert position to the first occurence of the family name
        # FIXME: this is poor implementation
        # The positioning of the insert cursor should be happening by parsing the
        # CFG production rules, using CSFamily.prod.lineno and endlineno
        self.text.config(takefocus=True)
        idx= self.text.search('feature', "START")
        if idx:
            self.text.mark_set(CURRENT, idx)
            self.text.see(CURRENT)
        else:
            showwarning('Warning','Features not located in text')

        editFrame.pack(expand=YES, fill=BOTH)

    def save_tree(self, parent):
        # We force the text contents of the cfile object to copy over
        # all that is presently in the current text-box
        self.cfile.setAllText(self.text.get(1.0,END))
        self.edit.config(text='Edit', command= lambda:self.edit_tree(parent))

        # Recompile whatever was edited and redisplay
        # Note: changes are not saved hereby!!
        self.cfile.compile_if_needed()
        self.cfile.onFeatures()

class CTestbed(CTab):
    def __init__(self, parent, cfile):
        CTab.__init__(self, parent, cfile, 'Testbed')
        self.child = None
        self.edit = None
        self.text = None
        self.editFrame = None
        self.cnv = None
        self.mainFrame = None
        self.newInsert = None

    def makelab(self, text, row, col, **props):
        lab = Label(self.child, text=text, background='white', **props)
        # Make the label grow to fill all space allocated for the column
        lab.grid(row=row, column=col, sticky='NSEW')

    # Called when we switch to this mode using the toolbar at top.
    def reinit(self):
        if self.child:
            self.child.pack_forget()
        if self.mainFrame:
            self.mainFrame.pack_forget()

        self.mainFrame = Frame(self, bd=1, bg='white')
        self.mainFrame.pack(expand=YES, fill=BOTH)

        self.mainFrame.grid_rowconfigure(0, weight=1)
        self.mainFrame.grid_columnconfigure(0, weight=1)

        xscrollbar = Scrollbar(self.mainFrame, orient=HORIZONTAL)
        xscrollbar.grid(row=1, column=0, sticky=E+W)

        yscrollbar = Scrollbar(self.mainFrame)
        yscrollbar.grid(row=0, column=1, sticky=N+S)

        self.cnv= Canvas(self.mainFrame, bd=2, xscrollcommand=xscrollbar.set,
                         yscrollcommand=yscrollbar.set, width = 847, height=369)

        xscrollbar.config(command=self.cnv.xview)
        yscrollbar.config(command=self.cnv.yview)

        self.child = Frame(self.cnv, bd=2, relief=SUNKEN, background='white')


        self.child.rowconfigure(1, weight=1)
        self.child.columnconfigure(1, weight=1)
        self.child.pack(expand=YES, fill=BOTH)

        butnFrame = Frame(self.child, relief=SUNKEN, bd=2)
        butnFrame.grid(row=0, sticky='NSEW', columnspan=2)

        self.edit = Button(butnFrame, text='Edit', command= self.edit_testbed)
        self.edit.pack(side=RIGHT)
        self.newInsert = Button(butnFrame, text='New Sentence', command= self.new_sentence)
        self.newInsert.pack(side=RIGHT)

        self.cfile.compile_if_needed()

        self.makelab("Num Parses", 1, 0, bd=1, relief=SUNKEN, fg="#77AA77", font = ("Helvetica", FontScale +12))
        self.makelab("Sentence", 1, 1, bd=1, relief=SUNKEN, fg="#77AA77", font = ("Helvetica", FontScale +12))

        # Make the column containing the sentences grow to include all
        # extra space
        self.child.columnconfigure(1, weight=1)
        for i in xrange(len(self.cfile.curparse.testbed_statements)):
            x = self.cfile.curparse.testbed_statements[i]
            assert x[0] == 'item'
            x = x[1]
            # Left-justify the text
            numparse = ccg2xml.getprop('numOfParses', x)
            string = ccg2xml.getprop('string', x)

        # How many parses of the sentence are produced?
        self.makelab('%s' % numparse, i+2, 0)

        # Print the sentence itself
        self.makelab('%s%s' % (numparse == 0 and '*' or '', string),
                     i+2, 1, anchor=W)

        self.cnv.create_window(0, 0, anchor='nw', window=self.child)

        self.child.update_idletasks()
        #self.child.grid(row=0, column=0, sticky=NSEW)

        self.cnv.config(scrollregion=self.cnv.bbox("all"))
        self.cnv.grid(row=0, column=0, sticky='NSEW')


    # Edit the testbed
    def edit_testbed(self):
        self.editFrame = Frame(self.mainFrame, bd=1, background='white')
        #self.editFrame.grid(row=len(self.cfile.curparse.testbed_statements)+3, columnspan=2, sticky='NSEW')
        self.editFrame.grid(row=2, columnspan=2, sticky='NSEW')

        self.text = Text(self.editFrame, padx=5, wrap=None, undo = YES, background='white')
        vbar = Scrollbar(self.editFrame)
        hbar = Scrollbar(self.editFrame, orient='horizontal')

        self.text.config(yscrollcommand=vbar.set)    # call vbar.set on text move
        self.text.config(xscrollcommand=hbar.set)
        vbar.config(command=self.text.yview)         # call text.yview on scroll move
        hbar.config(command=self.text.xview)         # or hbar['command']=text.xview

        # Change the text on the button, and also pass the rest
        # of the arguments so that the grid for the statements can be reset
        self.edit.config(text='Done', command= self.save_testbed)

        # Changing the mode of the cfile object here,
        # so that once the user clicks done,
        # the whole object is recompiled and redisplayed
        self.cfile.mode= 'Edit'

        vbar.pack(side=RIGHT, fill=Y)
        hbar.pack(side=BOTTOM, fill=X)
        self.text.pack(fill= BOTH, expand= YES)

        # Set a mark at the beginning of the text
        self.text.mark_set("START", INSERT)
        self.text.mark_gravity("START", LEFT)

        # Push in the rest of the file's contents
        fileData = self.cfile.getAllText()
        self.text.insert(INSERT, fileData)

        # Move the insert position to the first occurence of the family name
        # FIXME: this is poor implementation
        # The positioning of the insert cursor should be happening by parsing the
        # CFG production rules, using CSFamily.prod.lineno and endlineno
        self.text.config(takefocus=True)
        idx= self.text.search('testbed', "START")
        if idx:
            self.text.mark_set(CURRENT, idx)
            self.text.see(CURRENT)
        else:
            showwarning(title= 'VisCCG: Warning', message='No initial testbed found')

        #self.editFrame.pack(expand=YES, fill=BOTH)
        self.child.update_idletasks()
        self.cnv.config(scrollregion=self.cnv.bbox("all"))

    # Save the edited text
    def save_testbed(self):
        # We force the text contents of the cfile object to copy over
        # all that is presently in the current text-box
        self.cfile.setAllText(self.text.get(1.0,END))
        self.edit.config(text='Edit', command= self.edit_testbed)
        self.editFrame.pack_forget()

        # Recompile whatever was edited and redisplay
        # Note: changes are not saved hereby!!
        self.cfile.compile_if_needed()
        self.cfile.onTestbed()

    # Enter a new sentence
    def new_sentence(self):
        master = Tk()
        master.title('VisCCG: New Sentence for the testbed')
        sent = Entry(master, bg='#FFFFFF', width = 100)
        nParses = Entry(master, bg='#FFFFFF', width = 2)

        sLabel = Label (master, text = 'Sentence:')
        nLabel = Label (master, text = 'Number of parses:')

        sent.focus_set()

        b = Button(master, text="Add sentence", width=10, command= lambda:self.editNew(master, sent, nParses))
        c = Button(master, text="Cancel", command= master.destroy)

        sent.grid (row=1, column=0, sticky = W)
        nParses.grid (row=1, column=1, sticky= W)
        sLabel.grid (row=0, column=0, sticky=W)
        nLabel.grid (row=0, column=1, sticky = W)
        b.grid (row=2, column = 0)
        c.grid (row=2, column = 1)

    # Print from the new sentence
    def editNew(self, master, sent, nParses):
        # Prepare the file's contents for editing
        fileData = self.cfile.getAllText()
        self.text = Text(master)

        self.text.mark_set("START", INSERT)
        self.text.mark_gravity("START", LEFT)
        self.text.insert(INSERT, fileData)

        testSent = sent.get()
        npSent = nParses.get()

        self.text.config(takefocus=True)
        idx= self.text.search('testbed', "START")
        if idx:
            self.text.mark_set("START", idx)
            idx = self.text.search('{', "START", forwards = True)
            self.text.mark_set("START", idx)
            idx = self.text.search('\n', "START", forwards = True)
            # FIXME: really poor search for locating the right position
            # to insert text here. Needs correction!
            self.text.mark_set(INSERT, idx)
            self.text.mark_gravity(INSERT, RIGHT)

            self.text.insert (INSERT, '\n\t'+ testSent+ ':\t'+  npSent+ ';')

        else:
            showwarning(title= 'VisCCG: Warning', message='No initial testbed found, creating new')
            self.text.mark_set(INSERT, END)
            self.text.mark_gravity(INSERT, RIGHT)

            self.text.insert (INSERT, ' testbed {\n')
            self.text.insert (INSERT, '\n\t'+ testSent+ ':\t'+  npSent+ ';')
            self.text.insert (INSERT, '}\n')


        # Set the original file's data to be this
        fileData= self.text.get(1.0, END)
        self.cfile.setAllText(fileData)

        # Destroy the entry window
        master.destroy()

        # Update the display
        self.cfile.mode= 'Edit'
        self.cfile.compile_if_needed()
        self.cfile.onTestbed()

# Creates the top-level window and populates the widgets below it.
class CFile(object):
    #### NOTE NOTE NOTE! Variables declared like this, in the class itself,
    #### are class variables (not instance variables) until they are
    #### assigned to.  If you want pure instance variables, you need to
    #### initialize them inside of __init__().

    # Hash table describing modes and the associated class
    modelist = {'Edit':CEdit, 'Lexicon':CLexicon, 'Features':CFeatures,
                'Words':CWords, 'Testbed':CTestbed, 'Rules':CRules}

    startfiledir = '.'
    ftypes = [('All files',     '*'),                 # for file open dialog
              ('Text files',   '.txt'),               # customize in subclass
              ('Python files', '.py')]                # or set in each instance

    colors = [{'fg':'black',      'bg':'white'},      # color pick list
              {'fg':'yellow',     'bg':'black'},      # first item is default
              {'fg':'white',      'bg':'blue'},       # tailor me as desired
              {'fg':'black',      'bg':'beige'},      # or do PickBg/Fg chooser
              {'fg':'yellow',     'bg':'purple'},
              {'fg':'black',      'bg':'brown'},
              {'fg':'lightgreen', 'bg':'darkgreen'},
              {'fg':'darkblue',   'bg':'orange'},
              {'fg':'orange',     'bg':'darkblue'}]

    fonts  = [('courier',    9+FontScale, 'normal'),  # platform-neutral fonts
              ('courier',   12+FontScale, 'normal'),  # (family, size, style)
              ('courier',   10+FontScale, 'bold'),    # or popup a listbox
              ('courier',   10+FontScale, 'italic'),  # make bigger on linux
              ('times',     10+FontScale, 'normal'),
              ('helvetica', 10+FontScale, 'normal'),
              ('ariel',     10+FontScale, 'normal'),
              ('system',    10+FontScale, 'normal'),
              ('courier',   20+FontScale, 'normal')]

    def __init__(self, file=None):
        self.file = file

        self.openDialog = None
        self.saveDialog = None
        self.lastfind   = None
        self.current_parse = None
        self.mode = None
        self.last_save_signature = None
        self.last_compile_signature = None

        # First top-level window is Tk(); rest are Toplevel()
        global root
        if not root:
            root = Tk()
            self.top = root
        else:
            self.top = Toplevel(root)

        ccg2xml.late_init_graphics()
        openfiles[self] = True
        self.top.protocol('WM_DELETE_WINDOW', self.onClose)

        # We create an outer frame to hold the toolbar and the main widget.
        # Create all the different kinds of main widget.
        # FIXME: Maybe outer isn't necessary?
        self.outer = Frame(self.top)
        self.outer.pack(expand=YES, fill=BOTH)  # make frame stretchable
        self.modes = {}
        for mode in self.modelist:
            self.modes[mode] = self.modelist[mode](self.outer, self)
        self.main = None
        self.toolbar_widget = None
        self.checkbar_widget = None
        #self.switch_to('Edit')
        self.setFileName(None)
        if file:
                self.onFirstOpen(file)
        else:
            # When the user has just opened a new file
            # Need to load template from the src folder
            openccg_home = os.environ['OPENCCG_HOME']
            template = open(openccg_home + '/src/ccg2xml/grammar_template.ccg', 'r').read()
            self.setAllText(template)

        # Save the MD5 signature for future comparison
        self.last_save_signature = self.getSignature(self.getAllText())
        self.switch_to('Edit')

    def switch_to(self, mode):
        # Switch to a different mode (display, edit, test).  Remove the
        # existing main and toolbar widgets, if existing.  Redo the menubar
        # and toolbar widgets according to the new mode and then display
        # the new widgets.
        #
        # FIXME: We should probably create the menubar and toolbar widgets
        # only once, and remember them.
        if self.mode != mode:
            if self.main:
                self.main.pack_forget()
            if self.toolbar_widget:
                self.toolbar_widget.pack_forget()
            if self.checkbar_widget:
                self.checkbar_widget.pack_forget()
            self.mode = mode
            self.main = self.modes[mode]
            self.makeMenubar()
            self.makeToolbar(mode)
            self.makeCheckbar()
            #print "Reinit being called now... "
            self.main.reinit()
            # Pack the main widget after the toolbar, so it goes below it.
            self.main.pack(side=TOP, expand=YES, fill=BOTH)

    # Create the menubar; assumes that self.menubar has been set to the
    # appropriate menubar description.  Note that the menubar has to be a
    # child of the top-level window itself rather than any child of it, so
    # that it can be correctly displayed at the top of the window -- or
    # possibly in its decoration (Windows) or at top of screen (Mac).
    #
    # From PP2E guimaker.py.
    def makeMenubar(self):
        menubar = Menu(self.top)
        self.top.config(menu=menubar)

        for (name, key, items) in self.main.menubar:
            pulldown = Menu(menubar)
            self.addMenuItems(pulldown, items)
            menubar.add_cascade(label=name, underline=key, menu=pulldown)

        if sys.platform[:3] == 'win':
            menubar.add_command(label='Help', command=self.help)
        else:
            pulldown = Menu(menubar)  # linux needs real pulldown
            pulldown.add_command(label='About', command=self.help)
            menubar.add_cascade(label='Help', menu=pulldown)

    # Add items to a menu or submenu.  From PP2E guimaker.py.
    def addMenuItems(self, menu, items):
        for item in items:                     # scan nested items list
            if item == 'separator':            # string: add separator
                menu.add_separator({})
            elif type(item) is list:       # list: disabled item list
                for num in item:
                    menu.entryconfig(num, state=DISABLED)
            elif type(item[2]) is not list:
                menu.add_command(label     = item[0],         # command:
                                 underline = item[1],         # add command
                                 command   = item[2])         # cmd=callable
            else:
                pullover = Menu(menu)
                self.addMenuItems(pullover, item[2])          # sublist:
                menu.add_cascade(label     = item[0],         # make submenu
                                 underline = item[1],         # add cascade
                                 menu      = pullover)

    def makeToolbar(self, selected):
        """
        make toolbar (of buttons) at top, if any
        expand=no, fill=x so same width on resize
        """
        if self.main.toolbar:
            self.toolbar_widget = Frame(self.outer, cursor='hand2',
                                        relief=SUNKEN, bd=2)
            self.toolbar_widget.pack(side=TOP, fill=X)
            for (name, action, where) in self.main.toolbar:
                but = Button(self.toolbar_widget, text=name,
                             command=action)
                if name == selected:
                    but.config(relief=SUNKEN)
                but.pack(where)

    def makeCheckbar(self):
        """
        make check-button bar at top, if any
        expand=no, fill=x so same width on resize
        """
        if self.main.checkbar:
            self.checkbar_widget = Frame(self.outer, cursor='hand2',
                                         relief=SUNKEN, bd=2)
            self.checkbar_widget.pack(side=TOP, fill=X)
            for (name, var) in self.main.checkbar:
                Checkbutton(self.checkbar_widget, text=name,
                            variable=var,
                            command=self.main.redraw).pack(side=LEFT)

    def getAllText(self):
        return self.modes['Edit'].getAllText()

    def setAllText(self, text):
        self.modes['Edit'].setAllText(text)
        #self.modes['Display'].setAllText(text)

    def _getints(self, string):
        """Internal function."""
        if string:
            if type(string) is str:
                textwid = self.modes['Edit'].text
                return tuple(map(getint, textwid.tk.splitlist(string)))
            else:
                return string

    def edit(self, *args):
        """Internal method

        This method controls the undo mechanism and
        the modified flag. The exact behavior of the
        command depends on the option argument that
        follows the edit argument. The following forms
        of the command are currently supported:

        edit_modified, edit_redo, edit_reset, edit_separator
        and edit_undo

        """
        textwid = self.modes['Edit'].text
        return self._getints(
            textwid.tk.call((textwid._w, 'edit') + args)) or ()

    def edit_modified(self, arg=None):
        """Get or Set the modified flag

        If arg is not specified, returns the modified
        flag of the widget. The insert, delete, edit undo and
        edit redo commands or the user can set or clear the
        modified flag. If boolean is specified, sets the
        modified flag of the widget to arg.
        """

        # Added to use md5 functionality to watch for changed data
        if arg is None:
            alltext = self.getAllText()
            if (self.last_save_signature != self.getSignature(alltext)):
                return YES
            return self.edit("modified", arg)

    def onInfo(self):
        text  = self.getAllText()                  # added on 5/3/00 in 15 mins
        bytes = len(text)                          # words uses a simple guess:
        lines = len(string.split(text, '\n'))      # any separated by whitespace
        words = len(string.split(text))
        index = self.main.text.index(INSERT)
        where = tuple(string.split(index, '.'))

        showinfo('CCG Editor Information',
                 'Current location:\n\n' +
                 'line:\t%s\ncolumn:\t%s\n\n' % where +
                 'File text statistics:\n\n' +
                 'Modified: %s\n\n' % self.edit_modified()+
                 'bytes:\t%d\nlines:\t%d\nwords:\t%d\n' %
                 (bytes, lines, words))

    #######################
    # Search menu commands
    #######################

    def onGoto(self, line=None):
        if not line:
            line = askinteger('CCG Editor', 'Enter line number')
        self.main.text.update()
        self.main.text.focus()
        if line is not None:
            maxindex = self.main.text.index(END+'-1c')
            maxline  = atoi(split(maxindex, '.')[0])
            if line > 0 and line <= maxline:
                self.main.text.mark_set(INSERT, '%d.0' % line)      # goto line
                self.main.text.tag_remove(SEL, '1.0', END)          # delete selects
                self.main.text.tag_add(SEL, INSERT, 'insert + 1l')  # select line
                self.main.text.see(INSERT)                          # scroll to line
            else:
                showerror('CCG Editor', 'Bad line number')

    def onFind(self, lastkey=None):
        key = lastkey or askstring('CCG Editor', 'Enter search string')
        self.main.text.update()
        self.main.text.focus()
        self.lastfind = key
        if key:
            where = self.main.text.search(key, INSERT, END)        # don't wrap
            if not where:
                showerror('CCG Editor', 'String not found')
            else:
                pastkey = where + '+%dc' % len(key)           # index past key
                self.main.text.tag_remove(SEL, '1.0', END)         # remove any sel
                self.main.text.tag_add(SEL, where, pastkey)        # select key
                self.main.text.mark_set(INSERT, pastkey)           # for next find
                self.main.text.see(where)                          # scroll display

    def onRefind(self):
        self.onFind(self.lastfind)

    ######################
    # Tools menu commands
    ######################

    def onFontList(self):
        self.fonts.append(self.fonts[0])           # pick next font in list
        del self.fonts[0]                          # resizes the text area
        self.modes['Edit'].text.config(font=self.fonts[0])
        self.modes['Display'].text.config(font=self.fonts[0])

    def onColorList(self):
        self.colors.append(self.colors[0])         # pick next color in list
        del self.colors[0]                         # move current to end
        self.modes['Edit'].text.config(fg=self.colors[0]['fg'], bg=self.colors[0]['bg'])
        self.modes['Display'].text.config(fg=self.colors[0]['fg'], bg=self.colors[0]['bg'])

    def onPickFg(self):
        self.pickColor('fg')
    def onPickBg(self):
        self.pickColor('bg')
    def pickColor(self, part):
        (triple, hexstr) = askcolor()
        if hexstr:
            apply(self.modes['Edit'].text.config, (), {part: hexstr})
            apply(self.modes['Display'].text.config, (), {part: hexstr})

#     def onRunCode(self, parallelmode=1):
#         """
#         run Python code being edited--not an ide, but handy;
#         tries to run in file's dir, not cwd (may be pp2e root);
#         inputs and adds command-line arguments for script files;
#         code's stdin/out/err = editor's start window, if any;
#         but parallelmode uses start to open a dos box for i/o;
#         """
#         from PP2E.launchmodes import System, Start, Fork
#         filemode = 0
#         thefile  = str(self.getFileName())
#         cmdargs  = askstring('CCG Editor', 'Commandline arguments?') or ''
#         if os.path.exists(thefile):
#             filemode = askyesno('CCG Editor', 'Run from file?')
#         if not filemode:                                    # run text string
#             namespace = {'__name__': '__main__'}            # run as top-level
#             sys.argv = [thefile] + string.split(cmdargs)    # could use threads
#             exec self.getAllText() + '\n' in namespace      # exceptions ignored
#         elif askyesno('CCG Editor', 'Text saved in file?'):
#             mycwd = os.getcwd()                             # cwd may be root
#             os.chdir(os.path.dirname(thefile) or mycwd)     # cd for filenames
#             thecmd  = thefile + ' ' + cmdargs
#             if not parallelmode:                            # run as file
#                 System(thecmd, thecmd)()                    # block editor
#             else:
#                 if sys.platform[:3] == 'win':               # spawn in parallel
#                     Start(thecmd, thecmd)()                 # or use os.spawnv
#                 else:
#                     Fork(thecmd, thecmd)()                  # spawn in parallel
#             os.chdir(mycwd)

    #####################
    # File menu commands
    #####################

    def getSignature(self, contents):
        return md5.md5(contents).digest()

    def my_askopenfilename(self):      # objects remember last result dir/file
        if not self.openDialog:
            self.openDialog = Open(initialdir=self.startfiledir,
                                   filetypes=self.ftypes)
        return self.openDialog.show()

    def my_asksaveasfilename(self):    # objects remember last result dir/file
        if not self.saveDialog:
            self.saveDialog = SaveAs(initialdir=self.startfiledir,
                                     filetypes=self.ftypes)
        self.last_save_signature = self.getSignature(self.getAllText())
        return self.saveDialog.show()

    def onOpen(self):
        file = self.my_askopenfilename()
        # FIXME! Only create new window if file exists and is readable
        if file:
            CFile(file)

    def onFirstOpen(self, file):
        try:
            text = open(file, 'r').read()
        except:
            showerror('CCG Editor', 'Could not open file ' + file)
        else:
            self.setAllText(text)
            self.setFileName(file)

    def compile_if_needed(self):
        # Compare the last compiled MD5 signature and present one
        # and compile if needed.
        # To force compilation, set this signature to None
        text = self.getAllText()
        textSign = self.getSignature(text)
        if textSign != self.last_compile_signature:
            # Now compile
            ccg2xml.init_global_state(errors_to_string=True)
            ccg2xml.options.quiet = True
            self.curparse = ccg2xml.parse_string(text)
            self.last_compiled_signature = textSign

    def onDisplay(self):
        self.switch_to('Display')

    def onEdit(self):
        self.switch_to('Edit')

    def onLexicon(self):
        self.switch_to('Lexicon')

    def onTestbed(self):
        self.switch_to('Testbed')

    def onRules(self):
        self.switch_to('Rules')

    def onWords(self):
        self.switch_to('Words')

    def onFeatures(self):
        self.switch_to('Features')

    def onNew(self):
        CFile()

    def getFileName(self):
        return self.currfile

    def setFileName(self, name):
        self.currfile = name  # for save
        if name:
            title = 'VisCCG Editor: %s' % name
        else:
            title = 'VisCCG Editor'
        self.top.title(title)
        self.top.iconname(title)

    def help(self):
        showinfo('Help', 'Sorry, no help for ' + self.__class__.__name__)

    # Close this window; if this is the last window, quit
    def onClose(self):
        assert self in openfiles
        if len(openfiles) == 1 or self.top == root:
            self.onQuit()
            # If we got this far, the user refused to quit, so do nothing
        else:
            ccg2xml.debug("fooooo\n")
            del openfiles[self]
            self.top.destroy()

    def onQuit(self):
        modfiles = False
        for f in openfiles:
            if f.edit_modified() == YES:
                modfiles = True
                break
        if not modfiles or askyesno('CCG Editor', 'Files are modified, Really quit?'):
            self.top.quit()


def main():
    ccg2xml.parse_arguments(sys.argv[1:])
    ccg2xml.init_global_state_once()
    if ccg2xml.global_args and len(ccg2xml.global_args) > 0:
        # file name:
        fname = ccg2xml.global_args[0]
    else:
        fname = None

    CFile(fname)
    mainloop()

if __name__ == '__main__':                            # when run as a script
    main()


================================================
FILE: src/ccg2xml/convert-ply.py
================================================
#!/usr/bin/python

import sys
import re
import optparse
import os.path
import time

# Author: Ben Wing <ben@666.com>
# Date: April 2006

#############################################################################
#                                                                           #
#                              convert-ply.py                               #
#                                                                           #
#   Convert a .ply file into a .py file which can be run to generate a      #
#   compiler for a language and use it to parse a specified file.  This     #
#   program is something like a compiler-compiler-compiler -- it uses a     #
#   script to generate a compiler-compiler script, which in turn is used    #
#   to generate a compiler, which in turn processes a program in some       #
#   arbitrary syntax and does whatever it wants with it.  Very meta!!!      #
#                                                                           #
#############################################################################

# The format of a .ply file is that of a .py file with YACC-like directives
# interspersed.  %y on a line by itself switches to YACC mode, and %p
# switches back to Python mode.  In YACC mode, lines should look like this:

# lhs: rhs1 rhs2 ...: python code # first alternative
#    : rhs3 rhs4 ...: more python code # second alternative
#    : rhs5 rhs6 # alternative with default code of $$ = $1
#    : rhs7 rhs8 ...:
#        # If no code follows the colon on the same line, the code consists
#        # of all following indented lines.
#        python code
#        python code
#        ...
#
# This represents a context-free rule where LHS expands to one or more
# rules (e.g. RHS1 RHS2 ... or RHS3 RHS4 ... or RHS5 RHS6 ... etc.).
# Associated with each rule is some code, which will be invoked when the
# parser finds an appropriately matching right-hand side somewhere in
# the stream of tokens being parsed and proceeds to "reduce" the relevant
# tokens into the single left-hand side token LHS.  Associated with each
# token is a value.  For terminal tokens, the value is the string in the
# text that produced this token.  For non-terminal tokens, the value is
# determined by the code associated with the rule that produced this token
# (i.e. one of the rules with this token as its LHS).  The value of a
# non-terminal token is set by assigning to $$; values of RHS tokens are
# referenced using $1, $2, etc., where $1 is the first RHS token, $2
# is the second, etc.  Hence, the default code of $$ = $1 assigns the
# value of the first RHS token to the LHS token.  The code can also
# reference $@, which is a structure encapsulating all RHS values; this
# is mostly useful for getting at $@.lineno, a function referring to the
# starting line number of a particular token (especially $@.lineno(0), the
# starting line number of the set of RHS tokens).

# WARNING!!! Currently, PLY has a serious bug in its handling of empty
# RHS rules; often it reports a syntax error in place of properly reducing
# an empty RHS rule.  If this happens, you must rewrite the appropriate
# rules without the use of an empty RHS rule. (As of yet, I'm not sure
# exactly what the circumstances are that trigger this bug.)
#
# Note that this bug exists as of PLY 1.6, which is what we are currently
# using.  It's quite possible that later versions of PLY (especially the
# new PLY 2.x series) fix the bug.

###########################################################################
#
# Command-line options and usage
#
###########################################################################

usage = """%prog [OPTIONS] FILE ...

Convert from .ply format to a .py file, for lex/yacc.
"""

parser = optparse.OptionParser(usage=usage)
parser.add_option("-o", "--outfile",
                   default=None,
                   help="""Specify the output file.
Default is y.INFILE.py, where INFILE is the source file's name minus any
.ply extension.""",
                   metavar="FILE")

(options, args) = parser.parse_args()

def syntax_error(err, line):
    global errors
    errors += 1
    if errors > maxerr:
        raise SyntaxError("Too many errors (more than %s) when compiling" %
                          maxerr)
    sys.stderr.write("%s in file %s, line %d: %s\n" %
                     (err, current_file, current_lineno, line))
    

wordrange = r'\-a-zA-Z0-9_%'
operrange = r'\+\*\|\?'
wordre = '[%s]+' % wordrange

def make_name_python_safe(name):
    return re.sub('[^A-Za-z0-9_]', '_', name)

# Replace dollar signs in CODE to point to the actual array of RHS values.
# If RENUMBER_AT is given, however, convert $RENUMBER_AT to None, and
# subtract one from all $ references above this value.

def replace_dollar_signs(code, renumber_at=None):
    newcode = ""
    prevright = 0
    for match in re.finditer(r"""('''([^\\\n]|\\(.|\n))*?'''|
                                  \"\"\"([^\\\n]|\\(.|\n))*?\"\"\"|
                                  '([^\\\n]|\\(.|\n))*?'|
                                  \"([^\\\n]|\\(.|\n))*?\"|
                                  [#][^\n]*\n?|
                                  ([^\\'\"#]|\\(.|\n))*)""", code, re.VERBOSE):
        errored = 0
        if prevright != match.start(0):
            syntax_error("Apparent syntax error in code at position %d"
                         % prevright, code)
            errored = 1
            newcode += code[prevright:match.start(0)]
        prevright = match.end(0)
        matchstr = match.group(0)
        if not matchstr:
            if match.start(0) == len(code):
                break
            elif not errored:
                errored = 1
                syntax_error("Apparent syntax error in code at position %d"
                             % match.start(0), code)
        elif matchstr[0] in '\'"#':
            # A comment or literal; don't substitute in it
            pass
        elif renumber_at:
            # Renumber
            def replace_dollar_def(match):
                str = match.group()
                ref = int(str[1:])
                if ref == renumber_at:
                    return '[]'
                elif ref > renumber_at:
                    return '$%d' % (ref - 1)
                else:
                    return str
            matchstr = re.sub(r'\$([0-9]+)', replace_dollar_def, matchstr)
        else:
            # Apply substitutions
            matchstr = re.sub(r'\$@', 'p', matchstr)
            matchstr = re.sub(r'\$\$', 'p[0]', matchstr)
            matchstr = re.sub(r'\$([0-9]+)', r'p[\1]', matchstr)

        newcode += matchstr
    return newcode

# Output a single CFG rule
def output_python_cfg_rule(fil, lhs, rhs, code):
    global unique_no

    # Look for occurrences of foo* or foo+; handle all of them by
    # adding appropriate list rules.
    newrhs = ""
    prevright = 0
    for match in re.finditer(r'(%s)\s*([+*])' % wordre, rhs):
        matchstr = match.group(1)
        newrhs += rhs[prevright:match.start(0)]
        prevright = match.end(0)
        unique_no += 1
        matchlhs = '%s_%s_list_%s' % (lhs, matchstr, unique_no)
        newrhs += matchlhs
        if match.group(2) == '+':
            output_python_cfg_rule(fil, matchlhs, matchstr, "    $$ = [$1]\n")
        else:
            output_python_cfg_rule(fil, matchlhs, " ", "    $$ = []\n")
        output_python_cfg_rule(fil, matchlhs, '%s %s' % (matchlhs, matchstr),
                               "    $$ = $1 + [$2]\n")
    if prevright:
        newrhs += rhs[prevright:]
        rhs = newrhs

    # Look for occurrences of foo?; handle by splitting into two rules
    # (It should be possible to handle by using empty rules, but this
    # is currently broken in PLY and more-or-less randomly doesn't work,
    # with the empty rule not being recognized and a syntax error
    # resulting)
    match = re.search(r'(%s)\s*[?]' % wordre, rhs)
    if match:
        matchtoken = match.group(1) # matched token, w/o following '?'
        leftrhs = rhs[0:match.start(0)] # text before match
        rightrhs = rhs[match.end(0):] # text after match
        # Output the "it's there" alternative
        output_python_cfg_rule(fil, lhs, leftrhs + matchtoken + rightrhs, code)
        # compute token ID, as would be referenced by a $# reference, based
        # on the text before the match.  first delete everything before a
        # '|' (alternatives) then count the number of words.
        tokennum = len(re.sub('.*\|', '', leftrhs).split()) + 1
        code = replace_dollar_signs(code, tokennum)
        # Output the "it's not there" alternative, with the dollar references
        # renumbered.  We should *not* attempt any tail-recursion elimination
        # here, in case there are further foo? occurrences later in the file.
        output_python_cfg_rule(fil, lhs, leftrhs + rightrhs, code)
    else:
        unique_no += 1
        print >> fil, "def p_%s_%d(p):" % (make_name_python_safe(lhs),
                                           unique_no)
        rhs = rhs.strip()
        rhs = re.sub(r'\s*\|\s*', r'\n    | ', rhs)
        rhs = re.sub(r'\n\s*\n', '\n', rhs)
        if rhs.find('\n') >= 0:
            print >> fil, "    '''%s : %s'''" % (lhs, rhs)
        else:
            print >> fil, "    '%s : %s'" % (lhs, rhs)
        code = replace_dollar_signs(code)
        print >> fil, code

def output_default_python_cfg_rule(fil, lhs, rhs):
    output_python_cfg_rule(fil, lhs, rhs, "    $$ = $1\n")

def finish_any_cfg(fil):
    global curlhs, currhs, yacc_python_mode, yacc_python_code
    if currhs:
        # A RHS not yet finished; finish it
        if yacc_python_code:
            output_python_cfg_rule(fil, curlhs, currhs, yacc_python_code)
        else:
            output_default_python_cfg_rule(fil, curlhs, currhs)
    clear_rule_context()

def clear_rule_context():
    global curlhs, currhs, yacc_python_mode, yacc_python_code
    curlhs = None
    currhs = None
    yacc_python_mode = False
    yacc_python_code = None

## Process file(s)

args = args or ['-']
for arg in args:
    global current_file
    current_file = arg
    # Open input and output files
    if arg == '-':
        fil = sys.stdin
    else:
        fil = open(arg)
    if options.outfile:
        outarg = options.outfile
    else:
        if arg == '-':
            outarg = 'y.ccg.py'
        else:
            fname = arg
            if fname.endswith('.ply'):
                fname = fname[0:-4]
            (fdir, ffile) = os.path.split(fname)
            outarg = os.path.join(fdir, 'y.%s.py' % ffile)
    outfil = open(outarg, 'w')

    # Initialize state
    errors = 0
    maxerr = 5
    unique_no = 0
    clear_rule_context()
    mode = 'python'
    contline = None

    print >> outfil, """#!/usr/bin/python

################## NOTE NOTE NOTE ##################
#
# This file (%s) was automatically generated from %s.
# Generated by %s at %s.
#
# DO NOT MODIFY THIS FILE DIRECTLY.  YOUR CHANGES WILL BE LOST.
# Instead, modify the file `%s' that generated this file, and then
# rerun `%s%s %s'.
#
################## NOTE NOTE NOTE ##################
""" % (outarg, current_file, sys.argv[0], time.asctime(), current_file,
       sys.argv[0],
       options.outfile and " -o %s" % options.outfile or "",
       current_file)

    global current_lineno
    current_lineno = 0
    for line in fil:
        current_lineno += 1
        line = line.rstrip("\r\n")
        if contline:
            line = contline + line
            contline = None
        if line == '%y':
            mode = 'yacc'
        elif line == '%p':
            mode = 'python'
            finish_any_cfg(outfil)
        elif line == '%l':
            mode = 'lex'
        else:
            if mode == 'python':
                print >> outfil, line
            else:
                if yacc_python_mode:
                    if re.match(r'\S', line):
                        yacc_python_mode = False
                    else:
                        yacc_python_code += line + '\n'
                        continue
                if re.match(r'\s*#.*$', line):
                    print >> outfil, line
                    continue
                elif line and line[-1] == '\\':
                    contline = line[0:-1]
                    continue
                elif re.match(r'\s*$', line):
                    print >> outfil, line
                    continue
                # Eliminate comments, but conservatively, to avoid any
                # possibility of removing comments inside of quotes (which
                # should occur only in Python code, anyway, in which case
                # it doesn't really matter)
                line = re.sub(r'''^([^\'\"#]*)#.*$''', '\1', line)
                if mode == 'yacc':
                    match = re.match(r'(%s)\s*(:.*)$' % wordre, line)
                    if match:
                        # We are starting a new rule
                        finish_any_cfg(outfil)
                        curlhs = match.group(1)
                        line = ' ' + match.group(2)
                    match = re.match(r'(\s*)(:)?([^:]*)(:.*)?$', line)
                    if not match or not match.group(1):
                        syntax_error("Unrecognized rule beginning", line)
                    if re.match(r'^.*[^%s\s%s].*$' % (operrange, wordrange),
                                match.group(3)):
                        syntax_error("Illegal characters in RHS", line)
                    if not match.group(2):
                        # We are continuing an RHS
                        if currhs == None:
                            syntax_error("Invalid RHS continuation", line)
                        else:
                            currhs += match.expand(r' \3')
                    else:
                        # We are starting an RHS
                        if curlhs == None:
                            syntax_error("Invalid RHS without LHS", line)
                        else:
                            if currhs:
                                output_default_python_cfg_rule(outfil, curlhs,
                                                               currhs)
                            currhs = match.group(3)
                    if match.group(4):
                        # strip colon, spaces
                        code = match.group(4)[1:].strip()
                        if not code:
                            # Start eating the rest of the code until new rule
                            yacc_python_mode = True
                            yacc_python_code = ""
                        else:
                            code = '    ' + code + '\n'
                            output_python_cfg_rule(outfil, curlhs, currhs,
                                                   code)
                            currhs = None
    finish_any_cfg(outfil)
    fil.close()
    outfil.close()


================================================
FILE: src/ccg2xml/grammar_template.ccg
================================================
############ [name of the grammar] ####################
#
## [a brief description of your grammar]
## [your name, Month Year]
#
#
# For help on how to create grammars with VisCCG, see the tutorial:
#   http://comp.ling.utexas.edu/wiki/doku.php/openccg/ccggui_tut

####################### Features #######################

feature {
}

######################### Words #########################


######################### Rules #########################


################## Lexicon/Categories ####################


####################### Testbed #########################

testbed {
}


================================================
FILE: src/ccg2xml/lex.py
================================================
#-----------------------------------------------------------------------------
# ply: lex.py
#
# Author: David M. Beazley (dave@dabeaz.com)
#
# Copyright (C) 2001-2005, David M. Beazley
#
# $Header: /cvsroot/openccg/openccg/src/ccg2xml/lex.py,v 1.1 2006/09/30 08:11:29 benwing Exp $
#
# This library is free software; you can redistribute it and/or
# modify it under the terms of the GNU Lesser General Public
# License as published by the Free Software Foundation; either
# version 2.1 of the License, or (at your option) any later version.
#
# This library is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
# Lesser General Public License for more details.
#
# You should have received a copy of the GNU Lesser General Public
# License along with this library; if not, write to the Free Software
# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
#
# See the file COPYING for a complete copy of the LGPL.
#
#
# This module automatically constructs a lexical analysis module from regular
# expression rules defined in a user-defined module.  The idea is essentially the same
# as that used in John Aycock's Spark framework, but the implementation works
# at the module level rather than requiring the use of classes.
#
# This module tries to provide an interface that is closely modeled after
# the traditional lex interface in Unix.  It also differs from Spark
# in that:
#
#   -  It provides more extensive error checking and reporting if
#      the user supplies a set of regular expressions that can't
#      be compiled or if there is any other kind of a problem in
#      the specification.
#
#   -  The interface is geared towards LALR(1) and LR(1) parser
#      generators.  That is tokens are generated one at a time
#      rather than being generated in advanced all in one step.
#
# There are a few limitations of this module
#
#   -  The module interface makes it somewhat awkward to support more
#      than one lexer at a time.  Although somewhat inelegant from a
#      design perspective, this is rarely a practical concern for
#      most compiler projects.
#
#   -  The lexer requires that the entire input text be read into
#      a string before scanning.  I suppose that most machines have
#      enough memory to make this a minor issues, but it makes
#      the lexer somewhat difficult to use in interactive sessions
#      or with streaming data.
#
#-----------------------------------------------------------------------------

r"""
lex.py

This module builds lex-like scanners based on regular expression rules.
To use the module, simply write a collection of regular expression rules
and actions like this:

# lexer.py
import lex

# Define a list of valid tokens
tokens = (
    'IDENTIFIER', 'NUMBER', 'PLUS', 'MINUS'
    )

# Define tokens as functions
def t_IDENTIFIER(t):
    r' ([a-zA-Z_](\w|_)* '
    return t

def t_NUMBER(t):
    r' \d+ '
    return t

# Some simple tokens with no actions
t_PLUS = r'\+'
t_MINUS = r'-'

# Initialize the lexer
lex.lex()

The tokens list is required and contains a complete list of all valid
token types that the lexer is allowed to produce.  Token types are
restricted to be valid identifiers.  This means that 'MINUS' is a valid
token type whereas '-' is not.

Rules are defined by writing a function with a name of the form
t_rulename.  Each rule must accept a single argument which is
a token object generated by the lexer. This token has the following
attributes:

    t.type   = type string of the token.  This is initially set to the
               name of the rule without the leading t_
    t.value  = The value of the lexeme.
    t.lineno = The value of the line number where the token was encountered

For example, the t_NUMBER() rule above might be called with the following:

    t.type  = 'NUMBER'
    t.value = '42'
    t.lineno = 3

Each rule returns the token object it would like to supply to the
parser.  In most cases, the token t is returned with few, if any
modifications.  To discard a token for things like whitespace or
comments, simply return nothing.  For instance:

def t_whitespace(t):
    r' \s+ '
    pass

For faster lexing, you can also define this in terms of the ignore set like this:

t_ignore = ' \t'

The characters in this string are ignored by the lexer. Use of this feature can speed
up parsing significantly since scanning will immediately proceed to the next token.

lex requires that the token returned by each rule has an attribute
t.type.  Other than this, rules are free to return any kind of token
object that they wish and may construct a new type of token object
from the attributes of t (provided the new object has the required
type attribute).

If illegal characters are encountered, the scanner executes the
function t_error(t) where t is a token representing the rest of the
string that hasn't been matched.  If this function isn't defined, a
LexError exception is raised.  The .text attribute of this exception
object contains the part of the string that wasn't matched.

The t.skip(n) method can be used to skip ahead n characters in the
input stream.  This is usually only used in the error handling rule.
For instance, the following rule would print an error message and
continue:

def t_error(t):
    print "Illegal character in input %s" % t.value[0]
    t.skip(1)

Of course, a nice scanner might wish to skip more than one character
if the input looks very corrupted.

The lex module defines a t.lineno attribute on each token that can be used
to track the current line number in the input.  The value of this
variable is not modified by lex so it is up to your lexer module
to correctly update its value depending on the lexical properties
of the input language.  To do this, you might write rules such as
the following:

def t_newline(t):
    r' \n+ '
    t.lineno += t.value.count("\n")

To initialize your lexer so that it can be used, simply call the lex.lex()
function in your rule file.  If there are any errors in your
specification, warning messages or an exception will be generated to
alert you to the problem.

(dave: this needs to be rewritten)
To use the newly constructed lexer from another module, simply do
this:

    import lex
    import lexer
    plex.input("position = initial + rate*60")

    while 1:
        token = plex.token()       # Get a token
        if not token: break        # No more tokens
        ... do whatever ...

Assuming that the module 'lexer' has initialized plex as shown
above, parsing modules can safely import 'plex' without having
to import the rule file or any additional imformation about the
scanner you have defined.
"""

# -----------------------------------------------------------------------------


__version__ = "1.6"

import re, types, sys, copy

# Exception thrown when invalid token encountered and no default
class LexError(Exception):
    def __init__(self,message,s):
         self.args = (message,)
         self.text = s

# Token class
class LexToken:
    def __str__(self):
        return "LexToken(%s,%r,%d)" % (self.type,self.value,self.lineno)
    def __repr__(self):
        return str(self)
    def skip(self,n):
        try:
            self._skipn += n
        except AttributeError:
            self._skipn = n

# -----------------------------------------------------------------------------
# Lexer class
#
#    input()          -  Store a new string in the lexer
#    token()          -  Get the next token
# -----------------------------------------------------------------------------

class Lexer:
    def __init__(self):
        self.lexre = None           # Master regular expression
        self.lexdata = None         # Actual input data (as a string)
        self.lexpos = 0             # Current position in input text
        self.lexlen = 0             # Length of the input text
        self.lexindexfunc = [ ]     # Reverse mapping of groups to functions and types
        self.lexerrorf = None       # Error rule (if any)
        self.lextokens = None       # List of valid tokens
        self.lexignore = None       # Ignored characters
        self.lineno = 1             # Current line number
        self.debug = 0              # Debugging mode
        self.optimize = 0           # Optimized mode
        self.token = self.errtoken

    def __copy__(self):
        c = Lexer()
        c.lexre = self.lexre
        c.lexdata = self.lexdata
        c.lexpos = self.lexpos
        c.lexlen = self.lexlen
        c.lexindexfunc = self.lexindexfunc
        c.lexerrorf = self.lexerrorf
        c.lextokens = self.lextokens
        c.lexignore = self.lexignore
        c.debug = self.debug
        c.lineno = self.lineno
        c.optimize = self.optimize
        c.token = c.realtoken
        return c

    # ------------------------------------------------------------
    # input() - Push a new string into the lexer
    # ------------------------------------------------------------
    def input(self,s):
        if not isinstance(s, (unicode, types.StringType)):
            raise ValueError, "Expected a string"
        self.lexdata = s
        self.lexpos = 0
        self.lexlen = len(s)
        self.token = self.realtoken

        # Change the token routine to point to realtoken()
        global token
        if token == self.errtoken:
            token = self.token

    # ------------------------------------------------------------
    # errtoken() - Return error if token is called with no data
    # ------------------------------------------------------------
    def errtoken(self):
        raise RuntimeError, "No input string given with input()"

    # ------------------------------------------------------------
    # token() - Return the next token from the Lexer
    #
    # Note: This function has been carefully implemented to be as fast
    # as possible.  Don't make changes unless you really know what
    # you are doing
    # ------------------------------------------------------------
    def realtoken(self):
        # Make local copies of frequently referenced attributes
        lexpos    = self.lexpos
        lexlen    = self.lexlen
        lexignore = self.lexignore
        lexdata   = self.lexdata

        while lexpos < lexlen:
            # This code provides some short-circuit code for whitespace, tabs, and other ignored characters
            if lexdata[lexpos] in lexignore:
                lexpos += 1
                continue

            # Look for a regular expression match
            m = self.lexre.match(lexdata,lexpos)
            if m:
                i = m.lastindex
                lexpos = m.end()
                tok = LexToken()
                tok.value = m.group()
                tok.lineno = self.lineno
                tok.lexer = self
                func,tok.type = self.lexindexfunc[i]
                if not func:
                    self.lexpos = lexpos
                    return tok

                # If token is processed by a function, call it
                self.lexpos = lexpos
                newtok = func(tok)
                self.lineno = tok.lineno     # Update line number

                # Every function must return a token, if nothing, we just move to next token
                if not newtok: continue

                # Verify type of the token.  If not in the token map, raise an error
                if not self.optimize:
                    if not self.lextokens.has_key(newtok.type):
                        raise LexError, ("%s:%d: Rule '%s' returned an unknown token type '%s'" % (
                            func.func_code.co_filename, func.func_code.co_firstlineno,
                            func.__name__, newtok.type),lexdata[lexpos:])

                return newtok

            # No match. Call t_error() if defined.
            if self.lexerrorf:
                tok = LexToken()
                tok.value = self.lexdata[lexpos:]
                tok.lineno = self.lineno
                tok.type = "error"
                tok.lexer = self
                oldpos = lexpos
                newtok = self.lexerrorf(tok)
                lexpos += getattr(tok,"_skipn",0)
                if oldpos == lexpos:
                    # Error method didn't change text position at all. This is an error.
                    self.lexpos = lexpos
                    raise LexError, ("Scanning error. Illegal character '%s'" % (lexdata[lexpos]), lexdata[lexpos:])
                if not newtok: continue
                self.lexpos = lexpos
                return newtok

            self.lexpos = lexpos
            raise LexError, ("No match found", lexdata[lexpos:])

        # No more input data
        self.lexpos = lexpos + 1
        return None


# -----------------------------------------------------------------------------
# validate_file()
#
# This checks to see if there are duplicated t_rulename() functions or strings
# in the parser input file.  This is done using a simple regular expression
# match on each line in the filename.
# -----------------------------------------------------------------------------

def validate_file(filename):
    import os.path
    base,ext = os.path.splitext(filename)
    if ext != '.py': return 1        # No idea what the file is. Return OK

    try:
        f = open(filename)
        lines = f.readlines()
        f.close()
    except IOError:
        return 1                       # Oh well

    fre = re.compile(r'\s*def\s+(t_[a-zA-Z_0-9]*)\(')
    sre = re.compile(r'\s*(t_[a-zA-Z_0-9]*)\s*=')
    counthash = { }
    linen = 1
    noerror = 1
    for l in lines:
        m = fre.match(l)
        if not m:
            m = sre.match(l)
        if m:
            name = m.group(1)
            prev = counthash.get(name)
            if not prev:
                counthash[name] = linen
            else:
                print "%s:%d: Rule %s redefined. Previously defined on line %d" % (filename,linen,name,prev)
                noerror = 0
        linen += 1
    return noerror

# -----------------------------------------------------------------------------
# _read_lextab(module)
#
# Reads lexer table from a lextab file instead of using introspection.
# -----------------------------------------------------------------------------

def _read_lextab(lexer, fdict, module):
    exec "import %s as lextab" % module
    lexer.lexre = re.compile(lextab._lexre, re.VERBOSE)
    lexer.lexindexfunc = lextab._lextab
    for i in range(len(lextab._lextab)):
        t = lexer.lexindexfunc[i]
        if t:
            if t[0]:
                lexer.lexindexfunc[i] = (fdict[t[0]],t[1])
    lexer.lextokens = lextab._lextokens
    lexer.lexignore = lextab._lexignore
    if lextab._lexerrorf:
        lexer.lexerrorf = fdict[lextab._lexerrorf]

# -----------------------------------------------------------------------------
# lex(module)
#
# Build all of the regular expression rules from definitions in the supplied module
# -----------------------------------------------------------------------------
def lex(module=None,debug=0,optimize=0,lextab="lextab"):
    ldict = None
    regex = ""
    error = 0
    files = { }
    lexer = Lexer()
    lexer.debug = debug
    lexer.optimize = optimize
    global token,input

    if module:
        # User supplied a module object.
        if isinstance(module, types.ModuleType):
            ldict = module.__dict__
        elif isinstance(module, types.InstanceType):
            _items = [(k,getattr(module,k)) for k in dir(module)]
            ldict = { }
            for (i,v) in _items:
                ldict[i] = v
        else:
            raise ValueError,"Expected a module or instance"

    else:
        # No module given.  We might be able to get information from the caller.
        try:
            raise RuntimeError
        except RuntimeError:
            e,b,t = sys.exc_info()
            f = t.tb_frame
            f = f.f_back           # Walk out to our calling function
            ldict = f.f_globals    # Grab its globals dictionary

    if optimize and lextab:
        try:
            _read_lextab(lexer,ldict, lextab)
            if not lexer.lexignore: lexer.lexignore = ""
            token = lexer.token
            input = lexer.input
            return lexer

        except ImportError:
            pass

    # Get the tokens map
    if (module and isinstance(module,types.InstanceType)):
        tokens = getattr(module,"tokens",None)
    else:
        try:
            tokens = ldict["tokens"]
        except KeyError:
            tokens = None

    if not tokens:
        raise SyntaxError,"lex: module does not define 'tokens'"
    if not (isinstance(tokens,types.ListType) or isinstance(tokens,types.TupleType)):
        raise SyntaxError,"lex: tokens must be a list or tuple."

    # Build a dictionary of valid token names
    lexer.lextokens = { }
    if not optimize:

        # Utility function for verifying tokens
        def is_identifier(s):
            for c in s:
                if not (c.isalnum() or c == '_'): return 0
            return 1

        for n in tokens:
            if not is_identifier(n):
                print "lex: Bad token name '%s'" % n
                error = 1
            if lexer.lextokens.has_key(n):
                print "lex: Warning. Token '%s' multiply defined." % n
            lexer.lextokens[n] = None
    else:
        for n in tokens: lexer.lextokens[n] = None


    if debug:
        print "lex: tokens = '%s'" % lexer.lextokens.keys()

    # Get a list of symbols with the t_ prefix
    tsymbols = [f for f in ldict.keys() if f[:2] == 't_']

    # Now build up a list of functions and a list of strings
    fsymbols = [ ]
    ssymbols = [ ]
    for f in tsymbols:
        if callable(ldict[f]):
            fsymbols.append(ldict[f])
        elif isinstance(ldict[f], types.StringType):
            ssymbols.append((f,ldict[f]))
        else:
            print "lex: %s not defined as a function or string" % f
            error = 1

    # Sort the functions by line number
    fsymbols.sort(lambda x,y: cmp(x.func_code.co_firstlineno,y.func_code.co_firstlineno))

    # Sort the strings by regular expression length
    ssymbols.sort(lambda x,y: (len(x[1]) < len(y[1])) - (len(x[1]) > len(y[1])))

    # Check for non-empty symbols
    if len(fsymbols) == 0 and len(ssymbols) == 0:
        raise SyntaxError,"lex: no rules of the form t_rulename are defined."

    # Add all of the rules defined with actions first
    for f in fsymbols:

        line = f.func_code.co_firstlineno
        file = f.func_code.co_filename
        files[file] = None

        ismethod = isinstance(f, types.MethodType)

        if not optimize:
            nargs = f.func_code.co_argcount
            if ismethod:
                reqargs = 2
            else:
                reqargs = 1
            if nargs > reqargs:
                print "%s:%d: Rule '%s' has too many arguments." % (file,line,f.__name__)
                error = 1
                continue

            if nargs < reqargs:
                print "%s:%d: Rule '%s' requires an argument." % (file,line,f.__name__)
                error = 1
                continue

            if f.__name__ == 't_ignore':
                print "%s:%d: Rule '%s' must be defined as a string." % (file,line,f.__name__)
                error = 1
                continue

        if f.__name__ == 't_error':
            lexer.lexerrorf = f
            continue

        if f.__doc__:
            if not optimize:
                try:
                    c = re.compile(f.__doc__, re.VERBOSE)
                except re.error,e:
                    print "%s:%d: Invalid regular expression for rule '%s'. %s" % (file,line,f.__name__,e)
                    error = 1
                    continue

                if debug:
                    print "lex: Adding rule %s -> '%s'" % (f.__name__,f.__doc__)

            # Okay. The regular expression seemed okay.  Let's append it to the master regular
            # expression we're building

            if (regex): regex += "|"
            regex += "(?P<%s>%s)" % (f.__name__,f.__doc__)
        else:
            print "%s:%d: No regular expression defined for rule '%s'" % (file,line,f.__name__)

    # Now add all of the simple rules
    for name,r in ssymbols:

        if name == 't_ignore':
            lexer.lexignore = r
            continue

        if not optimize:
            if name == 't_error':
                raise SyntaxError,"lex: Rule 't_error' must be defined as a function"
                error = 1
                continue

            if not lexer.lextokens.has_key(name[2:]):
                print "lex: Rule '%s' defined for an unspecified token %s." % (name,name[2:])
                error = 1
                continue
            try:
                c = re.compile(r,re.VERBOSE)
            except re.error,e:
                print "lex: Invalid regular expression for rule '%s'. %s" % (name,e)
                error = 1
                continue
            if debug:
                print "lex: Adding rule %s -> '%s'" % (name,r)

        if regex: regex += "|"
        regex += "(?P<%s>%s)" % (name,r)

    if not optimize:
        for f in files.keys():
            if not validate_file(f):
                error = 1
    try:
        if debug:
            print "lex: regex = '%s'" % regex
        lexer.lexre = re.compile(regex, re.VERBOSE)

        # Build the index to function map for the matching engine
        lexer.lexindexfunc = [ None ] * (max(lexer.lexre.groupindex.values())+1)
        for f,i in lexer.lexre.groupindex.items():
            handle = ldict[f]
            if type(handle) in (types.FunctionType, types.MethodType):
                lexer.lexindexfunc[i] = (handle,handle.__name__[2:])
            else:
                # If rule was specified as a string, we build an anonymous
                # callback function to carry out the action
                lexer.lexindexfunc[i] = (None,f[2:])

        # If a lextab was specified, we create a file containing the precomputed
        # regular expression and index table

        if lextab and optimize:
            lt = open(lextab+".py","w")
            lt.write("# %s.py.  This file automatically created by PLY. Don't edit.\n" % lextab)
            lt.write("_lexre = %s\n" % repr(regex))
            lt.write("_lextab = [\n");
            for i in range(0,len(lexer.lexindexfunc)):
                t = lexer.lexindexfunc[i]
                if t:
                    if t[0]:
                        lt.write("  ('%s',%s),\n"% (t[0].__name__, repr(t[1])))
                    else:
                        lt.write("  (None,%s),\n" % repr(t[1]))
                else:
                    lt.write("  None,\n")

            lt.write("]\n");
            lt.write("_lextokens = %s\n" % repr(lexer.lextokens))
            lt.write("_lexignore = %s\n" % repr(lexer.lexignore))
            if (lexer.lexerrorf):
                lt.write("_lexerrorf = %s\n" % repr(lexer.lexerrorf.__name__))
            else:
                lt.write("_lexerrorf = None\n")
            lt.close()

    except re.error,e:
        print "lex: Fatal error. Unable to compile regular expression rules. %s" % e
        error = 1
    if error:
        raise SyntaxError,"lex: Unable to build lexer."
    if not lexer.lexerrorf:
        print "lex: Warning. no t_error rule is defined."

    if not lexer.lexignore: lexer.lexignore = ""

    # Create global versions of the token() and input() functions
    token = lexer.token
    input = lexer.input

    return lexer

# -----------------------------------------------------------------------------
# run()
#
# This runs the lexer as a main program
# -----------------------------------------------------------------------------

def runmain(lexer=None,data=None):
    if not data:
        try:
            filename = sys.argv[1]
            f = open(filename)
            data = f.read()
            f.close()
        except IndexError:
            print "Reading from standard input (type EOF to end):"
            data = sys.stdin.read()

    if lexer:
        _input = lexer.input
    else:
        _input = input
    _input(data)
    if lexer:
        _token = lexer.token
    else:
        _token = token

    while 1:
        tok = _token()
        if not tok: break
        print "(%s,'%s',%d)" % (tok.type, tok.value, tok.lineno)


================================================
FILE: src/ccg2xml/yacc.py
================================================
#-----------------------------------------------------------------------------
# ply: yacc.py
#
# Author(s): David M. Beazley (dave@dabeaz.com)
#
# Copyright (C) 2001-2005, David M. Beazley
#
# $Header: /cvsroot/openccg/openccg/src/ccg2xml/yacc.py,v 1.1 2006/09/30 08:11:29 benwing Exp $
#
# This library is free software; you can redistribute it and/or
# modify it under the terms of the GNU Lesser General Public
# License as published by the Free Software Foundation; either
# version 2.1 of the License, or (at your option) any later version.
# 
# This library is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
# Lesser General Public License for more details.
# 
# You should have received a copy of the GNU Lesser General Public
# License along with this library; if not, write to the Free Software
# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
# 
# See the file COPYING for a complete copy of the LGPL.
#
#
# This implements an LR parser that is constructed from grammar rules defined
# as Python functions.  Roughly speaking, this module is a cross between
# John Aycock's Spark system and the GNU bison utility.
#
# The current implementation is only somewhat object-oriented. The
# LR parser itself is defined in terms of an object (which allows multiple
# parsers to co-exist).  However, most of the variables used during table
# construction are defined in terms of global variables.  Users shouldn't
# notice unless they are trying to define multiple parsers at the same
# time using threads (in which case they should have their head examined).
#
# This implementation supports both SLR and LALR(1) parsing.  LALR(1)
# support was implemented by Elias Ioup (ezioup@alumni.uchicago.edu)
# and hacked abit by Dave to run faster.
#
# :::::::: WARNING :::::::
#
# Construction of LR parsing tables is fairly complicated and expensive.
# To make this module run fast, a *LOT* of work has been put into
# optimization---often at the expensive of readability and what might
# consider to be good Python "coding style."   Modify the code at your
# own risk!
# ----------------------------------------------------------------------------

__version__ = "1.6"

#-----------------------------------------------------------------------------
#                     === User configurable parameters ===
#
# Change these to modify the default behavior of yacc (if you wish)
#-----------------------------------------------------------------------------

yaccdebug   = 1                # Debugging mode.  If set, yacc generates a
                               # a 'parser.out' file in the current directory

debug_file  = 'parser.out'     # Default name of the debugging file
tab_module  = 'parsetab'       # Default name of the table module
default_lr  = 'SLR'            # Default LR table generation method

error_count = 3                # Number of symbols that must be shifted to leave recovery mode

import re, types, sys, cStringIO, md5, os.path

# Exception raised for yacc-related errors
class YaccError(Exception):   pass

#-----------------------------------------------------------------------------
#                        ===  LR Parsing Engine ===
#
# The following classes are used for the LR parser itself.  These are not
# used during table construction and are independent of the actual LR
# table generation algorithm
#-----------------------------------------------------------------------------

# This class is used to hold non-terminal grammar symbols during parsing.
# It normally has the following attributes set:
#        .type       = Grammar symbol type
#        .value      = Symbol value
#        .lineno     = Starting line number
#        .endlineno  = Ending line number (optional, set automatically)

class YaccSymbol:
    def __str__(self):    return self.type
    def __repr__(self):   return str(self)

# This class is a wrapper around the objects actually passed to each
# grammar rule.   Index lookup and assignment actually assign the
# .value attribute of the underlying YaccSymbol object.
# The lineno() method returns the line number of a given
# item (or 0 if not defined).   The linespan() method returns
# a tuple of (startline,endline) representing the range of lines
# for a symbol.

class YaccProduction:
    def __init__(self,s):
        self.slice = s
        self.pbstack = []

    def __getitem__(self,n):
        return self.slice[n].value

    def __setitem__(self,n,v):
        self.slice[n].value = v

    def __len__(self):
        return len(self.slice)
    
    def lineno(self,n):
        return getattr(self.slice[n],"lineno",0)

    def linespan(self,n):
        startline = getattr(self.slice[n],"lineno",0)
        endline = getattr(self.slice[n],"endlineno",startline)
        return startline,endline

    def pushback(self,n):
        if n <= 0:
            raise ValueError, "Expected a positive value"
        if n > (len(self.slice)-1):
            raise ValueError, "Can't push %d tokens. Only %d are available." % (n,len(self.slice)-1)
        for i in range(0,n):
            self.pbstack.append(self.slice[-i-1])

# The LR Parsing engine.   This is defined as a class so that multiple parsers
# can exist in the same process.  A user never instantiates this directly.
# Instead, the global yacc() function should be used to create a suitable Parser
# object. 

class Parser:
    def __init__(self,magic=None):

        # This is a hack to keep users from trying to instantiate a Parser
        # object directly.

        if magic != "xyzzy":
            raise YaccError, "Can't instantiate Parser. Use yacc() instead."

        # Reset internal state
        self.productions = None          # List of productions
        self.errorfunc   = None          # Error handling function
        self.action      = { }           # LR Action table
        self.goto        = { }           # LR goto table
        self.require     = { }           # Attribute require table
        self.method      = "Unknown LR"  # Table construction method used

    def errok(self):
        self.errorcount = 0

    def restart(self):
        del self.statestack[:]
        del self.symstack[:]
        sym = YaccSymbol()
        sym.type = '$'
        self.symstack.append(sym)
        self.statestack.append(0)
        
    def parse(self,input=None,lexer=None,debug=0):
        lookahead = None                 # Current lookahead symbol
        lookaheadstack = [ ]             # Stack of lookahead symbols
        actions = self.action            # Local reference to action table
        goto    = self.goto              # Local reference to goto table
        prod    = self.productions       # Local reference to production list
        pslice  = YaccProduction(None)   # Production object passed to grammar rules
        pslice.parser = self             # Parser object
        self.errorcount = 0              # Used during error recovery

        # If no lexer was given, we will try to use the lex module
        if not lexer:
            import lex as lexer

        pslice.lexer = lexer
        
        # If input was supplied, pass to lexer
        if input:
            lexer.input(input)

        # Tokenize function
        get_token = lexer.token

        statestack = [ ]                # Stack of parsing states
        self.statestack = statestack
        symstack   = [ ]                # Stack of grammar symbols
        self.symstack = symstack

        errtoken   = None               # Err token

        # The start state is assumed to be (0,$)
        statestack.append(0)
        sym = YaccSymbol()
        sym.type = '$'
        symstack.append(sym)
        
        while 1:
            # Get the next symbol on the input.  If a lookahead symbol
            # is already set, we just use that. Otherwise, we'll pull
            # the next token off of the lookaheadstack or from the lexer
            if not lookahead:
                if not lookaheadstack:
                    lookahead = get_token()     # Get the next token
                else:
                    lookahead = lookaheadstack.pop()
                if not lookahead:
                    lookahead = YaccSymbol()
                    lookahead.type = '$'
            if debug:
                errorlead = ("%s . %s" % (" ".join([xx.type for xx in symstack][1:]), str(lookahead))).lstrip()

            # Check the action table
            s = statestack[-1]
            ltype = lookahead.type
            t = actions.get((s,ltype),None)

            if t is not None:
                if t > 0:
                    # shift a symbol on the stack
                    if ltype == '$':
                        # Error, end of input
                        sys.stderr.write("yacc: Parse error. EOF\n")
                        return
                    statestack.append(t)
                    if debug > 1:
                        sys.stderr.write("%-60s shift state %s\n" % (errorlead, t))
                    symstack.append(lookahead)
                    lookahead = None

                    # Decrease error count on successful shift
                    if self.errorcount > 0:
                        self.errorcount -= 1
                        
                    continue
                
                if t < 0:
                    # reduce a symbol on the stack, emit a production
                    p = prod[-t]
                    pname = p.name
                    plen  = p.len

                    # Get production function
                    sym = YaccSymbol()
                    sym.type = pname       # Production name
                    sym.value = None
                    if debug > 1:
                        sys.stderr.write("%-60s reduce %d\n" % (errorlead, -t))

                    if plen:
                        targ = symstack[-plen-1:]
                        targ[0] = sym
                        try:
                            sym.lineno = targ[1].lineno
                            sym.endlineno = getattr(targ[-1],"endlineno",targ[-1].lineno)
                        except AttributeError:
                            sym.lineno = 0
                        del symstack[-plen:]
                        del statestack[-plen:]
                    else:
                        sym.lineno = 0
                        targ = [ sym ]
                    pslice.slice = targ
                    pslice.pbstack = []
                    # Call the grammar rule with our special slice object
                    p.func(pslice)

                    # If there was a pushback, put that on the stack
                    if pslice.pbstack:
                        lookaheadstack.append(lookahead)
                        for _t in pslice.pbstack:
                            lookaheadstack.append(_t)
                        lookahead = None

                    symstack.append(sym)
                    statestack.append(goto[statestack[-1],pname])
                    continue

                if t == 0:
                    n = symstack[-1]
                    return getattr(n,"value",None)
                    sys.stderr.write(errorlead, "\n")

            if t == None:
                if debug:
                    sys.stderr.write(errorlead + "\n")
                # We have some kind of parsing error here.  To handle
                # this, we are going to push the current token onto
                # the tokenstack and replace it with an 'error' token.
                # If there are any synchronization rules, they may
                # catch it.
                #
                # In addition to pushing the error token, we call call
                # the user defined p_error() function if this is the
                # first syntax error.  This function is only called if
                # errorcount == 0.
                if not self.errorcount:
                    self.errorcount = error_count
                    errtoken = lookahead
                    if errtoken.type == '$':
                        errtoken = None               # End of file!
                    if self.errorfunc:
                        global errok,token,restart
                        errok = self.errok        # Set some special functions available in error recovery
                        token = get_token
                        restart = self.restart
                        tok = self.errorfunc(errtoken)
                        del errok, token, restart   # Delete special functions
                        
                        if not self.errorcount:
                            # User must have done some kind of panic
                            # mode recovery on their own.  The
                            # returned token is the next lookahead
                            lookahead = tok
                            errtoken = None
                            continue
                    else:
                        if errtoken:
                            if hasattr(errtoken,"lineno"): lineno = lookahead.lineno
                            else: lineno = 0
                            if lineno:
                                sys.stderr.write("yacc: Syntax error at line %d, token=%s\n" % (lineno, errtoken.type))
                            else:
                                sys.stderr.write("yacc: Syntax error, token=%s" % errtoken.type)
                        else:
                            sys.stderr.write("yacc: Parse error in input. EOF\n")
                            return

                else:
                    self.errorcount = error_count
                
                # case 1:  the statestack only has 1 entry on it.  If we're in this state, the
                # entire parse has been rolled back and we're completely hosed.   The token is
                # discarded and we just keep going.

                if len(statestack) <= 1 and lookahead.type != '$':
                    lookahead = None
                    errtoken = None
                    # Nuke the pushback stack
                    del lookaheadstack[:]
                    continue

                # case 2: the statestack has a couple of entries on it, but we're
                # at the end of the file. nuke the top entry and generate an error token

                # Start nuking entries on the stack
                if lookahead.type == '$':
                    # Whoa. We're really hosed here. Bail out
                    return 

                if lookahead.type != 'error':
                    sym = symstack[-1]
                    if sym.type == 'error':
                        # Hmmm. Error is on top of stack, we'll just nuke input
                        # symbol and continue
                        lookahead = None
                        continue
                    t = YaccSymbol()
                    t.type = 'error'
                    if hasattr(lookahead,"lineno"):
                        t.lineno = lookahead.lineno
                    t.value = lookahead
                    lookaheadstack.append(lookahead)
                    lookahead = t
                else:
                    symstack.pop()
                    statestack.pop()

                continue

            # Call an error function here
            raise RuntimeError, "yacc: internal parser error!!!\n"

# -----------------------------------------------------------------------------
#                          === Parser Construction ===
#
# The following functions and variables are used to implement the yacc() function
# itself.   This is pretty hairy stuff involving lots of error checking,
# construction of LR items, kernels, and so forth.   Although a lot of
# this work is done using global variables, the resulting Parser object
# is completely self contained--meaning that it is safe to repeatedly
# call yacc() with different grammars in the same application.
# -----------------------------------------------------------------------------
        
# -----------------------------------------------------------------------------
# validate_file()
#
# This function checks to see if there are duplicated p_rulename() functions
# in the parser module file.  Without this function, it is really easy for
# users to make mistakes by cutting and pasting code fragments (and it's a real
# bugger to try and figure out why the resulting parser doesn't work).  Therefore,
# we just do a little regular expression pattern matching of def statements
# to try and detect duplicates.
# -----------------------------------------------------------------------------

def validate_file(filename):
    base,ext = os.path.splitext(filename)
    if ext != '.py': return 1          # No idea. Assume it's okay.

    try:
        f = open(filename)
        lines = f.readlines()
        f.close()
    except IOError:
        return 1                       # Oh well

    # Match def p_funcname(
    fre = re.compile(r'\s*def\s+(p_[a-zA-Z_0-9]*)\(')
    counthash = { }
    linen = 1
    noerror = 1
    for l in lines:
        m = fre.match(l)
        if m:
            name = m.group(1)
            prev = counthash.get(name)
            if not prev:
                counthash[name] = linen
            else:
                sys.stderr.write("%s:%d: Function %s redefined. Previously defined on line %d\n" % (filename,linen,name,prev))
                noerror = 0
        linen += 1
    return noerror

# This function looks for functions that might be grammar rules, but which don't have the proper p_suffix.
def validate_dict(d):
    for n,v in d.items(): 
        if n[0:2] == 'p_' and type(v) in (types.FunctionType, types.MethodType): continue
        if n[0:2] == 't_': continue

        if n[0:2] == 'p_':
            sys.stderr.write("yacc: Warning. '%s' not defined as a function\n" % n)
        if 1 and isinstance(v,types.FunctionType) and v.func_code.co_argcount == 1:
            try:
                doc = v.__doc__.split(" ")
                if doc[1] == ':':
                    sys.stderr.write("%s:%d: Warning. Possible grammar rule '%s' defined without p_ prefix.\n" % (v.func_code.co_filename, v.func_code.co_firstlineno,n))
            except StandardError:
                pass

# -----------------------------------------------------------------------------
#                           === GRAMMAR FUNCTIONS ===
#
# The following global variables and functions are used to store, manipulate,
# and verify the grammar rules specified by the user.
# -----------------------------------------------------------------------------

# Initialize all of the global variables used during grammar construction
def initialize_vars():
    global Productions, Prodnames, Prodmap, Terminals 
    global Nonterminals, First, Follow, Precedence, LRitems
    global Errorfunc, Signature, Requires

    # LALR(1) globals
    global Prodempty, TReductions, NTReductions, GotoSetNum, Canonical
    
    Productions  = [None]  # A list of all of the productions.  The first
                           # entry is always reserved for the purpose of
                           # building an augmented grammar
                        
    Prodnames    = { }     # A dictionary mapping the names of nonterminals to a list of all
                           # productions of that nonterminal.
                        
    Prodmap      = { }     # A dictionary that is only used to detect duplicate
                           # productions.

    Terminals    = { }     # A dictionary mapping the names of terminal symbols to a
                           # list of the rules where they are used.

    Nonterminals = { }     # A dictionary mapping names of nonterminals to a list
                           # of rule numbers where they are used.

    First        = { }     # A dictionary of precomputed FIRST(x) symbols
    
    Follow       = { }     # A dictionary of precomputed FOLLOW(x) symbols

    Precedence   = { }     # Precedence rules for each terminal. Contains tuples of the
                           # form ('right',level) or ('nonassoc', level) or ('left',level)

    LRitems      = [ ]     # A list of all LR items for the grammar.  These are the
                           # productions with the "dot" like E -> E . PLUS E

    Errorfunc    = None    # User defined error handler

    Signature    = md5.new()   # Digital signature of the grammar rules, precedence
                               # and other information.  Used to determined when a
                               # parsing table needs to be regenerated.

    Requires     = { }     # Requires list

    # LALR(1) Initialization
    Prodempty    = { }     # A dictionary of all productions that have an empty rule
                           # of the form P : <empty>

    TReductions  = { }     # A dictionary of precomputer reductions from
                           # nonterminals to terminals

    NTReductions = { }     # A dictionary of precomputed reductions from
                           # nonterminals to nonterminals

    GotoSetNum   = { }     # A dictionary that remembers goto sets based on
                           # the state number and symbol

    Canonical    = { }     # A list of LR item sets. A LR item set is a list of LR
                           # items that represent the state of the parser

    # File objects used when creating the parser.out debugging file
    global _vf, _vfc
    _vf           = cStringIO.StringIO()
    _vfc          = cStringIO.StringIO()

# -----------------------------------------------------------------------------
# class Production:
#
# This class stores the raw information about a single production or grammar rule.
# It has a few required attributes:
#
#       name     - Name of the production (nonterminal)
#       prod     - A list of symbols making up its production
#       number   - Production number.
#
# In addition, a few additional attributes are used to help with debugging or
# optimization of table generation.
#
#       file     - File where production action is defined.
#       lineno   - Line number where action is defined
#       func     - Action function
#       prec     - Precedence level
#       lr_next  - Next LR item. Example, if we are ' E -> E . PLUS E'
#                  then lr_next refers to 'E -> E PLUS . E'   
#       lr_index - LR item index (location of the ".") in the prod list.
#       lookaheads - LALR lookahead symbols for this item
#       len      - Length of the production (number of symbols on right hand side)
# -----------------------------------------------------------------------------

class Production:
    def __init__(self,**kw):
        for k,v in kw.items():
            setattr(self,k,v)
        self.lr_index = -1
        self.lr0_added = 0    # Flag indicating whether or not added to LR0 closure
        self.lr1_added = 0    # Flag indicating whether or not added to LR1
        self.usyms = [ ]
        self.lookaheads = { }
        self.lk_added = { }
        self.setnumbers = [ ]
        
    def __str__(self):
        if self.prod:
            s = "%s -> %s" % (self.name," ".join(self.prod))
        else:
            s = "%s -> <empty>" % self.name
        return s

    def __repr__(self):
        return str(self)

    # Compute lr_items from the production
    def lr_item(self,n):
        if n > len(self.prod): return None
        p = Production()
        p.name = self.name
        p.prod = list(self.prod)
        p.number = self.number
        p.lr_index = n
        p.lookaheads = { }
        p.setnumbers = self.setnumbers
        p.prod.insert(n,".")
        p.prod = tuple(p.prod)
        p.len = len(p.prod)
        p.usyms = self.usyms

        # Precompute list of productions immediately following
        try:
            p.lrafter = Prodnames[p.prod[n+1]]
        except (IndexError,KeyError),e:
            p.lrafter = []
        try:
            p.lrbefore = p.prod[n-1]
        except IndexError:
            p.lrbefore = None

        return p

class MiniProduction:
    pass

# Utility function
def is_identifier(s):
    for c in s:
        if not (c.isalnum() or c == '_'): return 0
    return 1

# -----------------------------------------------------------------------------
# add_production()
#
# Given an action function, this function assembles a production rule.
# The production rule is assumed to be found in the function's docstring.
# This rule has the general syntax:
#
#              name1 ::= production1
#                     |  production2
#                     |  production3
#                    ...
#                     |  productionn
#              name2 ::= production1
#                     |  production2
#                    ... 
# -----------------------------------------------------------------------------

def add_production(f,file,line,prodname,syms):
    
    if Terminals.has_key(prodname):
        sys.stderr.write("%s:%d: Illegal rule name '%s'. Already defined as a token.\n" % (file,line,prodname))
        return -1
    if prodname == 'error':
        sys.stderr.write("%s:%d: Illegal rule name '%s'. error is a reserved word.\n" % (file,line,prodname))
        return -1
                
    if not is_identifier(prodname):
        sys.stderr.write("%s:%d: Illegal rule name '%s'\n" % (file,line,prodname))
        return -1

    for s in syms:
        if not is_identifier(s) and s != '%prec':
            sys.stderr.write("%s:%d: Illegal name '%s' in rule '%s'\n" % (file,line,s, prodname))
            return -1

    # See if the rule is already in the rulemap
    map = "%s -> %s" % (prodname,syms)
    if Prodmap.has_key(map):
        m = Prodmap[map]
        sys.stderr.write("%s:%d: Duplicate rule %s.\n" % (file,line, m))
        sys.stderr.write("%s:%d: Previous definition at %s:%d\n" % (file,line, m.file, m.line))
        return -1

    p = Production()
    p.name = prodname
    p.prod = syms
    p.file = file
    p.line = line
    p.func = f
    p.number = len(Productions)

            
    Productions.append(p)
    Prodmap[map] = p
    if not Nonterminals.has_key(prodname):
        Nonterminals[prodname] = [ ]
    
    # Add all terminals to Terminals
    i = 0
    while i < len(p.prod):
        t = p.prod[i]
        if t == '%prec':
            try:
                precname = p.prod[i+1]
            except IndexError:
                sys.stderr.write("%s:%d: Syntax error. Nothing follows %%prec.\n" % (p.file,p.line))
                return -1

            prec = Precedence.get(precname,None)
            if not prec:
                sys.stderr.write("%s:%d: Nothing known about the precedence of '%s'\n" % (p.file,p.line,precname))
                return -1
            else:
                p.prec = prec
            del p.prod[i]
            del p.prod[i]
            continue

        if Terminals.has_key(t):
            Terminals[t].append(p.number)
            # Is a terminal.  We'll assign a precedence to p based on this
            if not hasattr(p,"prec"):
                p.prec = Precedence.get(t,('right',0))
        else:
            if not Nonterminals.has_key(t):
                Nonterminals[t] = [ ]
            Nonterminals[t].append(p.number)
        i += 1

    if not hasattr(p,"prec"):
        p.prec = ('right',0)
        
    # Set final length of productions
    p.len  = len(p.prod)
    p.prod = tuple(p.prod)

    # Calculate unique syms in the production
    p.usyms = [ ]
    for s in p.prod:
        if s not in p.usyms:
            p.usyms.append(s)
    
    # Add to the global productions list
    try:
        Prodnames[p.name].append(p)
    except KeyError:
        Prodnames[p.name] = [ p ]
    return 0

# Given a raw rule function, this function rips out its doc string
# and adds rules to the grammar

def add_function(f):
    line = f.func_code.co_firstlineno
    file = f.func_code.co_filename
    error = 0

    if isinstance(f,types.MethodType):
        reqdargs = 2
    else:
        reqdargs = 1
        
    if f.func_code.co_argcount > reqdargs:
        sys.stderr.write("%s:%d: Rule '%s' has too many arguments.\n" % (file,line,f.__name__))
        return -1

    if f.func_code.co_argcount < reqdargs:
        sys.stderr.write("%s:%d: Rule '%s' requires an argument.\n" % (file,line,f.__name__))
        return -1
          
    if f.__doc__:
        # Split the doc string into lines
        pstrings = f.__doc__.splitlines()
        lastp = None
        dline = line
        for ps in pstrings:
            dline += 1
            p = ps.split()
            if not p: continue
            try:
                if p[0] == '|':
                    # This is a continuation of a previous rule
                    if not lastp:
                        sys.stderr.write("%s:%d: Misplaced '|'.\n" % (file,dline))
                        return -1
                    prodname = lastp
                    if len(p) > 1:
                        syms = p[1:]
                    else:
                        syms = [ ]
                else:
                    prodname = p[0]
                    lastp = prodname
                    assign = p[1]
                    if len(p) > 2:
                        syms = p[2:]
                    else:
                        syms = [ ]
                    if assign != ':' and assign != '::=':
                        sys.stderr.write("%s:%d: Syntax error. Expected ':'\n" % (file,dline))
                        return -1
                e = add_production(f,file,dline,prodname,syms)
                error += e
            except StandardError:
                sys.stderr.write("%s:%d: Syntax error in rule '%s'\n" % (file,dline,ps))
                error -= 1
    else:
        sys.stderr.write("%s:%d: No documentation string specified in function '%s'\n" % (file,line,f.__name__))
    return error


# Cycle checking code (Michael Dyck)

def compute_reachable():
    '''
    Find each symbol that can be reached from the start symbol.
    Print a warning for any nonterminals that can't be reached.
    (Unused terminals have already had their warning.)
    '''
    Reachable = { }
    for s in Terminals.keys() + Nonterminals.keys():
        Reachable[s] = 0

    mark_reachable_from( Productions[0].prod[0], Reachable )

    for s in Nonterminals.keys():
        if not Reachable[s]:
            sys.stderr.write("yacc: Symbol '%s' is unreachable.\n" % s)

def mark_reachable_from(s, Reachable):
    '''
    Mark all symbols that are reachable from symbol s.
    '''
    if Reachable[s]:
        # We've already reached symbol s.
        return
    Reachable[s] = 1
    for p in Prodnames.get(s,[]):
        for r in p.prod:
            mark_reachable_from(r, Reachable)

# -----------------------------------------------------------------------------
# compute_terminates()
#
# This function looks at the various parsing rules and tries to detect
# infinite recursion cycles (grammar rules where there is no possible way
# to derive a string of only terminals).
# -----------------------------------------------------------------------------
def compute_terminates():
    '''
    Raise an error for any symbols that don't terminate.
    '''
    Terminates = {}

    # Terminals:
    for t in Terminals.keys():
        Terminates[t] = 1

    Terminates['$'] = 1

    # Nonterminals:

    # Initialize to false:
    for n in Nonterminals.keys():
        Terminates[n] = 0

    # Then propagate termination until no change:
    while 1:
        some_change = 0
        for (n,pl) in Prodnames.items():
            # Nonterminal n terminates iff any of its productions terminates.
            for p in pl:
                # Production p terminates iff all of its rhs symbols terminate.
                for s in p.prod:
                    if not Terminates[s]:
                        # The symbol s does not terminate,
                        # so production p does not terminate.
                        p_terminates = 0
                        break
                else:
                    # didn't break from the loop,
                    # so every symbol s terminates
                    # so production p terminates.
                    p_terminates = 1

                if p_terminates:
                    # symbol n terminates!
                    if not Terminates[n]:
                        Terminates[n] = 1
                        some_change = 1
                    # Don't need to consider any more productions for this n.
                    break

        if not some_change:
            break

    some_error = 0
    for (s,terminates) in Terminates.items():
        if not terminates:
            if not Prodnames.has_key(s) and not Terminals.has_key(s) and s != 'error':
                # s is used-but-not-defined, and we've already warned of that,
                # so it would be overkill to say that it's also non-terminating.
                pass
            else:
                sys.stderr.write("yacc: Infinite recursion detected for symbol '%s'.\n" % s)
                some_error = 1

    return some_error

# -----------------------------------------------------------------------------
# verify_productions()
#
# This function examines all of the supplied rules to see if they seem valid.
# -----------------------------------------------------------------------------
def verify_productions(cycle_check=1):
    error = 0
    for p in Productions:
        if not p: continue

        for s in p.prod:
            if not Prodnames.has_key(s) and not Terminals.has_key(s) and s != 'error':
                sys.stderr.write("%s:%d: Symbol '%s' used, but not defined as a token or a rule.\n" % (p.file,p.line,s))
                error = 1
                continue

    unused_tok = 0 
    # Now verify all of the tokens
    if yaccdebug:
        _vf.write("Unused terminals:\n\n")
    for s,v in Terminals.items():
        if s != 'error' and not v:
            sys.stderr.write("yacc: Warning. Token '%s' defined, but not used.\n" % s)
            if yaccdebug: _vf.write("   %s\n"% s)
            unused_tok += 1

    # Print out all of the productions
    if yaccdebug:
        _vf.write("\nGrammar\n\n")
        for i in range(1,len(Productions)):
            _vf.write("Rule %-5d %s\n" % (i, Productions[i]))
        
    unused_prod = 0
    # Verify the use of all productions
    for s,v in Nonterminals.items():
        if not v:
            p = Prodnames[s][0]
            sys.stderr.write("%s:%d: Warning. Rule '%s' defined, but not used.\n" % (p.file,p.line, s))
            unused_prod += 1

    
    if unused_tok == 1:
        sys.stderr.write("yacc: Warning. There is 1 unused token.\n")
    if unused_tok > 1:
        sys.stderr.write("yacc: Warning. There are %d unused tokens.\n" % unused_tok)

    if unused_prod == 1:
        sys.stderr.write("yacc: Warning. There is 1 unused rule.\n")
    if unused_prod > 1:
        sys.stderr.write("yacc: Warning. There are %d unused rules.\n" % unused_prod)

    if yaccdebug:
        _vf.write("\nTerminals, with rules where they appear\n\n")
        ks = Terminals.keys()
        ks.sort()
        for k in ks:
            _vf.write("%-20s : %s\n" % (k, " ".join([str(s) for s in Terminals[k]])))
        _vf.write("\nNonterminals, with rules where they appear\n\n")
        ks = Nonterminals.keys()
        ks.sort()
        for k in ks:
            _vf.write("%-20s : %s\n" % (k, " ".join([str(s) for s in Nonterminals[k]])))

    if (cycle_check):
        compute_reachable()
        error += compute_terminates()
#        error += check_cycles()
    return error

# -----------------------------------------------------------------------------
# build_lritems()
#
# This function walks the list of productions and builds a complete set of the
# LR items.  The LR items are stored in two ways:  First, they are uniquely
# numbered and placed in the list _lritems.  Second, a linked list of LR items
# is built for each production.  For example:
#
#   E -> E PLUS E
#
# Creates the list
#
#  [E -> . E PLUS E, E -> E . PLUS E, E -> E PLUS . E, E -> E PLUS E . ] 
# -----------------------------------------------------------------------------

def build_lritems():
    for p in Productions:
        lastlri = p
        lri = p.lr_item(0)
        i = 0
        while 1:
            lri = p.lr_item(i)
            lastlri.lr_next = lri
            if not lri: break
            lri.lr_num = len(LRitems)
            LRitems.append(lri)
            lastlri = lri
            i += 1

    # In order for the rest of the parser generator to work, we need to
    # guarantee that no more lritems are generated.  Therefore, we nuke
    # the p.lr_item method.  (Only used in debugging)
    # Production.lr_item = None

# -----------------------------------------------------------------------------
# add_precedence()
#
# Given a list of precedence rules, add to the precedence table.
# -----------------------------------------------------------------------------

def add_precedence(plist):
    plevel = 0
    error = 0
    for p in plist:
        plevel += 1
        try:
            prec = p[0]
            terms = p[1:]
            if prec != 'left' and prec != 'right' and prec != 'nonassoc':
                sys.stderr.write("yacc: Invalid precedence '%s'\n" % prec)
                return -1
            for t in terms:
                if Precedence.has_key(t):
                    sys.stderr.write("yacc: Precedence already specified for terminal '%s'\n" % t)
                    error += 1
                    continue
                Precedence[t] = (prec,plevel)
        except:
            sys.stderr.write("yacc: Invalid precedence table.\n")
            error += 1

    return error

# -----------------------------------------------------------------------------
# augment_grammar()
#
# Compute the augmented grammar.  This is just a rule S' -> start where start
# is the starting symbol.
# -----------------------------------------------------------------------------

def augment_grammar(start=None):
    if not start:
        start = Productions[1].name
    Productions[0] = Production(name="S'",prod=[start],number=0,len=1,prec=('right',0),func=None)
    Productions[0].usyms = [ start ]
    Nonterminals[start].append(0)


# -------------------------------------------------------------------------
# first()
#
# Compute the value of FIRST1(beta) where beta is a tuple of symbols.
#
# During execution of compute_first1, the result may be incomplete.
# Afterward (e.g., when called from compute_follow()), it will be complete.
# -------------------------------------------------------------------------
def first(beta):

    # We are computing First(x1,x2,x3,...,xn)
    result = [ ]
    for x in beta:
        x_produces_empty = 0

        # Add all the non-<empty> symbols of First[x] to the result.
        for f in First[x]:
            if f == '<empty>':
                x_produces_empty = 1
            else:
                if f not in result: result.append(f)

        if x_produces_empty:
            # We have to consider the next x in beta,
            # i.e. stay in the loop.
            pass
        else:
            # We don't have to consider any further symbols in beta.
            break
    else:
        # There was no 'break' from the loop,
        # so x_produces_empty was true for all x in beta,
        # so beta produces empty as well.
        result.append('<empty>')

    return result


# FOLLOW(x)
# Given a non-terminal.  This function computes the set of all symbols
# that might follow it.  Dragon book, p. 189.

def compute_follow(start=None):
    # Add '$' to the follow list of the start symbol
    for k in Nonterminals.keys():
        Follow[k] = [ ]

    if not start:
        start = Productions[1].name
        
    Follow[start] = [ '$' ]
        
    while 1:
        didadd = 0
        for p in Productions[1:]:
            # Here is the production set
            for i in range(len(p.prod)):
                B = p.prod[i]
                if Nonterminals.has_key(B):
                    # Okay. We got a non-terminal in a production
                    fst = first(p.prod[i+1:])
                    hasempty = 0
                    for f in fst:
                        if f != '<empty>' and f not in Follow[B]:
                            Follow[B].append(f)
                            didadd = 1
                        if f == '<empty>':
                            hasempty = 1
                    if hasempty or i == (len(p.prod)-1):
                        # Add elements of follow(a) to follow(b)
                        for f in Follow[p.name]:
                            if f not in Follow[B]:
                                Follow[B].append(f)
                                didadd = 1
        if not didadd: break

    if 0 and yaccdebug:
        _vf.write('\nFollow:\n')
        for k in Nonterminals.keys():
            _vf.write("%-20s : %s\n" % (k, " ".join([str(s) for s in Follow[k]])))

# -------------------------------------------------------------------------
# compute_first1()
#
# Compute the value of FIRST1(X) for all symbols
# -------------------------------------------------------------------------
def compute_first1():

    # Terminals:
    for t in Terminals.keys():
        First[t] = [t]

    First['$'] = ['$']
    First['#'] = ['#'] # what's this for?

    # Nonterminals:

    # Initialize to the empty set:
    for n in Nonterminals.keys():
        First[n] = []

    # Then propagate symbols until no change:
    while 1:
        some_change = 0
        for n in Nonterminals.keys():
            for p in Prodnames[n]:
                for f in first(p.prod):
                    if f not in First[n]:
                        First[n].append( f )
                        some_change = 1
        if not some_change:
            break

    if 0 and yaccdebug:
        _vf.write('\nFirst:\n')
        for k in Nonterminals.keys():
            _vf.write("%-20s : %s\n" %
                (k, " ".join([str(s) for s in First[k]])))

# -----------------------------------------------------------------------------
#                           === SLR Generation ===
#
# The following functions are used to construct SLR (Simple LR) parsing tables
# as described on p.221-229 of the dragon book.
# -----------------------------------------------------------------------------

# Global variables for the LR parsing engine
def lr_init_vars():
    global _lr_action, _lr_goto, _lr_method
    global _lr_goto_cache
    
    _lr_action       = { }        # Action table
    _lr_goto         = { }        # Goto table
    _lr_method       = "Unknown"  # LR method used
    _lr_goto_cache   = { }

# Compute the LR(0) closure operation on I, where I is a set of LR(0) items.
# prodlist is a list of productions.

_add_count = 0       # Counter used to detect cycles

def lr0_closure(I):
    global _add_count
    
    _add_count += 1
    prodlist = Productions
    
    # Add everything in I to J        
    J = I[:]
    didadd = 1
    while didadd:
        didadd = 0
        for j in J:
            for x in j.lrafter:
                if x.lr0_added == _add_count: continue
                # Add B --> .G to J
                J.append(x.lr_next)
                x.lr0_added = _add_count
                didadd = 1
               
    return J

# Compute the LR(0) goto function goto(I,X) where I is a set
# of LR(0) items and X is a grammar symbol.   This function is written
# in a way that guarantees uniqueness of the generated goto sets
# (i.e. the same goto set will never be returned as two different Python
# objects).  With uniqueness, we can later do fast set comparisons using
# id(obj) instead of element-wise comparison.

def lr0_goto(I,x):
    # First we look for a previously cached entry
    g = _lr_goto_cache.get((id(I),x),None)
    if g: return g

    # Now we generate the goto set in a way that guarantees uniqueness
    # of the result
    
    s = _lr_goto_cache.get(x,None)
    if not s:
        s = { }
        _lr_goto_cache[x] = s

    gs = [ ]
    for p in I:
        n = p.lr_next
        if n and n.lrbefore == x:
            s1 = s.get(id(n),None)
            if not s1:
                s1 = { }
                s[id(n)] = s1
            gs.append(n)
            s = s1
    g = s.get('$',None)
    if not g:
        if gs:
            g = lr0_closure(gs)
            s['$'] = g
        else:
            s['$'] = gs
    _lr_goto_cache[(id(I),x)] = g
    return g

# Added for LALR(1)

# Given a setnumber of an lr0 state and a symbol return the setnumber of the goto state 
def lr0_goto_setnumber(I_setnumber, x):
    global Canonical
    global GotoSetNum

    if GotoSetNum.has_key((I_setnumber, x)):
        setnumber = GotoSetNum[(I_setnumber, x)]
    else:
        gset = lr0_goto(Canonical[I_setnumber], x)
        if not gset:
            return -1
        else:
            gsetlen = len(gset)            
            for i in xrange(len(gset[0].setnumbers)):
                inall = 1
                for item in gset:
                    if not item.setnumbers[i]:
                        inall = 0
                        break
                if inall and len(Canonical[i]) == gsetlen:
                    setnumber = i
                    break          # Note: DB. I added this to improve performance.
                                   # Not sure if this breaks the algorithm (it doesn't appear to).

            GotoSetNum[(I_setnumber, x)] = setnumber
            
    return setnumber

# Compute the kernel of a set of LR(0) items
def lr0_kernel(I):
    KI = [ ]
    for p in I:
        if p.name == "S'" or p.lr_index > 0 or p.len == 0:
            KI.append(p)

    return KI

_lr0_cidhash = { }

# Compute the LR(0) sets of item function
def lr0_items():
    
    C = [ lr0_closure([Productions[0].lr_next]) ]
    i = 0
    for I in C:
        _lr0_cidhash[id(I)] = i
        i += 1

    # Loop over the items in C and each grammar symbols
    i = 0
    while i < len(C):
        I = C[i]
        i += 1

        # Collect all of the symbols that could possibly be in the goto(I,X) sets
        asyms = { }
        for ii in I:
            for s in ii.usyms:
                asyms[s] = None

        for x in asyms.keys():
            g = lr0_goto(I,x)
            if not g:  continue
            if _lr0_cidhash.has_key(id(g)): continue
            _lr0_cidhash[id(g)] = len(C)            
            C.append(g)
            
    return C

# -----------------------------------------------------------------------------
# slr_parse_table()
#
# This function constructs an SLR table.
# -----------------------------------------------------------------------------
def slr_parse_table():
    global _lr_method
    goto = _lr_goto           # Goto array
    action = _lr_action       # Action array
    actionp = { }             # Action production array (temporary)

    _lr_method = "SLR"
    
    n_srconflict = 0
    n_rrconflict = 0

    if yaccdebug:
        sys.stderr.write("yacc: Generating SLR parsing table...\n")        
        _vf.write("\n\nParsing method: SLR\n\n")
        
    # Step 1: Construct C = { I0, I1, ... IN}, collection of LR(0) items
    # This determines the number of states
    
    C = lr0_items()

    # Build the parser table, state by state
    st = 0
    for I in C:
        # Loop over each production in I
        actlist = [ ]              # List of actions
        
        if yaccdebug:
            _vf.write("\nstate %d\n\n" % st)
            for p in I:
                _vf.write("    (%d) %s\n" % (p.number, str(p)))
            _vf.write("\n")

        for p in I:
            try:
                if p.prod[-1] == ".":
                    if p.name == "S'":
                        # Start symbol. Accept!
                        action[st,"$"] = 0
                        actionp[st,"$"] = p
                    else:
                        # We are at the end of a production.  Reduce!
                        for a in Follow[p.name]:
                            actlist.append((a,p,"reduce using rule %d (%s)" % (p.number,p)))
                            r = action.get((st,a),None)
                            if r is not None:
                                # Whoa. Have a shift/reduce or reduce/reduce conflict
                                if r > 0:
                                    # Need to decide on shift or reduce here
                                    # By default we favor shifting. Need to add
                                    # some precedence rules here.
                                    sprec,slevel = Productions[actionp[st,a].number].prec                                    
                                    rprec,rlevel = Precedence.get(a,('right',0))
                                    if (slevel < rlevel) or ((slevel == rlevel) and (rprec == 'left')):
                                        # We really need to reduce here.  
                                        action[st,a] = -p.number
                                        actionp[st,a] = p
                                        if not slevel and not rlevel:
                                            _vfc.write("shift/reduce conflict in state %d resolved as reduce.\n" % st)
                                            _vf.write("  ! shift/reduce conflict for %s resolved as reduce.\n" % a)
                                            n_srconflict += 1
                                    elif (slevel == rlevel) and (rprec == 'nonassoc'):
                                        action[st,a] = None
                                    else:
                                        # Hmmm. Guess we'll keep the shift
                                        if not slevel and not rlevel:
                                            _vfc.write("shift/reduce conflict in state %d resolved as shift.\n" % st)
                                            _vf.write("  ! shift/reduce conflict for %s resolved as shift.\n" % a)
                                            n_srconflict +=1                                    
                                elif r < 0:
                                    # Reduce/reduce conflict.   In this case, we favor the rule
                                    # that was defined first in the grammar file
                                    oldp = Productions[-r]
                                    pp = Productions[p.number]
                                    if oldp.line > pp.line:
                                        action[st,a] = -p.number
                                        actionp[st,a] = p
                                    # sys.stderr.write("Reduce/reduce conflict in state %d\n" % st)
                                    n_rrconflict += 1
                                    _vfc.write("reduce/reduce conflict in state %d resolved using rule %d (%s).\n" % (st, actionp[st,a].number, actionp[st,a]))
                                    _vf.write("  ! reduce/reduce conflict for %s resolved using rule %d (%s).\n" % (a,actionp[st,a].number, actionp[st,a]))
                                else:
                                    sys.stderr.write("Unknown conflict in state %d\n" % st)
                            else:
                                action[st,a] = -p.number
                                actionp[st,a] = p
                else:
                    i = p.lr_index
                    a = p.prod[i+1]       # Get symbol right after the "."
                    if Terminals.has_key(a):
                        g = lr0_goto(I,a)
                        j = _lr0_cidhash.get(id(g),-1)
                        if j >= 0:
                            # We are in a shift state
                            actlist.append((a,p,"shift and go to state %d" % j))
                            r = action.get((st,a),None)
                            if r is not None:
                                # Whoa have a shift/reduce or shift/shift conflict
                                if r > 0:
                                    if r != j:
                                        sys.stderr.write("Shift/shift conflict in state %d\n" % st)
                                elif r < 0:
                                    # Do a precedence check.
                                    #   -  if precedence of reduce rule is higher, we reduce.
                                    #   -  if precedence of reduce is same and left assoc, we reduce.
                                    #   -  otherwise we shift
                                    rprec,rlevel = Productions[actionp[st,a].number].prec
                                    sprec,slevel = Precedence.get(a,('right',0))
                                    if (slevel > rlevel) or ((slevel == rlevel) and (rprec != 'left')):
                                        # We decide to shift here... highest precedence to shift
                                        action[st,a] = j
                                        actionp[st,a] = p
                                        if not slevel and not rlevel:
                                            n_srconflict += 1
                                            _vfc.write("shift/reduce conflict in state %d resolved as shift.\n" % st)
                                            _vf.write("  ! shift/reduce conflict for %s resolved as shift.\n" % a)
                                    elif (slevel == rlevel) and (rprec == 'nonassoc'):
                                        action[st,a] = None
                                    else:                                            
                                        # Hmmm. Guess we'll keep the reduce
                                        if not slevel and not rlevel:
                                            n_srconflict +=1
                                            _vfc.write("shift/reduce conflict in state %d resolved as reduce.\n" % st)
                                            _vf.write("  ! shift/reduce conflict for %s resolved as reduce.\n" % a)
                                            
                                else:
                                    sys.stderr.write("Unknown conflict in state %d\n" % st)
                            else:
                                action[st,a] = j
                                actionp[st,a] = p
                                
            except StandardError,e:
                raise YaccError, "Hosed in slr_parse_table", e

        # Print the actions associated with each terminal
        if yaccdebug:
          _actprint = { }
          for a,p,m in actlist:
            if action.has_key((st,a)):
                if p is actionp[st,a]:
                    _vf.write("    %-15s %s\n" % (a,m))
                    _actprint[(a,m)] = 1
          _vf.write("\n")
          for a,p,m in actlist:
            if action.has_key((st,a)):
                if p is not actionp[st,a]:
                    if not _actprint.has_key((a,m)):
                        _vf.write("  ! %-15s [ %s ]\n" % (a,m))
                        _actprint[(a,m)] = 1
            
        # Construct the goto table for this state
        if yaccdebug:
            _vf.write("\n")
        nkeys = { }
        for ii in I:
            for s in ii.usyms:
                if Nonterminals.has_key(s):
                    nkeys[s] = None
        for n in nkeys.keys():
            g = lr0_goto(I,n)
            j = _lr0_cidhash.get(id(g),-1)            
            if j >= 0:
                goto[st,n] = j
                if yaccdebug:
                    _vf.write("    %-30s shift and go to state %d\n" % (n,j))

        st += 1

    if yaccdebug:
        if n_srconflict == 1:
            sys.stderr.write("yacc: %d shift/reduce conflict\n" % n_srconflict)
        if n_srconflict > 1:
            sys.stderr.write("yacc: %d shift/reduce conflicts\n" % n_srconflict)
        if n_rrconflict == 1:
            sys.stderr.write("yacc: %d reduce/reduce conflict\n" % n_rrconflict)
        if n_rrconflict > 1:
            sys.stderr.write("yacc: %d reduce/reduce conflicts\n" % n_rrconflict)


# -----------------------------------------------------------------------------
#                       ==== LALR(1) Parsing ====
# FINISHED!  5/20/2003 by Elias Ioup
# -----------------------------------------------------------------------------


# Compute the lr1_closure of a set I.  I is a list of productions and setnumber
# is the state that you want the lr items that are made from the to come from.

_lr1_add_count = 0

def lr1_closure(I, setnumber = 0):
    global _add_count
    global Nonterminals

    _add_count += 1
    prodlist = Productions

    # Add everything in I to J        
    J = I[:]
    Jhash = { }
    for j in J:
        Jhash[id(j)] = 1
        
    didadd = 1
    while didadd:
        didadd = 0
        for j in J:
            jprod = j.prod
            jlr_index = j.lr_index
            jprodslice = jprod[jlr_index+2:]
            
            if jlr_index < len(jprod) - 1 and Nonterminals.has_key(jprod[jlr_index+1]):
                first_syms = []

                if j.lk_added.setdefault(setnumber, 0) < len(j.lookaheads[setnumber]): 
                    for a in j.lookaheads[setnumber][j.lk_added[setnumber]:]: 
                        # find b in FIRST(Xa) if j = [A->a.BX,a]
                        temp_first_syms = first(jprodslice + (a,))
                        for x in temp_first_syms:
                            if x not in first_syms:
                                first_syms.append(x)

                j.lk_added[setnumber] = len(j.lookaheads[setnumber]) 

                for x in j.lrafter:
                    
                    # Add B --> .G to J
                    if x.lr_next.lookaheads.has_key(setnumber):
                        _xlook = x.lr_next.lookaheads[setnumber]                        
                        for s in first_syms:
                            if s not in _xlook:
                                _xlook.append(s)
                                didadd = 1
                    else:        
                        x.lr_next.lookaheads[setnumber] = first_syms
                        didadd = 1

                    nid = id(x.lr_next)
                    if not Jhash.has_key(nid):
                        J.append(x.lr_next)
                        Jhash[nid] = 1
                        
    return J

def add_lookaheads(K):
    spontaneous = []
    propogate = []

    for setnumber in range(len(K)):
        for kitem in K[setnumber]:
            kitem.lookaheads[setnumber] = ['#']
            J = lr1_closure([kitem], setnumber)

            # find the lookaheads that are spontaneously created from closures
            # and the propogations of lookaheads between lr items
            for item in J:
                if item.lr_index < len(item.prod)-1:
                    for lookahead in item.lookaheads[setnumber]:
                        goto_setnumber = lr0_goto_setnumber(setnumber, item.prod[item.lr_index+1]) 
                        next = None 
                        if lookahead != '#':
                            if item.lr_next in K[goto_setnumber]:
                                next = item.lr_next
                            if next:
                                spontaneous.append((next, (lookahead, goto_setnumber)))
                        else:
                            if goto_setnumber > -1:
                                if item.lr_next in K[goto_setnumber]:
                                    next = item.lr_next
                                    
                            if next:
                                propogate.append(((kitem, setnumber), (next, goto_setnumber)))

        
        for x in K[setnumber]:
            x.lookaheads[setnumber] = []

    for x in spontaneous:
        if x[1][0] not in x[0].lookaheads[x[1][1]]:
            x[0].lookaheads[x[1][1]].append(x[1][0])

    K[0][0].lookaheads[0] = ['$']

    pitems = {}
    for x in propogate:
        if pitems.has_key(x[0]):
            pitems[x[0]].append(x[1])
        else:
            pitems[x[0]] = []
            pitems[x[0]].append(x[1])
            
    # propogate the lookaheads that were spontaneously generated
    # based on the propogations produced above
    stop = 0

    while not stop:
        stop = 1
        kindex = 0
        for set in K:
            for item in set:
                pkey = (item, kindex)
                if pitems.has_key(pkey):
                    for propogation in pitems[pkey]:
                        gitem = propogation[0]
                        gsetnumber = propogation[1]
                        glookaheads = gitem.lookaheads[gsetnumber]
                        for lookahead in item.lookaheads[kindex]:
                            if lookahead not in glookaheads:
                                glookaheads.append(lookahead)
                                stop = 0
            kindex += 1

def ReduceNonterminals():
    global Nonterminals

    global TReductions
    global NTReductions

    for nt in Nonterminals.keys():
        TReductions[nt] = []
        NTReductions[nt] = []
        
    for nt in Nonterminals.keys():
        terms = ReduceToTerminals(nt)
        TReductions[nt].extend(terms)
        if not NTReductions.has_key(nt):
            ReduceToNonterminals(nt)
        

def ReduceToTerminals(nt):
    global Prodnames
    global Terminals
    reducedterminals = []

    for p in Prodnames[nt]:
        if len(p.prod) > 0:
            if Terminals.has_key(p.prod[0]):
                if p.prod[0] not in reducedterminals:
                    reducedterminals.append(p.prod[0])
            else:
                if p.prod[0] != nt:
                    terms = ReduceToTerminals(p.prod[0])
                    for t in terms:
                        if t not in reducedterminals:
                            reducedterminals.append(t)

    return reducedterminals

            
def ReduceToNonterminals(nt):
    global Prodnames
    global Nonterminals
    global NTReductions
    reducednonterminals = []

    for p in Prodnames[nt]:
        if len(p.prod) > 0:
            if Nonterminals.has_key(p.prod[0]):
                if p.prod[0] not in reducednonterminals:
                    reducednonterminals.append(p.prod[0])
                    if p.prod[0] != nt:
                        if not NTReductions.has_key(p.prod[0]):
                            ReduceToNonterminals(p.prod[0])
                        
                        nterms = NTReductions[p.prod[0]]
                        for nt in nterms:
                            if nt not in reducednonterminals:
                                reducednonterminals.append(nt)
                            

    NTReductions[nt] = reducednonterminals

# -----------------------------------------------------------------------------
# lalr_parse_table()
#
# This function constructs an LALR table.
# -----------------------------------------------------------------------------
def lalr_parse_table():
    global _lr_method
    goto = _lr_goto           # Goto array
    action = _lr_action       # Action array
    actionp = { }             # Action production array (temporary)
    goto_cache = _lr_goto_cache
    cid_hash = _lr0_cidhash
    
    _lr_method = "LALR"
    
    n_srconflict = 0
    n_rrconflict = 0

    if yaccdebug:
        sys.stderr.write("yacc: Generating LALR(1) parsing table...\n")
        _vf.write("\n\nParsing method: LALR(1)\n\n")
        
    # Step 1: Construct C = { I0, I1, ... IN}, collection of LR(0) items
    # This determines the number of states

    C = lr0_items()

    global Canonical
    Canonical = C

    ###
    # Create the kernel states.
    ###
    K = []
    setC = [0]*len(C)
    for x in C:
        K.append(lr0_kernel(x))
        for y in x:
            y.setnumbers = setC[:]

    _cindex = 0
    for x in C:
        for y in x:
            y.lookaheads[_cindex] = [] 
            y.setnumbers[_cindex] = 1
        _cindex = _cindex + 1

    ###
    # Add lookaheads to the lr items
    ###

    add_lookaheads(K)

    ###
    # Do the reductions for parsing first and keep them in globals
    ###

    ReduceNonterminals()

    global TReductions
    global NTReductions
    global Prodempty

    EmptyAncestors = {}
    for y in Prodempty.keys():
        EmptyAncestors[y] = []
    for x in NTReductions.items():
        for y in x[1]:
            if Prodempty.has_key(y):
                EmptyAncestors[y].append(x[0])


    # Build the parser table, state by state
    st = 0
    for I in C:
        # Loop over each production in I
        actlist = [ ]              # List of actions
        acthash = { }
        
        idI = id(I)
        
        if yaccdebug:
            _vf.write("\nstate %d\n\n" % st)
            for p in I:
                _vf.write("    (%d) %s\n" % (p.number, str(p)))
            _vf.write("\n")

        global First
        for p in I:
            try:
                if p.prod[-1] == ".":
                    if p.name == "S'":
                        # Start symbol. Accept!
                        action[st,"$"] = 0
                        actionp[st,"$"] = p
                    elif len(p.prod) == 0:
                        ancestors = EmptyAncestors[p.name]
                        for i in ancestors:
                            for s in K:
                                if i in s:
                                    input_list = []
                                    plist = Productions[i.name]
                                    for x in plist:
                                        if len(x.prod) > 0 and x.prod[0] == p.name:
                                            n = p.prod[1:]
                                            d = x.prod[lr_index+2:]
                                            for l in x.lookaheads.items():
                                                flist = First[tuple(n+d+[l])]
                                                for f in flist:
                                                    if f not in input_list and f in p.lookaheads[st]:
                                                        input_list.append(f)
                                        
                                    # We are at the end of a production.  Reduce!
                                    #print "input_list: %s" % input_list
                                    #print "Follow[p.name]: %s" % Follow[p.name]
                                    for a in input_list:
                                        actlist.append((a,p,"reduce using rule %d (%s) " % (p.number,p)))
                                        r = action.get((st,a),None)
                                        if r is not None:
                                            # Whoa. Have a shift/reduce or reduce/reduce conflict
                                            if r > 0:
                                                # Need to decide on shift or reduce here
                                                # By default we favor shifting. Need to add
                                                # some precedence rules here.
                                                sprec,slevel = Productions[actionp[st,a].number].prec                                    
                                                rprec,rlevel = Precedence.get(a,('right',0))
                                                if (slevel < rlevel) or ((slevel == rlevel) and (rprec == 'left')):
                                                    # We really need to reduce here.  
                                                    action[st,a] = -p.number
                                                    actionp[st,a] = p
                                                    if not slevel and not rlevel:
                                                        _vfc.write("shift/reduce conflict in state %d resolved as reduce.\n" % st)
                                                        _vf.write("  ! shift/reduce conflict for %s resolved as reduce.\n" % a)
                                                        n_srconflict += 1
                                                elif (slevel == rlevel) and (rprec == 'nonassoc'):
                                                    action[st,a] = None
                                                else:
                                                    # Hmmm. Guess we'll keep the shift
                                                    if not slevel and not rlevel:
                                                        _vfc.write("shift/reduce conflict in state %d resolved as shift.\n" % st)
                                                        _vf.write("  ! shift/reduce conflict for %s resolved as shift.\n" % a)
                                                        n_srconflict +=1                                    
                                            elif r < 0:
                                                # Reduce/reduce conflict.   In this case, we favor the rule
                                                # that was defined first in the grammar file
                                                oldp = Productions[-r]
                                                pp = Productions[p.number]
                                                if oldp.line > pp.line:
                                                    action[st,a] = -p.number
                                                    actionp[st,a] = p
                                                    # print "Reduce/reduce conflict in state %d" % st
                                                    n_rrconflict += 1
                                                    _vfc.write("reduce/reduce conflict in state %d resolved using rule %d.\n" % (st, actionp[st,a].number))
                                                    _vf.write("  ! reduce/reduce conflict for %s resolved using rule %d.\n" % (a,actionp[st,a].number))
                                            else:
                                                sys.stderr.write("Unknown conflict in state %d\n" % st)
                                        else:
                                            action[st,a] = -p.number
                                            actionp[st,a] = p

                                    break           # break out of the for s in K loop because we only want to make
                                                    # sure that a production is in the Kernel
                        
                    else:
                        # We are at the end of a production.  Reduce!

                        for a in p.lookaheads[st]:
                            actlist.append((a,p,"reduce using rule %d (%s)" % (p.number,p)))
                            r = action.get((st,a),None)
                            if r is not None:
                                # Whoa. Have a shift/reduce or reduce/reduce conflict
                                if r > 0:
                                    # Need to decide on shift or reduce here
                                    # By default we favor shifting. Need to add
                                    # some precedence rules here.
                                    sprec,slevel = Productions[actionp[st,a].number].prec                                    
                                    rprec,rlevel = Precedence.get(a,('right',0))                                    
                                    if (slevel < rlevel) or ((slevel == rlevel) and (rprec == 'left')):
                                        # We really need to reduce here.  
                                        action[st,a] = -p.number
                                        actionp[st,a] = p
                                        if not slevel and not rlevel:
                                            _vfc.write("shift/reduce conflict in state %d resolved as reduce.\n" % st)
                                            _vf.write("  ! shift/reduce conflict for %s resolved as reduce.\n" % a)
                                            n_srconflict += 1
                                    elif (slevel == rlevel) and (rprec == 'nonassoc'):
                                        action[st,a] = None
                                    else:
                                        # Hmmm. Guess we'll keep the shift
                                        if not slevel and not rlevel:
                                            _vfc.write("shift/reduce conflict in state %d resolved as shift.\n" % st)
                                            _vf.write("  ! shift/reduce conflict for %s resolved as shift.\n" % a)
                                            n_srconflict +=1                                    
                                elif r < 0:
                                    # Reduce/reduce conflict.   In this case, we favor the rule
                                    # that was defined first in the grammar file
                                    oldp = Productions[-r]
                                    pp = Productions[p.number]
                                    if oldp.line > pp.line:
                                        action[st,a] = -p.number
                                        actionp[st,a] = p
                                    # print "Reduce/reduce conflict in state %d" % st
                                    n_rrconflict += 1
                                    _vfc.write("reduce/reduce conflict in state %d resolved using rule %d.\n" % (st, actionp[st,a].number))
                                    _vf.write("  ! reduce/reduce conflict for %s resolved using rule %d.\n" % (a,actionp[st,a].number))
                                else:
                                    print "Unknown conflict in state %d" % st
                            else:
                                action[st,a] = -p.number
                                actionp[st,a] = p
                else:
                    i = p.lr_index
                    a = p.prod[i+1]       # Get symbol right after the "."
                    if Terminals.has_key(a):
                        g = goto_cache[(idI,a)]
                        j = cid_hash.get(id(g),-1)
                        if j >= 0:
                            # We are in a shift state
                            _k = (a,j)
                            if not acthash.has_key(_k):
                                actlist.append((a,p,"shift and go to state %d" % j))
                                acthash[_k] = 1
                            r = action.get((st,a),None)
                            if r is not None:
                                # Whoa have a shift/reduce or shift/shift conflict
                                if r > 0:
                                    if r != j:
                                        sys.stderr.write("Shift/shift conflict in state %d\n" % st)
                                elif r < 0:
                                    # Do a precedence check.
                                    #   -  if precedence of reduce rule is higher, we reduce.
                                    #   -  if precedence of reduce is same and left assoc, we reduce.
                                    #   -  otherwise we shift
                                    rprec,rlevel = Productions[actionp[st,a].number].prec
                                    sprec,slevel = Precedence.get(a,('right',0))
                                    if (slevel > rlevel) or ((slevel == rlevel) and (rprec != 'left')):
                                        # We decide to shift here... highest precedence to shift
                                        action[st,a] = j
                                        actionp[st,a] = p
                                        if not slevel and not rlevel:
                                            n_srconflict += 1
                                            _vfc.write("shift/reduce conflict in state %d resolved as shift.\n" % st)
                                            _vf.write("  ! shift/reduce conflict for %s resolved as shift.\n" % a)
                                    elif (slevel == rlevel) and (rprec == 'nonassoc'):
                                        action[st,a] = None
                                    else:                                            
                                        # Hmmm. Guess we'll keep the reduce
                                        if not slevel and not rlevel:
                                            n_srconflict +=1
                                            _vfc.write("shift/reduce conflict in state %d resolved as reduce.\n" % st)
                                            _vf.write("  ! shift/reduce conflict for %s resolved as reduce.\n" % a)
                                            
                                else:
                                    sys.stderr.write("Unknown conflict in state %d\n" % st)
                            else:
                                action[st,a] = j
                                actionp[st,a] = p
                    else:
                        nonterminal = a
                        term_list = TReductions[nonterminal]
                        # DB: This loop gets executed a lot.  Try to optimize
                        for a in term_list:
                            g = goto_cache[(idI,a)]
                            j = cid_hash[id(g)]
                            if j >= 0:
                                # We are in a shift state
                                # Don't put repeated shift actions on action list (performance hack)
                                _k = (a,j)
                                if not acthash.has_key(_k):
                                    actlist.append((a,p,"shift and go to state "+str(j)))
                                    acthash[_k] = 1
                                    
                                r = action.get((st,a),None)
                                if r is not None:
                                    # Whoa have a shift/reduce or shift/shift conflict
                                    if r > 0:
                                        if r != j:
                                            sys.stderr.write("Shift/shift conflict in state %d\n" % st)
                                        continue
                                    elif r < 0:
                                        # Do a precedence check.
                                        #   -  if precedence of reduce rule is higher, we reduce.
                                        #   -  if precedence of reduce is same and left assoc, we reduce.
                                        #   -  otherwise we shift
                                        rprec,rlevel = Productions[actionp[st,a].number].prec
                                        sprec,slevel = Precedence.get(a,('right',0))
                                        if (slevel > rlevel) or ((slevel == rlevel) and (rprec != 'left')):
                                            # We decide to shift here... highest precedence to shift
                                            action[st,a] = j
                                            actionp[st,a] = p
                                            if not slevel and not rlevel:
                                                n_srconflict += 1
                                                _vfc.write("shift/reduce conflict in state %d resolved as shift.\n" % st)
                                                _vf.write("  ! shift/reduce conflict for %s resolved as shift.\n" % a)
                                        elif (slevel == rlevel) and (rprec == 'nonassoc'):
                                            action[st,a] = None
                                        else:                                            
                                            # Hmmm. Guess we'll keep the reduce
                                            if not slevel and not rlevel:
                                                n_srconflict +=1
                                                _vfc.write("shift/reduce conflict in state %d resolved as reduce.\n" % st)
                                                _vf.write("  ! shift/reduce conflict for %s resolved as reduce.\n" % a)
                                            
                                    else:
                                        sys.stderr.write("Unknown conflict in state %d\n" % st)
                                else:
                                    action[st,a] = j
                                    actionp[st,a] = p
                    
            except StandardError,e:
                raise YaccError, "Hosed in lalr_parse_table", e

        # Print the actions associated with each terminal
        if yaccdebug:
          for a,p,m in actlist:
            if action.has_key((st,a)):
                if p is actionp[st,a]:
                    _vf.write("    %-15s %s\n" % (a,m))
          _vf.write("\n")

          for a,p,m in actlist:
            if action.has_key((st,a)):
                if p is not actionp[st,a]:
                    _vf.write("  ! %-15s [ %s ]\n" % (a,m))
            
        # Construct the goto table for this state
        nkeys = { }
        for ii in I:
            for s in ii.usyms:
                if Nonterminals.has_key(s):
                    nkeys[s] = None

        # Construct the goto table for this state
        for n in nkeys.keys():
            g = lr0_goto(I,n)
            j = cid_hash.get(id(g),-1)            
            if j >= 0:
                goto[st,n] = j
                if yaccdebug:
                    _vf.write("    %-30s shift and go to state %d\n" % (n,j))

        st += 1
    if yaccdebug:
        if n_srconflict == 1:
            sys.stderr.write("yacc: %d shift/reduce conflict\n" % n_srconflict)
        if n_srconflict > 1:
            sys.stderr.write("yacc: %d shift/reduce conflicts\n" % n_srconflict)        
        if n_rrconflict == 1:
            sys.stderr.write("yacc: %d reduce/reduce conflict\n" % n_rrconflict)
        if n_rrconflict > 1:
            sys.stderr.write("yacc: %d reduce/reduce conflicts\n" % n_rrconflict)

    
# -----------------------------------------------------------------------------
#                          ==== LR Utility functions ====
# -----------------------------------------------------------------------------

# -----------------------------------------------------------------------------
# _lr_write_tables()
#
# This function writes the LR parsing tables to a file
# -----------------------------------------------------------------------------

def lr_write_tables(modulename=tab_module,outputdir=''):
    filename = os.path.join(outputdir,modulename) + ".py"
    try:
        f = open(filename,"w")

        f.write("""
# %s
# This file is automatically generated. Do not edit.

_lr_method = %s

_lr_signature = %s
""" % (filename, repr(_lr_method), repr(Signature.digest())))

        # Change smaller to 0 to go back to original tables
        smaller = 1
                
        # Factor out names to try and make smaller
        if smaller:
            items = { }
        
            for k,v in _lr_action.items():
                i = items.get(k[1])
                if not i:
                    i = ([],[])
                    items[k[1]] = i
                i[0].append(k[0])
                i[1].append(v)

            f.write("\n_lr_action_items = {")
            for k,v in items.items():
                f.write("%r:([" % k)
                for i in v[0]:
                    f.write("%r," % i)
                f.write("],[")
                for i in v[1]:
                    f.write("%r," % i)
                           
                f.write("]),")
            f.write("}\n")

            f.write("""
_lr_action = { }
for _k, _v in _lr_action_items.items():
   for _x,_y in zip(_v[0],_v[1]):
       _lr_action[(_x,_k)] = _y
del _lr_action_items
""")
            
        else:
            f.write("\n_lr_action = { ");
            for k,v in _lr_action.items():
                f.write("(%r,%r):%r," % (k[0],k[1],v))
            f.write("}\n");

        if smaller:
            # Factor out names to try and make smaller
            items = { }
        
            for k,v in _lr_goto.items():
                i = items.get(k[1])
                if not i:
                    i = ([],[])
                    items[k[1]] = i
                i[0].append(k[0])
                i[1].append(v)

            f.write("\n_lr_goto_items = {")
            for k,v in items.items():
                f.write("%r:([" % k)
                for i in v[0]:
                    f.write("%r," % i)
                f.write("],[")
                for i in v[1]:
                    f.write("%r," % i)
                           
                f.write("]),")
            f.write("}\n")

            f.write("""
_lr_goto = { }
for _k, _v in _lr_goto_items.items():
   for _x,_y in zip(_v[0],_v[1]):
       _lr_goto[(_x,_k)] = _y
del _lr_goto_items
""")
        else:
            f.write("\n_lr_goto = { ");
            for k,v in _lr_goto.items():
                f.write("(%r,%r):%r," % (k[0],k[1],v))                    
            f.write("}\n");

        # Write production table
        f.write("_lr_productions = [\n")
        for p in Productions:
            if p:
                if (p.func):
                    f.write("  (%r,%d,%r,%r,%d),\n" % (p.name, p.len, p.func.__name__,p.file,p.line))
                else:
                    f.write("  (%r,%d,None,None,None),\n" % (p.name, p.len))
            else:
                f.write("  None,\n")
        f.write("]\n")
        f.close()

    except IOError,e:
        print "Unable to create '%s'" % filename
        print e
        return

def lr_read_tables(module=tab_module,optimize=0):
    global _lr_action, _lr_goto, _lr_productions, _lr_method
    try:
        exec "import %s as parsetab" % module
        
        if (optimize) or (Signature.digest() == parsetab._lr_signature):
            _lr_action = parsetab._lr_action
            _lr_goto   = parsetab._lr_goto
            _lr_productions = parsetab._lr_productions
            _lr_method = parsetab._lr_method
            return 1
        else:
            return 0
        
    except (ImportError,AttributeError):
        return 0

# -----------------------------------------------------------------------------
# yacc(module)
#
# Build the parser module
# -----------------------------------------------------------------------------

def yacc(method=default_lr, debug=yaccdebug, module=None, tabmodule=tab_module, start=None, check_recursion=1, optimize=0,write_tables=1,debugfile=debug_file,outputdir=''):
    global yaccdebug
    yaccdebug = debug
    
    initialize_vars()
    files = { }
    error = 0

    # Add starting symbol to signature
    if start:
        Signature.update(start)

    # Add parsing method to signature
    Signature.update(method)
    
    # If a "module" parameter was supplied, extract its dictionary.
    # Note: a module may in fact be an instance as well.
    
    if module:
        # User supplied a module object.
        if isinstance(module, types.ModuleType):
            ldict = module.__dict__
        elif isinstance(module, types.InstanceType):
            _items = [(k,getattr(module,k)) for k in dir(module)]
            ldict = { }
            for i in _items:
                ldict[i[0]] = i[1]
        else:
            raise ValueError,"Expected a module"
        
    else:
        # No module given.  We might be able to get information from the caller.
        # Throw an exception and unwind the traceback to get the globals
        
        try:
            raise RuntimeError
        except RuntimeError:
            e,b,t = sys.exc_info()
            f = t.tb_frame
            f = f.f_back           # Walk out to our calling function
            ldict = f.f_globals    # Grab its globals dictionary

    # If running in optimized mode.  We're going to

    if (optimize and lr_read_tables(tabmodule,1)):
        # Read parse table
        del Productions[:]
        for p in _lr_productions:
            if not p:
                Productions.append(None)
            else:
                m = MiniProduction()
                m.name = p[0]
                m.len  = p[1]
                m.file = p[3]
                m.line = p[4]
                if p[2]:
                    m.func = ldict[p[2]]
                Productions.append(m)
        
    else:
        # Get the tokens map
        if (module and isinstance(module,types.InstanceType)):
            tokens = getattr(module,"tokens",None)
        else:
            tokens = ldict.get("tokens",None)
    
        if not tokens:
            raise YaccError,"module does not define a list 'tokens'"
        if not (isinstance(tokens,types.ListType) or isinstance(tokens,types.TupleType)):
            raise YaccError,"tokens must be a list or tuple."

        # Check to see if a requires dictionary is defined.
        requires = ldict.get("require",None)
        if requires:
            if not (isinstance(requires,types.DictType)):
                raise YaccError,"require must be a dictionary."

            for r,v in requires.items():
                try:
                    if not (isinstance(v,types.ListType)):
                        raise TypeError
                    v1 = [x.split(".") for x in v]
                    Requires[r] = v1
                except StandardError:
                    print "Invalid specification for rule '%s' in require. Expected a list of strings" % r            

        
        # Build the dictionary of terminals.  We a record a 0 in the
        # dictionary to track whether or not a terminal is actually
        # used in the grammar

        if 'error' in tokens:
            print "yacc: Illegal token 'error'.  Is a reserved word."
            raise YaccError,"Illegal token name"

        for n in tokens:
            if Terminals.has_key(n):
                print "yacc: Warning. Token '%s' multiply defined." % n
            Terminals[n] = [ ]

        Terminals['error'] = [ ]

        # Get the precedence map (if any)
        prec = ldict.get("precedence",None)
        if prec:
            if not (isinstance(prec,types.ListType) or isinstance(prec,types.TupleType)):
                raise YaccError,"precedence must be a list or tuple."
            add_precedence(prec)
            Signature.update(repr(prec))

        for n in tokens:
            if not Precedence.has_key(n):
                Precedence[n] = ('right',0)         # Default, right associative, 0 precedence

        # Look for error handler
        ef = ldict.get('p_error',None)
        if ef:
            if isinstance(ef,types.FunctionType):
                ismethod = 0
            elif isinstance(ef, types.MethodType):
                ismethod = 1
            else:
                raise YaccError,"'p_error' defined, but is not a function or method."                
            eline = ef.func_code.co_firstlineno
            efile = ef.func_code.co_filename
            files[efile] = None

            if (ef.func_code.co_argcount != 1+ismethod):
                raise YaccError,"%s:%d: p_error() requires 1 argument." % (efile,eline)
            global Errorfunc
            Errorfunc = ef
        else:
            print "yacc: Warning. no p_error() function is defined."
            
        # Get the list of built-in functions with p_ prefix
        symbols = [ldict[f] for f in ldict.keys()
               if (type(ldict[f]) in (types.FunctionType, types.MethodType) and ldict[f].__name__[:2] == 'p_'
                   and ldict[f].__name__ != 'p_error')]

        # Check for non-empty symbols
        if len(symbols) == 0:
            raise YaccError,"no rules of the form p_rulename are defined."
    
        # Sort the symbols by line number
        symbols.sort(lambda x,y: cmp(x.func_code.co_firstlineno,y.func_code.co_firstlineno))

        # Add all of the symbols to the grammar
        for f in symbols:
            if (add_function(f)) < 0:
                error += 1
            else:
                files[f.func_code.co_filename] = None

        # Make a signature of the docstrings
        for f in symbols:
            if f.__doc__:
                Signature.update(f.__doc__)
    
        lr_init_vars()

        if error:
            raise YaccError,"Unable to construct parser."

        if not lr_read_tables(tabmodule):

            # Validate files
            for filename in files.keys():
                if not validate_file(filename):
                    error = 1

            # Validate dictionary
            validate_dict(ldict)

            if start and not Prodnames.has_key(start):
                raise YaccError,"Bad starting symbol '%s'" % start
        
            augment_grammar(start)    
            error = verify_productions(cycle_check=check_recursion)
            otherfunc = [ldict[f] for f in ldict.keys()
               if (type(f) in (types.FunctionType,types.MethodType) and ldict[f].__name__[:2] != 'p_')]

            if error:
                raise YaccError,"Unable to construct parser."
            
            build_lritems()
            compute_first1()
            compute_follow(start)
        
            if method == 'SLR':
                slr_parse_table()
            elif method == 'LALR':
                lalr_parse_table()
            else:
                raise YaccError, "Unknown parsing method '%s'" % method

            if write_tables:
                lr_write_tables(tabmodule,outputdir)        
    
            if yaccdebug:
                try:
                    f = open(os.path.join(outputdir,debugfile),"w")
                    f.write(_vfc.getvalue())
                    f.write("\n\n")
                    f.write(_vf.getvalue())
                    f.close()
                except IOError,e:
                    print "yacc: can't create '%s'" % debugfile,e
        
    # Made it here.   Create a parser object and set up its internal state.
    # Set global parse() method to bound method of parser object.

    p = Parser("xyzzy")
    p.productions = Productions
    p.errorfunc = Errorfunc
    p.action = _lr_action
    p.goto   = _lr_goto
    p.method = _lr_method
    p.require = Requires

    global parse
    parse = p.parse

    # Clean up all of the globals we created
    if (not optimize):
        yacc_cleanup()
    return p

# yacc_cleanup function.  Delete all of the global variables
# used during table construction

def yacc_cleanup():
    global _lr_action, _lr_goto, _lr_method, _lr_goto_cache
    del _lr_action, _lr_goto, _lr_method, _lr_goto_cache

    global Productions, Prodnames, Prodmap, Terminals 
    global Nonterminals, First, Follow, Precedence, LRitems
    global Errorfunc, Signature, Requires
    global Prodempty, TReductions, NTReductions, GotoSetNum, Canonical
    
    del Productions, Prodnames, Prodmap, Terminals
    del Nonterminals, First, Follow, Precedence, LRitems
    del Errorfunc, Signature, Requires
    del Prodempty, TReductions, NTReductions, GotoSetNum, Canonical
    
    global _vf, _vfc
    del _vf, _vfc
    
    
# Stub that raises an error if parsing is attempted without first calling yacc()
def parse(*args,**kwargs):
    raise YaccError, "yacc: No parser built with yacc()"


================================================
FILE: src/kenlm/COPYING
================================================
                    GNU GENERAL PUBLIC LICENSE
                       Version 3, 29 June 2007

 Copyright (C) 2007 Free Software Foundation, Inc. <http://fsf.org/>
 Everyone is permitted to copy and distribute verbatim copies
 of this license document, but changing it is not allowed.

                            Preamble

  The GNU General Public License is a free, copyleft license for
software and other kinds of works.

  The licenses for most software and other practical works are designed
to take away your freedom to share and change the works.  By contrast,
the GNU General Public License is intended to guarantee your freedom to
share and change all versions of a program--to make sure it remains free
software for all its users.  We, the Free Software Foundation, use the
GNU General Public License for most of our software; it applies also to
any other work released this way by its authors.  You can apply it to
your programs, too.

  When we speak of free software, we are referring to freedom, not
price.  Our General Public Licenses are designed to make sure that you
have the freedom to distribute copies of free software (and charge for
them if you wish), that you receive source code or can get it if you
want it, that you can change the software or use pieces of it in new
free programs, and that you know you can do these things.

  To protect your rights, we need to prevent others from denying you
these rights or asking you to surrender the rights.  Therefore, you have
certain responsibilities if you distribute copies of the software, or if
you modify it: responsibilities to respect the freedom of others.

  For example, if you distribute copies of such a program, whether
gratis or for a fee, you must pass on to the recipients the same
freedoms that you received.  You must make sure that they, too, receive
or can get the source code.  And you must show them these terms so they
know their rights.

  Developers that use the GNU GPL protect your rights with two steps:
(1) assert copyright on the software, and (2) offer you this License
giving you legal permission to copy, distribute and/or modify it.

  For the developers' and authors' protection, the GPL clearly explains
that there is no warranty for this free software.  For both users' and
authors' sake, the GPL requires that modified versions be marked as
changed, so that their problems will not be attributed erroneously to
authors of previous versions.

  Some devices are designed to deny users access to install or run
modified versions of the software inside them, although the manufacturer
can do so.  This is fundamentally incompatible with the aim of
protecting users' freedom to change the software.  The systematic
pattern of such abuse occurs in the area of products for individuals to
use, which is precisely where it is most unacceptable.  Therefore, we
have designed this version of the GPL to prohibit the practice for those
products.  If such problems arise substantially in other domains, we
stand ready to extend this provision to those domains in future versions
of the GPL, as needed to protect the freedom of users.

  Finally, every program is threatened constantly by software patents.
States should not allow patents to restrict development and use of
software on general-purpose computers, but in those that do, we wish to
avoid the special danger that patents applied to a free program could
make it effectively proprietary.  To prevent this, the GPL assures that
patents cannot be used to render the program non-free.

  The precise terms and conditions for copying, distribution and
modification follow.

                       TERMS AND CONDITIONS

  0. Definitions.

  "This License" refers to version 3 of the GNU General Public License.

  "Copyright" also means copyright-like laws that apply to other kinds of
works, such as semiconductor masks.

  "The Program" refers to any copyrightable work licensed under this
License.  Each licensee is addressed as "you".  "Licensees" and
"recipients" may be individuals or organizations.

  To "modify" a work means to copy from or adapt all or part of the work
in a fashion requiring copyright permission, other than the making of an
exact copy.  The resulting work is called a "modified version" of the
earlier work or a work "based on" the earlier work.

  A "covered work" means either the unmodified Program or a work based
on the Program.

  To "propagate" a work means to do anything with it that, without
permission, would make you directly or secondarily liable for
infringement under applicable copyright law, except executing it on a
computer or modifying a private copy.  Propagation includes copying,
distribution (with or without modification), making available to the
public, and in some countries other activities as well.

  To "convey" a work means any kind of propagation that enables other
parties to make or receive copies.  Mere interaction with a user through
a computer network, with no transfer of a copy, is not conveying.

  An interactive user interface displays "Appropriate Legal Notices"
to the extent that it includes a convenient and prominently visible
feature that (1) displays an appropriate copyright notice, and (2)
tells the user that there is no warranty for the work (except to the
extent that warranties are provided), that licensees may convey the
work under this License, and how to view a copy of this License.  If
the interface presents a list of user commands or options, such as a
menu, a prominent item in the list meets this criterion.

  1. Source Code.

  The "source code" for a work means the preferred form of the work
for making modifications to it.  "Object code" means any non-source
form of a work.

  A "Standard Interface" means an interface that either is an official
standard defined by a recognized standards body, or, in the case of
interfaces specified for a particular programming language, one that
is widely used among developers working in that language.

  The "System Libraries" of an executable work include anything, other
than the work as a whole, that (a) is included in the normal form of
packaging a Major Component, but which is not part of that Major
Component, and (b) serves only to enable use of the work with that
Major Component, or to implement a Standard Interface for which an
implementation is available to the public in source code form.  A
"Major Component", in this context, means a major essential component
(kernel, window system, and so on) of the specific operating system
(if any) on which the executable work runs, or a compiler used to
produce the work, or an object code interpreter used to run it.

  The "Corresponding Source" for a work in object code form means all
the source code needed to generate, install, and (for an executable
work) run the object code and to modify the work, including scripts to
control those activities.  However, it does not include the work's
System Libraries, or general-purpose tools or generally available free
programs which are used unmodified in performing those activities but
which are not part of the work.  For example, Corresponding Source
includes interface definition files associated with source files for
the work, and the source code for shared libraries and dynamically
linked subprograms that the work is specifically designed to require,
such as by intimate data communication or control flow between those
subprograms and other parts of the work.

  The Corresponding Source need not include anything that users
can regenerate automatically from other parts of the Corresponding
Source.

  The Corresponding Source for a work in source code form is that
same work.

  2. Basic Permissions.

  All rights granted under this License are granted for the term of
copyright on the Program, and are irrevocable provided the stated
conditions are met.  This License explicitly affirms your unlimited
permission to run the unmodified Program.  The output from running a
covered work is covered by this License only if the output, given its
content, constitutes a covered work.  This License acknowledges your
rights of fair use or other equivalent, as provided by copyright law.

  You may make, run and propagate covered works that you do not
convey, without conditions so long as your license otherwise remains
in force.  You may convey covered works to others for the sole purpose
of having them make modifications exclusively for you, or provide you
with facilities for running those works, provided that you comply with
the terms of this License in conveying all material for which you do
not control copyright.  Those thus making or running the covered works
for you must do so exclusively on your behalf, under your direction
and control, on terms that prohibit them from making any copies of
your copyrighted material outside their relationship with you.

  Conveying under any other circumstances is permitted solely under
the conditions stated below.  Sublicensing is not allowed; section 10
makes it unnecessary.

  3. Protecting Users' Legal Rights From Anti-Circumvention Law.

  No covered work shall be deemed part of an effective technological
measure under any applicable law fulfilling obligations under article
11 of the WIPO copyright treaty adopted on 20 December 1996, or
similar laws prohibiting or restricting circumvention of such
measures.

  When you convey a covered work, you waive any legal power to forbid
circumvention of technological measures to the extent such circumvention
is effected by exercising rights under this License with respect to
the covered work, and you disclaim any intention to limit operation or
modification of the work as a means of enforcing, against the work's
users, your or third parties' legal rights to forbid circumvention of
technological measures.

  4. Conveying Verbatim Copies.

  You may convey verbatim copies of the Program's source code as you
receive it, in any medium, provided that you conspicuously and
appropriately publish on each copy an appropriate copyright notice;
keep intact all notices stating that this License and any
non-permissive terms added in accord with section 7 apply to the code;
keep intact all notices of the absence of any warranty; and give all
recipients a copy of this License along with the Program.

  You may charge any price or no price for each copy that you convey,
and you may offer support or warranty protection for a fee.

  5. Conveying Modified Source Versions.

  You may convey a work based on the Program, or the modifications to
produce it from the Program, in the form of source code under the
terms of section 4, provided that you also meet all of these conditions:

    a) The work must carry prominent notices stating that you modified
    it, and giving a relevant date.

    b) The work must carry prominent notices stating that it is
    released under this License and any conditions added under section
    7.  This requirement modifies the requirement in section 4 to
    "keep intact all notices".

    c) You must license the entire work, as a whole, under this
    License to anyone who comes into possession of a copy.  This
    License will therefore apply, along with any applicable section 7
    additional terms, to the whole of the work, and all its parts,
    regardless of how they are packaged.  This License gives no
    permission to license the work in any other way, but it does not
    invalidate such permission if you have separately received it.

    d) If the work has interactive user interfaces, each must display
    Appropriate Legal Notices; however, if the Program has interactive
    interfaces that do not display Appropriate Legal Notices, your
    work need not make them do so.

  A compilation of a covered work with other separate and independent
works, which are not by their nature extensions of the covered work,
and which are not combined with it such as to form a larger program,
in or on a volume of a storage or distribution medium, is called an
"aggregate" if the compilation and its resulting copyright are not
used to limit the access or legal rights of the compilation's users
beyond what the individual works permit.  Inclusion of a covered work
in an aggregate does not cause this License to apply to the other
parts of the aggregate.

  6. Conveying Non-Source Forms.

  You may convey a covered work in object code form under the terms
of sections 4 and 5, provided that you also convey the
machine-readable Corresponding Source under the terms of this License,
in one of these ways:

    a) Convey the object code in, or embodied in, a physical product
    (including a physical distribution medium), accompanied by the
    Corresponding Source fixed on a durable physical medium
    customarily used for software interchange.

    b) Convey the object code in, or embodied in, a physical product
    (including a physical distribution medium), accompanied by a
    written offer, valid for at least three years and valid for as
    long as you offer spare parts or customer support for that product
    model, to give anyone who possesses the object code either (1) a
    copy of the Corresponding Source for all the software in the
    product that is covered by this License, on a durable physical
    medium customarily used for software interchange, for a price no
    more than your reasonable cost of physically performing this
    conveying of source, or (2) access to copy the
    Corresponding Source from a network server at no charge.

    c) Convey individual copies of the object code with a copy of the
    written offer to provide the Corresponding Source.  This
    alternative is allowed only occasionally and noncommercially, and
    only if you received the object code with such an offer, in accord
    with subsection 6b.

    d) Convey the object code by offering access from a designated
    place (gratis or for a charge), and offer equivalent access to the
    Corresponding Source in the same way through the same place at no
    further charge.  You need not require recipients to copy the
    Corresponding Source along with the object code.  If the place to
    copy the object code is a network server, the Corresponding Source
    may be on a different server (operated by you or a third party)
    that supports equivalent copying facilities, provided you maintain
    clear directions next to the object code saying where to find the
    Corresponding Source.  Regardless of what server hosts the
    Corresponding Source, you remain obligated to ensure that it is
    available for as long as needed to satisfy these requirements.

    e) Convey the object code using peer-to-peer transmission, provided
    you inform other peers where the object code and Corresponding
    Source of the work are being offered to the general public at no
    charge under subsection 6d.

  A separable portion of the object code, whose source code is excluded
from the Corresponding Source as a System Library, need not be
included in conveying the object code work.

  A "User Product" is either (1) a "consumer product", which means any
tangible personal property which is normally used for personal, family,
or household purposes, or (2) anything designed or sold for incorporation
into a dwelling.  In determining whether a product is a consumer product,
doubtful cases shall be resolved in favor of coverage.  For a particular
product received by a particular user, "normally used" refers to a
typical or common use of that class of product, regardless of the status
of the particular user or of the way in which the particular user
actually uses, or expects or is expected to use, the product.  A product
is a consumer product regardless of whether the product has substantial
commercial, industrial or non-consumer uses, unless such uses represent
the only significant mode of use of the product.

  "Installation Information" for a User Product means any methods,
procedures, authorization keys, or other information required to install
and execute modified versions of a covered work in that User Product from
a modified version of its Corresponding Source.  The information must
suffice to ensure that the continued functioning of the modified object
code is in no case prevented or interfered with solely because
modification has been made.

  If you convey an object code work under this section in, or with, or
specifically for use in, a User Product, and the conveying occurs as
part of a transaction in which the right of possession and use of the
User Product is transferred to the recipient in perpetuity or for a
fixed term (regardless of how the transaction is characterized), the
Corresponding Source conveyed under this section must be accompanied
by the Installation Information.  But this requirement does not apply
if neither you nor any third party retains the ability to install
modified object code on the User Product (for example, the work has
been installed in ROM).

  The requirement to provide Installation Information does not include a
requirement to continue to provide support service, warranty, or updates
for a work that has been modified or installed by the recipient, or for
the User Product in which it has been modified or installed.  Access to a
network may be denied when the modification itself materially and
adversely affects the operation of the network or violates the rules and
protocols for communication across the network.

  Corresponding Source conveyed, and Installation Information provided,
in accord with this section must be in a format that is publicly
documented (and with an implementation available to the public in
source code form), and must require no special password or key for
unpacking, reading or copying.

  7. Additional Terms.

  "Additional permissions" are terms that supplement the terms of this
License by making exceptions from one or more of its conditions.
Additional permissions that are applicable to the entire Program shall
be treated as though they were included in this License, to the extent
that they are valid under applicable law.  If additional permissions
apply only to part of the Program, that part may be used separately
under those permissions, but the entire Program remains governed by
this License without regard to the additional permissions.

  When you convey a copy of a covered work, you may at your option
remove any additional permissions from that copy, or from any part of
it.  (Additional permissions may be written to require their own
removal in certain cases when you modify the work.)  You may place
additional permissions on material, added by you to a covered work,
for which you have or can give appropriate copyright permission.

  Notwithstanding any other provision of this License, for material you
add to a covered work, you may (if authorized by the copyright holders of
that material) supplement the terms of this License with terms:

    a) Disclaiming warranty or limiting liability differently from the
    terms of sections 15 and 16 of this License; or

    b) Requiring preservation of specified reasonable legal notices or
    author attributions in that material or in the Appropriate Legal
    Notices displayed by works containing it; or

    c) Prohibiting misrepresentation of the origin of that material, or
    requiring that modified versions of such material be marked in
    reasonable ways as different from the original version; or

    d) Limiting the use for publicity purposes of names of licensors or
    authors of the material; or

    e) Declining to grant rights under trademark law for use of some
    trade names, trademarks, or service marks; or

    f) Requiring indemnification of licensors and authors of that
    material by anyone who conveys the material (or modified versions of
    it) with contractual assumptions of liability to the recipient, for
    any liability that these contractual assumptions directly impose on
    those licensors and authors.

  All other non-permissive additional terms are considered "further
restrictions" within the meaning of section 10.  If the Program as you
received it, or any part of it, contains a notice stating that it is
governed by this License along with a term that is a further
restriction, you may remove that term.  If a license document contains
a further restriction but permits relicensing or conveying under this
License, you may add to a covered work material governed by the terms
of that license document, provided that the further restriction does
not survive such relicensing or conveying.

  If you add terms to a covered work in accord with this section, you
must place, in the relevant source files, a statement of the
additional terms that apply to those files, or a notice indicating
where to find the applicable terms.

  Additional terms, permissive or non-permissive, may be stated in the
form of a separately written license, or stated as exceptions;
the above requirements apply either way.

  8. Termination.

  You may not propagate or modify a covered work except as expressly
provided under this License.  Any attempt otherwise to propagate or
modify it is void, and will automatically terminate your rights under
this License (including any patent licenses granted under the third
paragraph of section 11).

  However, if you cease all violation of this License, then your
license from a particular copyright holder is reinstated (a)
provisionally, unless and until the copyright holder explicitly and
finally terminates your license, and (b) permanently, if the copyright
holder fails to notify you of the violation by some reasonable means
prior to 60 days after the cessation.

  Moreover, your license from a particular copyright holder is
reinstated permanently if the copyright holder notifies you of the
violation by some reasonable means, this is the first time you have
received notice of violation of this License (for any work) from that
copyright holder, and you cure the violation prior to 30 days after
your receipt of the notice.

  Termination of your rights under this section does not terminate the
licenses of parties who have received copies or rights from you under
this License.  If your rights have been terminated and not permanently
reinstated, you do not qualify to receive new licenses for the same
material under section 10.

  9. Acceptance Not Required for Having Copies.

  You are not required to accept this License in order to receive or
run a copy of the Program.  Ancillary propagation of a covered work
occurring solely as a consequence of using peer-to-peer transmission
to receive a copy likewise does not require acceptance.  However,
nothing other than this License grants you permission to propagate or
modify any covered work.  These actions infringe copyright if you do
not accept this License.  Therefore, by modifying or propagating a
covered work, you indicate your acceptance of this License to do so.

  10. Automatic Licensing of Downstream Recipients.

  Each time you convey a covered work, the recipient automatically
receives a license from the original licensors, to run, modify and
propagate that work, subject to this License.  You are not responsible
for enforcing compliance by third parties with this License.

  An "entity transaction" is a transaction transferring control of an
organization, or substantially all assets of one, or subdividing an
organization, or merging organizations.  If propagation of a covered
work results from an entity transaction, each party to that
transaction who receives a copy of the work also receives whatever
licenses to the work the party's predecessor in interest had or could
give under the previous paragraph, plus a right to possession of the
Corresponding Source of the work from the predecessor in interest, if
the predecessor has it or can get it with reasonable efforts.

  You may not impose any further restrictions on the exercise of the
rights granted or affirmed under this License.  For example, you may
not impose a license fee, royalty, or other charge for exercise of
rights granted under this License, and you may not initiate litigation
(including a cross-claim or counterclaim in a lawsuit) alleging that
any patent claim is infringed by making, using, selling, offering for
sale, or importing the Program or any portion of it.

  11. Patents.

  A "contributor" is a copyright holder who authorizes use under this
License of the Program or a work on which the Program is based.  The
work thus licensed is called the contributor's "contributor version".

  A contributor's "essential patent claims" are all patent claims
owned or controlled by the contributor, whether already acquired or
hereafter acquired, that would be infringed by some manner, permitted
by this License, of making, using, or selling its contributor version,
but do not include claims that would be infringed only as a
consequence of further modification of the contributor version.  For
purposes of this definition, "control" includes the right to grant
patent sublicenses in a manner consistent with the requirements of
this License.

  Each contributor grants you a non-exclusive, worldwide, royalty-free
patent license under the contributor's essential patent claims, to
make, use, sell, offer for sale, import and otherwise run, modify and
propagate the contents of its contributor version.

  In the following three paragraphs, a "patent license" is any express
agreement or commitment, however denominated, not to enforce a patent
(such as an express permission to practice a patent or covenant not to
sue for patent infringement).  To "grant" such a patent license to a
party means to make such an agreement or commitment not to enforce a
patent against the party.

  If you convey a covered work, knowingly relying on a patent license,
and the Corresponding Source of the work is not available for anyone
to copy, free of charge and under the terms of this License, through a
publicly available network server or other readily accessible means,
then you must either (1) cause the Corresponding Source to be so
available, or (2) arrange to deprive yourself of the benefit of the
patent license for this particular work, or (3) arrange, in a manner
consistent with the requirements of this License, to extend the patent
license to downstream recipients.  "Knowingly relying" means you have
actual knowledge that, but for the patent license, your conveying the
covered work in a country, or your recipient's use of the covered work
in a country, would infringe one or more identifiable patents in that
country that you have reason to believe are valid.

  If, pursuant to or in connection with a single transaction or
arrangement, you convey, or propagate by procuring conveyance of, a
covered work, and grant a patent license to some of the parties
receiving the covered work authorizing them to use, propagate, modify
or convey a specific copy of the covered work, then the patent license
you grant is automatically extended to all recipients of the covered
work and works based on it.

  A patent license is "discriminatory" if it does not include within
the scope of its coverage, prohibits the exercise of, or is
conditioned on the non-exercise of one or more of the rights that are
specifically granted under this License.  You may not convey a covered
work if you are a party to an arrangement with a third party that is
in the business of distributing software, under which you make payment
to the third party based on the extent of your activity of conveying
the work, and under which the third party grants, to any of the
parties who would receive the covered work from you, a discriminatory
patent license (a) in connection with copies of the covered work
conveyed by you (or copies made from those copies), or (b) primarily
for and in connection with specific products or compilations that
contain the covered work, unless you entered into that arrangement,
or that patent license was granted, prior to 28 March 2007.

  Nothing in this License shall be construed as excluding or limiting
any implied license or other defenses to infringement that may
otherwise be available to you under applicable patent law.

  12. No Surrender of Others' Freedom.

  If conditions are imposed on you (whether by court order, agreement or
otherwise) that contradict the conditions of this License, they do not
excuse you from the conditions of this License.  If you cannot convey a
covered work so as to satisfy simultaneously your obligations under this
License and any other pertinent obligations, then as a consequence you may
not convey it at all.  For example, if you agree to terms that obligate you
to collect a royalty for further conveying from those to whom you convey
the Program, the only way you could satisfy both those terms and this
License would be to refrain entirely from conveying the Program.

  13. Use with the GNU Affero General Public License.

  Notwithstanding any other provision of this License, you have
permission to link or combine any covered work with a work licensed
under version 3 of the GNU Affero General Public License into a single
combined work, and to convey the resulting work.  The terms of this
License will continue to apply to the part which is the covered work,
but the special requirements of the GNU Affero General Public License,
section 13, concerning interaction through a network will apply to the
combination as such.

  14. Revised Versions of this License.

  The Free Software Foundation may publish revised and/or new versions of
the GNU General Public License from time to time.  Such new versions will
be similar in spirit to the present version, but may differ in detail to
address new problems or concerns.

  Each version is given a distinguishing version number.  If the
Program specifies that a certain numbered version of the GNU General
Public License "or any later version" applies to it, you have the
option of following the terms and conditions either of that numbered
version or of any later version published by the Free Software
Foundation.  If the Program does not specify a version number of the
GNU General Public License, you may choose any version ever published
by the Free Software Foundation.

  If the Program specifies that a proxy can decide which future
versions of the GNU General Public License can be used, that proxy's
public statement of acceptance of a version permanently authorizes you
to choose that version for the Program.

  Later license versions may give you additional or different
permissions.  However, no additional obligations are imposed on any
author or copyright holder as a result of your choosing to follow a
later version.

  15. Disclaimer of Warranty.

  THERE IS NO WARRANTY FOR THE PROGRAM, TO THE EXTENT PERMITTED BY
APPLICABLE LAW.  EXCEPT WHEN OTHERWISE STATED IN WRITING THE COPYRIGHT
HOLDERS AND/OR OTHER PARTIES PROVIDE THE PROGRAM "AS IS" WITHOUT WARRANTY
OF ANY KIND, EITHER EXPRESSED OR IMPLIED, INCLUDING, BUT NOT LIMITED TO,
THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
PURPOSE.  THE ENTIRE RISK AS TO THE QUALITY AND PERFORMANCE OF THE PROGRAM
IS WITH YOU.  SHOULD THE PROGRAM PROVE DEFECTIVE, YOU ASSUME THE COST OF
ALL NECESSARY SERVICING, REPAIR OR CORRECTION.

  16. Limitation of Liability.

  IN NO EVENT UNLESS REQUIRED BY APPLICABLE LAW OR AGREED TO IN WRITING
WILL ANY COPYRIGHT HOLDER, OR ANY OTHER PARTY WHO MODIFIES AND/OR CONVEYS
THE PROGRAM AS PERMITTED ABOVE, BE LIABLE TO YOU FOR DAMAGES, INCLUDING ANY
GENERAL, SPECIAL, INCIDENTAL OR CONSEQUENTIAL DAMAGES ARISING OUT OF THE
USE OR INABILITY TO USE THE PROGRAM (INCLUDING BUT NOT LIMITED TO LOSS OF
DATA OR DATA BEING RENDERED INACCURATE OR LOSSES SUSTAINED BY YOU OR THIRD
PARTIES OR A FAILURE OF THE PROGRAM TO OPERATE WITH ANY OTHER PROGRAMS),
EVEN IF SUCH HOLDER OR OTHER PARTY HAS BEEN ADVISED OF THE POSSIBILITY OF
SUCH DAMAGES.

  17. Interpretation of Sections 15 and 16.

  If the disclaimer of warranty and limitation of liability provided
above cannot be given local legal effect according to their terms,
reviewing courts shall apply local law that most closely approximates
an absolute waiver of all civil liability in connection with the
Program, unless a warranty or assumption of liability accompanies a
copy of the Program in return for a fee.

                     END OF TERMS AND CONDITIONS

            How to Apply These Terms to Your New Programs

  If you develop a new program, and you want it to be of the greatest
possible use to the public, the best way to achieve this is to make it
free software which everyone can redistribute and change under these terms.

  To do so, attach the following notices to the program.  It is safest
to attach them to the start of each source file to most effectively
state the exclusion of warranty; and each file should have at least
the "copyright" line and a pointer to where the full notice is found.

    <one line to give the program's name and a brief idea of what it does.>
    Copyright (C) <year>  <name of author>

    This program is free software: you can redistribute it and/or modify
    it under the terms of the GNU General Public License as published by
    the Free Software Foundation, either version 3 of the License, or
    (at your option) any later version.

    This program is distributed in the hope that it will be useful,
    but WITHOUT ANY WARRANTY; without even the implied warranty of
    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
    GNU General Public License for more details.

    You should have received a copy of the GNU General Public License
    along with this program.  If not, see <http://www.gnu.org/licenses/>.

Also add information on how to contact you by electronic and paper mail.

  If the program does terminal interaction, make it output a short
notice like this when it starts in an interactive mode:

    <program>  Copyright (C) <year>  <name of author>
    This program comes with ABSOLUTELY NO WARRANTY; for details type `show w'.
    This is free software, and you are welcome to redistribute it
    under certain conditions; type `show c' for details.

The hypothetical commands `show w' and `show c' should show the appropriate
parts of the General Public License.  Of course, your program's commands
might be different; for a GUI interface, you would use an "about box".

  You should also get your employer (if you work as a programmer) or school,
if any, to sign a "copyright disclaimer" for the program, if necessary.
For more information on this, and how to apply and follow the GNU GPL, see
<http://www.gnu.org/licenses/>.

  The GNU General Public License does not permit incorporating your program
into proprietary programs.  If your program is a subroutine library, you
may consider it more useful to permit linking proprietary applications with
the library.  If this is what you want to do, use the GNU Lesser General
Public License instead of this License.  But first, please read
<http://www.gnu.org/philosophy/why-not-lgpl.html>.


================================================
FILE: src/kenlm/COPYING.LESSER
================================================
		   GNU LESSER GENERAL PUBLIC LICENSE
                       Version 3, 29 June 2007

 Copyright (C) 2007 Free Software Foundation, Inc. <http://fsf.org/>
 Everyone is permitted to copy and distribute verbatim copies
 of this license document, but changing it is not allowed.


  This version of the GNU Lesser General Public License incorporates
the terms and conditions of version 3 of the GNU General Public
License, supplemented by the additional permissions listed below.

  0. Additional Definitions.

  As used herein, "this License" refers to version 3 of the GNU Lesser
General Public License, and the "GNU GPL" refers to version 3 of the GNU
General Public License.

  "The Library" refers to a covered work governed by this License,
other than an Application or a Combined Work as defined below.

  An "Application" is any work that makes use of an interface provided
by the Library, but which is not otherwise based on the Library.
Defining a subclass of a class defined by the Library is deemed a mode
of using an interface provided by the Library.

  A "Combined Work" is a work produced by combining or linking an
Application with the Library.  The particular version of the Library
with which the Combined Work was made is also called the "Linked
Version".

  The "Minimal Corresponding Source" for a Combined Work means the
Corresponding Source for the Combined Work, excluding any source code
for portions of the Combined Work that, considered in isolation, are
based on the Application, and not on the Linked Version.

  The "Corresponding Application Code" for a Combined Work means the
object code and/or source code for the Application, including any data
and utility programs needed for reproducing the Combined Work from the
Application, but excluding the System Libraries of the Combined Work.

  1. Exception to Section 3 of the GNU GPL.

  You may convey a covered work under sections 3 and 4 of this License
without being bound by section 3 of the GNU GPL.

  2. Conveying Modified Versions.

  If you modify a copy of the Library, and, in your modifications, a
facility refers to a function or data to be supplied by an Application
that uses the facility (other than as an argument passed when the
facility is invoked), then you may convey a copy of the modified
version:

   a) under this License, provided that you make a good faith effort to
   ensure that, in the event an Application does not supply the
   function or data, the facility still operates, and performs
   whatever part of its purpose remains meaningful, or

   b) under the GNU GPL, with none of the additional permissions of
   this License applicable to that copy.

  3. Object Code Incorporating Material from Library Header Files.

  The object code form of an Application may incorporate material from
a header file that is part of the Library.  You may convey such object
code under terms of your choice, provided that, if the incorporated
material is not limited to numerical parameters, data structure
layouts and accessors, or small macros, inline functions and templates
(ten or fewer lines in length), you do both of the following:

   a) Give prominent notice with each copy of the object code that the
   Library is used in it and that the Library and its use are
   covered by this License.

   b) Accompany the object code with a copy of the GNU GPL and this license
   document.

  4. Combined Works.

  You may convey a Combined Work under terms of your choice that,
taken together, effectively do not restrict modification of the
portions of the Library contained in the Combined Work and reverse
engineering for debugging such modifications, if you also do each of
the following:

   a) Give prominent notice with each copy of the Combined Work that
   the Library is used in it and that the Library and its use are
   covered by this License.

   b) Accompany the Combined Work with a copy of the GNU GPL and this license
   document.

   c) For a Combined Work that displays copyright notices during
   execution, include the copyright notice for the Library among
   these notices, as well as a reference directing the user to the
   copies of the GNU GPL and this license document.

   d) Do one of the following:

       0) Convey the Minimal Corresponding Source under the terms of this
       License, and the Corresponding Application Code in a form
       suitable for, and under terms that permit, the user to
       recombine or relink the Application with a modified version of
       the Linked Version to produce a modified Combined Work, in the
       manner specified by section 6 of the GNU GPL for conveying
       Corresponding Source.

       1) Use a suitable shared library mechanism for linking with the
       Library.  A suitable mechanism is one that (a) uses at run time
       a copy of the Library already present on the user's computer
       system, and (b) will operate properly with a modified version
       of the Library that is interface-compatible with the Linked
       Version.

   e) Provide Installation Information, but only if you would otherwise
   be required to provide such information under section 6 of the
   GNU GPL, and only to the extent that such information is
   necessary to install and execute a modified version of the
   Combined Work produced by recombining or relinking the
   Application with a modified version of the Linked Version. (If
   you use option 4d0, the Installation Information must accompany
   the Minimal Corresponding Source and Corresponding Application
   Code. If you use option 4d1, you must provide the Installation
   Information in the manner specified by section 6 of the GNU GPL
   for conveying Corresponding Source.)

  5. Combined Libraries.

  You may place library facilities that are a work based on the
Library side by side in a single library together with other library
facilities that are not Applications and are not covered by this
License, and convey such a combined library under terms of your
choice, if you do both of the following:

   a) Accompany the combined library with a copy of the same work based
   on the Library, uncombined with any other library facilities,
   conveyed under the terms of this License.

   b) Give prominent notice with the combined library that part of it
   is a work based on the Library, and explaining where to find the
   accompanying uncombined form of the same work.

  6. Revised Versions of the GNU Lesser General Public License.

  The Free Software Foundation may publish revised and/or new versions
of the GNU Lesser General Public License from time to time. Such new
versions will be similar in spirit to the present version, but may
differ in detail to address new problems or concerns.

  Each version is given a distinguishing version number. If the
Library as you received it specifies that a certain numbered version
of the GNU Lesser General Public License "or any later version"
applies to it, you have the option of following the terms and
conditions either of that published version or of any later version
published by the Free Software Foundation. If the Library as you
received it does not specify a version number of the GNU Lesser
General Public License, you may choose any version of the GNU Lesser
General Public License ever published by the Free Software Foundation.

  If the Library as you received it specifies that a proxy can decide
whether future versions of the GNU Lesser General Public License shall
apply, that proxy's public statement of acceptance of any version is
permanent authorization for you to choose that version for the
Library.


================================================
FILE: src/kenlm/LICENSE
================================================
Most of the code here is licensed under the LGPL.  There are exceptions which have their own licenses, listed below.  See comments in those files for more details.  

util/murmur_hash.cc is under the MIT license.  
util/string_piece.hh and util/string_piece.cc are Google code and contains its own license.  

For the rest:

    Avenue code is free software: you can redistribute it and/or modify
    it under the terms of the GNU Lesser General Public License as published
    by the Free Software Foundation, either version 3 of the License, or
    (at your option) any later version.

    Avenue code is distributed in the hope that it will be useful,
    but WITHOUT ANY WARRANTY; without even the implied warranty of
    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
    GNU Lesser General Public License for more details.

    You should have received a copy of the GNU Lesser General Public License
    along with Avenue code.  If not, see <http://www.gnu.org/licenses/>.


================================================
FILE: src/kenlm/README
================================================
Language model inference code by Kenneth Heafield <kenlm at kheafield.com>
The official website is http://kheafield.com/code/kenlm/.  If you're a decoder developer, please download the latest version from there instead of copying from another decoder.  

Two data structures are supported: probing and trie.  Probing is a probing hash table with keys that ere 64-bit hashes of n-grams and floats as values.  Trie is a fairly standard trie but with bit-level packing so it uses the minimum number of bits to store word indices and pointers.  The trie node entries are sorted by word index.  Probing is the fastest and uses the most memory.  Trie uses the least memory and a bit slower.  

With trie, resident memory is 58% of IRST's smallest version and 21% of SRI's compact version.  Simultaneously, trie CPU's use is 81% of IRST's fastest version and 84% of SRI's fast version.  KenLM's probing hash table implementation goes even faster at the expense of using more memory.  See http://kheafield.com/code/kenlm/benchmark/.  

Binary format via mmap is supported.  Run ./build_binary to make one then pass the binary file name to the appropriate Model constructor.   

Currently, it assumes POSIX APIs for errno, sterror_r, open, close, mmap, munmap, ftruncate, fstat, lseek, and read.  This is tested on Linux and the non-UNIX Mac OS X.  I welcome submissions porting (via #ifdef) to other systems (e.g. Windows) but proudly have no machine on which to test it.  

A brief note to Mac OS X users: your gcc is too old to recognize the pack pragma.  The warning effectively means that, on 64-bit machines, the model will use 16 bytes instead of 12 bytes per n-gram of maximum order (those of lower order are already 16 bytes) in the probing and sorted models.  The trie is not impacted by this.  


FOR DEVELOPERS
Copy the code and distribute with your decoder.  
- It does not depend on Boost or ICU.  If you use ICU, define HAVE_ICU in util/have.hh (uncomment the line) to avoid a name conflict.  Defining HAVE_BOOST will let you hash StringPiece.  

- Most people have zlib.  If you don't want to depend on that, comment out #define HAVE_ZLIB in util/have.hh.  This will disable loading gzipped ARPA files.  

- Look at compile.sh and reimplement using your build system.  

- Use either the interface in lm/model.hh or lm/virtual_interface.hh.  Interface documentation is in comments of lm/virtual_interface.hh (including for lm/model.hh).  

- See lm/config.hh for tuning options.  

- I recommend copying the code and distributing it with your decoder.  However, please send improvements to me so that they can be integrated into the package.  

Also included: A wrapper to SRI with the same interface.  

The name was Hieu Hoang's idea, not mine.  


================================================
FILE: src/kenlm/build_jnilib.sh
================================================
#!/bin/bash
# based on compile_query_only.sh

echo Compiling source files

rm {lm,util}/*.o 2>/dev/null
set -e

CXXFLAGS="-I. -O3 -DNDEBUG -DKENLM_MAX_ORDER=6 -fPIC $CXXFLAGS"

#Grab all cc files in these directories except those ending in test.cc or main.cc
objects=""
for i in util/double-conversion/*.cc util/*.cc lm/*.cc; do
  if [ "${i%test.cc}" == "$i" ] && [ "${i%main.cc}" == "$i" ]; then
    g++ $CXXFLAGS -c $i -o ${i%.cc}.o
    objects="$objects ${i%.cc}.o"
  fi
done


echo Compiling binaries into bin

mkdir -p bin
g++ $CXXFLAGS lm/build_binary_main.cc $objects -o bin/build_binary
g++ $CXXFLAGS lm/query_main.cc $objects -o bin/query
g++ $CXXFLAGS lm/kenlm_max_order_main.cc -o bin/kenlm_max_order


echo Compiling JNI library and moving it to openccg/lib

g++ $CXXFLAGS jni/wrap.cc -I $JAVA_HOME/include -I $JAVA_HOME/include/linux $objects -shared -Wl,-soname,libken.so -o libken.so -lz -Wno-deprecated -pthread
mv libken.so ../../lib/.


================================================
FILE: src/kenlm/clean_query_only.sh
================================================
#!/bin/bash
rm -rf {lm,util,util/double-conversion}/*.o bin/{query,kenlm_max_order,build_binary}


================================================
FILE: src/kenlm/jni/wrap.cc
================================================
#include "lm/enumerate_vocab.hh"
#include "lm/model.hh"
#include "util/murmur_hash.hh"

#include <iostream>

#include <string.h>
#include <stdlib.h>
#include <jni.h>
#include <pthread.h>

// Grr.  Everybody's compiler is slightly different and I'm trying to not depend on boost.   
#include <ext/hash_map>

// This is needed to compile on OS X Lion / gcc 4.2.1
namespace __gnu_cxx {
template<>
struct hash<unsigned long long int>
{
	size_t
	operator()(unsigned long long int __x) const
			{
		return __x;
	}
};
}

// Verify that jint and lm::ngram::WordIndex are the same size. If this breaks
// for you, there's a need to revise probString.
namespace {

template<bool> struct StaticCheck {};

template<> struct StaticCheck<true> {
	typedef bool StaticAssertionPassed;
};

typedef StaticCheck<sizeof(jint) == sizeof(lm::WordIndex)>::StaticAssertionPassed FloatSize;

// Vocab ids above what the vocabulary knows about are unknown and should
// be mapped to that.
void MapArray(const std::vector<lm::WordIndex>& map, jint *begin, jint *end) {
	for (jint *i = begin; i < end; ++i) {
		*i = map[*i];
	}
}

char *PieceCopy(const StringPiece &str) {
	char *ret = (char*) malloc(str.size() + 1);
	memcpy(ret, str.data(), str.size());
	ret[str.size()] = 0;
	return ret;
}

// Rather than handle several different instantiations over JNI, we'll just
// do virtual calls C++-side.
class VirtualBase {
public:
	virtual ~VirtualBase() {
	}

	virtual float Prob(jint *begin, jint *end) const = 0;

	virtual float ProbString(jint * const begin, jint * const end,
			jint start) const = 0;

	virtual uint8_t Order() const = 0;

	virtual bool RegisterWord(const StringPiece& word, const int wd_id) = 0;

protected:
	VirtualBase() {
	}

private:
};

template<class Model> class VirtualImpl: public VirtualBase {
public:
	VirtualImpl(const char *name, float fake_oov_cost) :
			m_(name), fake_oov_cost_(fake_oov_cost) {
		// Insert unknown id mapping.
		map_.push_back(0);
	}

	~VirtualImpl() {
	}

	float Prob(jint * const begin, jint * const end) const {
		MapArray(map_, begin, end);

		std::reverse(begin, end - 1);
		lm::ngram::State ignored;
		return *(end - 1) ?
				m_.FullScoreForgotState(
						reinterpret_cast<const lm::WordIndex*>(begin),
						reinterpret_cast<const lm::WordIndex*>(end - 1), *(end - 1),
						ignored).prob :
				fake_oov_cost_;
	}

	float ProbString(jint * const begin, jint * const end, jint start) const {
		MapArray(map_, begin, end);

		float prob;
		lm::ngram::State state;
		if (start == 0) {
			prob = 0;
			state = m_.NullContextState();
		} else {
			std::reverse(begin, begin + start);
			prob = m_.FullScoreForgotState(
					reinterpret_cast<const lm::WordIndex*>(begin),
					reinterpret_cast<const lm::WordIndex*>(begin + start), begin[start],
					state).prob;
			if (begin[start] == 0)
				prob = fake_oov_cost_;
			++start;
		}
		lm::ngram::State state2;
		for (const jint *i = begin + start;;) {
			if (i >= end)
				break;
			float got = m_.Score(state, *i, state2);
			prob += *(i++) ? got : fake_oov_cost_;
			if (i >= end)
				break;
			got = m_.Score(state2, *i, state);
			prob += *(i++) ? got : fake_oov_cost_;
		}
		return prob;
	}

	uint8_t Order() const {
		return m_.Order();
	}

	bool RegisterWord(const StringPiece& word, const int wd_id) {
		if (map_.size() <= wd_id) {
			map_.resize(wd_id + 1, 0);
		}
		bool already_present = false;
		if (map_[wd_id] != 0)
			already_present = true;
		map_[wd_id] = m_.GetVocabulary().Index(word);
		return already_present;
	}

private:
	Model m_;
	float fake_oov_cost_;
	std::vector<lm::WordIndex> map_;
};

VirtualBase *ConstructModel(const char *file_name, float fake_oov_cost) {
	using namespace lm::ngram;
	ModelType model_type;
	if (!RecognizeBinary(file_name, model_type))
		model_type = HASH_PROBING;
	switch (model_type) {
	case HASH_PROBING:
		return new VirtualImpl<ProbingModel>(file_name, fake_oov_cost);
	case TRIE_SORTED:
		return new VirtualImpl<TrieModel>(file_name, fake_oov_cost);
	case ARRAY_TRIE_SORTED:
		return new VirtualImpl<ArrayTrieModel>(file_name, fake_oov_cost);
	case QUANT_TRIE_SORTED:
		return new VirtualImpl<QuantTrieModel>(file_name, fake_oov_cost);
	case QUANT_ARRAY_TRIE_SORTED:
		return new VirtualImpl<QuantArrayTrieModel>(file_name, fake_oov_cost);
	default:
		UTIL_THROW(
				lm::FormatLoadException,
				"Unrecognized file format " << (unsigned) model_type << " in file "
						<< file_name);
	}
}

} // namespace

extern "C" {

JNIEXPORT jlong JNICALL Java_opennlp_ccg_ngrams_kenlm_jni_KenLM_construct(
		JNIEnv *env, jclass, jstring file_name, jfloat fake_oov_cost) {
	const char *str = env->GetStringUTFChars(file_name, 0);
	if (!str)
		return 0;
	jlong ret;
	try {
		ret = reinterpret_cast<jlong>(ConstructModel(str, fake_oov_cost));
	} catch (std::exception &e) {
		std::cerr << e.what() << std::endl;
		abort();
	}
	env->ReleaseStringUTFChars(file_name, str);
	return ret;
}

JNIEXPORT void JNICALL Java_opennlp_ccg_ngrams_kenlm_jni_KenLM_destroy(
		JNIEnv *env, jclass, jlong pointer) {
	delete reinterpret_cast<VirtualBase*>(pointer);
}

JNIEXPORT jint JNICALL Java_opennlp_ccg_ngrams_kenlm_jni_KenLM_order(
		JNIEnv *env, jclass, jlong pointer) {
	return reinterpret_cast<VirtualBase*>(pointer)->Order();
}

JNIEXPORT jboolean JNICALL Java_opennlp_ccg_ngrams_kenlm_jni_KenLM_registerWord(
		JNIEnv *env, jclass, jlong pointer, jstring word, jint id) {
	const char *str = env->GetStringUTFChars(word, 0);
	if (!str)
		return false;
	jint ret;
	try {
		ret = reinterpret_cast<VirtualBase*>(pointer)->RegisterWord(str, id);
	} catch (std::exception &e) {
		std::cerr << e.what() << std::endl;
		abort();
	}
	env->ReleaseStringUTFChars(word, str);
	return ret;
}

JNIEXPORT jfloat JNICALL Java_opennlp_ccg_ngrams_kenlm_jni_KenLM_prob(
		JNIEnv *env, jclass, jlong pointer, jintArray arr) {
	jint length = env->GetArrayLength(arr);
	if (length <= 0)
		return 0.0;
	// GCC only.
	jint values[length];
	env->GetIntArrayRegion(arr, 0, length, values);

	return reinterpret_cast<const VirtualBase*>(pointer)->Prob(values,
			values + length);
}

JNIEXPORT jfloat JNICALL Java_opennlp_ccg_ngrams_kenlm_jni_KenLM_probString(
		JNIEnv *env, jclass, jlong pointer, jintArray arr, jint start) {
	jint length = env->GetArrayLength(arr);
	if (length <= start)
		return 0.0;
	// GCC only.
	jint values[length];
	env->GetIntArrayRegion(arr, 0, length, values);

	return reinterpret_cast<const VirtualBase*>(pointer)->ProbString(values,
			values + length, start);
}

} // extern


================================================
FILE: src/kenlm/lm/Jamfile
================================================
# If you need higher order, change this option
# Having this limit means that State can be
# (KENLM_MAX_ORDER - 1) * sizeof(float) bytes instead of
# sizeof(float*) + (KENLM_MAX_ORDER - 1) * sizeof(float) + malloc overhead
max-order = [ option.get "max-kenlm-order" : 6 : 6 ] ;
if ( $(max-order) != 6 ) {
   echo "Setting KenLM maximum n-gram order to $(max-order)" ;
}
max-order = <define>KENLM_MAX_ORDER=$(max-order) ;

path-constant ORDER-LOG : bin/order.log ;
update-if-changed $(ORDER-LOG) $(max-order) ;

max-order += <dependency>$(ORDER-LOG) ;

fakelib kenlm : [ glob *.cc : *main.cc *test.cc ] ../util//kenutil : <include>.. $(max-order) : : <include>.. $(max-order) ;

import testing ;

run left_test.cc kenlm /top//boost_unit_test_framework : : test.arpa ;
run model_test.cc kenlm /top//boost_unit_test_framework : : test.arpa test_nounk.arpa ;
run partial_test.cc kenlm /top//boost_unit_test_framework : : test.arpa ;

exe query : query_main.cc kenlm ../util//kenutil ;
exe build_binary : build_binary_main.cc kenlm ../util//kenutil ;
exe fragment : fragment_main.cc kenlm ;

alias programs : query build_binary fragment filter//filter : <threading>multi:<source>builder//lmplz ;


================================================
FILE: src/kenlm/lm/bhiksha.cc
================================================
#include "lm/bhiksha.hh"
#include "lm/config.hh"
#include "util/file.hh"
#include "util/exception.hh"

#include <limits>

namespace lm {
namespace ngram {
namespace trie {

DontBhiksha::DontBhiksha(const void * /*base*/, uint64_t /*max_offset*/, uint64_t max_next, const Config &/*config*/) : 
  next_(util::BitsMask::ByMax(max_next)) {}

const uint8_t kArrayBhikshaVersion = 0;

// TODO: put this in binary file header instead when I change the binary file format again.  
void ArrayBhiksha::UpdateConfigFromBinary(int fd, Config &config) {
  uint8_t version;
  uint8_t configured_bits;
  util::ReadOrThrow(fd, &version, 1);
  util::ReadOrThrow(fd, &configured_bits, 1);
  if (version != kArrayBhikshaVersion) UTIL_THROW(FormatLoadException, "This file has sorted array compression version " << (unsigned) version << " but the code expects version " << (unsigned)kArrayBhikshaVersion);
  config.pointer_bhiksha_bits = configured_bits;
}

namespace {

// Find argmin_{chopped \in [0, RequiredBits(max_next)]} ChoppedDelta(max_offset)
uint8_t ChopBits(uint64_t max_offset, uint64_t max_next, const Config &config) {
  uint8_t required = util::RequiredBits(max_next);
  uint8_t best_chop = 0;
  int64_t lowest_change = std::numeric_limits<int64_t>::max();
  // There are probably faster ways but I don't care because this is only done once per order at construction time.  
  for (uint8_t chop = 0; chop <= std::min(required, config.pointer_bhiksha_bits); ++chop) {
    int64_t change = (max_next >> (required - chop)) * 64 /* table cost in bits */
      - max_offset * static_cast<int64_t>(chop); /* savings in bits*/
    if (change < lowest_change) {
      lowest_change = change;
      best_chop = chop;
    }
  }
  return best_chop;
}

std::size_t ArrayCount(uint64_t max_offset, uint64_t max_next, const Config &config) {
  uint8_t required = util::RequiredBits(max_next);
  uint8_t chopping = ChopBits(max_offset, max_next, config);
  return (max_next >> (required - chopping)) + 1 /* we store 0 too */;
}
} // namespace

uint64_t ArrayBhiksha::Size(uint64_t max_offset, uint64_t max_next, const Config &config) {
  return sizeof(uint64_t) * (1 /* header */ + ArrayCount(max_offset, max_next, config)) + 7 /* 8-byte alignment */;
}

uint8_t ArrayBhiksha::InlineBits(uint64_t max_offset, uint64_t max_next, const Config &config) {
  return util::RequiredBits(max_next) - ChopBits(max_offset, max_next, config);
}

namespace {

void *AlignTo8(void *from) {
  uint8_t *val = reinterpret_cast<uint8_t*>(from);
  std::size_t remainder = reinterpret_cast<std::size_t>(val) & 7;
  if (!remainder) return val;
  return val + 8 - remainder;
}

} // namespace

ArrayBhiksha::ArrayBhiksha(void *base, uint64_t max_offset, uint64_t max_next, const Config &config)
  : next_inline_(util::BitsMask::ByBits(InlineBits(max_offset, max_next, config))),
    offset_begin_(reinterpret_cast<const uint64_t*>(AlignTo8(base)) + 1 /* 8-byte header */),
    offset_end_(offset_begin_ + ArrayCount(max_offset, max_next, config)),
    write_to_(reinterpret_cast<uint64_t*>(AlignTo8(base)) + 1 /* 8-byte header */ + 1 /* first entry is 0 */),
    original_base_(base) {}

void ArrayBhiksha::FinishedLoading(const Config &config) {
  // *offset_begin_ = 0 but without a const_cast.
  *(write_to_ - (write_to_ - offset_begin_)) = 0;

  if (write_to_ != offset_end_) UTIL_THROW(util::Exception, "Did not get all the array entries that were expected.");

  uint8_t *head_write = reinterpret_cast<uint8_t*>(original_base_);
  *(head_write++) = kArrayBhikshaVersion;
  *(head_write++) = config.pointer_bhiksha_bits;
}

void ArrayBhiksha::LoadedBinary() {
}

} // namespace trie
} // namespace ngram
} // namespace lm


================================================
FILE: src/kenlm/lm/bhiksha.hh
================================================
/* Simple implementation of
 * @inproceedings{bhikshacompression,
 *  author={Bhiksha Raj and Ed Whittaker},
 *  year={2003},
 *  title={Lossless Compression of Language Model Structure and Word Identifiers},
 *  booktitle={Proceedings of IEEE International Conference on Acoustics, Speech and Signal Processing},
 *  pages={388--391},
 *  }
 *
 *  Currently only used for next pointers.  
 */

#ifndef LM_BHIKSHA__
#define LM_BHIKSHA__

#include <stdint.h>
#include <assert.h>

#include "lm/model_type.hh"
#include "lm/trie.hh"
#include "util/bit_packing.hh"
#include "util/sorted_uniform.hh"

namespace lm {
namespace ngram {
struct Config;

namespace trie {

class DontBhiksha {
  public:
    static const ModelType kModelTypeAdd = static_cast<ModelType>(0);

    static void UpdateConfigFromBinary(int /*fd*/, Config &/*config*/) {}

    static uint64_t Size(uint64_t /*max_offset*/, uint64_t /*max_next*/, const Config &/*config*/) { return 0; }

    static uint8_t InlineBits(uint64_t /*max_offset*/, uint64_t max_next, const Config &/*config*/) {
      return util::RequiredBits(max_next);
    }

    DontBhiksha(const void *base, uint64_t max_offset, uint64_t max_next, const Config &config);

    void ReadNext(const void *base, uint64_t bit_offset, uint64_t /*index*/, uint8_t total_bits, NodeRange &out) const {
      out.begin = util::ReadInt57(base, bit_offset, next_.bits, next_.mask);
      out.end = util::ReadInt57(base, bit_offset + total_bits, next_.bits, next_.mask);
      //assert(out.end >= out.begin);
    }

    void WriteNext(void *base, uint64_t bit_offset, uint64_t /*index*/, uint64_t value) {
      util::WriteInt57(base, bit_offset, next_.bits, value);
    }

    void FinishedLoading(const Config &/*config*/) {}

    void LoadedBinary() {}

    uint8_t InlineBits() const { return next_.bits; }

  private:
    util::BitsMask next_;
};

class ArrayBhiksha {
  public:
    static const ModelType kModelTypeAdd = kArrayAdd;

    static void UpdateConfigFromBinary(int fd, Config &config);

    static uint64_t Size(uint64_t max_offset, uint64_t max_next, const Config &config);

    static uint8_t InlineBits(uint64_t max_offset, uint64_t max_next, const Config &config);

    ArrayBhiksha(void *base, uint64_t max_offset, uint64_t max_value, const Config &config);

    void ReadNext(const void *base, uint64_t bit_offset, uint64_t index, uint8_t total_bits, NodeRange &out) const {
      const uint64_t *begin_it = util::BinaryBelow(util::IdentityAccessor<uint64_t>(), offset_begin_, offset_end_, index);
      const uint64_t *end_it;
      for (end_it = begin_it; (end_it < offset_end_) && (*end_it <= index + 1); ++end_it) {}
      --end_it;
      out.begin = ((begin_it - offset_begin_) << next_inline_.bits) | 
        util::ReadInt57(base, bit_offset, next_inline_.bits, next_inline_.mask);
      out.end = ((end_it - offset_begin_) << next_inline_.bits) | 
        util::ReadInt57(base, bit_offset + total_bits, next_inline_.bits, next_inline_.mask);
      //assert(out.end >= out.begin);
    }

    void WriteNext(void *base, uint64_t bit_offset, uint64_t index, uint64_t value) {
      uint64_t encode = value >> next_inline_.bits;
      for (; write_to_ <= offset_begin_ + encode; ++write_to_) *write_to_ = index;
      util::WriteInt57(base, bit_offset, next_inline_.bits, value & next_inline_.mask);
    }

    void FinishedLoading(const Config &config);

    void LoadedBinary();

    uint8_t InlineBits() const { return next_inline_.bits; }

  private:
    const util::BitsMask next_inline_;

    const uint64_t *const offset_begin_;
    const uint64_t *const offset_end_;

    uint64_t *write_to_;

    void *original_base_;
};

} // namespace trie
} // namespace ngram
} // namespace lm

#endif // LM_BHIKSHA__


================================================
FILE: src/kenlm/lm/binary_format.cc
================================================
#include "lm/binary_format.hh"

#include "lm/lm_exception.hh"
#include "util/file.hh"
#include "util/file_piece.hh"

#include <cstddef>
#include <cstring>
#include <limits>
#include <string>

#include <stdint.h>

namespace lm {
namespace ngram {
namespace {
const char kMagicBeforeVersion[] = "mmap lm http://kheafield.com/code format version";
const char kMagicBytes[] = "mmap lm http://kheafield.com/code format version 5\n\0";
// This must be shorter than kMagicBytes and indicates an incomplete binary file (i.e. build failed).
const char kMagicIncomplete[] = "mmap lm http://kheafield.com/code incomplete\n";
const long int kMagicVersion = 5;

// Old binary files built on 32-bit machines have this header.
// TODO: eliminate with next binary release.
struct OldSanity {
  char magic[sizeof(kMagicBytes)];
  float zero_f, one_f, minus_half_f;
  WordIndex one_word_index, max_word_index;
  uint64_t one_uint64;

  void SetToReference() {
    std::memset(this, 0, sizeof(OldSanity));
    std::memcpy(magic, kMagicBytes, sizeof(magic));
    zero_f = 0.0; one_f = 1.0; minus_half_f = -0.5;
    one_word_index = 1;
    max_word_index = std::numeric_limits<WordIndex>::max();
    one_uint64 = 1;
  }
};


// Test values aligned to 8 bytes.
struct Sanity {
  char magic[ALIGN8(sizeof(kMagicBytes))];
  float zero_f, one_f, minus_half_f;
  WordIndex one_word_index, max_word_index, padding_to_8;
  uint64_t one_uint64;

  void SetToReference() {
    std::memset(this, 0, sizeof(Sanity));
    std::memcpy(magic, kMagicBytes, sizeof(kMagicBytes));
    zero_f = 0.0; one_f = 1.0; minus_half_f = -0.5;
    one_word_index = 1;
    max_word_index = std::numeric_limits<WordIndex>::max();
    padding_to_8 = 0;
    one_uint64 = 1;
  }
};

const char *kModelNames[6] = {"probing hash tables", "probing hash tables with rest costs", "trie", "trie with quantization", "trie with array-compressed pointers", "trie with quantization and array-compressed pointers"};

std::size_t TotalHeaderSize(unsigned char order) {
  return ALIGN8(sizeof(Sanity) + sizeof(FixedWidthParameters) + sizeof(uint64_t) * order);
}

void WriteHeader(void *to, const Parameters &params) {
  Sanity header = Sanity();
  header.SetToReference();
  std::memcpy(to, &header, sizeof(Sanity));
  char *out = reinterpret_cast<char*>(to) + sizeof(Sanity);

  *reinterpret_cast<FixedWidthParameters*>(out) = params.fixed;
  out += sizeof(FixedWidthParameters);

  uint64_t *counts = reinterpret_cast<uint64_t*>(out);
  for (std::size_t i = 0; i < params.counts.size(); ++i) {
    counts[i] = params.counts[i];
  }
}

} // namespace

uint8_t *SetupJustVocab(const Config &config, uint8_t order, std::size_t memory_size, Backing &backing) {
  if (config.write_mmap) {
    std::size_t total = TotalHeaderSize(order) + memory_size;
    backing.file.reset(util::CreateOrThrow(config.write_mmap));
    if (config.write_method == Config::WRITE_MMAP) {
      backing.vocab.reset(util::MapZeroedWrite(backing.file.get(), total), total, util::scoped_memory::MMAP_ALLOCATED);
    } else {
      util::ResizeOrThrow(backing.file.get(), 0);
      util::MapAnonymous(total, backing.vocab);
    }
    strncpy(reinterpret_cast<char*>(backing.vocab.get()), kMagicIncomplete, TotalHeaderSize(order));
    return reinterpret_cast<uint8_t*>(backing.vocab.get()) + TotalHeaderSize(order);
  } else {
    util::MapAnonymous(memory_size, backing.vocab);
    return reinterpret_cast<uint8_t*>(backing.vocab.get());
  }
}

uint8_t *GrowForSearch(const Config &config, std::size_t vocab_pad, std::size_t memory_size, Backing &backing) {
  std::size_t adjusted_vocab = backing.vocab.size() + vocab_pad;
  if (config.write_mmap) {
    // Grow the file to accomodate the search, using zeros.
    try {
      util::ResizeOrThrow(backing.file.get(), adjusted_vocab + memory_size);
    } catch (util::ErrnoException &e) {
      e << " for file " << config.write_mmap;
      throw e;
    }

    if (config.write_method == Config::WRITE_AFTER) {
      util::MapAnonymous(memory_size, backing.search);
      return reinterpret_cast<uint8_t*>(backing.search.get());
    }
    // mmap it now.
    // We're skipping over the header and vocab for the search space mmap.  mmap likes page aligned offsets, so some arithmetic to round the offset down.
    std::size_t page_size = util::SizePage();
    std::size_t alignment_cruft = adjusted_vocab % page_size;
    backing.search.reset(util::MapOrThrow(alignment_cruft + memory_size, true, util::kFileFlags, false, backing.file.get(), adjusted_vocab - alignment_cruft), alignment_cruft + memory_size, util::scoped_memory::MMAP_ALLOCATED);
    return reinterpret_cast<uint8_t*>(backing.search.get()) + alignment_cruft;
  } else {
    util::MapAnonymous(memory_size, backing.search);
    return reinterpret_cast<uint8_t*>(backing.search.get());
  }
}

void FinishFile(const Config &config, ModelType model_type, unsigned int search_version, const std::vector<uint64_t> &counts, std::size_t vocab_pad, Backing &backing) {
  if (!config.write_mmap) return;
  switch (config.write_method) {
    case Config::WRITE_MMAP:
      util::SyncOrThrow(backing.vocab.get(), backing.vocab.size());
      util::SyncOrThrow(backing.search.get(), backing.search.size());
      break;
    case Config::WRITE_AFTER:
      util::SeekOrThrow(backing.file.get(), 0);
      util::WriteOrThrow(backing.file.get(), backing.vocab.get(), backing.vocab.size());
      util::SeekOrThrow(backing.file.get(), backing.vocab.size() + vocab_pad);
      util::WriteOrThrow(backing.file.get(), backing.search.get(), backing.search.size());
      util::FSyncOrThrow(backing.file.get());
      break;
  }
  // header and vocab share the same mmap.  The header is written here because we know the counts.
  Parameters params = Parameters();
  params.counts = counts;
  params.fixed.order = counts.size();
  params.fixed.probing_multiplier = config.probing_multiplier;
  params.fixed.model_type = model_type;
  params.fixed.has_vocabulary = config.include_vocab;
  params.fixed.search_version = search_version;
  WriteHeader(backing.vocab.get(), params);
  if (config.write_method == Config::WRITE_AFTER) {
    util::SeekOrThrow(backing.file.get(), 0);
    util::WriteOrThrow(backing.file.get(), backing.vocab.get(), TotalHeaderSize(counts.size()));
  }
}

namespace detail {

bool IsBinaryFormat(int fd) {
  const uint64_t size = util::SizeFile(fd);
  if (size == util::kBadSize || (size <= static_cast<uint64_t>(sizeof(Sanity)))) return false;
  // Try reading the header.
  util::scoped_memory memory;
  try {
    util::MapRead(util::LAZY, fd, 0, sizeof(Sanity), memory);
  } catch (const util::Exception &e) {
    return false;
  }
  Sanity reference_header = Sanity();
  reference_header.SetToReference();
  if (!memcmp(memory.get(), &reference_header, sizeof(Sanity))) return true;
  if (!memcmp(memory.get(), kMagicIncomplete, strlen(kMagicIncomplete))) {
    UTIL_THROW(FormatLoadException, "This binary file did not finish building");
  }
  if (!memcmp(memory.get(), kMagicBeforeVersion, strlen(kMagicBeforeVersion))) {
    char *end_ptr;
    const char *begin_version = static_cast<const char*>(memory.get()) + strlen(kMagicBeforeVersion);
    long int version = strtol(begin_version, &end_ptr, 10);
    if ((end_ptr != begin_version) && version != kMagicVersion) {
      UTIL_THROW(FormatLoadException, "Binary file has version " << version << " but this implementation expects version " << kMagicVersion << " so you'll have to use the ARPA to rebuild your binary");
    }

    OldSanity old_sanity = OldSanity();
    old_sanity.SetToReference();
    UTIL_THROW_IF(!memcmp(memory.get(), &old_sanity, sizeof(OldSanity)), FormatLoadException, "Looks like this is an old 32-bit format.  The old 32-bit format has been removed so that 64-bit and 32-bit files are exchangeable.");
    UTIL_THROW(FormatLoadException, "File looks like it should be loaded with mmap, but the test values don't match.  Try rebuilding the binary format LM using the same code revision, compiler, and architecture");
  }
  return false;
}

void ReadHeader(int fd, Parameters &out) {
  util::SeekOrThrow(fd, sizeof(Sanity));
  util::ReadOrThrow(fd, &out.fixed, sizeof(out.fixed));
  if (out.fixed.probing_multiplier < 1.0)
    UTIL_THROW(FormatLoadException, "Binary format claims to have a probing multiplier of " << out.fixed.probing_multiplier << " which is < 1.0.");

  out.counts.resize(static_cast<std::size_t>(out.fixed.order));
  if (out.fixed.order) util::ReadOrThrow(fd, &*out.counts.begin(), sizeof(uint64_t) * out.fixed.order);
}

void MatchCheck(ModelType model_type, unsigned int search_version, const Parameters &params) {
  if (params.fixed.model_type != model_type) {
    if (static_cast<unsigned int>(params.fixed.model_type) >= (sizeof(kModelNames) / sizeof(const char *)))
      UTIL_THROW(FormatLoadException, "The binary file claims to be model type " << static_cast<unsigned int>(params.fixed.model_type) << " but this is not implemented for in this inference code.");
    UTIL_THROW(FormatLoadException, "The binary file was built for " << kModelNames[params.fixed.model_type] << " but the inference code is trying to load " << kModelNames[model_type]);
  }
  UTIL_THROW_IF(search_version != params.fixed.search_version, FormatLoadException, "The binary file has " << kModelNames[params.fixed.model_type] << " version " << params.fixed.search_version << " but this code expects " << kModelNames[params.fixed.model_type] << " version " << search_version);
}

void SeekPastHeader(int fd, const Parameters &params) {
  util::SeekOrThrow(fd, TotalHeaderSize(params.counts.size()));
}

uint8_t *SetupBinary(const Config &config, const Parameters &params, uint64_t memory_size, Backing &backing) {
  const uint64_t file_size = util::SizeFile(backing.file.get());
  // The header is smaller than a page, so we have to map the whole header as well.
  std::size_t total_map = util::CheckOverflow(TotalHeaderSize(params.counts.size()) + memory_size);
  if (file_size != util::kBadSize && static_cast<uint64_t>(file_size) < total_map)
    UTIL_THROW(FormatLoadException, "Binary file has size " << file_size << " but the headers say it should be at least " << total_map);

  util::MapRead(config.load_method, backing.file.get(), 0, total_map, backing.search);

  if (config.enumerate_vocab && !params.fixed.has_vocabulary)
    UTIL_THROW(FormatLoadException, "The decoder requested all the vocabulary strings, but this binary file does not have them.  You may need to rebuild the binary file with an updated version of build_binary.");

  // Seek to vocabulary words
  util::SeekOrThrow(backing.file.get(), total_map);
  return reinterpret_cast<uint8_t*>(backing.search.get()) + TotalHeaderSize(params.counts.size());
}

void ComplainAboutARPA(const Config &config, ModelType model_type) {
  if (config.write_mmap || !config.messages) return;
  if (config.arpa_complain == Config::ALL) {
    *config.messages << "Loading the LM will be faster if you build a binary file." << std::endl;
  } else if (config.arpa_complain == Config::EXPENSIVE &&
             (model_type == TRIE || model_type == QUANT_TRIE || model_type == ARRAY_TRIE || model_type == QUANT_ARRAY_TRIE)) {
    *config.messages << "Building " << kModelNames[model_type] << " from ARPA is expensive.  Save time by building a binary format." << std::endl;
  }
}

} // namespace detail

bool RecognizeBinary(const char *file, ModelType &recognized) {
  util::scoped_fd fd(util::OpenReadOrThrow(file));
  if (!detail::IsBinaryFormat(fd.get())) return false;
  Parameters params;
  detail::ReadHeader(fd.get(), params);
  recognized = params.fixed.model_type;
  return true;
}

} // namespace ngram
} // namespace lm


================================================
FILE: src/kenlm/lm/binary_format.hh
================================================
#ifndef LM_BINARY_FORMAT__
#define LM_BINARY_FORMAT__

#include "lm/config.hh"
#include "lm/model_type.hh"
#include "lm/read_arpa.hh"

#include "util/file_piece.hh"
#include "util/mmap.hh"
#include "util/scoped.hh"

#include <cstddef>
#include <vector>

#include <stdint.h>

namespace lm {
namespace ngram {

/*Inspect a file to determine if it is a binary lm.  If not, return false.  
 * If so, return true and set recognized to the type.  This is the only API in
 * this header designed for use by decoder authors.  
 */
bool RecognizeBinary(const char *file, ModelType &recognized);

struct FixedWidthParameters {
  unsigned char order;
  float probing_multiplier;
  // What type of model is this?  
  ModelType model_type;
  // Does the end of the file have the actual strings in the vocabulary?   
  bool has_vocabulary;
  unsigned int search_version;
};

// This is a macro instead of an inline function so constants can be assigned using it.
#define ALIGN8(a) ((std::ptrdiff_t(((a)-1)/8)+1)*8)

// Parameters stored in the header of a binary file.  
struct Parameters {
  FixedWidthParameters fixed;
  std::vector<uint64_t> counts;
};

struct Backing {
  // File behind memory, if any.  
  util::scoped_fd file;
  // Vocabulary lookup table.  Not to be confused with the vocab words themselves.  
  util::scoped_memory vocab;
  // Raw block of memory backing the language model data structures
  util::scoped_memory search;
};

// Create just enough of a binary file to write vocabulary to it.  
uint8_t *SetupJustVocab(const Config &config, uint8_t order, std::size_t memory_size, Backing &backing);
// Grow the binary file for the search data structure and set backing.search, returning the memory address where the search data structure should begin.  
uint8_t *GrowForSearch(const Config &config, std::size_t vocab_pad, std::size_t memory_size, Backing &backing);

// Write header to binary file.  This is done last to prevent incomplete files
// from loading.   
void FinishFile(const Config &config, ModelType model_type, unsigned int search_version, const std::vector<uint64_t> &counts,  std::size_t vocab_pad, Backing &backing);

namespace detail {

bool IsBinaryFormat(int fd);

void ReadHeader(int fd, Parameters &params);

void MatchCheck(ModelType model_type, unsigned int search_version, const Parameters &params);

void SeekPastHeader(int fd, const Parameters &params);

uint8_t *SetupBinary(const Config &config, const Parameters &params, uint64_t memory_size, Backing &backing);

void ComplainAboutARPA(const Config &config, ModelType model_type);

} // namespace detail

template <class To> void LoadLM(const char *file, const Config &config, To &to) {
  Backing &backing = to.MutableBacking();
  backing.file.reset(util::OpenReadOrThrow(file));

  try {
    if (detail::IsBinaryFormat(backing.file.get())) {
      Parameters params;
      detail::ReadHeader(backing.file.get(), params);
      detail::MatchCheck(To::kModelType, To::kVersion, params);
      // Replace the run-time configured probing_multiplier with the one in the file.  
      Config new_config(config);
      new_config.probing_multiplier = params.fixed.probing_multiplier;
      detail::SeekPastHeader(backing.file.get(), params);
      To::UpdateConfigFromBinary(backing.file.get(), params.counts, new_config);
      uint64_t memory_size = To::Size(params.counts, new_config);
      uint8_t *start = detail::SetupBinary(new_config, params, memory_size, backing);
      to.InitializeFromBinary(start, params, new_config, backing.file.get());
    } else {
      detail::ComplainAboutARPA(config, To::kModelType);
      to.InitializeFromARPA(file, config);
    }
  } catch (util::Exception &e) {
    e << " File: " << file;
    throw;
  }
}

} // namespace ngram
} // namespace lm
#endif // LM_BINARY_FORMAT__


================================================
FILE: src/kenlm/lm/blank.hh
================================================
#ifndef LM_BLANK__
#define LM_BLANK__

#include <limits>

#include <stdint.h>
#include <math.h>

namespace lm {
namespace ngram {

/* Suppose "foo bar" appears with zero backoff but there is no trigram
 * beginning with these words.  Then, when scoring "foo bar", the model could
 * return out_state containing "bar" or even null context if "bar" also has no
 * backoff and is never followed by another word.  Then the backoff is set to
 * kNoExtensionBackoff.  If the n-gram might be extended, then out_state must
 * contain the full n-gram, in which case kExtensionBackoff is set.  In any
 * case, if an n-gram has non-zero backoff, the full state is returned so
 * backoff can be properly charged.  
 * These differ only in sign bit because the backoff is in fact zero in either
 * case.   
 */
const float kNoExtensionBackoff = -0.0;
const float kExtensionBackoff = 0.0;
const uint64_t kNoExtensionQuant = 0;
const uint64_t kExtensionQuant = 1;

inline void SetExtension(float &backoff) {
  if (backoff == kNoExtensionBackoff) backoff = kExtensionBackoff;
}

// This compiles down nicely.  
inline bool HasExtension(const float &backoff) {
  typedef union { float f; uint32_t i; } UnionValue;
  UnionValue compare, interpret;
  compare.f = kNoExtensionBackoff;
  interpret.f = backoff;
  return compare.i != interpret.i;
}

} // namespace ngram
} // namespace lm
#endif // LM_BLANK__


================================================
FILE: src/kenlm/lm/build_binary_main.cc
================================================
#include "lm/model.hh"
#include "lm/sizes.hh"
#include "util/file_piece.hh"
#include "util/usage.hh"

#include <algorithm>
#include <cstdlib>
#include <exception>
#include <iostream>
#include <iomanip>
#include <limits>

#include <math.h>
#include <stdlib.h>

#ifdef WIN32
#include "util/getopt.hh"
#else
#include <unistd.h>
#endif

namespace lm {
namespace ngram {
namespace {

void Usage(const char *name, const char *default_mem) {
  std::cerr << "Usage: " << name << " [-u log10_unknown_probability] [-s] [-i] [-w mmap|after] [-p probing_multiplier] [-T trie_temporary] [-S trie_building_mem] [-q bits] [-b bits] [-a bits] [type] input.arpa [output.mmap]\n\n"
"-u sets the log10 probability for <unk> if the ARPA file does not have one.\n"
"   Default is -100.  The ARPA file will always take precedence.\n"
"-s allows models to be built even if they do not have <s> and </s>.\n"
"-i allows buggy models from IRSTLM by mapping positive log probability to 0.\n"
"-w mmap|after determines how writing is done.\n"
"   mmap maps the binary file and writes to it.  Default for trie.\n"
"   after allocates anonymous memory, builds, and writes.  Default for probing.\n"
"-r \"order1.arpa order2 order3 order4\" adds lower-order rest costs from these\n"
"   model files.  order1.arpa must be an ARPA file.  All others may be ARPA or\n"
"   the same data structure as being built.  All files must have the same\n"
"   vocabulary.  For probing, the unigrams must be in the same order.\n\n"
"type is either probing or trie.  Default is probing.\n\n"
"probing uses a probing hash table.  It is the fastest but uses the most memory.\n"
"-p sets the space multiplier and must be >1.0.  The default is 1.5.\n\n"
"trie is a straightforward trie with bit-level packing.  It uses the least\n"
"memory and is still faster than SRI or IRST.  Building the trie format uses an\n"
"on-disk sort to save memory.\n"
"-T is the temporary directory prefix.  Default is the output file name.\n"
"-S determines memory use for sorting.  Default is " << default_mem << ".  This is compatible\n"
"   with GNU sort.  The number is followed by a unit: \% for percent of physical\n"
"   memory, b for bytes, K for Kilobytes, M for megabytes, then G,T,P,E,Z,Y.  \n"
"   Default unit is K for Kilobytes.\n"
"-q turns quantization on and sets the number of bits (e.g. -q 8).\n"
"-b sets backoff quantization bits.  Requires -q and defaults to that value.\n"
"-a compresses pointers using an array of offsets.  The parameter is the\n"
"   maximum number of bits encoded by the array.  Memory is minimized subject\n"
"   to the maximum, so pick 255 to minimize memory.\n\n"
"Get a memory estimate by passing an ARPA file without an output file name.\n";
  exit(1);
}

// I could really use boost::lexical_cast right about now.  
float ParseFloat(const char *from) {
  char *end;
  float ret = strtod(from, &end);
  if (*end) throw util::ParseNumberException(from);
  return ret;
}
unsigned long int ParseUInt(const char *from) {
  char *end;
  unsigned long int ret = strtoul(from, &end, 10);
  if (*end) throw util::ParseNumberException(from);
  return ret;
}

uint8_t ParseBitCount(const char *from) {
  unsigned long val = ParseUInt(from);
  if (val > 25) {
    util::ParseNumberException e(from);
    e << " bit counts are limited to 25.";
  }
  return val;
}

void ParseFileList(const char *from, std::vector<std::string> &to) {
  to.clear();
  while (true) {
    const char *i;
    for (i = from; *i && *i != ' '; ++i) {}
    to.push_back(std::string(from, i - from));
    if (!*i) break;
    from = i + 1;
  }
}

void ProbingQuantizationUnsupported() {
  std::cerr << "Quantization is only implemented in the trie data structure." << std::endl;
  exit(1);
}

} // namespace ngram
} // namespace lm
} // namespace

int main(int argc, char *argv[]) {
  using namespace lm::ngram;

  const char *default_mem = util::GuessPhysicalMemory() ? "80%" : "1G";

  try {
    bool quantize = false, set_backoff_bits = false, bhiksha = false, set_write_method = false, rest = false;
    lm::ngram::Config config;
    config.building_memory = util::ParseSize(default_mem);
    int opt;
    while ((opt = getopt(argc, argv, "q:b:a:u:p:t:T:m:S:w:sir:")) != -1) {
      switch(opt) {
        case 'q':
          config.prob_bits = ParseBitCount(optarg);
          if (!set_backoff_bits) config.backoff_bits = config.prob_bits;
          quantize = true;
          break;
        case 'b':
          config.backoff_bits = ParseBitCount(optarg);
          set_backoff_bits = true;
          break;
        case 'a':
          config.pointer_bhiksha_bits = ParseBitCount(optarg);
          bhiksha = true;
          break;
        case 'u':
          config.unknown_missing_logprob = ParseFloat(optarg);
          break;
        case 'p':
          config.probing_multiplier = ParseFloat(optarg);
          break;
        case 't': // legacy
        case 'T':
          config.temporary_directory_prefix = optarg;
          break;
        case 'm': // legacy
          config.building_memory = ParseUInt(optarg) * 1048576;
          break;
        case 'S':
          config.building_memory = std::min(static_cast<uint64_t>(std::numeric_limits<std::size_t>::max()), util::ParseSize(optarg));
          break;
        case 'w':
          set_write_method = true;
          if (!strcmp(optarg, "mmap")) {
            config.write_method = Config::WRITE_MMAP;
          } else if (!strcmp(optarg, "after")) {
            config.write_method = Config::WRITE_AFTER;
          } else {
            Usage(argv[0], default_mem);
          }
          break;
        case 's':
          config.sentence_marker_missing = lm::SILENT;
          break;
        case 'i':
          config.positive_log_probability = lm::SILENT;
          break;
        case 'r':
          rest = true;
          ParseFileList(optarg, config.rest_lower_files);
          config.rest_function = Config::REST_LOWER;
          break;
        default:
          Usage(argv[0], default_mem);
      }
    }
    if (!quantize && set_backoff_bits) {
      std::cerr << "You specified backoff quantization (-b) but not probability quantization (-q)" << std::endl;
      abort();
    }
    if (optind + 1 == argc) {
      ShowSizes(argv[optind], config);
      return 0;
    }
    const char *model_type;
    const char *from_file;

    if (optind + 2 == argc) {
      model_type = "probing";
      from_file = argv[optind];
      config.write_mmap = argv[optind + 1];
    } else if (optind + 3 == argc) {
      model_type = argv[optind];
      from_file = argv[optind + 1];
      config.write_mmap = argv[optind + 2];
    } else {
      Usage(argv[0], default_mem);
    }
    if (!strcmp(model_type, "probing")) {
      if (!set_write_method) config.write_method = Config::WRITE_AFTER;
      if (quantize || set_backoff_bits) ProbingQuantizationUnsupported();
      if (rest) {
        RestProbingModel(from_file, config);
      } else {
        ProbingModel(from_file, config);
      }
    } else if (!strcmp(model_type, "trie")) {
      if (rest) {
        std::cerr << "Rest + trie is not supported yet." << std::endl;
        return 1;
      }
      if (!set_write_method) config.write_method = Config::WRITE_MMAP;
      if (quantize) {
        if (bhiksha) {
          QuantArrayTrieModel(from_file, config);
        } else {
          QuantTrieModel(from_file, config);
        }
      } else {
        if (bhiksha) {
          ArrayTrieModel(from_file, config);
        } else {
          TrieModel(from_file, config);
        }
      }
    } else {
      Usage(argv[0], default_mem);
    }
  }
  catch (const std::exception &e) {
    std::cerr << e.what() << std::endl;
    std::cerr << "ERROR" << std::endl;
    return 1;
  }
  std::cerr << "SUCCESS" << std::endl;
  return 0;
}


================================================
FILE: src/kenlm/lm/config.cc
================================================
#include "lm/config.hh"

#include <iostream>

namespace lm {
namespace ngram {

Config::Config() :
  show_progress(true),
  messages(&std::cerr),
  enumerate_vocab(NULL),
  unknown_missing(COMPLAIN),
  sentence_marker_missing(THROW_UP),
  positive_log_probability(THROW_UP),
  unknown_missing_logprob(-100.0),
  probing_multiplier(1.5),
  building_memory(1073741824ULL), // 1 GB
  temporary_directory_prefix(NULL),
  arpa_complain(ALL),
  write_mmap(NULL),
  write_method(WRITE_AFTER),
  include_vocab(true),
  rest_function(REST_MAX),
  prob_bits(8),
  backoff_bits(8),
  pointer_bhiksha_bits(22),
  load_method(util::POPULATE_OR_READ) {}

} // namespace ngram
} // namespace lm


================================================
FILE: src/kenlm/lm/config.hh
================================================
#ifndef LM_CONFIG__
#define LM_CONFIG__

#include "lm/lm_exception.hh"
#include "util/mmap.hh"

#include <iosfwd>
#include <string>
#include <vector>

/* Configuration for ngram model.  Separate header to reduce pollution. */

namespace lm {

class EnumerateVocab;

namespace ngram {

struct Config {
  // EFFECTIVE FOR BOTH ARPA AND BINARY READS

  // (default true) print progress bar to messages
  bool show_progress;

  // Where to log messages including the progress bar.  Set to NULL for
  // silence.
  std::ostream *messages;

  std::ostream *ProgressMessages() const {
    return show_progress ? messages : 0;
  }

  // This will be called with every string in the vocabulary.  See
  // enumerate_vocab.hh for more detail.  Config does not take ownership; you
  // are still responsible for deleting it (or stack allocating).
  EnumerateVocab *enumerate_vocab;


  // ONLY EFFECTIVE WHEN READING ARPA

  // What to do when <unk> isn't in the provided model.
  WarningAction unknown_missing;
  // What to do when <s> or </s> is missing from the model.
  // If THROW_UP, the exception will be of type util::SpecialWordMissingException.
  WarningAction sentence_marker_missing;

  // What to do with a positive log probability.  For COMPLAIN and SILENT, map
  // to 0.
  WarningAction positive_log_probability;

  // The probability to substitute for <unk> if it's missing from the model.
  // No effect if the model has <unk> or unknown_missing == THROW_UP.
  float unknown_missing_logprob;

  // Size multiplier for probing hash table.  Must be > 1.  Space is linear in
  // this.  Time is probing_multiplier / (probing_multiplier - 1).  No effect
  // for sorted variant.
  // If you find yourself setting this to a low number, consider using the
  // TrieModel which has lower memory consumption.
  float probing_multiplier;

  // Amount of memory to use for building.  The actual memory usage will be
  // higher since this just sets sort buffer size.  Only applies to trie
  // models.
  std::size_t building_memory;

  // Template for temporary directory appropriate for passing to mkdtemp.
  // The characters XXXXXX are appended before passing to mkdtemp.  Only
  // applies to trie.  If NULL, defaults to write_mmap.  If that's NULL,
  // defaults to input file name.
  const char *temporary_directory_prefix;

  // Level of complaining to do when loading from ARPA instead of binary format.
  enum ARPALoadComplain {ALL, EXPENSIVE, NONE};
  ARPALoadComplain arpa_complain;

  // While loading an ARPA file, also write out this binary format file.  Set
  // to NULL to disable.
  const char *write_mmap;

  enum WriteMethod {
    WRITE_MMAP, // Map the file directly.
    WRITE_AFTER // Write after we're done.
  };
  WriteMethod write_method;

  // Include the vocab in the binary file?  Only effective if write_mmap != NULL.
  bool include_vocab;


  // Left rest options.  Only used when the model includes rest costs.
  enum RestFunction {
    REST_MAX,   // Maximum of any score to the left
    REST_LOWER, // Use lower-order files given below.
  };
  RestFunction rest_function;
  // Only used for REST_LOWER.
  std::vector<std::string> rest_lower_files;


  // Quantization options.  Only effective for QuantTrieModel.  One value is
  // reserved for each of prob and backoff, so 2^bits - 1 buckets will be used
  // to quantize (and one of the remaining backoffs will be 0).
  uint8_t prob_bits, backoff_bits;

  // Bhiksha compression (simple form).  Only works with trie.
  uint8_t pointer_bhiksha_bits;


  // ONLY EFFECTIVE WHEN READING BINARY

  // How to get the giant array into memory: lazy mmap, populate, read etc.
  // See util/mmap.hh for details of MapMethod.
  util::LoadMethod load_method;


  // Set defaults.
  Config();
};

} /* namespace ngram */ } /* namespace lm */

#endif // LM_CONFIG__


================================================
FILE: src/kenlm/lm/enumerate_vocab.hh
================================================
#ifndef LM_ENUMERATE_VOCAB__
#define LM_ENUMERATE_VOCAB__

#include "lm/word_index.hh"
#include "util/string_piece.hh"

namespace lm {

/* If you need the actual strings in the vocabulary, inherit from this class
 * and implement Add.  Then put a pointer in Config.enumerate_vocab; it does
 * not take ownership.  Add is called once per vocab word.  index starts at 0
 * and increases by 1 each time.  This is only used by the Model constructor;
 * the pointer is not retained by the class.  
 */
class EnumerateVocab {
  public:
    virtual ~EnumerateVocab() {}

    virtual void Add(WordIndex index, const StringPiece &str) = 0;

  protected:
    EnumerateVocab() {}
};

} // namespace lm

#endif // LM_ENUMERATE_VOCAB__


================================================
FILE: src/kenlm/lm/facade.hh
================================================
#ifndef LM_FACADE__
#define LM_FACADE__

#include "lm/virtual_interface.hh"
#include "util/string_piece.hh"

#include <string>

namespace lm {
namespace base {

// Common model interface that depends on knowing the specific classes. 
// Curiously recurring template pattern.  
template <class Child, class StateT, class VocabularyT> class ModelFacade : public Model {
  public:
    typedef StateT State;
    typedef VocabularyT Vocabulary;

    // Default Score function calls FullScore.  Model can override this.  
    float Score(const State &in_state, const WordIndex new_word, State &out_state) const {
      return static_cast<const Child*>(this)->FullScore(in_state, new_word, out_state).prob;
    }

    /* Translate from void* to State */
    FullScoreReturn FullScore(const void *in_state, const WordIndex new_word, void *out_state) const {
      return static_cast<const Child*>(this)->FullScore(
          *reinterpret_cast<const State*>(in_state),
          new_word,
          *reinterpret_cast<State*>(out_state));
    }
    float Score(const void *in_state, const WordIndex new_word, void *out_state) const {
      return static_cast<const Child*>(this)->Score(
          *reinterpret_cast<const State*>(in_state),
          new_word,
          *reinterpret_cast<State*>(out_state));
    }

    const State &BeginSentenceState() const { return begin_sentence_; }
    const State &NullContextState() const { return null_context_; }
    const Vocabulary &GetVocabulary() const { return *static_cast<const Vocabulary*>(&BaseVocabulary()); }

  protected:
    ModelFacade() : Model(sizeof(State)) {}

    virtual ~ModelFacade() {}

    // begin_sentence and null_context can disappear after.  vocab should stay.  
    void Init(const State &begin_sentence, const State &null_context, const Vocabulary &vocab, unsigned char order) {
      begin_sentence_ = begin_sentence;
      null_context_ = null_context;
      begin_sentence_memory_ = &begin_sentence_;
      null_context_memory_ = &null_context_;
      base_vocab_ = &vocab;
      order_ = order;
    }

  private:
    State begin_sentence_, null_context_;
};

} // mamespace base
} // namespace lm

#endif // LM_FACADE__


================================================
FILE: src/kenlm/lm/fragment_main.cc
================================================
#include "lm/binary_format.hh"
#include "lm/model.hh"
#include "lm/left.hh"
#include "util/tokenize_piece.hh"

template <class Model> void Query(const char *name) {
  Model model(name);
  std::string line;
  lm::ngram::ChartState ignored;
  while (getline(std::cin, line)) {
    lm::ngram::RuleScore<Model> scorer(model, ignored);
    for (util::TokenIter<util::SingleCharacter, true> i(line, ' '); i; ++i) {
      scorer.Terminal(model.GetVocabulary().Index(*i));
    }
    std::cout << scorer.Finish() << '\n';
  }
}

int main(int argc, char *argv[]) {
  if (argc != 2) {
    std::cerr << "Expected model file name." << std::endl;
    return 1;
  }
  const char *name = argv[1];
  lm::ngram::ModelType model_type = lm::ngram::PROBING;
  lm::ngram::RecognizeBinary(name, model_type);
  switch (model_type) {
    case lm::ngram::PROBING:
      Query<lm::ngram::ProbingModel>(name);
      break;
    case lm::ngram::REST_PROBING:
      Query<lm::ngram::RestProbingModel>(name);
      break;
    default:
      std::cerr << "Model type not supported yet." << std::endl;
  }
}


================================================
FILE: src/kenlm/lm/kenlm_max_order_main.cc
================================================
#include "lm/max_order.hh"
#include <iostream>

int main(int argc, char *argv[]) {
  std::cerr << "KenLM was compiled with a maximum supported n-gram order set to " << KENLM_MAX_ORDER << "." << std::endl;
}


================================================
FILE: src/kenlm/lm/left.hh
================================================
/* Efficient left and right language model state for sentence fragments.
 * Intended usage:
 * Store ChartState with every chart entry.  
 * To do a rule application:
 * 1. Make a ChartState object for your new entry.  
 * 2. Construct RuleScore.  
 * 3. Going from left to right, call Terminal or NonTerminal. 
 *   For terminals, just pass the vocab id.  
 *   For non-terminals, pass that non-terminal's ChartState.
 *     If your decoder expects scores inclusive of subtree scores (i.e. you
 *     label entries with the highest-scoring path), pass the non-terminal's
 *     score as prob.  
 *     If your decoder expects relative scores and will walk the chart later,
 *     pass prob = 0.0.  
 *     In other words, the only effect of prob is that it gets added to the
 *     returned log probability.  
 * 4. Call Finish.  It returns the log probability.   
 *
 * There's a couple more details: 
 * Do not pass <s> to Terminal as it is formally not a word in the sentence,
 * only context.  Instead, call BeginSentence.  If called, it should be the
 * first call after RuleScore is constructed (since <s> is always the
 * leftmost).
 *
 * If the leftmost RHS is a non-terminal, it's faster to call BeginNonTerminal.
 *
 * Hashing and sorting comparison operators are provided.   All state objects
 * are POD.  If you intend to use memcmp on raw state objects, you must call
 * ZeroRemaining first, as the value of array entries beyond length is
 * otherwise undefined.  
 *
 * Usage is of course not limited to chart decoding.  Anything that generates
 * sentence fragments missing left context could benefit.  For example, a
 * phrase-based decoder could pre-score phrases, storing ChartState with each
 * phrase, even if hypotheses are generated left-to-right.  
 */

#ifndef LM_LEFT__
#define LM_LEFT__

#include "lm/max_order.hh"
#include "lm/state.hh"
#include "lm/return.hh"

#include "util/murmur_hash.hh"

#include <algorithm>

namespace lm {
namespace ngram {

template <class M> class RuleScore {
  public:
    explicit RuleScore(const M &model, ChartState &out) : model_(model), out_(&out), left_done_(false), prob_(0.0) {
      out.left.length = 0;
      out.right.length = 0;
    }

    void BeginSentence() {
      out_->right = model_.BeginSentenceState();
      // out_->left is empty.
      left_done_ = true;
    }

    void Terminal(WordIndex word) {
      State copy(out_->right);
      FullScoreReturn ret(model_.FullScore(copy, word, out_->right));
      if (left_done_) { prob_ += ret.prob; return; }
      if (ret.independent_left) {
        prob_ += ret.prob;
        left_done_ = true;
        return;
      }
      out_->left.pointers[out_->left.length++] = ret.extend_left;
      prob_ += ret.rest;
      if (out_->right.length != copy.length + 1)
        left_done_ = true;
    }

    // Faster version of NonTerminal for the case where the rule begins with a non-terminal.  
    void BeginNonTerminal(const ChartState &in, float prob = 0.0) {
      prob_ = prob;
      *out_ = in;
      left_done_ = in.left.full;
    }

    void NonTerminal(const ChartState &in, float prob = 0.0) {
      prob_ += prob;
      
      if (!in.left.length) {
        if (in.left.full) {
          for (const float *i = out_->right.backoff; i < out_->right.backoff + out_->right.length; ++i) prob_ += *i;
          left_done_ = true;
          out_->right = in.right;
        }
        return;
      }

      if (!out_->right.length) {
        out_->right = in.right;
        if (left_done_) {
          prob_ += model_.UnRest(in.left.pointers, in.left.pointers + in.left.length, 1);
          return;
        }
        if (out_->left.length) {
          left_done_ = true;
        } else {
          out_->left = in.left;
          left_done_ = in.left.full;
        }
        return;
      }

      float backoffs[KENLM_MAX_ORDER - 1], backoffs2[KENLM_MAX_ORDER - 1];
      float *back = backoffs, *back2 = backoffs2;
      unsigned char next_use = out_->right.length;

      // First word
      if (ExtendLeft(in, next_use, 1, out_->right.backoff, back)) return;

      // Words after the first, so extending a bigram to begin with
      for (unsigned char extend_length = 2; extend_length <= in.left.length; ++extend_length) {
        if (ExtendLeft(in, next_use, extend_length, back, back2)) return;
        std::swap(back, back2);
      }

      if (in.left.full) {
        for (const float *i = back; i != back + next_use; ++i) prob_ += *i;
        left_done_ = true;
        out_->right = in.right;
        return;
      }

      // Right state was minimized, so it's already independent of the new words to the left.  
      if (in.right.length < in.left.length) {
        out_->right = in.right;
        return;
      }

      // Shift exisiting words down.  
      for (WordIndex *i = out_->right.words + next_use - 1; i >= out_->right.words; --i) {
        *(i + in.right.length) = *i;
      }
      // Add words from in.right.  
      std::copy(in.right.words, in.right.words + in.right.length, out_->right.words);
      // Assemble backoff composed on the existing state's backoff followed by the new state's backoff.  
      std::copy(in.right.backoff, in.right.backoff + in.right.length, out_->right.backoff);
      std::copy(back, back + next_use, out_->right.backoff + in.right.length);
      out_->right.length = in.right.length + next_use;
    }

    float Finish() {
      // A N-1-gram might extend left and right but we should still set full to true because it's an N-1-gram.  
      out_->left.full = left_done_ || (out_->left.length == model_.Order() - 1);
      return prob_;
    }

    void Reset() {
      prob_ = 0.0;
      left_done_ = false;
      out_->left.length = 0;
      out_->right.length = 0;
    }
    void Reset(ChartState &replacement) {
      out_ = &replacement;
      Reset();
    }

  private:
    bool ExtendLeft(const ChartState &in, unsigned char &next_use, unsigned char extend_length, const float *back_in, float *back_out) {
      ProcessRet(model_.ExtendLeft(
            out_->right.words, out_->right.words + next_use, // Words to extend into
            back_in, // Backoffs to use
            in.left.pointers[extend_length - 1], extend_length, // Words to be extended
            back_out, // Backoffs for the next score
            next_use)); // Length of n-gram to use in next scoring.  
      if (next_use != out_->right.length) {
        left_done_ = true;
        if (!next_use) {
          // Early exit.  
          out_->right = in.right;
          prob_ += model_.UnRest(in.left.pointers + extend_length, in.left.pointers + in.left.length, extend_length + 1);
          return true;
        }
      }
      // Continue scoring.  
      return false;
    }

    void ProcessRet(const FullScoreReturn &ret) {
      if (left_done_) {
        prob_ += ret.prob;
        return;
      }
      if (ret.independent_left) {
        prob_ += ret.prob;
        left_done_ = true;
        return;
      }
      out_->left.pointers[out_->left.length++] = ret.extend_left;
      prob_ += ret.rest;
    }

    const M &model_;

    ChartState *out_;

    bool left_done_;

    float prob_;
};

} // namespace ngram
} // namespace lm

#endif // LM_LEFT__


================================================
FILE: src/kenlm/lm/left_test.cc
================================================
#include "lm/left.hh"
#include "lm/model.hh"

#include "util/tokenize_piece.hh"

#include <vector>

#define BOOST_TEST_MODULE LeftTest
#include <boost/test/unit_test.hpp>
#include <boost/test/floating_point_comparison.hpp>

namespace lm {
namespace ngram {
namespace {

#define Term(word) score.Terminal(m.GetVocabulary().Index(word));
#define VCheck(word, value) BOOST_CHECK_EQUAL(m.GetVocabulary().Index(word), value);

// Apparently some Boost versions use templates and are pretty strict about types matching.  
#define SLOPPY_CHECK_CLOSE(ref, value, tol) BOOST_CHECK_CLOSE(static_cast<double>(ref), static_cast<double>(value), static_cast<double>(tol));

template <class M> void Short(const M &m) {
  ChartState base;
  {
    RuleScore<M> score(m, base);
    Term("more");
    Term("loin");
    SLOPPY_CHECK_CLOSE(-1.206319 - 0.3561665, score.Finish(), 0.001);
  }
  BOOST_CHECK(base.left.full);
  BOOST_CHECK_EQUAL(2, base.left.length);
  BOOST_CHECK_EQUAL(1, base.right.length);
  VCheck("loin", base.right.words[0]);

  ChartState more_left;
  {
    RuleScore<M> score(m, more_left);
    Term("little");
    score.NonTerminal(base, -1.206319 - 0.3561665);
    // p(little more loin | null context)
    SLOPPY_CHECK_CLOSE(-1.56538, score.Finish(), 0.001);
  }
  BOOST_CHECK_EQUAL(3, more_left.left.length);
  BOOST_CHECK_EQUAL(1, more_left.right.length);
  VCheck("loin", more_left.right.words[0]);
  BOOST_CHECK(more_left.left.full);

  ChartState shorter;
  {
    RuleScore<M> score(m, shorter);
    Term("to");
    score.NonTerminal(base, -1.206319 - 0.3561665);
    SLOPPY_CHECK_CLOSE(-0.30103 - 1.687872 - 1.206319 - 0.3561665, score.Finish(), 0.01);
  }
  BOOST_CHECK_EQUAL(1, shorter.left.length);
  BOOST_CHECK_EQUAL(1, shorter.right.length);
  VCheck("loin", shorter.right.words[0]);
  BOOST_CHECK(shorter.left.full);
}

template <class M> void Charge(const M &m) {
  ChartState base;
  {
    RuleScore<M> score(m, base);
    Term("on");
    Term("more");
    SLOPPY_CHECK_CLOSE(-1.509559 -0.4771212 -1.206319, score.Finish(), 0.001);
  }
  BOOST_CHECK_EQUAL(1, base.left.length);
  BOOST_CHECK_EQUAL(1, base.right.length);
  VCheck("more", base.right.words[0]);
  BOOST_CHECK(base.left.full);

  ChartState extend;
  {
    RuleScore<M> score(m, extend);
    Term("looking");
    score.NonTerminal(base, -1.509559 -0.4771212 -1.206319);
    SLOPPY_CHECK_CLOSE(-3.91039, score.Finish(), 0.001);
  }
  BOOST_CHECK_EQUAL(2, extend.left.length);
  BOOST_CHECK_EQUAL(1, extend.right.length);
  VCheck("more", extend.right.words[0]);
  BOOST_CHECK(extend.left.full);

  ChartState tobos;
  {
    RuleScore<M> score(m, tobos);
    score.BeginSentence();
    score.NonTerminal(extend, -3.91039);
    SLOPPY_CHECK_CLOSE(-3.471169, score.Finish(), 0.001);
  }
  BOOST_CHECK_EQUAL(0, tobos.left.length);
  BOOST_CHECK_EQUAL(1, tobos.right.length);
}

template <class M> float LeftToRight(const M &m, const std::vector<WordIndex> &words, bool begin_sentence = false) {
  float ret = 0.0;
  State right = begin_sentence ? m.BeginSentenceState() : m.NullContextState();
  for (std::vector<WordIndex>::const_iterator i = words.begin(); i != words.end(); ++i) {
    State copy(right);
    ret += m.Score(copy, *i, right);
  }
  return ret;
}

template <class M> float RightToLeft(const M &m, const std::vector<WordIndex> &words, bool begin_sentence = false) {
  float ret = 0.0;
  ChartState state;
  state.left.length = 0;
  state.right.length = 0;
  state.left.full = false;
  for (std::vector<WordIndex>::const_reverse_iterator i = words.rbegin(); i != words.rend(); ++i) {
    ChartState copy(state);
    RuleScore<M> score(m, state);
    score.Terminal(*i);
    score.NonTerminal(copy, ret);
    ret = score.Finish();
  }
  if (begin_sentence) {
    ChartState copy(state);
    RuleScore<M> score(m, state);
    score.BeginSentence();
    score.NonTerminal(copy, ret);
    ret = score.Finish();
  }
  return ret;
}

template <class M> float TreeMiddle(const M &m, const std::vector<WordIndex> &words, bool begin_sentence = false) {
  std::vector<std::pair<ChartState, float> > states(words.size());
  for (unsigned int i = 0; i < words.size(); ++i) {
    RuleScore<M> score(m, states[i].first);
    score.Terminal(words[i]);
    states[i].second = score.Finish();
  }
  while (states.size() > 1) {
    std::vector<std::pair<ChartState, float> > upper((states.size() + 1) / 2);
    for (unsigned int i = 0; i < states.size() / 2; ++i) {
      RuleScore<M> score(m, upper[i].first);
      score.NonTerminal(states[i*2].first, states[i*2].second);
      score.NonTerminal(states[i*2+1].first, states[i*2+1].second);
      upper[i].second = score.Finish();
    }
    if (states.size() % 2) {
      upper.back() = states.back();
    }
    std::swap(states, upper);
  }

  if (states.empty()) return 0.0;

  if (begin_sentence) {
    ChartState ignored;
    RuleScore<M> score(m, ignored);
    score.BeginSentence();
    score.NonTerminal(states.front().first, states.front().second);
    return score.Finish();
  } else {
    return states.front().second;
  }

}

template <class M> void LookupVocab(const M &m, const StringPiece &str, std::vector<WordIndex> &out) {
  out.clear();
  for (util::TokenIter<util::SingleCharacter, true> i(str, ' '); i; ++i) {
    out.push_back(m.GetVocabulary().Index(*i));
  }
}

#define TEXT_TEST(str) \
  LookupVocab(m, str, words); \
  expect = LeftToRight(m, words, rest); \
  SLOPPY_CHECK_CLOSE(expect, RightToLeft(m, words, rest), 0.001); \
  SLOPPY_CHECK_CLOSE(expect, TreeMiddle(m, words, rest), 0.001); \

// Build sentences, or parts thereof, from right to left.  
template <class M> void GrowBig(const M &m, bool rest = false) {
  std::vector<WordIndex> words;
  float expect;
  TEXT_TEST("in biarritz watching considering looking . on a little more loin also would consider higher to look good unknown the screening foo bar , unknown however unknown </s>");
  TEXT_TEST("on a little more loin also would consider higher to look good unknown the screening foo bar , unknown however unknown </s>");
  TEXT_TEST("on a little more loin also would consider higher to look good");
  TEXT_TEST("more loin also would consider higher to look good");
  TEXT_TEST("more loin also would consider higher to look");
  TEXT_TEST("also would consider higher to look");
  TEXT_TEST("also would consider higher");
  TEXT_TEST("would consider higher to look");
  TEXT_TEST("consider higher to look");
  TEXT_TEST("consider higher to");
  TEXT_TEST("consider higher");
}

template <class M> void GrowSmall(const M &m, bool rest = false) {
  std::vector<WordIndex> words;
  float expect;
  TEXT_TEST("in biarritz watching considering looking . </s>");
  TEXT_TEST("in biarritz watching considering looking .");
  TEXT_TEST("in biarritz");
}

template <class M> void AlsoWouldConsiderHigher(const M &m) {
  ChartState also;
  {
    RuleScore<M> score(m, also);
    score.Terminal(m.GetVocabulary().Index("also"));
    SLOPPY_CHECK_CLOSE(-1.687872, score.Finish(), 0.001);
  }
  ChartState would;
  {
    RuleScore<M> score(m, would);
    score.Terminal(m.GetVocabulary().Index("would"));
    SLOPPY_CHECK_CLOSE(-1.687872, score.Finish(), 0.001);
  }
  ChartState combine_also_would;
  {
    RuleScore<M> score(m, combine_also_would);
    score.NonTerminal(also, -1.687872);
    score.NonTerminal(would, -1.687872);
    SLOPPY_CHECK_CLOSE(-1.687872 - 2.0, score.Finish(), 0.001);
  }
  BOOST_CHECK_EQUAL(2, combine_also_would.right.length);

  ChartState also_would;
  {
    RuleScore<M> score(m, also_would);
    score.Terminal(m.GetVocabulary().Index("also"));
    score.Terminal(m.GetVocabulary().Index("would"));
    SLOPPY_CHECK_CLOSE(-1.687872 - 2.0, score.Finish(), 0.001);
  }
  BOOST_CHECK_EQUAL(2, also_would.right.length);

  ChartState consider;
  {
    RuleScore<M> score(m, consider);
    score.Terminal(m.GetVocabulary().Index("consider"));
    SLOPPY_CHECK_CLOSE(-1.687872, score.Finish(), 0.001);
  }
  BOOST_CHECK_EQUAL(1, consider.left.length);
  BOOST_CHECK_EQUAL(1, consider.right.length);
  BOOST_CHECK(!consider.left.full);

  ChartState higher;
  float higher_score;
  {
    RuleScore<M> score(m, higher);
    score.Terminal(m.GetVocabulary().Index("higher"));
    higher_score = score.Finish();
  }
  SLOPPY_CHECK_CLOSE(-1.509559, higher_score, 0.001);
  BOOST_CHECK_EQUAL(1, higher.left.length);
  BOOST_CHECK_EQUAL(1, higher.right.length);
  BOOST_CHECK(!higher.left.full);
  VCheck("higher", higher.right.words[0]);
  SLOPPY_CHECK_CLOSE(-0.30103, higher.right.backoff[0], 0.001);

  ChartState consider_higher;
  {
    RuleScore<M> score(m, consider_higher);
    score.NonTerminal(consider, -1.687872);
    score.NonTerminal(higher, higher_score);
    SLOPPY_CHECK_CLOSE(-1.509559 - 1.687872 - 0.30103, score.Finish(), 0.001);
  }
  BOOST_CHECK_EQUAL(2, consider_higher.left.length);
  BOOST_CHECK(!consider_higher.left.full);

  ChartState full;
  {
    RuleScore<M> score(m, full);
    score.NonTerminal(combine_also_would, -1.687872 - 2.0);
    score.NonTerminal(consider_higher, -1.509559 - 1.687872 - 0.30103);
    SLOPPY_CHECK_CLOSE(-10.6879, score.Finish(), 0.001);
  }
  BOOST_CHECK_EQUAL(4, full.right.length);
}

#define CHECK_SCORE(str, val) \
{ \
  float got = val; \
  std::vector<WordIndex> indices; \
  LookupVocab(m, str, indices); \
  SLOPPY_CHECK_CLOSE(LeftToRight(m, indices), got, 0.001); \
}

template <class M> void FullGrow(const M &m) {
  std::vector<WordIndex> words;
  LookupVocab(m, "in biarritz watching considering looking . </s>", words);

  ChartState lexical[7];
  float lexical_scores[7];
  for (unsigned int i = 0; i < 7; ++i) {
    RuleScore<M> score(m, lexical[i]);
    score.Terminal(words[i]);
    lexical_scores[i] = score.Finish();
  }
  CHECK_SCORE("in", lexical_scores[0]);
  CHECK_SCORE("biarritz", lexical_scores[1]);
  CHECK_SCORE("watching", lexical_scores[2]);
  CHECK_SCORE("</s>", lexical_scores[6]);

  ChartState l1[4];
  float l1_scores[4];
  {
    RuleScore<M> score(m, l1[0]);
    score.NonTerminal(lexical[0], lexical_scores[0]);
    score.NonTerminal(lexical[1], lexical_scores[1]);
    CHECK_SCORE("in biarritz", l1_scores[0] = score.Finish());
  }
  {
    RuleScore<M> score(m, l1[1]);
    score.NonTerminal(lexical[2], lexical_scores[2]);
    score.NonTerminal(lexical[3], lexical_scores[3]);
    CHECK_SCORE("watching considering", l1_scores[1] = score.Finish());
  }
  {
    RuleScore<M> score(m, l1[2]);
    score.NonTerminal(lexical[4], lexical_scores[4]);
    score.NonTerminal(lexical[5], lexical_scores[5]);
    CHECK_SCORE("looking .", l1_scores[2] = score.Finish());
  }
  BOOST_CHECK_EQUAL(l1[2].left.length, 1);
  l1[3] = lexical[6];
  l1_scores[3] = lexical_scores[6];

  ChartState l2[2];
  float l2_scores[2];
  {
    RuleScore<M> score(m, l2[0]);
    score.NonTerminal(l1[0], l1_scores[0]);
    score.NonTerminal(l1[1], l1_scores[1]);
    CHECK_SCORE("in biarritz watching considering", l2_scores[0] = score.Finish());
  }
  {
    RuleScore<M> score(m, l2[1]);
    score.NonTerminal(l1[2], l1_scores[2]);
    score.NonTerminal(l1[3], l1_scores[3]);
    CHECK_SCORE("looking . </s>", l2_scores[1] = score.Finish());
  }
  BOOST_CHECK_EQUAL(l2[1].left.length, 1);
  BOOST_CHECK(l2[1].left.full);

  ChartState top;
  {
    RuleScore<M> score(m, top);
    score.NonTerminal(l2[0], l2_scores[0]);
    score.NonTerminal(l2[1], l2_scores[1]);
    CHECK_SCORE("in biarritz watching considering looking . </s>", score.Finish());
  }
}

const char *FileLocation() {
  if (boost::unit_test::framework::master_test_suite().argc < 2) {
    return "test.arpa";
  }
  return boost::unit_test::framework::master_test_suite().argv[1];
}

template <class M> void Everything() {
  Config config;
  config.messages = NULL;
  M m(FileLocation(), config);

  Short(m);
  Charge(m);
  GrowBig(m);
  AlsoWouldConsiderHigher(m);
  GrowSmall(m);
  FullGrow(m);
}

BOOST_AUTO_TEST_CASE(ProbingAll) {
  Everything<Model>();
}
BOOST_AUTO_TEST_CASE(TrieAll) {
  Everything<TrieModel>();
}
BOOST_AUTO_TEST_CASE(QuantTrieAll) {
  Everything<QuantTrieModel>();
}
BOOST_AUTO_TEST_CASE(ArrayQuantTrieAll) {
  Everything<QuantArrayTrieModel>();
}
BOOST_AUTO_TEST_CASE(ArrayTrieAll) {
  Everything<ArrayTrieModel>();
}

BOOST_AUTO_TEST_CASE(RestProbing) {
  Config config;
  config.messages = NULL;
  RestProbingModel m(FileLocation(), config);
  GrowBig(m, true);
}

} // namespace
} // namespace ngram
} // namespace lm


================================================
FILE: src/kenlm/lm/lm_exception.cc
================================================
#include "lm/lm_exception.hh"

#include<errno.h>
#include<stdio.h>

namespace lm {

ConfigException::ConfigException() throw() {}
ConfigException::~ConfigException() throw() {}

LoadException::LoadException() throw() {}
LoadException::~LoadException() throw() {}

FormatLoadException::FormatLoadException() throw() {}
FormatLoadException::~FormatLoadException() throw() {}

VocabLoadException::VocabLoadException() throw() {}
VocabLoadException::~VocabLoadException() throw() {}

SpecialWordMissingException::SpecialWordMissingException() throw() {}
SpecialWordMissingException::~SpecialWordMissingException() throw() {}

} // namespace lm


================================================
FILE: src/kenlm/lm/lm_exception.hh
================================================
#ifndef LM_LM_EXCEPTION__
#define LM_LM_EXCEPTION__

// Named to avoid conflict with util/exception.hh.  

#include "util/exception.hh"
#include "util/string_piece.hh"

#include <exception>
#include <string>

namespace lm {

typedef enum {THROW_UP, COMPLAIN, SILENT} WarningAction;

class ConfigException : public util::Exception {
  public:
    ConfigException() throw();
    ~ConfigException() throw();
};

class LoadException : public util::Exception {
   public:
      virtual ~LoadException() throw();

   protected:
      LoadException() throw();
};

class FormatLoadException : public LoadException {
  public:
    FormatLoadException() throw();
    ~FormatLoadException() throw();
};

class VocabLoadException : public LoadException {
  public:
    virtual ~VocabLoadException() throw();
    VocabLoadException() throw();
};

class SpecialWordMissingException : public VocabLoadException {
  public:
    explicit SpecialWordMissingException() throw();
    ~SpecialWordMissingException() throw();
};

} // namespace lm

#endif // LM_LM_EXCEPTION


================================================
FILE: src/kenlm/lm/max_order.hh
================================================
/* IF YOUR BUILD SYSTEM PASSES -DKENLM_MAX_ORDER, THEN CHANGE THE BUILD SYSTEM.
 * If not, this is the default maximum order.  
 * Having this limit means that State can be
 * (kMaxOrder - 1) * sizeof(float) bytes instead of
 * sizeof(float*) + (kMaxOrder - 1) * sizeof(float) + malloc overhead
 */
#ifndef KENLM_ORDER_MESSAGE
#define KENLM_ORDER_MESSAGE "If your build system supports changing KENLM_MAX_ORDER, change it there and recompile.  In the KenLM tarball or Moses, use e.g. `bjam --max-kenlm-order=6 -a'.  Otherwise, edit lm/max_order.hh."
#endif


================================================
FILE: src/kenlm/lm/model.cc
================================================
#include "lm/model.hh"

#include "lm/blank.hh"
#include "lm/lm_exception.hh"
#include "lm/search_hashed.hh"
#include "lm/search_trie.hh"
#include "lm/read_arpa.hh"
#include "util/have.hh"
#include "util/murmur_hash.hh"

#include <algorithm>
#include <functional>
#include <numeric>
#include <cmath>
#include <limits>

namespace lm {
namespace ngram {
namespace detail {

template <class Search, class VocabularyT> const ModelType GenericModel<Search, VocabularyT>::kModelType = Search::kModelType;

template <class Search, class VocabularyT> uint64_t GenericModel<Search, VocabularyT>::Size(const std::vector<uint64_t> &counts, const Config &config) {
  return VocabularyT::Size(counts[0], config) + Search::Size(counts, config);
}

template <class Search, class VocabularyT> void GenericModel<Search, VocabularyT>::SetupMemory(void *base, const std::vector<uint64_t> &counts, const Config &config) {
  size_t goal_size = util::CheckOverflow(Size(counts, config));
  uint8_t *start = static_cast<uint8_t*>(base);
  size_t allocated = VocabularyT::Size(counts[0], config);
  vocab_.SetupMemory(start, allocated, counts[0], config);
  start += allocated;
  start = search_.SetupMemory(start, counts, config);
  if (static_cast<std::size_t>(start - static_cast<uint8_t*>(base)) != goal_size) UTIL_THROW(FormatLoadException, "The data structures took " << (start - static_cast<uint8_t*>(base)) << " but Size says they should take " << goal_size);
}

template <class Search, class VocabularyT> GenericModel<Search, VocabularyT>::GenericModel(const char *file, const Config &config) {
  LoadLM(file, config, *this);

  // g++ prints warnings unless these are fully initialized.
  State begin_sentence = State();
  begin_sentence.length = 1;
  begin_sentence.words[0] = vocab_.BeginSentence();
  typename Search::Node ignored_node;
  bool ignored_independent_left;
  uint64_t ignored_extend_left;
  begin_sentence.backoff[0] = search_.LookupUnigram(begin_sentence.words[0], ignored_node, ignored_independent_left, ignored_extend_left).Backoff();
  State null_context = State();
  null_context.length = 0;
  P::Init(begin_sentence, null_context, vocab_, search_.Order());
}

namespace {
void CheckCounts(const std::vector<uint64_t> &counts) {
  UTIL_THROW_IF(counts.size() > KENLM_MAX_ORDER, FormatLoadException, "This model has order " << counts.size() << " but KenLM was compiled to support up to " << KENLM_MAX_ORDER << ".  " << KENLM_ORDER_MESSAGE);
  if (sizeof(uint64_t) > sizeof(std::size_t)) {
    for (std::vector<uint64_t>::const_iterator i = counts.begin(); i != counts.end(); ++i) {
      UTIL_THROW_IF(*i > static_cast<uint64_t>(std::numeric_limits<size_t>::max()), util::OverflowException, "This model has " << *i << " " << (i - counts.begin() + 1) << "-grams which is too many for 32-bit machines.");
    }
  }
}
} // namespace

template <class Search, class VocabularyT> void GenericModel<Search, VocabularyT>::InitializeFromBinary(void *start, const Parameters &params, const Config &config, int fd) {
  CheckCounts(params.counts);
  SetupMemory(start, params.counts, config);
  vocab_.LoadedBinary(params.fixed.has_vocabulary, fd, config.enumerate_vocab);
  search_.LoadedBinary();
}

template <class Search, class VocabularyT> void GenericModel<Search, VocabularyT>::InitializeFromARPA(const char *file, const Config &config) {
  // Backing file is the ARPA.  Steal it so we can make the backing file the mmap output if any.
  util::FilePiece f(backing_.file.release(), file, config.ProgressMessages());
  try {
    std::vector<uint64_t> counts;
    // File counts do not include pruned trigrams that extend to quadgrams etc.   These will be fixed by search_.
    ReadARPACounts(f, counts);
    CheckCounts(counts);
    if (counts.size() < 2) UTIL_THROW(FormatLoadException, "This ngram implementation assumes at least a bigram model.");
    if (config.probing_multiplier <= 1.0) UTIL_THROW(ConfigException, "probing multiplier must be > 1.0");

    std::size_t vocab_size = util::CheckOverflow(VocabularyT::Size(counts[0], config));
    // Setup the binary file for writing the vocab lookup table.  The search_ is responsible for growing the binary file to its needs.
    vocab_.SetupMemory(SetupJustVocab(config, counts.size(), vocab_size, backing_), vocab_size, counts[0], config);

    if (config.write_mmap) {
      WriteWordsWrapper wrap(config.enumerate_vocab);
      vocab_.ConfigureEnumerate(&wrap, counts[0]);
      search_.InitializeFromARPA(file, f, counts, config, vocab_, backing_);
      wrap.Write(backing_.file.get(), backing_.vocab.size() + vocab_.UnkCountChangePadding() + Search::Size(counts, config));
    } else {
      vocab_.ConfigureEnumerate(config.enumerate_vocab, counts[0]);
      search_.InitializeFromARPA(file, f, counts, config, vocab_, backing_);
    }

    if (!vocab_.SawUnk()) {
      assert(config.unknown_missing != THROW_UP);
      // Default probabilities for unknown.
      search_.UnknownUnigram().backoff = 0.0;
      search_.UnknownUnigram().prob = config.unknown_missing_logprob;
    }
    FinishFile(config, kModelType, kVersion, counts, vocab_.UnkCountChangePadding(), backing_);
  } catch (util::Exception &e) {
    e << " Byte: " << f.Offset();
    throw;
  }
}

template <class Search, class VocabularyT> void GenericModel<Search, VocabularyT>::UpdateConfigFromBinary(int fd, const std::vector<uint64_t> &counts, Config &config) {
  util::AdvanceOrThrow(fd, VocabularyT::Size(counts[0], config));
  Search::UpdateConfigFromBinary(fd, counts, config);
}

template <class Search, class VocabularyT> FullScoreReturn GenericModel<Search, VocabularyT>::FullScore(const State &in_state, const WordIndex new_word, State &out_state) const {
  FullScoreReturn ret = ScoreExceptBackoff(in_state.words, in_state.words + in_state.length, new_word, out_state);
  for (const float *i = in_state.backoff + ret.ngram_length - 1; i < in_state.backoff + in_state.length; ++i) {
    ret.prob += *i;
  }
  return ret;
}

template <class Search, class VocabularyT> FullScoreReturn GenericModel<Search, VocabularyT>::FullScoreForgotState(const WordIndex *context_rbegin, const WordIndex *context_rend, const WordIndex new_word, State &out_state) const {
  context_rend = std::min(context_rend, context_rbegin + P::Order() - 1);
  FullScoreReturn ret = ScoreExceptBackoff(context_rbegin, context_rend, new_word, out_state);

  // Add the backoff weights for n-grams of order start to (context_rend - context_rbegin).
  unsigned char start = ret.ngram_length;
  if (context_rend - context_rbegin < static_cast<std::ptrdiff_t>(start)) return ret;

  bool independent_left;
  uint64_t extend_left;
  typename Search::Node node;
  if (start <= 1) {
    ret.prob += search_.LookupUnigram(*context_rbegin, node, independent_left, extend_left).Backoff();
    start = 2;
  } else if (!search_.FastMakeNode(context_rbegin, context_rbegin + start - 1, node)) {
    return ret;
  }
  // i is the order of the backoff we're looking for.
  unsigned char order_minus_2 = start - 2;
  for (const WordIndex *i = context_rbegin + start - 1; i < context_rend; ++i, ++order_minus_2) {
    typename Search::MiddlePointer p(search_.LookupMiddle(order_minus_2, *i, node, independent_left, extend_left));
    if (!p.Found()) break;
    ret.prob += p.Backoff();
  }
  return ret;
}

template <class Search, class VocabularyT> void GenericModel<Search, VocabularyT>::GetState(const WordIndex *context_rbegin, const WordIndex *context_rend, State &out_state) const {
  // Generate a state from context.
  context_rend = std::min(context_rend, context_rbegin + P::Order() - 1);
  if (context_rend == context_rbegin) {
    out_state.length = 0;
    return;
  }
  typename Search::Node node;
  bool independent_left;
  uint64_t extend_left;
  out_state.backoff[0] = search_.LookupUnigram(*context_rbegin, node, independent_left, extend_left).Backoff();
  out_state.length = HasExtension(out_state.backoff[0]) ? 1 : 0;
  float *backoff_out = out_state.backoff + 1;
  unsigned char order_minus_2 = 0;
  for (const WordIndex *i = context_rbegin + 1; i < context_rend; ++i, ++backoff_out, ++order_minus_2) {
    typename Search::MiddlePointer p(search_.LookupMiddle(order_minus_2, *i, node, independent_left, extend_left));
    if (!p.Found()) {
      std::copy(context_rbegin, context_rbegin + out_state.length, out_state.words);
      return;
    }
    *backoff_out = p.Backoff();
    if (HasExtension(*backoff_out)) out_state.length = i - context_rbegin + 1;
  }
  std::copy(context_rbegin, context_rbegin + out_state.length, out_state.words);
}

template <class Search, class VocabularyT> FullScoreReturn GenericModel<Search, VocabularyT>::ExtendLeft(
    const WordIndex *add_rbegin, const WordIndex *add_rend,
    const float *backoff_in,
    uint64_t extend_pointer,
    unsigned char extend_length,
    float *backoff_out,
    unsigned char &next_use) const {
  FullScoreReturn ret;
  typename Search::Node node;
  if (extend_length == 1) {
    typename Search::UnigramPointer ptr(search_.LookupUnigram(static_cast<WordIndex>(extend_pointer), node, ret.independent_left, ret.extend_left));
    ret.rest = ptr.Rest();
    ret.prob = ptr.Prob();
    assert(!ret.independent_left);
  } else {
    typename Search::MiddlePointer ptr(search_.Unpack(extend_pointer, extend_length, node));
    ret.rest = ptr.Rest();
    ret.prob = ptr.Prob();
    ret.extend_left = extend_pointer;
    // If this function is called, then it does depend on left words.
    ret.independent_left = false;
  }
  float subtract_me = ret.rest;
  ret.ngram_length = extend_length;
  next_use = extend_length;
  ResumeScore(add_rbegin, add_rend, extend_length - 1, node, backoff_out, next_use, ret);
  next_use -= extend_length;
  // Charge backoffs.
  for (const float *b = backoff_in + ret.ngram_length - extend_length; b < backoff_in + (add_rend - add_rbegin); ++b) ret.prob += *b;
  ret.prob -= subtract_me;
  ret.rest -= subtract_me;
  return ret;
}

namespace {
// Do a paraonoid copy of history, assuming new_word has already been copied
// (hence the -1).  out_state.length could be zero so I avoided using
// std::copy.
void CopyRemainingHistory(const WordIndex *from, State &out_state) {
  WordIndex *out = out_state.words + 1;
  const WordIndex *in_end = from + static_cast<ptrdiff_t>(out_state.length) - 1;
  for (const WordIndex *in = from; in < in_end; ++in, ++out) *out = *in;
}
} // namespace

/* Ugly optimized function.  Produce a score excluding backoff.
 * The search goes in increasing order of ngram length.
 * Context goes backward, so context_begin is the word immediately preceeding
 * new_word.
 */
template <class Search, class VocabularyT> FullScoreReturn GenericModel<Search, VocabularyT>::ScoreExceptBackoff(
    const WordIndex *const context_rbegin,
    const WordIndex *const context_rend,
    const WordIndex new_word,
    State &out_state) const {
  assert(new_word < vocab_.Bound());
  FullScoreReturn ret;
  // ret.ngram_length contains the last known non-blank ngram length.
  ret.ngram_length = 1;

  typename Search::Node node;
  typename Search::UnigramPointer uni(search_.LookupUnigram(new_word, node, ret.independent_left, ret.extend_left));
  out_state.backoff[0] = uni.Backoff();
  ret.prob = uni.Prob();
  ret.rest = uni.Rest();

  // This is the length of the context that should be used for continuation to the right.
  out_state.length = HasExtension(out_state.backoff[0]) ? 1 : 0;
  // We'll write the word anyway since it will probably be used and does no harm being there.
  out_state.words[0] = new_word;
  if (context_rbegin == context_rend) return ret;

  ResumeScore(context_rbegin, context_rend, 0, node, out_state.backoff + 1, out_state.length, ret);
  CopyRemainingHistory(context_rbegin, out_state);
  return ret;
}

template <class Search, class VocabularyT> void GenericModel<Search, VocabularyT>::ResumeScore(const WordIndex *hist_iter, const WordIndex *const context_rend, unsigned char order_minus_2, typename Search::Node &node, float *backoff_out, unsigned char &next_use, FullScoreReturn &ret) const {
  for (; ; ++order_minus_2, ++hist_iter, ++backoff_out) {
    if (hist_iter == context_rend) return;
    if (ret.independent_left) return;
    if (order_minus_2 == P::Order() - 2) break;

    typename Search::MiddlePointer pointer(search_.LookupMiddle(order_minus_2, *hist_iter, node, ret.independent_left, ret.extend_left));
    if (!pointer.Found()) return;
    *backoff_out = pointer.Backoff();
    ret.prob = pointer.Prob();
    ret.rest = pointer.Rest();
    ret.ngram_length = order_minus_2 + 2;
    if (HasExtension(*backoff_out)) {
      next_use = ret.ngram_length;
    }
  }
  ret.independent_left = true;
  typename Search::LongestPointer longest(search_.LookupLongest(*hist_iter, node));
  if (longest.Found()) {
    ret.prob = longest.Prob();
    ret.rest = ret.prob;
    // There is no blank in longest_.
    ret.ngram_length = P::Order();
  }
}

template <class Search, class VocabularyT> float GenericModel<Search, VocabularyT>::InternalUnRest(const uint64_t *pointers_begin, const uint64_t *pointers_end, unsigned char first_length) const {
  float ret;
  typename Search::Node node;
  if (first_length == 1) {
    if (pointers_begin >= pointers_end) return 0.0;
    bool independent_left;
    uint64_t extend_left;
    typename Search::UnigramPointer ptr(search_.LookupUnigram(static_cast<WordIndex>(*pointers_begin), node, independent_left, extend_left));
    ret = ptr.Prob() - ptr.Rest();
    ++first_length;
    ++pointers_begin;
  } else {
    ret = 0.0;
  }
  for (const uint64_t *i = pointers_begin; i < pointers_end; ++i, ++first_length) {
    typename Search::MiddlePointer ptr(search_.Unpack(*i, first_length, node));
    ret += ptr.Prob() - ptr.Rest();
  }
  return ret;
}

template class GenericModel<HashedSearch<BackoffValue>, ProbingVocabulary>;
template class GenericModel<HashedSearch<RestValue>, ProbingVocabulary>;
template class GenericModel<trie::TrieSearch<DontQuantize, trie::DontBhiksha>, SortedVocabulary>;
template class GenericModel<trie::TrieSearch<DontQuantize, trie::ArrayBhiksha>, SortedVocabulary>;
template class GenericModel<trie::TrieSearch<SeparatelyQuantize, trie::DontBhiksha>, SortedVocabulary>;
template class GenericModel<trie::TrieSearch<SeparatelyQuantize, trie::ArrayBhiksha>, SortedVocabulary>;

} // namespace detail
} // namespace ngram
} // namespace lm


================================================
FILE: src/kenlm/lm/model.hh
================================================
#ifndef LM_MODEL__
#define LM_MODEL__

#include "lm/bhiksha.hh"
#include "lm/binary_format.hh"
#include "lm/config.hh"
#include "lm/facade.hh"
#include "lm/quantize.hh"
#include "lm/search_hashed.hh"
#include "lm/search_trie.hh"
#include "lm/state.hh"
#include "lm/value.hh"
#include "lm/vocab.hh"
#include "lm/weights.hh"

#include "util/murmur_hash.hh"

#include <algorithm>
#include <vector>

#include <string.h>

namespace util { class FilePiece; }

namespace lm {
namespace ngram {
namespace detail {

// Should return the same results as SRI.  
// ModelFacade typedefs Vocabulary so we use VocabularyT to avoid naming conflicts.
template <class Search, class VocabularyT> class GenericModel : public base::ModelFacade<GenericModel<Search, VocabularyT>, State, VocabularyT> {
  private:
    typedef base::ModelFacade<GenericModel<Search, VocabularyT>, State, VocabularyT> P;
  public:
    // This is the model type returned by RecognizeBinary.
    static const ModelType kModelType;

    static const unsigned int kVersion = Search::kVersion;

    /* Get the size of memory that will be mapped given ngram counts.  This
     * does not include small non-mapped control structures, such as this class
     * itself.  
     */
    static uint64_t Size(const std::vector<uint64_t> &counts, const Config &config = Config());

    /* Load the model from a file.  It may be an ARPA or binary file.  Binary
     * files must have the format expected by this class or you'll get an
     * exception.  So TrieModel can only load ARPA or binary created by
     * TrieModel.  To classify binary files, call RecognizeBinary in
     * lm/binary_format.hh.  
     */
    explicit GenericModel(const char *file, const Config &config = Config());

    /* Score p(new_word | in_state) and incorporate new_word into out_state.
     * Note that in_state and out_state must be different references:
     * &in_state != &out_state.  
     */
    FullScoreReturn FullScore(const State &in_state, const WordIndex new_word, State &out_state) const;

    /* Slower call without in_state.  Try to remember state, but sometimes it
     * would cost too much memory or your decoder isn't setup properly.  
     * To use this function, make an array of WordIndex containing the context
     * vocabulary ids in reverse order.  Then, pass the bounds of the array:
     * [context_rbegin, context_rend).  The new_word is not part of the context
     * array unless you intend to repeat words.  
     */
    FullScoreReturn FullScoreForgotState(const WordIndex *context_rbegin, const WordIndex *context_rend, const WordIndex new_word, State &out_state) const;

    /* Get the state for a context.  Don't use this if you can avoid it.  Use
     * BeginSentenceState or EmptyContextState and extend from those.  If
     * you're only going to use this state to call FullScore once, use
     * FullScoreForgotState. 
     * To use this function, make an array of WordIndex containing the context
     * vocabulary ids in reverse order.  Then, pass the bounds of the array:
     * [context_rbegin, context_rend).  
     */
    void GetState(const WordIndex *context_rbegin, const WordIndex *context_rend, State &out_state) const;

    /* More efficient version of FullScore where a partial n-gram has already
     * been scored.  
     * NOTE: THE RETURNED .rest AND .prob ARE RELATIVE TO THE .rest RETURNED BEFORE.  
     */
    FullScoreReturn ExtendLeft(
        // Additional context in reverse order.  This will update add_rend to 
        const WordIndex *add_rbegin, const WordIndex *add_rend,
        // Backoff weights to use.  
        const float *backoff_in,
        // extend_left returned by a previous query.
        uint64_t extend_pointer,
        // Length of n-gram that the pointer corresponds to.  
        unsigned char extend_length,
        // Where to write additional backoffs for [extend_length + 1, min(Order() - 1, return.ngram_length)]
        float *backoff_out,
        // Amount of additional content that should be considered by the next call.
        unsigned char &next_use) const;

    /* Return probabilities minus rest costs for an array of pointers.  The
     * first length should be the length of the n-gram to which pointers_begin
     * points.  
     */
    float UnRest(const uint64_t *pointers_begin, const uint64_t *pointers_end, unsigned char first_length) const {
      // Compiler should optimize this if away.  
      return Search::kDifferentRest ? InternalUnRest(pointers_begin, pointers_end, first_length) : 0.0;
    }

  private:
    friend void lm::ngram::LoadLM<>(const char *file, const Config &config, GenericModel<Search, VocabularyT> &to);

    static void UpdateConfigFromBinary(int fd, const std::vector<uint64_t> &counts, Config &config);

    FullScoreReturn ScoreExceptBackoff(const WordIndex *const context_rbegin, const WordIndex *const context_rend, const WordIndex new_word, State &out_state) const;

    // Score bigrams and above.  Do not include backoff.   
    void ResumeScore(const WordIndex *context_rbegin, const WordIndex *const context_rend, unsigned char starting_order_minus_2, typename Search::Node &node, float *backoff_out, unsigned char &next_use, FullScoreReturn &ret) const;

    // Appears after Size in the cc file.
    void SetupMemory(void *start, const std::vector<uint64_t> &counts, const Config &config);

    void InitializeFromBinary(void *start, const Parameters &params, const Config &config, int fd);

    void InitializeFromARPA(const char *file, const Config &config);

    float InternalUnRest(const uint64_t *pointers_begin, const uint64_t *pointers_end, unsigned char first_length) const;

    Backing &MutableBacking() { return backing_; }

    Backing backing_;
    
    VocabularyT vocab_;

    Search search_;
};

} // namespace detail

// Instead of typedef, inherit.  This allows the Model etc to be forward declared.  
// Oh the joys of C and C++. 
#define LM_COMMA() ,
#define LM_NAME_MODEL(name, from)\
class name : public from {\
  public:\
    name(const char *file, const Config &config = Config()) : from(file, config) {}\
};

LM_NAME_MODEL(ProbingModel, detail::GenericModel<detail::HashedSearch<BackoffValue> LM_COMMA() ProbingVocabulary>);
LM_NAME_MODEL(RestProbingModel, detail::GenericModel<detail::HashedSearch<RestValue> LM_COMMA() ProbingVocabulary>);
LM_NAME_MODEL(TrieModel, detail::GenericModel<trie::TrieSearch<DontQuantize LM_COMMA() trie::DontBhiksha> LM_COMMA() SortedVocabulary>);
LM_NAME_MODEL(ArrayTrieModel, detail::GenericModel<trie::TrieSearch<DontQuantize LM_COMMA() trie::ArrayBhiksha> LM_COMMA() SortedVocabulary>);
LM_NAME_MODEL(QuantTrieModel, detail::GenericModel<trie::TrieSearch<SeparatelyQuantize LM_COMMA() trie::DontBhiksha> LM_COMMA() SortedVocabulary>);
LM_NAME_MODEL(QuantArrayTrieModel, detail::GenericModel<trie::TrieSearch<SeparatelyQuantize LM_COMMA() trie::ArrayBhiksha> LM_COMMA() SortedVocabulary>);

// Default implementation.  No real reason for it to be the default.  
typedef ::lm::ngram::ProbingVocabulary Vocabulary;
typedef ProbingModel Model;

} // namespace ngram
} // namespace lm

#endif // LM_MODEL__


================================================
FILE: src/kenlm/lm/model_test.cc
================================================
#include "lm/model.hh"

#include <stdlib.h>
#include <string.h>

#define BOOST_TEST_MODULE ModelTest
#include <boost/test/unit_test.hpp>
#include <boost/test/floating_point_comparison.hpp>

// Apparently some Boost versions use templates and are pretty strict about types matching.  
#define SLOPPY_CHECK_CLOSE(ref, value, tol) BOOST_CHECK_CLOSE(static_cast<double>(ref), static_cast<double>(value), static_cast<double>(tol));

namespace lm {
namespace ngram {

std::ostream &operator<<(std::ostream &o, const State &state) {
  o << "State length " << static_cast<unsigned int>(state.length) << ':';
  for (const WordIndex *i = state.words; i < state.words + state.length; ++i) {
    o << ' ' << *i;
  }
  return o;
}

namespace {

// Stupid bjam reverses the command line arguments randomly.
const char *TestLocation() {
  if (boost::unit_test::framework::master_test_suite().argc < 3) {
    return "test.arpa";
  }
  char **argv = boost::unit_test::framework::master_test_suite().argv;
  return argv[strstr(argv[1], "nounk") ? 2 : 1];
}
const char *TestNoUnkLocation() {
  if (boost::unit_test::framework::master_test_suite().argc < 3) {
    return "test_nounk.arpa";
  }
  char **argv = boost::unit_test::framework::master_test_suite().argv;
  return argv[strstr(argv[1], "nounk") ? 1 : 2];
}

template <class Model> State GetState(const Model &model, const char *word, const State &in) {
  WordIndex context[in.length + 1];
  context[0] = model.GetVocabulary().Index(word);
  std::copy(in.words, in.words + in.length, context + 1);
  State ret;
  model.GetState(context, context + in.length + 1, ret);
  return ret;
}

#define StartTest(word, ngram, score, indep_left) \
  ret = model.FullScore( \
      state, \
      model.GetVocabulary().Index(word), \
      out);\
  SLOPPY_CHECK_CLOSE(score, ret.prob, 0.001); \
  BOOST_CHECK_EQUAL(static_cast<unsigned int>(ngram), ret.ngram_length); \
  BOOST_CHECK_GE(std::min<unsigned char>(ngram, 5 - 1), out.length); \
  BOOST_CHECK_EQUAL(indep_left, ret.independent_left); \
  BOOST_CHECK_EQUAL(out, GetState(model, word, state));

#define AppendTest(word, ngram, score, indep_left) \
  StartTest(word, ngram, score, indep_left) \
  state = out;

template <class M> void Starters(const M &model) {
  FullScoreReturn ret;
  Model::State state(model.BeginSentenceState());
  Model::State out;

  StartTest("looking", 2, -0.4846522, true);

  // , probability plus <s> backoff
  StartTest(",", 1, -1.383514 + -0.4149733, true);
  // <unk> probability plus <s> backoff
  StartTest("this_is_not_found", 1, -1.995635 + -0.4149733, true);
}

template <class M> void Continuation(const M &model) {
  FullScoreReturn ret;
  Model::State state(model.BeginSentenceState());
  Model::State out;

  AppendTest("looking", 2, -0.484652, true);
  AppendTest("on", 3, -0.348837, true);
  AppendTest("a", 4, -0.0155266, true);
  AppendTest("little", 5, -0.00306122, true);
  State preserve = state;
  AppendTest("the", 1, -4.04005, true);
  AppendTest("biarritz", 1, -1.9889, true);
  AppendTest("not_found", 1, -2.29666, true);
  AppendTest("more", 1, -1.20632 - 20.0, true);
  AppendTest(".", 2, -0.51363, true);
  AppendTest("</s>", 3, -0.0191651, true);
  BOOST_CHECK_EQUAL(0, state.length);

  state = preserve;
  AppendTest("more", 5, -0.00181395, true);
  BOOST_CHECK_EQUAL(4, state.length);
  AppendTest("loin", 5, -0.0432557, true);
  BOOST_CHECK_EQUAL(1, state.length);
}

template <class M> void Blanks(const M &model) {
  FullScoreReturn ret;
  State state(model.NullContextState());
  State out;
  AppendTest("also", 1, -1.687872, false);
  AppendTest("would", 2, -2, true);
  AppendTest("consider", 3, -3, true);
  State preserve = state;
  AppendTest("higher", 4, -4, true);
  AppendTest("looking", 5, -5, true);
  BOOST_CHECK_EQUAL(1, state.length);

  state = preserve;
  // also would consider not_found
  AppendTest("not_found", 1, -1.995635 - 7.0 - 0.30103, true);

  state = model.NullContextState();
  // higher looking is a blank.  
  AppendTest("higher", 1, -1.509559, false);
  AppendTest("looking", 2, -1.285941 - 0.30103, false);

  State higher_looking = state;

  BOOST_CHECK_EQUAL(1, state.length);
  AppendTest("not_found", 1, -1.995635 - 0.4771212, true);

  state = higher_looking;
  // higher looking consider
  AppendTest("consider", 1, -1.687872 - 0.4771212, true);

  state = model.NullContextState();
  AppendTest("would", 1, -1.687872, false);
  BOOST_CHECK_EQUAL(1, state.length);
  AppendTest("consider", 2, -1.687872 -0.30103, false);
  BOOST_CHECK_EQUAL(2, state.length);
  AppendTest("higher", 3, -1.509559 - 0.30103, false);
  BOOST_CHECK_EQUAL(3, state.length);
  AppendTest("looking", 4, -1.285941 - 0.30103, false);
}

template <class M> void Unknowns(const M &model) {
  FullScoreReturn ret;
  State state(model.NullContextState());
  State out;

  AppendTest("not_found", 1, -1.995635, false);
  State preserve = state;
  AppendTest("not_found2", 2, -15.0, true);
  AppendTest("not_found3", 2, -15.0 - 2.0, true);
  
  state = preserve;
  AppendTest("however", 2, -4, true);
  AppendTest("not_found3", 3, -6, true);
}

template <class M> void MinimalState(const M &model) {
  FullScoreReturn ret;
  State state(model.NullContextState());
  State out;

  AppendTest("baz", 1, -6.535897, true);
  BOOST_CHECK_EQUAL(0, state.length);
  state = model.NullContextState();
  AppendTest("foo", 1, -3.141592, true);
  BOOST_CHECK_EQUAL(1, state.length);
  AppendTest("bar", 2, -6.0, true);
  // Has to include the backoff weight.  
  BOOST_CHECK_EQUAL(1, state.length);
  AppendTest("bar", 1, -2.718281 + 3.0, true);
  BOOST_CHECK_EQUAL(1, state.length);

  state = model.NullContextState();
  AppendTest("to", 1, -1.687872, false);
  AppendTest("look", 2, -0.2922095, true);
  BOOST_CHECK_EQUAL(2, state.length);
  AppendTest("good", 3, -7, true);
}

template <class M> void ExtendLeftTest(const M &model) {
  State right;
  FullScoreReturn little(model.FullScore(model.NullContextState(), model.GetVocabulary().Index("little"), right));
  const float kLittleProb = -1.285941;
  SLOPPY_CHECK_CLOSE(kLittleProb, little.prob, 0.001);
  unsigned char next_use;
  float backoff_out[4];

  FullScoreReturn extend_none(model.ExtendLeft(NULL, NULL, NULL, little.extend_left, 1, NULL, next_use));
  BOOST_CHECK_EQUAL(0, next_use);
  BOOST_CHECK_EQUAL(little.extend_left, extend_none.extend_left);
  SLOPPY_CHECK_CLOSE(little.prob - little.rest, extend_none.prob, 0.001);
  BOOST_CHECK_EQUAL(1, extend_none.ngram_length);

  const WordIndex a = model.GetVocabulary().Index("a");
  float backoff_in = 3.14;
  // a little
  FullScoreReturn extend_a(model.ExtendLeft(&a, &a + 1, &backoff_in, little.extend_left, 1, backoff_out, next_use));
  BOOST_CHECK_EQUAL(1, next_use);
  SLOPPY_CHECK_CLOSE(-0.69897, backoff_out[0], 0.001);
  SLOPPY_CHECK_CLOSE(-0.09132547 - little.rest, extend_a.prob, 0.001);
  BOOST_CHECK_EQUAL(2, extend_a.ngram_length);
  BOOST_CHECK(!extend_a.independent_left);

  const WordIndex on = model.GetVocabulary().Index("on");
  FullScoreReturn extend_on(model.ExtendLeft(&on, &on + 1, &backoff_in, extend_a.extend_left, 2, backoff_out, next_use));
  BOOST_CHECK_EQUAL(1, next_use);
  SLOPPY_CHECK_CLOSE(-0.4771212, backoff_out[0], 0.001);
  SLOPPY_CHECK_CLOSE(-0.0283603 - (extend_a.rest + little.rest), extend_on.prob, 0.001);
  BOOST_CHECK_EQUAL(3, extend_on.ngram_length);
  BOOST_CHECK(!extend_on.independent_left);

  const WordIndex both[2] = {a, on};
  float backoff_in_arr[4];
  FullScoreReturn extend_both(model.ExtendLeft(both, both + 2, backoff_in_arr, little.extend_left, 1, backoff_out, next_use));
  BOOST_CHECK_EQUAL(2, next_use);
  SLOPPY_CHECK_CLOSE(-0.69897, backoff_out[0], 0.001);
  SLOPPY_CHECK_CLOSE(-0.4771212, backoff_out[1], 0.001);
  SLOPPY_CHECK_CLOSE(-0.0283603 - little.rest, extend_both.prob, 0.001);
  BOOST_CHECK_EQUAL(3, extend_both.ngram_length);
  BOOST_CHECK(!extend_both.independent_left);
  BOOST_CHECK_EQUAL(extend_on.extend_left, extend_both.extend_left);
}

#define StatelessTest(word, provide, ngram, score) \
  ret = model.FullScoreForgotState(indices + num_words - word, indices + num_words - word + provide, indices[num_words - word - 1], state); \
  SLOPPY_CHECK_CLOSE(score, ret.prob, 0.001); \
  BOOST_CHECK_EQUAL(static_cast<unsigned int>(ngram), ret.ngram_length); \
  model.GetState(indices + num_words - word, indices + num_words - word + provide, before); \
  ret = model.FullScore(before, indices[num_words - word - 1], out); \
  BOOST_CHECK(state == out); \
  SLOPPY_CHECK_CLOSE(score, ret.prob, 0.001); \
  BOOST_CHECK_EQUAL(static_cast<unsigned int>(ngram), ret.ngram_length);

template <class M> void Stateless(const M &model) {
  const char *words[] = {"<s>", "looking", "on", "a", "little", "the", "biarritz", "not_found", "more", ".", "</s>"};
  const size_t num_words = sizeof(words) / sizeof(const char*);
  // Silience "array subscript is above array bounds" when extracting end pointer.
  WordIndex indices[num_words + 1];
  for (unsigned int i = 0; i < num_words; ++i) {
    indices[num_words - 1 - i] = model.GetVocabulary().Index(words[i]);
  }
  FullScoreReturn ret;
  State state, out, before;

  ret = model.FullScoreForgotState(indices + num_words - 1, indices + num_words, indices[num_words - 2], state);
  SLOPPY_CHECK_CLOSE(-0.484652, ret.prob, 0.001);
  StatelessTest(1, 1, 2, -0.484652);

  // looking
  StatelessTest(1, 2, 2, -0.484652);
  // on
  AppendTest("on", 3, -0.348837, true);
  StatelessTest(2, 3, 3, -0.348837);
  StatelessTest(2, 2, 3, -0.348837);
  StatelessTest(2, 1, 2, -0.4638903);
  // a
  StatelessTest(3, 4, 4, -0.0155266);
  // little
  AppendTest("little", 5, -0.00306122, true);
  StatelessTest(4, 5, 5, -0.00306122);
  // the
  AppendTest("the", 1, -4.04005, true);
  StatelessTest(5, 5, 1, -4.04005);
  // No context of the.  
  StatelessTest(5, 0, 1, -1.687872);
  // biarritz
  StatelessTest(6, 1, 1, -1.9889);
  // not found
  StatelessTest(7, 1, 1, -2.29666);
  StatelessTest(7, 0, 1, -1.995635);

  WordIndex unk[1];
  unk[0] = 0;
  model.GetState(unk, unk + 1, state);
  BOOST_CHECK_EQUAL(1, state.length);
  BOOST_CHECK_EQUAL(static_cast<WordIndex>(0), state.words[0]);
}

template <class M> void NoUnkCheck(const M &model) {
  WordIndex unk_index = 0;
  State state;

  FullScoreReturn ret = model.FullScoreForgotState(&unk_index, &unk_index + 1, unk_index, state);
  SLOPPY_CHECK_CLOSE(-100.0, ret.prob, 0.001);
}

template <class M> void Everything(const M &m) {
  Starters(m);
  Continuation(m);
  Blanks(m);
  Unknowns(m);
  MinimalState(m);
  ExtendLeftTest(m);
  Stateless(m);
}

class ExpectEnumerateVocab : public EnumerateVocab {
  public:
    ExpectEnumerateVocab() {}

    void Add(WordIndex index, const StringPiece &str) {
      BOOST_CHECK_EQUAL(seen.size(), index);
      seen.push_back(std::string(str.data(), str.length()));
    }

    void Check(const base::Vocabulary &vocab) {
      BOOST_CHECK_EQUAL(37ULL, seen.size());
      BOOST_REQUIRE(!seen.empty());
      BOOST_CHECK_EQUAL("<unk>", seen[0]);
      for (WordIndex i = 0; i < seen.size(); ++i) {
        BOOST_CHECK_EQUAL(i, vocab.Index(seen[i]));
      }
    }

    void Clear() {
      seen.clear();
    }

    std::vector<std::string> seen;
};

template <class ModelT> void LoadingTest() {
  Config config;
  config.arpa_complain = Config::NONE;
  config.messages = NULL;
  config.probing_multiplier = 2.0;
  {
    ExpectEnumerateVocab enumerate;
    config.enumerate_vocab = &enumerate;
    ModelT m(TestLocation(), config);
    enumerate.Check(m.GetVocabulary());
    BOOST_CHECK_EQUAL((WordIndex)37, m.GetVocabulary().Bound());
    Everything(m);
  }
  {
    ExpectEnumerateVocab enumerate;
    config.enumerate_vocab = &enumerate;
    ModelT m(TestNoUnkLocation(), config);
    enumerate.Check(m.GetVocabulary());
    BOOST_CHECK_EQUAL((WordIndex)37, m.GetVocabulary().Bound());
    NoUnkCheck(m);
  }
}

BOOST_AUTO_TEST_CASE(probing) {
  LoadingTest<Model>();
}
BOOST_AUTO_TEST_CASE(trie) {
  LoadingTest<TrieModel>();
}
BOOST_AUTO_TEST_CASE(quant_trie) {
  LoadingTest<QuantTrieModel>();
}
BOOST_AUTO_TEST_CASE(bhiksha_trie) {
  LoadingTest<ArrayTrieModel>();
}
BOOST_AUTO_TEST_CASE(quant_bhiksha_trie) {
  LoadingTest<QuantArrayTrieModel>();
}

template <class ModelT> void BinaryTest() {
  Config config;
  config.write_mmap = "test.binary";
  config.messages = NULL;
  ExpectEnumerateVocab enumerate;
  config.enumerate_vocab = &enumerate;

  {
    ModelT copy_model(TestLocation(), config);
    enumerate.Check(copy_model.GetVocabulary());
    enumerate.Clear();
    Everything(copy_model);
  }

  config.write_mmap = NULL;

  ModelType type;
  BOOST_REQUIRE(RecognizeBinary("test.binary", type));
  BOOST_CHECK_EQUAL(ModelT::kModelType, type);

  {
    ModelT binary("test.binary", config);
    enumerate.Check(binary.GetVocabulary());
    Everything(binary);
  }
  unlink("test.binary");

  // Now test without <unk>.
  config.write_mmap = "test_nounk.binary";
  config.messages = NULL;
  enumerate.Clear();
  {
    ModelT copy_model(TestNoUnkLocation(), config);
    enumerate.Check(copy_model.GetVocabulary());
    enumerate.Clear();
    NoUnkCheck(copy_model);
  }
  config.write_mmap = NULL;
  {
    ModelT binary(TestNoUnkLocation(), config);
    enumerate.Check(binary.GetVocabulary());
    NoUnkCheck(binary);
  }
  unlink("test_nounk.binary");
}

BOOST_AUTO_TEST_CASE(write_and_read_probing) {
  BinaryTest<ProbingModel>();
}
BOOST_AUTO_TEST_CASE(write_and_read_rest_probing) {
  BinaryTest<RestProbingModel>();
}
BOOST_AUTO_TEST_CASE(write_and_read_trie) {
  BinaryTest<TrieModel>();
}
BOOST_AUTO_TEST_CASE(write_and_read_quant_trie) {
  BinaryTest<QuantTrieModel>();
}
BOOST_AUTO_TEST_CASE(write_and_read_array_trie) {
  BinaryTest<ArrayTrieModel>();
}
BOOST_AUTO_TEST_CASE(write_and_read_quant_array_trie) {
  BinaryTest<QuantArrayTrieModel>();
}

BOOST_AUTO_TEST_CASE(rest_max) {
  Config config;
  config.arpa_complain = Config::NONE;
  config.messages = NULL;

  RestProbingModel model(TestLocation(), config);
  State state, out;
  FullScoreReturn ret(model.FullScore(model.NullContextState(), model.GetVocabulary().Index("."), state));
  SLOPPY_CHECK_CLOSE(-0.2705918, ret.rest, 0.001);
  SLOPPY_CHECK_CLOSE(-0.01916512, model.FullScore(state, model.GetVocabulary().EndSentence(), out).rest, 0.001);
}

} // namespace
} // namespace ngram
} // namespace lm


================================================
FILE: src/kenlm/lm/model_type.hh
================================================
#ifndef LM_MODEL_TYPE__
#define LM_MODEL_TYPE__

namespace lm {
namespace ngram {

/* Not the best numbering system, but it grew this way for historical reasons
 * and I want to preserve existing binary files. */
typedef enum {PROBING=0, REST_PROBING=1, TRIE=2, QUANT_TRIE=3, ARRAY_TRIE=4, QUANT_ARRAY_TRIE=5} ModelType;

// Historical names.  
const ModelType HASH_PROBING = PROBING;
const ModelType TRIE_SORTED = TRIE;
const ModelType QUANT_TRIE_SORTED = QUANT_TRIE;
const ModelType ARRAY_TRIE_SORTED = ARRAY_TRIE;
const ModelType QUANT_ARRAY_TRIE_SORTED = QUANT_ARRAY_TRIE;

const static ModelType kQuantAdd = static_cast<ModelType>(QUANT_TRIE - TRIE);
const static ModelType kArrayAdd = static_cast<ModelType>(ARRAY_TRIE - TRIE);

} // namespace ngram
} // namespace lm
#endif // LM_MODEL_TYPE__


================================================
FILE: src/kenlm/lm/ngram_query.hh
================================================
#ifndef LM_NGRAM_QUERY__
#define LM_NGRAM_QUERY__

#include "lm/enumerate_vocab.hh"
#include "lm/model.hh"
#include "util/usage.hh"

#include <cstdlib>
#include <iostream>
#include <ostream>
#include <istream>
#include <string>

namespace lm {
namespace ngram {

template <class Model> void Query(const Model &model, bool sentence_context, std::istream &in_stream, std::ostream &out_stream) {
  std::cerr << "Loading statistics:\n";
  util::PrintUsage(std::cerr);
  typename Model::State state, out;
  lm::FullScoreReturn ret;
  std::string word;

  while (in_stream) {
    state = sentence_context ? model.BeginSentenceState() : model.NullContextState();
    float total = 0.0;
    bool got = false;
    unsigned int oov = 0;
    while (in_stream >> word) {
      got = true;
      lm::WordIndex vocab = model.GetVocabulary().Index(word);
      if (vocab == 0) ++oov;
      ret = model.FullScore(state, vocab, out);
      total += ret.prob;
      out_stream << word << '=' << vocab << ' ' << static_cast<unsigned int>(ret.ngram_length)  << ' ' << ret.prob << '\t';
      state = out;
      char c;
      while (true) {
        c = in_stream.get();
        if (!in_stream) break;
        if (c == '\n') break;
        if (!isspace(c)) {
          in_stream.unget();
          break;
        }
      }
      if (c == '\n') break;
    }
    if (!got && !in_stream) break;
    if (sentence_context) {
      ret = model.FullScore(state, model.GetVocabulary().EndSentence(), out);
      total += ret.prob;
      out_stream << "</s>=" << model.GetVocabulary().EndSentence() << ' ' << static_cast<unsigned int>(ret.ngram_length)  << ' ' << ret.prob << '\t';
    }
    out_stream << "Total: " << total << " OOV: " << oov << '\n';
  }
  std::cerr << "After queries:\n";
  util::PrintUsage(std::cerr);
}

template <class M> void Query(const char *file, bool sentence_context, std::istream &in_stream, std::ostream &out_stream) {
  Config config;
  M model(file, config);
  Query(model, sentence_context, in_stream, out_stream);
}

} // namespace ngram
} // namespace lm

#endif // LM_NGRAM_QUERY__


================================================
FILE: src/kenlm/lm/partial.hh
================================================
#ifndef LM_PARTIAL__
#define LM_PARTIAL__

#include "lm/return.hh"
#include "lm/state.hh"

#include <algorithm>

#include <assert.h>

namespace lm {
namespace ngram {

struct ExtendReturn {
  float adjust;
  bool make_full;
  unsigned char next_use;
};

template <class Model> ExtendReturn ExtendLoop(
    const Model &model,
    unsigned char seen, const WordIndex *add_rbegin, const WordIndex *add_rend, const float *backoff_start,
    const uint64_t *pointers, const uint64_t *pointers_end,
    uint64_t *&pointers_write,
    float *backoff_write) {
  unsigned char add_length = add_rend - add_rbegin;

  float backoff_buf[2][KENLM_MAX_ORDER - 1];
  float *backoff_in = backoff_buf[0], *backoff_out = backoff_buf[1];
  std::copy(backoff_start, backoff_start + add_length, backoff_in);

  ExtendReturn value;
  value.make_full = false;
  value.adjust = 0.0;
  value.next_use = add_length;

  unsigned char i = 0;
  unsigned char length = pointers_end - pointers;
  // pointers_write is NULL means that the existing left state is full, so we should use completed probabilities.  
  if (pointers_write) {
    // Using full context, writing to new left state.   
    for (; i < length; ++i) {
      FullScoreReturn ret(model.ExtendLeft(
          add_rbegin, add_rbegin + value.next_use,
          backoff_in,
          pointers[i], i + seen + 1,
          backoff_out,
          value.next_use));
      std::swap(backoff_in, backoff_out);
      if (ret.independent_left) {
        value.adjust += ret.prob;
        value.make_full = true;
        ++i;
        break;
      }
      value.adjust += ret.rest;
      *pointers_write++ = ret.extend_left;
      if (value.next_use != add_length) {
        value.make_full = true;
        ++i;
        break;
      }
    }
  }
  // Using some of the new context.  
  for (; i < length && value.next_use; ++i) {
    FullScoreReturn ret(model.ExtendLeft(
        add_rbegin, add_rbegin + value.next_use,
        backoff_in,
        pointers[i], i + seen + 1,
        backoff_out,
        value.next_use));
    std::swap(backoff_in, backoff_out);
    value.adjust += ret.prob;
  }
  float unrest = model.UnRest(pointers + i, pointers_end, i + seen + 1);
  // Using none of the new context.  
  value.adjust += unrest;

  std::copy(backoff_in, backoff_in + value.next_use, backoff_write);
  return value;
}

template <class Model> float RevealBefore(const Model &model, const Right &reveal, const unsigned char seen, bool reveal_full, Left &left, Right &right) {
  assert(seen < reveal.length || reveal_full);
  uint64_t *pointers_write = reveal_full ? NULL : left.pointers;
  float backoff_buffer[KENLM_MAX_ORDER - 1];
  ExtendReturn value(ExtendLoop(
      model,
      seen, reveal.words + seen, reveal.words + reveal.length, reveal.backoff + seen,
      left.pointers, left.pointers + left.length,
      pointers_write,
      left.full ? backoff_buffer : (right.backoff + right.length)));
  if (reveal_full) {
    left.length = 0;
    value.make_full = true;
  } else {
    left.length = pointers_write - left.pointers;
    value.make_full |= (left.length == model.Order() - 1);
  }
  if (left.full) {
    for (unsigned char i = 0; i < value.next_use; ++i) value.adjust += backoff_buffer[i];
  } else {
    // If left wasn't full when it came in, put words into right state.  
    std::copy(reveal.words + seen, reveal.words + seen + value.next_use, right.words + right.length);
    right.length += value.next_use;
    left.full = value.make_full || (right.length == model.Order() - 1);
  }
  return value.adjust;
}

template <class Model> float RevealAfter(const Model &model, Left &left, Right &right, const Left &reveal, unsigned char seen) {
  assert(seen < reveal.length || reveal.full);
  uint64_t *pointers_write = left.full ? NULL : (left.pointers + left.length);
  ExtendReturn value(ExtendLoop(
      model,
      seen, right.words, right.words + right.length, right.backoff,
      reveal.pointers + seen, reveal.pointers + reveal.length,
      pointers_write,
      right.backoff));
  if (reveal.full) {
    for (unsigned char i = 0; i < value.next_use; ++i) value.adjust += right.backoff[i];
    right.length = 0;
    value.make_full = true;
  } else {
    right.length = value.next_use;
    value.make_full |= (right.length == model.Order() - 1);
  }
  if (!left.full) {
    left.length = pointers_write - left.pointers;
    left.full = value.make_full || (left.length == model.Order() - 1);
  }
  return value.adjust;
}

template <class Model> float Subsume(const Model &model, Left &first_left, const Right &first_right, const Left &second_left, Right &second_right, const unsigned int between_length) {
  assert(first_right.length < KENLM_MAX_ORDER);
  assert(second_left.length < KENLM_MAX_ORDER);
  assert(between_length < KENLM_MAX_ORDER - 1);
  uint64_t *pointers_write = first_left.full ? NULL : (first_left.pointers + first_left.length);
  float backoff_buffer[KENLM_MAX_ORDER - 1];
  ExtendReturn value(ExtendLoop(
        model,
        between_length, first_right.words, first_right.words + first_right.length, first_right.backoff,
        second_left.pointers, second_left.pointers + second_left.length,
        pointers_write,
        second_left.full ? backoff_buffer : (second_right.backoff + second_right.length)));
  if (second_left.full) {
    for (unsigned char i = 0; i < value.next_use; ++i) value.adjust += backoff_buffer[i];
  } else {
    std::copy(first_right.words, first_right.words + value.next_use, second_right.words + second_right.length);
    second_right.length += value.next_use;
    value.make_full |= (second_right.length == model.Order() - 1);
  }
  if (!first_left.full) {
    first_left.length = pointers_write - first_left.pointers;
    first_left.full = value.make_full || second_left.full || (first_left.length == model.Order() - 1);
  }
  assert(first_left.length < KENLM_MAX_ORDER);
  assert(second_right.length < KENLM_MAX_ORDER);
  return value.adjust;
}

} // namespace ngram
} // namespace lm

#endif // LM_PARTIAL__


================================================
FILE: src/kenlm/lm/partial_test.cc
================================================
#include "lm/partial.hh"

#include "lm/left.hh"
#include "lm/model.hh"
#include "util/tokenize_piece.hh"

#define BOOST_TEST_MODULE PartialTest
#include <boost/test/unit_test.hpp>
#include <boost/test/floating_point_comparison.hpp>

namespace lm {
namespace ngram {
namespace {

const char *TestLocation() {
  if (boost::unit_test::framework::master_test_suite().argc < 2) {
    return "test.arpa";
  }
  return boost::unit_test::framework::master_test_suite().argv[1];
}

Config SilentConfig() {
  Config config;
  config.arpa_complain = Config::NONE;
  config.messages = NULL;
  return config;
}

struct ModelFixture {
  ModelFixture() : m(TestLocation(), SilentConfig()) {}

  RestProbingModel m;
};

BOOST_FIXTURE_TEST_SUITE(suite, ModelFixture)

BOOST_AUTO_TEST_CASE(SimpleBefore) {
  Left left;
  left.full = false;
  left.length = 0;
  Right right;
  right.length = 0;

  Right reveal;
  reveal.length = 1;
  WordIndex period = m.GetVocabulary().Index(".");
  reveal.words[0] = period;
  reveal.backoff[0] = -0.845098;

  BOOST_CHECK_CLOSE(0.0, RevealBefore(m, reveal, 0, false, left, right), 0.001);
  BOOST_CHECK_EQUAL(0, left.length);
  BOOST_CHECK(!left.full);
  BOOST_CHECK_EQUAL(1, right.length);
  BOOST_CHECK_EQUAL(period, right.words[0]);
  BOOST_CHECK_CLOSE(-0.845098, right.backoff[0], 0.001);

  WordIndex more = m.GetVocabulary().Index("more");
  reveal.words[1] = more;
  reveal.backoff[1] =  -0.4771212;
  reveal.length = 2;
  BOOST_CHECK_CLOSE(0.0, RevealBefore(m, reveal, 1, false, left, right), 0.001);
  BOOST_CHECK_EQUAL(0, left.length);
  BOOST_CHECK(!left.full);
  BOOST_CHECK_EQUAL(2, right.length);
  BOOST_CHECK_EQUAL(period, right.words[0]);
  BOOST_CHECK_EQUAL(more, right.words[1]);
  BOOST_CHECK_CLOSE(-0.845098, right.backoff[0], 0.001);
  BOOST_CHECK_CLOSE(-0.4771212, right.backoff[1], 0.001);
}

BOOST_AUTO_TEST_CASE(AlsoWouldConsider) {
  WordIndex would = m.GetVocabulary().Index("would");
  WordIndex consider = m.GetVocabulary().Index("consider");

  ChartState current;
  current.left.length = 1;
  current.left.pointers[0] = would;
  current.left.full = false;
  current.right.length = 1;
  current.right.words[0] = would;
  current.right.backoff[0] = -0.30103;

  Left after;
  after.full = false;
  after.length = 1;
  after.pointers[0] = consider;

  // adjustment for would consider
  BOOST_CHECK_CLOSE(-1.687872 - -0.2922095 - 0.30103, RevealAfter(m, current.left, current.right, after, 0), 0.001);

  BOOST_CHECK_EQUAL(2, current.left.length);
  BOOST_CHECK_EQUAL(would, current.left.pointers[0]);
  BOOST_CHECK_EQUAL(false, current.left.full);

  WordIndex also = m.GetVocabulary().Index("also");
  Right before;
  before.length = 1;
  before.words[0] = also;
  before.backoff[0] = -0.30103;
  // r(would) = -0.2922095 [i would], r(would -> consider) = -1.988902 [b(would) + p(consider)]
  // p(also -> would) = -2, p(also would -> consider) = -3
  BOOST_CHECK_CLOSE(-2 + 0.2922095 -3 + 1.988902, RevealBefore(m, before, 0, false, current.left, current.right), 0.001);
  BOOST_CHECK_EQUAL(0, current.left.length);
  BOOST_CHECK(current.left.full);
  BOOST_CHECK_EQUAL(2, current.right.length);
  BOOST_CHECK_EQUAL(would, current.right.words[0]);
  BOOST_CHECK_EQUAL(also, current.right.words[1]);
}

BOOST_AUTO_TEST_CASE(EndSentence) {
  WordIndex loin = m.GetVocabulary().Index("loin");
  WordIndex period = m.GetVocabulary().Index(".");
  WordIndex eos = m.GetVocabulary().EndSentence();

  ChartState between;
  between.left.length = 1;
  between.left.pointers[0] = eos;
  between.left.full = true;
  between.right.length = 0;

  Right before;
  before.words[0] = period;
  before.words[1] = loin;
  before.backoff[0] = -0.845098;
  before.backoff[1] = 0.0;
  
  before.length = 1;
  BOOST_CHECK_CLOSE(-0.0410707, RevealBefore(m, before, 0, true, between.left, between.right), 0.001);
  BOOST_CHECK_EQUAL(0, between.left.length);
}

float ScoreFragment(const RestProbingModel &model, unsigned int *begin, unsigned int *end, ChartState &out) {
  RuleScore<RestProbingModel> scorer(model, out);
  for (unsigned int *i = begin; i < end; ++i) {
    scorer.Terminal(*i);
  }
  return scorer.Finish();
}

void CheckAdjustment(const RestProbingModel &model, float expect, const Right &before_in, bool before_full, ChartState between, const Left &after_in) {
  Right before(before_in);
  Left after(after_in);
  after.full = false;
  float got = 0.0;
  for (unsigned int i = 1; i < 5; ++i) {
    if (before_in.length >= i) {
      before.length = i;
      got += RevealBefore(model, before, i - 1, false, between.left, between.right);
    }
    if (after_in.length >= i) {
      after.length = i;
      got += RevealAfter(model, between.left, between.right, after, i - 1);
    }
  }
  if (after_in.full) {
    after.full = true;
    got += RevealAfter(model, between.left, between.right, after, after.length);
  }
  if (before_full) {
    got += RevealBefore(model, before, before.length, true, between.left, between.right);
  }
  // Sometimes they're zero and BOOST_CHECK_CLOSE fails for this. 
  BOOST_CHECK(fabs(expect - got) < 0.001);
}

void FullDivide(const RestProbingModel &model, StringPiece str) {
  std::vector<WordIndex> indices;
  for (util::TokenIter<util::SingleCharacter, true> i(str, ' '); i; ++i) {
    indices.push_back(model.GetVocabulary().Index(*i));
  }
  ChartState full_state;
  float full = ScoreFragment(model, &indices.front(), &indices.back() + 1, full_state);

  ChartState before_state;
  before_state.left.full = false;
  RuleScore<RestProbingModel> before_scorer(model, before_state);
  float before_score = 0.0;
  for (unsigned int before = 0; before < indices.size(); ++before) {
    for (unsigned int after = before; after <= indices.size(); ++after) {
      ChartState after_state, between_state;
      float after_score = ScoreFragment(model, &indices.front() + after, &indices.front() + indices.size(), after_state);
      float between_score = ScoreFragment(model, &indices.front() + before, &indices.front() + after, between_state);
      CheckAdjustment(model, full - before_score - after_score - between_score, before_state.right, before_state.left.full, between_state, after_state.left);
    }
    before_scorer.Terminal(indices[before]);
    before_score = before_scorer.Finish();
  }
}

BOOST_AUTO_TEST_CASE(Strings) {
  FullDivide(m, "also would consider");
  FullDivide(m, "looking on a little more loin . </s>");
  FullDivide(m, "in biarritz watching considering looking . on a little more loin also would consider higher to look good unknown the screening foo bar , unknown however unknown </s>");
}

BOOST_AUTO_TEST_SUITE_END()
} // namespace
} // namespace ngram
} // namespace lm


================================================
FILE: src/kenlm/lm/quantize.cc
================================================
/* Quantize into bins of equal size as described in
 * M. Federico and N. Bertoldi. 2006. How many bits are needed
 * to store probabilities for phrase-based translation? In Proc.
 * of the Workshop on Statistical Machine Translation, pages
 * 94–101, New York City, June. Association for Computa-
 * tional Linguistics.
 */

#include "lm/quantize.hh"

#include "lm/binary_format.hh"
#include "lm/lm_exception.hh"
#include "util/file.hh"

#include <algorithm>
#include <numeric>

namespace lm {
namespace ngram {

namespace {

void MakeBins(std::vector<float> &values, float *centers, uint32_t bins) {
  std::sort(values.begin(), values.end());
  std::vector<float>::const_iterator start = values.begin(), finish;
  for (uint32_t i = 0; i < bins; ++i, ++centers, start = finish) {
    finish = values.begin() + ((values.size() * static_cast<uint64_t>(i + 1)) / bins);
    if (finish == start) {
      // zero length bucket.
      *centers = i ? *(centers - 1) : -std::numeric_limits<float>::infinity();
    } else {
      *centers = std::accumulate(start, finish, 0.0) / static_cast<float>(finish - start);
    }
  }
}

const char kSeparatelyQuantizeVersion = 2;

} // namespace

void SeparatelyQuantize::UpdateConfigFromBinary(int fd, const std::vector<uint64_t> &/*counts*/, Config &config) {
  char version;
  util::ReadOrThrow(fd, &version, 1);
  util::ReadOrThrow(fd, &config.prob_bits, 1);
  util::ReadOrThrow(fd, &config.backoff_bits, 1);
  if (version != kSeparatelyQuantizeVersion) UTIL_THROW(FormatLoadException, "This file has quantization version " << (unsigned)version << " but the code expects version " << (unsigned)kSeparatelyQuantizeVersion);
  util::AdvanceOrThrow(fd, -3);
}

void SeparatelyQuantize::SetupMemory(void *base, unsigned char order, const Config &config) {
  prob_bits_ = config.prob_bits;
  backoff_bits_ = config.backoff_bits;
  // We need the reserved values.  
  if (config.prob_bits == 0) UTIL_THROW(ConfigException, "You can't quantize probability to zero");
  if (config.backoff_bits == 0) UTIL_THROW(ConfigException, "You can't quantize backoff to zero");
  if (config.prob_bits > 25) UTIL_THROW(ConfigException, "For efficiency reasons, quantizing probability supports at most 25 bits.  Currently you have requested " << static_cast<unsigned>(config.prob_bits) << " bits.");
  if (config.backoff_bits > 25) UTIL_THROW(ConfigException, "For efficiency reasons, quantizing backoff supports at most 25 bits.  Currently you have requested " << static_cast<unsigned>(config.backoff_bits) << " bits.");
  // Reserve 8 byte header for bit counts.  
  actual_base_ = static_cast<uint8_t*>(base);
  float *start = reinterpret_cast<float*>(actual_base_ + 8);
  for (unsigned char i = 0; i < order - 2; ++i) {
    tables_[i][0] = Bins(prob_bits_, start);
    start += (1ULL << prob_bits_);
    tables_[i][1] = Bins(backoff_bits_, start);
    start += (1ULL << backoff_bits_);
  }
  longest_ = tables_[order - 2][0] = Bins(prob_bits_, start);
}

void SeparatelyQuantize::Train(uint8_t order, std::vector<float> &prob, std::vector<float> &backoff) {
  TrainProb(order, prob);

  // Backoff
  float *centers = tables_[order - 2][1].Populate();
  *(centers++) = kNoExtensionBackoff;
  *(centers++) = kExtensionBackoff;
  MakeBins(backoff, centers, (1ULL << backoff_bits_) - 2);
}

void SeparatelyQuantize::TrainProb(uint8_t order, std::vector<float> &prob) {
  float *centers = tables_[order - 2][0].Populate();
  MakeBins(prob, centers, (1ULL << prob_bits_));
}

void SeparatelyQuantize::FinishedLoading(const Config &config) {
  uint8_t *actual_base = actual_base_;
  *(actual_base++) = kSeparatelyQuantizeVersion; // version
  *(actual_base++) = config.prob_bits;
  *(actual_base++) = config.backoff_bits;
}

} // namespace ngram
} // namespace lm


================================================
FILE: src/kenlm/lm/quantize.hh
================================================
#ifndef LM_QUANTIZE_H__
#define LM_QUANTIZE_H__

#include "lm/blank.hh"
#include "lm/config.hh"
#include "lm/max_order.hh"
#include "lm/model_type.hh"
#include "util/bit_packing.hh"

#include <algorithm>
#include <vector>

#include <stdint.h>

#include <iostream>

namespace lm {
namespace ngram {

struct Config;

/* Store values directly and don't quantize. */
class DontQuantize {
  public:
    static const ModelType kModelTypeAdd = static_cast<ModelType>(0);
    static void UpdateConfigFromBinary(int, const std::vector<uint64_t> &, Config &) {}
    static uint64_t Size(uint8_t /*order*/, const Config &/*config*/) { return 0; }
    static uint8_t MiddleBits(const Config &/*config*/) { return 63; }
    static uint8_t LongestBits(const Config &/*config*/) { return 31; }

    class MiddlePointer {
      public:
        MiddlePointer(const DontQuantize & /*quant*/, unsigned char /*order_minus_2*/, util::BitAddress address) : address_(address) {}

        MiddlePointer() : address_(NULL, 0) {}

        bool Found() const {
          return address_.base != NULL;
        }

        float Prob() const {
          return util::ReadNonPositiveFloat31(address_.base, address_.offset);
        }

        float Backoff() const {
          return util::ReadFloat32(address_.base, address_.offset + 31);
        }

        float Rest() const { return Prob(); }

        void Write(float prob, float backoff) {
          util::WriteNonPositiveFloat31(address_.base, address_.offset, prob);
          util::WriteFloat32(address_.base, address_.offset + 31, backoff);
        }

      private:
        util::BitAddress address_;
    };

    class LongestPointer {
      public:
        explicit LongestPointer(const DontQuantize &/*quant*/, util::BitAddress address) : address_(address) {}

        LongestPointer() : address_(NULL, 0) {}

        bool Found() const {
          return address_.base != NULL;
        }

        float Prob() const {
          return util::ReadNonPositiveFloat31(address_.base, address_.offset);
        }

        void Write(float prob) {
          util::WriteNonPositiveFloat31(address_.base, address_.offset, prob);
        }

      private:
        util::BitAddress address_;
    };

    DontQuantize() {}

    void SetupMemory(void * /*start*/, unsigned char /*order*/, const Config & /*config*/) {}

    static const bool kTrain = false;
    // These should never be called because kTrain is false.  
    void Train(uint8_t /*order*/, std::vector<float> &/*prob*/, std::vector<float> &/*backoff*/) {}
    void TrainProb(uint8_t, std::vector<float> &/*prob*/) {}

    void FinishedLoading(const Config &) {}
};

class SeparatelyQuantize {
  private:
    class Bins {
      public:
        // Sigh C++ default constructor
        Bins() {}

        Bins(uint8_t bits, float *begin) : begin_(begin), end_(begin_ + (1ULL << bits)), bits_(bits), mask_((1ULL << bits) - 1) {}

        float *Populate() { return begin_; }

        uint64_t EncodeProb(float value) const {
          return Encode(value, 0);
        }

        uint64_t EncodeBackoff(float value) const {
          if (value == 0.0) {
            return HasExtension(value) ? kExtensionQuant : kNoExtensionQuant;
          }
          return Encode(value, 2);
        }

        float Decode(std::size_t off) const { return begin_[off]; }

        uint8_t Bits() const { return bits_; }

        uint64_t Mask() const { return mask_; }

      private:
        uint64_t Encode(float value, size_t reserved) const {
          const float *above = std::lower_bound(static_cast<const float*>(begin_) + reserved, end_, value);
          if (above == begin_ + reserved) return reserved;
          if (above == end_) return end_ - begin_ - 1;
          return above - begin_ - (value - *(above - 1) < *above - value);
        }

        float *begin_;
        const float *end_;
        uint8_t bits_;
        uint64_t mask_;
    };

  public:
    static const ModelType kModelTypeAdd = kQuantAdd;

    static void UpdateConfigFromBinary(int fd, const std::vector<uint64_t> &counts, Config &config);

    static uint64_t Size(uint8_t order, const Config &config) {
      uint64_t longest_table = (static_cast<uint64_t>(1) << static_cast<uint64_t>(config.prob_bits)) * sizeof(float);
      uint64_t middle_table = (static_cast<uint64_t>(1) << static_cast<uint64_t>(config.backoff_bits)) * sizeof(float) + longest_table;
      // unigrams are currently not quantized so no need for a table.  
      return (order - 2) * middle_table + longest_table + /* for the bit counts and alignment padding) */ 8;
    }

    static uint8_t MiddleBits(const Config &config) { return config.prob_bits + config.backoff_bits; }
    static uint8_t LongestBits(const Config &config) { return config.prob_bits; }

    class MiddlePointer {
      public:
        MiddlePointer(const SeparatelyQuantize &quant, unsigned char order_minus_2, const util::BitAddress &address) : bins_(quant.GetTables(order_minus_2)), address_(address) {}

        MiddlePointer() : address_(NULL, 0) {}

        bool Found() const { return address_.base != NULL; }

        float Prob() const {
          return ProbBins().Decode(util::ReadInt25(address_.base, address_.offset + BackoffBins().Bits(), ProbBins().Bits(), ProbBins().Mask()));
        }

        float Backoff() const {
          return BackoffBins().Decode(util::ReadInt25(address_.base, address_.offset, BackoffBins().Bits(), BackoffBins().Mask()));
        }

        float Rest() const { return Prob(); }

        void Write(float prob, float backoff) const {
          util::WriteInt57(address_.base, address_.offset, ProbBins().Bits() + BackoffBins().Bits(), 
              (ProbBins().EncodeProb(prob) << BackoffBins().Bits()) | BackoffBins().EncodeBackoff(backoff));
        }

      private:
        const Bins &ProbBins() const { return bins_[0]; }
        const Bins &BackoffBins() const { return bins_[1]; }
        const Bins *bins_;

        util::BitAddress address_;
    };

    class LongestPointer {
      public:
        LongestPointer(const SeparatelyQuantize &quant, const util::BitAddress &address) : table_(&quant.LongestTable()), address_(address) {}
        
        LongestPointer() : address_(NULL, 0) {}

        bool Found() const { return address_.base != NULL; }

        void Write(float prob) const {
          util::WriteInt25(address_.base, address_.offset, table_->Bits(), table_->EncodeProb(prob));
        }

        float Prob() const {
          return table_->Decode(util::ReadInt25(address_.base, address_.offset, table_->Bits(), table_->Mask()));
        }

      private:
        const Bins *table_;
        util::BitAddress address_;
    };

    SeparatelyQuantize() {}

    void SetupMemory(void *start, unsigned char order, const Config &config);

    static const bool kTrain = true;
    // Assumes 0.0 is removed from backoff.  
    void Train(uint8_t order, std::vector<float> &prob, std::vector<float> &backoff);
    // Train just probabilities (for longest order).
    void TrainProb(uint8_t order, std::vector<float> &prob);

    void FinishedLoading(const Config &config);

    const Bins *GetTables(unsigned char order_minus_2) const { return tables_[order_minus_2]; }

    const Bins &LongestTable() const { return longest_; }

  private:
    Bins tables_[KENLM_MAX_ORDER - 1][2];

    Bins longest_;

    uint8_t *actual_base_;

    uint8_t prob_bits_, backoff_bits_;
};

} // namespace ngram
} // namespace lm

#endif // LM_QUANTIZE_H__


================================================
FILE: src/kenlm/lm/query_main.cc
================================================
#include "lm/ngram_query.hh"

int main(int argc, char *argv[]) {
  if (!(argc == 2 || (argc == 3 && !strcmp(argv[2], "null")))) {
    std::cerr << "KenLM was compiled with maximum order " << KENLM_MAX_ORDER << "." << std::endl;
    std::cerr << "Usage: " << argv[0] << " lm_file [null]" << std::endl;
    std::cerr << "Input is wrapped in <s> and </s> unless null is passed." << std::endl;
    return 1;
  }
  try {
    bool sentence_context = (argc == 2);
    using namespace lm::ngram;
    ModelType model_type;
    if (RecognizeBinary(argv[1], model_type)) {
      switch(model_type) {
        case PROBING:
          Query<lm::ngram::ProbingModel>(argv[1], sentence_context, std::cin, std::cout);
          break;
        case REST_PROBING:
          Query<lm::ngram::RestProbingModel>(argv[1], sentence_context, std::cin, std::cout);
          break;
        case TRIE:
          Query<TrieModel>(argv[1], sentence_context, std::cin, std::cout);
          break;
        case QUANT_TRIE:
          Query<QuantTrieModel>(argv[1], sentence_context, std::cin, std::cout);
          break;
        case ARRAY_TRIE:
          Query<ArrayTrieModel>(argv[1], sentence_context, std::cin, std::cout);
          break;
        case QUANT_ARRAY_TRIE:
          Query<QuantArrayTrieModel>(argv[1], sentence_context, std::cin, std::cout);
          break;
        default:
          std::cerr << "Unrecognized kenlm model type " << model_type << std::endl;
          abort();
      }
    } else {
      Query<ProbingModel>(argv[1], sentence_context, std::cin, std::cout);
    }
    std::cerr << "Total time including destruction:\n";
    util::PrintUsage(std::cerr);
  } catch (const std::exception &e) {
    std::cerr << e.what() << std::endl;
    return 1;
  }
  return 0;
}


================================================
FILE: src/kenlm/lm/read_arpa.cc
================================================
#include "lm/read_arpa.hh"

#include "lm/blank.hh"
#include "util/file.hh"

#include <cmath>
#include <cstdlib>
#include <iostream>
#include <sstream>
#include <vector>

#include <ctype.h>
#include <string.h>
#include <stdint.h>

#ifdef WIN32
#include <float.h>
#endif

namespace lm {

// 1 for '\t', '\n', and ' '.  This is stricter than isspace.  
const bool kARPASpaces[256] = {0,0,0,0,0,0,0,0,0,1,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0};

namespace {

bool IsEntirelyWhiteSpace(const StringPiece &line) {
  for (size_t i = 0; i < static_cast<size_t>(line.size()); ++i) {
    if (!isspace(line.data()[i])) return false;
  }
  return true;
}

const char kBinaryMagic[] = "mmap lm http://kheafield.com/code";

// strtoull isn't portable enough :-(
uint64_t ReadCount(const std::string &from) {
  std::stringstream stream(from);
  uint64_t ret;
  stream >> ret;
  UTIL_THROW_IF(!stream, FormatLoadException, "Bad count " << from);
  return ret;
}

} // namespace

void ReadARPACounts(util::FilePiece &in, std::vector<uint64_t> &number) {
  number.clear();
  StringPiece line = in.ReadLine();
  // In general, ARPA files can have arbitrary text before "\data\"
  // But in KenLM, we require such lines to start with "#", so that
  // we can do stricter error checking
  while (IsEntirelyWhiteSpace(line) || line.starts_with("#")) {
    line = in.ReadLine();
  }

  if (line != "\\data\\") {
    if ((line.size() >= 2) && (line.data()[0] == 0x1f) && (static_cast<unsigned char>(line.data()[1]) == 0x8b)) {
      UTIL_THROW(FormatLoadException, "Looks like a gzip file.  If this is an ARPA file, pipe " << in.FileName() << " through zcat.  If this already in binary format, you need to decompress it because mmap doesn't work on top of gzip.");
    }
    if (static_cast<size_t>(line.size()) >= strlen(kBinaryMagic) && StringPiece(line.data(), strlen(kBinaryMagic)) == kBinaryMagic) 
      UTIL_THROW(FormatLoadException, "This looks like a binary file but got sent to the ARPA parser.  Did you compress the binary file or pass a binary file where only ARPA files are accepted?");
    UTIL_THROW_IF(line.size() >= 4 && StringPiece(line.data(), 4) == "blmt", FormatLoadException, "This looks like an IRSTLM binary file.  Did you forget to pass --text yes to compile-lm?");
    UTIL_THROW_IF(line == "iARPA", FormatLoadException, "This looks like an IRSTLM iARPA file.  You need an ARPA file.  Run\n  compile-lm --text yes " << in.FileName() << " " << in.FileName() << ".arpa\nfirst.");
    UTIL_THROW(FormatLoadException, "first non-empty line was \"" << line << "\" not \\data\\.");
  }
  while (!IsEntirelyWhiteSpace(line = in.ReadLine())) {
    if (line.size() < 6 || strncmp(line.data(), "ngram ", 6)) UTIL_THROW(FormatLoadException, "count line \"" << line << "\"doesn't begin with \"ngram \"");
    // So strtol doesn't go off the end of line.  
    std::string remaining(line.data() + 6, line.size() - 6);
    char *end_ptr;
    unsigned int length = std::strtol(remaining.c_str(), &end_ptr, 10);
    if ((end_ptr == remaining.c_str()) || (length - 1 != number.size())) UTIL_THROW(FormatLoadException, "ngram count lengths should be consecutive starting with 1: " << line);
    if (*end_ptr != '=') UTIL_THROW(FormatLoadException, "Expected = immediately following the first number in the count line " << line);
    ++end_ptr;
    number.push_back(ReadCount(end_ptr));
  }
}

void ReadNGramHeader(util::FilePiece &in, unsigned int length) {
   StringPiece line;
  while (IsEntirelyWhiteSpace(line = in.ReadLine())) {}
  std::stringstream expected;
  expected << '\\' << length << "-grams:";
  if (line != expected.str()) UTIL_THROW(FormatLoadException, "Was expecting n-gram header " << expected.str() << " but got " << line << " instead");
}

void ReadBackoff(util::FilePiece &in, Prob &/*weights*/) {
  switch (in.get()) {
    case '\t':
      {
        float got = in.ReadFloat();
        if (got != 0.0)
          UTIL_THROW(FormatLoadException, "Non-zero backoff " << got << " provided for an n-gram that should have no backoff");
      }
      break;
    case '\n':
      break;
    default:
      UTIL_THROW(FormatLoadException, "Expected tab or newline for backoff");
  }
}

void ReadBackoff(util::FilePiece &in, float &backoff) {
  // Always make zero negative.  
  // Negative zero means that no (n+1)-gram has this n-gram as context.  
  // Therefore the hypothesis state can be shorter.  Of course, many n-grams
  // are context for (n+1)-grams.  An algorithm in the data structure will go
  // back and set the backoff to positive zero in these cases.
  switch (in.get()) {
    case '\t':
      backoff = in.ReadFloat();
      if (backoff == ngram::kExtensionBackoff) backoff = ngram::kNoExtensionBackoff;
      {
#ifdef WIN32
		int float_class = _fpclass(backoff);
        UTIL_THROW_IF(float_class == _FPCLASS_SNAN || float_class == _FPCLASS_QNAN || float_class == _FPCLASS_NINF || float_class == _FPCLASS_PINF, FormatLoadException, "Bad backoff " << backoff);
#else
        int float_class = std::fpclassify(backoff);
        UTIL_THROW_IF(float_class == FP_NAN || float_class == FP_INFINITE, FormatLoadException, "Bad backoff " << backoff);
#endif
      }
      UTIL_THROW_IF(in.get() != '\n', FormatLoadException, "Expected newline after backoff");
      break;
    case '\n':
      backoff = ngram::kNoExtensionBackoff;
      break;
    default:
      UTIL_THROW(FormatLoadException, "Expected tab or newline for backoff");
  }
}

void ReadEnd(util::FilePiece &in) {
  StringPiece line;
  do {
    line = in.ReadLine();
  } while (IsEntirelyWhiteSpace(line));
  if (line != "\\end\\") UTIL_THROW(FormatLoadException, "Expected \\end\\ but the ARPA file has " << line);

  try {
    while (true) {
      line = in.ReadLine();
      if (!IsEntirelyWhiteSpace(line)) UTIL_THROW(FormatLoadException, "Trailing line " << line);
    }
  } catch (const util::EndOfFileException &e) {}
}

void PositiveProbWarn::Warn(float prob) {
  switch (action_) {
    case THROW_UP:
      UTIL_THROW(FormatLoadException, "Positive log probability " << prob << " in the model.  This is a bug in IRSTLM; you can set config.positive_log_probability = SILENT or pass -i to build_binary to substitute 0.0 for the log probability.  Error");
    case COMPLAIN:
      std::cerr << "There's a positive log probability " << prob << " in the APRA file, probably because of a bug in IRSTLM.  This and subsequent entires will be mapepd to 0 log probability." << std::endl;
      action_ = SILENT;
      break;
    case SILENT:
      break;
  }
}

} // namespace lm


================================================
FILE: src/kenlm/lm/read_arpa.hh
================================================
#ifndef LM_READ_ARPA__
#define LM_READ_ARPA__

#include "lm/lm_exception.hh"
#include "lm/word_index.hh"
#include "lm/weights.hh"
#include "util/file_piece.hh"

#include <cstddef>
#include <iosfwd>
#include <vector>

namespace lm {

void ReadARPACounts(util::FilePiece &in, std::vector<uint64_t> &number);
void ReadNGramHeader(util::FilePiece &in, unsigned int length);

void ReadBackoff(util::FilePiece &in, Prob &weights);
void ReadBackoff(util::FilePiece &in, float &backoff);
inline void ReadBackoff(util::FilePiece &in, ProbBackoff &weights) {
  ReadBackoff(in, weights.backoff);
}
inline void ReadBackoff(util::FilePiece &in, RestWeights &weights) {
  ReadBackoff(in, weights.backoff);
}

void ReadEnd(util::FilePiece &in);

extern const bool kARPASpaces[256];

// Positive log probability warning.  
class PositiveProbWarn {
  public:
    PositiveProbWarn() : action_(THROW_UP) {}

    explicit PositiveProbWarn(WarningAction action) : action_(action) {}

    void Warn(float prob);

  private:
    WarningAction action_;
};

template <class Voc, class Weights> void Read1Gram(util::FilePiece &f, Voc &vocab, Weights *unigrams, PositiveProbWarn &warn) {
  try {
    float prob = f.ReadFloat();
    if (prob > 0.0) {
      warn.Warn(prob);
      prob = 0.0;
    }
    if (f.get() != '\t') UTIL_THROW(FormatLoadException, "Expected tab after probability");
    Weights &value = unigrams[vocab.Insert(f.ReadDelimited(kARPASpaces))];
    value.prob = prob;
    ReadBackoff(f, value);
  } catch(util::Exception &e) {
    e << " in the 1-gram at byte " << f.Offset();
    throw;
  }
}

// Return true if a positive log probability came out.
template <class Voc, class Weights> void Read1Grams(util::FilePiece &f, std::size_t count, Voc &vocab, Weights *unigrams, PositiveProbWarn &warn) {
  ReadNGramHeader(f, 1);
  for (std::size_t i = 0; i < count; ++i) {
    Read1Gram(f, vocab, unigrams, warn);
  }
  vocab.FinishedLoading(unigrams);
}

// Return true if a positive log probability came out.
template <class Voc, class Weights> void ReadNGram(util::FilePiece &f, const unsigned char n, const Voc &vocab, WordIndex *const reverse_indices, Weights &weights, PositiveProbWarn &warn) {
  try {
    weights.prob = f.ReadFloat();
    if (weights.prob > 0.0) {
      warn.Warn(weights.prob);
      weights.prob = 0.0;
    }
    for (WordIndex *vocab_out = reverse_indices + n - 1; vocab_out >= reverse_indices; --vocab_out) {
      *vocab_out = vocab.Index(f.ReadDelimited(kARPASpaces));
    }
    ReadBackoff(f, weights);
  } catch(util::Exception &e) {
    e << " in the " << static_cast<unsigned int>(n) << "-gram at byte " << f.Offset();
    throw;
  }
}

} // namespace lm

#endif // LM_READ_ARPA__


================================================
FILE: src/kenlm/lm/return.hh
================================================
#ifndef LM_RETURN__
#define LM_RETURN__

#include <stdint.h>

namespace lm {
/* Structure returned by scoring routines. */
struct FullScoreReturn {
  // log10 probability
  float prob;

  /* The length of n-gram matched.  Do not use this for recombination.  
   * Consider a model containing only the following n-grams:
   * -1 foo
   * -3.14  bar
   * -2.718 baz -5
   * -6 foo bar
   *
   * If you score ``bar'' then ngram_length is 1 and recombination state is the
   * empty string because bar has zero backoff and does not extend to the
   * right.  
   * If you score ``foo'' then ngram_length is 1 and recombination state is 
   * ``foo''.  
   *
   * Ideally, keep output states around and compare them.  Failing that,
   * get out_state.ValidLength() and use that length for recombination.
   */
  unsigned char ngram_length;

  /* Left extension information.  If independent_left is set, then prob is
   * independent of words to the left (up to additional backoff).  Otherwise,
   * extend_left indicates how to efficiently extend further to the left.  
   */
  bool independent_left;
  uint64_t extend_left; // Defined only if independent_left

  // Rest cost for extension to the left.
  float rest;
};

} // namespace lm
#endif // LM_RETURN__


================================================
FILE: src/kenlm/lm/search_hashed.cc
================================================
#include "lm/search_hashed.hh"

#include "lm/binary_format.hh"
#include "lm/blank.hh"
#include "lm/lm_exception.hh"
#include "lm/model.hh"
#include "lm/read_arpa.hh"
#include "lm/value.hh"
#include "lm/vocab.hh"

#include "util/bit_packing.hh"
#include "util/file_piece.hh"

#include <string>

namespace lm {
namespace ngram {

class ProbingModel;

namespace {

/* These are passed to ReadNGrams so that n-grams with zero backoff that appear as context will still be used in state. */
template <class Middle> class ActivateLowerMiddle {
  public:
    explicit ActivateLowerMiddle(Middle &middle) : modify_(middle) {}

    void operator()(const WordIndex *vocab_ids, const unsigned int n) {
      uint64_t hash = static_cast<WordIndex>(vocab_ids[1]);
      for (const WordIndex *i = vocab_ids + 2; i < vocab_ids + n; ++i) {
        hash = detail::CombineWordHash(hash, *i);
      }
      typename Middle::MutableIterator i;
      // TODO: somehow get text of n-gram for this error message.
      if (!modify_.UnsafeMutableFind(hash, i))
        UTIL_THROW(FormatLoadException, "The context of every " << n << "-gram should appear as a " << (n-1) << "-gram");
      SetExtension(i->value.backoff);
    }

  private:
    Middle &modify_;
};

template <class Weights> class ActivateUnigram {
  public:
    explicit ActivateUnigram(Weights *unigram) : modify_(unigram) {}

    void operator()(const WordIndex *vocab_ids, const unsigned int /*n*/) {
      // assert(n == 2);
      SetExtension(modify_[vocab_ids[1]].backoff);
    }

  private:
    Weights *modify_;
};

// Find the lower order entry, inserting blanks along the way as necessary.  
template <class Value> void FindLower(
    const std::vector<uint64_t> &keys,
    typename Value::Weights &unigram,
    std::vector<util::ProbingHashTable<typename Value::ProbingEntry, util::IdentityHash> > &middle,
    std::vector<typename Value::Weights *> &between) {
  typename util::ProbingHashTable<typename Value::ProbingEntry, util::IdentityHash>::MutableIterator iter;
  typename Value::ProbingEntry entry;
  // Backoff will always be 0.0.  We'll get the probability and rest in another pass.
  entry.value.backoff = kNoExtensionBackoff;
  // Go back and find the longest right-aligned entry, informing it that it extends left.  Normally this will match immediately, but sometimes SRI is dumb.  
  for (int lower = keys.size() - 2; ; --lower) {
    if (lower == -1) {
      between.push_back(&unigram);
      return;
    }
    entry.key = keys[lower];
    bool found = middle[lower].FindOrInsert(entry, iter);
    between.push_back(&iter->value);
    if (found) return;
  }
}

// Between usually has  single entry, the value to adjust.  But sometimes SRI stupidly pruned entries so it has unitialized blank values to be set here.  
template <class Added, class Build> void AdjustLower(
    const Added &added,
    const Build &build,
    std::vector<typename Build::Value::Weights *> &between, 
    const unsigned int n,
    const std::vector<WordIndex> &vocab_ids,
    typename Build::Value::Weights *unigrams,
    std::vector<util::ProbingHashTable<typename Build::Value::ProbingEntry, util::IdentityHash> > &middle) {
  typedef typename Build::Value Value;
  if (between.size() == 1) {
    build.MarkExtends(*between.front(), added);
    return;
  }
  typedef util::ProbingHashTable<typename Value::ProbingEntry, util::IdentityHash> Middle;
  float prob = -fabs(between.back()->prob);
  // Order of the n-gram on which probabilities are based.  
  unsigned char basis = n - between.size();
  assert(basis != 0);
  typename Build::Value::Weights **change = &between.back();
  // Skip the basis.
  --change;
  if (basis == 1) {
    // Hallucinate a bigram based on a unigram's backoff and a unigram probability.  
    float &backoff = unigrams[vocab_ids[1]].backoff;
    SetExtension(backoff);
    prob += backoff;
    (*change)->prob = prob;
    build.SetRest(&*vocab_ids.begin(), 2, **change);
    basis = 2;
    --change;
  }
  uint64_t backoff_hash = static_cast<uint64_t>(vocab_ids[1]);
  for (unsigned char i = 2; i <= basis; ++i) {
    backoff_hash = detail::CombineWordHash(backoff_hash, vocab_ids[i]);
  }
  for (; basis < n - 1; ++basis, --change) {
    typename Middle::MutableIterator gotit;
    if (middle[basis - 2].UnsafeMutableFind(backoff_hash, gotit)) {
      float &backoff = gotit->value.backoff;
      SetExtension(backoff);
      prob += backoff;
    }
    (*change)->prob = prob;
    build.SetRest(&*vocab_ids.begin(), basis + 1, **change);
    backoff_hash = detail::CombineWordHash(backoff_hash, vocab_ids[basis+1]);
  }

  typename std::vector<typename Value::Weights *>::const_iterator i(between.begin());
  build.MarkExtends(**i, added);
  const typename Value::Weights *longer = *i;
  // Everything has probability but is not marked as extending.  
  for (++i; i != between.end(); ++i) {
    build.MarkExtends(**i, *longer);
    longer = *i;
  }
}

// Continue marking lower entries even they know that they extend left.  This is used for upper/lower bounds.  
template <class Build> void MarkLower(
    const std::vector<uint64_t> &keys,
    const Build &build,
    typename Build::Value::Weights &unigram,
    std::vector<util::ProbingHashTable<typename Build::Value::ProbingEntry, util::IdentityHash> > &middle,
    int start_order,
    const typename Build::Value::Weights &longer) {
  if (start_order == 0) return;
  typename util::ProbingHashTable<typename Build::Value::ProbingEntry, util::IdentityHash>::MutableIterator iter;
  // Hopefully the compiler will realize that if MarkExtends always returns false, it can simplify this code.  
  for (int even_lower = start_order - 2 /* index in middle */; ; --even_lower) {
    if (even_lower == -1) {
      build.MarkExtends(unigram, longer);
      return;
    }
    middle[even_lower].UnsafeMutableFind(keys[even_lower], iter);
    if (!build.MarkExtends(iter->value, longer)) return;
  }
}

template <class Build, class Activate, class Store> void ReadNGrams(
    util::FilePiece &f,
    const unsigned int n,
    const size_t count,
    const ProbingVocabulary &vocab,
    const Build &build,
    typename Build::Value::Weights *unigrams,
    std::vector<util::ProbingHashTable<typename Build::Value::ProbingEntry, util::IdentityHash> > &middle,
    Activate activate,
    Store &store,
    PositiveProbWarn &warn) {
  typedef typename Build::Value Value;
  typedef util::ProbingHashTable<typename Value::ProbingEntry, util::IdentityHash> Middle;
  assert(n >= 2);
  ReadNGramHeader(f, n);

  // Both vocab_ids and keys are non-empty because n >= 2.
  // vocab ids of words in reverse order.
  std::vector<WordIndex> vocab_ids(n);
  std::vector<uint64_t> keys(n-1);
  typename Store::Entry entry;
  std::vector<typename Value::Weights *> between;
  for (size_t i = 0; i < count; ++i) {
    ReadNGram(f, n, vocab, &*vocab_ids.begin(), entry.value, warn);
    build.SetRest(&*vocab_ids.begin(), n, entry.value);

    keys[0] = detail::CombineWordHash(static_cast<uint64_t>(vocab_ids.front()), vocab_ids[1]);
    for (unsigned int h = 1; h < n - 1; ++h) {
      keys[h] = detail::CombineWordHash(keys[h-1], vocab_ids[h+1]);
    }
    // Initially the sign bit is on, indicating it does not extend left.  Most already have this but there might +0.0.  
    util::SetSign(entry.value.prob);
    entry.key = keys[n-2];

    store.Insert(entry);
    between.clear();
    FindLower<Value>(keys, unigrams[vocab_ids.front()], middle, between);
    AdjustLower<typename Store::Entry::Value, Build>(entry.value, build, between, n, vocab_ids, unigrams, middle);
    if (Build::kMarkEvenLower) MarkLower<Build>(keys, build, unigrams[vocab_ids.front()], middle, n - between.size() - 1, *between.back());
    activate(&*vocab_ids.begin(), n);
  }

  store.FinishedInserting();
}

} // namespace
namespace detail {
 
template <class Value> uint8_t *HashedSearch<Value>::SetupMemory(uint8_t *start, const std::vector<uint64_t> &counts, const Config &config) {
  std::size_t allocated = Unigram::Size(counts[0]);
  unigram_ = Unigram(start, counts[0], allocated);
  start += allocated;
  for (unsigned int n = 2; n < counts.size(); ++n) {
    allocated = Middle::Size(counts[n - 1], config.probing_multiplier);
    middle_.push_back(Middle(start, allocated));
    start += allocated;
  }
  allocated = Longest::Size(counts.back(), config.probing_multiplier);
  longest_ = Longest(start, allocated);
  start += allocated;
  return start;
}

template <class Value> void HashedSearch<Value>::InitializeFromARPA(const char * /*file*/, util::FilePiece &f, const std::vector<uint64_t> &counts, const Config &config, ProbingVocabulary &vocab, Backing &backing) {
  // TODO: fix sorted.
  SetupMemory(GrowForSearch(config, vocab.UnkCountChangePadding(), Size(counts, config), backing), counts, config);

  PositiveProbWarn warn(config.positive_log_probability);
  Read1Grams(f, counts[0], vocab, unigram_.Raw(), warn);
  CheckSpecials(config, vocab);
  DispatchBuild(f, counts, config, vocab, warn);
}

template <> void HashedSearch<BackoffValue>::DispatchBuild(util::FilePiece &f, const std::vector<uint64_t> &counts, const Config &config, const ProbingVocabulary &vocab, PositiveProbWarn &warn) {
  NoRestBuild build;
  ApplyBuild(f, counts, vocab, warn, build);
}

template <> void HashedSearch<RestValue>::DispatchBuild(util::FilePiece &f, const std::vector<uint64_t> &counts, const Config &config, const ProbingVocabulary &vocab, PositiveProbWarn &warn) {
  switch (config.rest_function) {
    case Config::REST_MAX:
      {
        MaxRestBuild build;
        ApplyBuild(f, counts, vocab, warn, build);
      }
      break;
    case Config::REST_LOWER:
      {
        LowerRestBuild<ProbingModel> build(config, counts.size(), vocab);
        ApplyBuild(f, counts, vocab, warn, build);
      }
      break;
  }
}

template <class Value> template <class Build> void HashedSearch<Value>::ApplyBuild(util::FilePiece &f, const std::vector<uint64_t> &counts, const ProbingVocabulary &vocab, PositiveProbWarn &warn, const Build &build) {
  for (WordIndex i = 0; i < counts[0]; ++i) {
    build.SetRest(&i, (unsigned int)1, unigram_.Raw()[i]);
  }

  try {
    if (counts.size() > 2) {
      ReadNGrams<Build, ActivateUnigram<typename Value::Weights>, Middle>(
          f, 2, counts[1], vocab, build, unigram_.Raw(), middle_, ActivateUnigram<typename Value::Weights>(unigram_.Raw()), middle_[0], warn);
    }
    for (unsigned int n = 3; n < counts.size(); ++n) {
      ReadNGrams<Build, ActivateLowerMiddle<Middle>, Middle>(
          f, n, counts[n-1], vocab, build, unigram_.Raw(), middle_, ActivateLowerMiddle<Middle>(middle_[n-3]), middle_[n-2], warn);
    }
    if (counts.size() > 2) {
      ReadNGrams<Build, ActivateLowerMiddle<Middle>, Longest>(
          f, counts.size(), counts[counts.size() - 1], vocab, build, unigram_.Raw(), middle_, ActivateLowerMiddle<Middle>(middle_.back()), longest_, warn);
    } else {
      ReadNGrams<Build, ActivateUnigram<typename Value::Weights>, Longest>(
          f, counts.size(), counts[counts.size() - 1], vocab, build, unigram_.Raw(), middle_, ActivateUnigram<typename Value::Weights>(unigram_.Raw()), longest_, warn);
    }
  } catch (util::ProbingSizeException &e) {
    UTIL_THROW(util::ProbingSizeException, "Avoid pruning n-grams like \"bar baz quux\" when \"foo bar baz quux\" is still in the model.  KenLM will work when this pruning happens, but the probing model assumes these events are rare enough that using blank space in the probing hash table will cover all of them.  Increase probing_multiplier (-p to build_binary) to add more blank spaces.\n");
  }
  ReadEnd(f);
}

template <class Value> void HashedSearch<Value>::LoadedBinary() {
  unigram_.LoadedBinary();
  for (typename std::vector<Middle>::iterator i = middle_.begin(); i != middle_.end(); ++i) {
    i->LoadedBinary();
  }
  longest_.LoadedBinary();
}

template class HashedSearch<BackoffValue>;
template class HashedSearch<RestValue>;

} // namespace detail
} // namespace ngram
} // namespace lm


================================================
FILE: src/kenlm/lm/search_hashed.hh
================================================
#ifndef LM_SEARCH_HASHED__
#define LM_SEARCH_HASHED__

#include "lm/model_type.hh"
#include "lm/config.hh"
#include "lm/read_arpa.hh"
#include "lm/return.hh"
#include "lm/weights.hh"

#include "util/bit_packing.hh"
#include "util/probing_hash_table.hh"

#include <algorithm>
#include <iostream>
#include <vector>

namespace util { class FilePiece; }

namespace lm {
namespace ngram {
struct Backing;
class ProbingVocabulary;
namespace detail {

inline uint64_t CombineWordHash(uint64_t current, const WordIndex next) {
  uint64_t ret = (current * 8978948897894561157ULL) ^ (static_cast<uint64_t>(1 + next) * 17894857484156487943ULL);
  return ret;
}

#pragma pack(push)
#pragma pack(4)
struct ProbEntry {
  uint64_t key;
  Prob value;
  typedef uint64_t Key;
  typedef Prob Value;
  uint64_t GetKey() const {
    return key;
  }
};

#pragma pack(pop)

class LongestPointer {
  public:
    explicit LongestPointer(const float &to) : to_(&to) {}

    LongestPointer() : to_(NULL) {}

    bool Found() const {
      return to_ != NULL;
    }

    float Prob() const {
      return *to_;
    }

  private:
    const float *to_;
};

template <class Value> class HashedSearch {
  public:
    typedef uint64_t Node;

    typedef typename Value::ProbingProxy UnigramPointer;
    typedef typename Value::ProbingProxy MiddlePointer;
    typedef ::lm::ngram::detail::LongestPointer LongestPointer;

    static const ModelType kModelType = Value::kProbingModelType;
    static const bool kDifferentRest = Value::kDifferentRest;
    static const unsigned int kVersion = 0;

    // TODO: move probing_multiplier here with next binary file format update.  
    static void UpdateConfigFromBinary(int, const std::vector<uint64_t> &, Config &) {}

    static uint64_t Size(const std::vector<uint64_t> &counts, const Config &config) {
      uint64_t ret = Unigram::Size(counts[0]);
      for (unsigned char n = 1; n < counts.size() - 1; ++n) {
        ret += Middle::Size(counts[n], config.probing_multiplier);
      }
      return ret + Longest::Size(counts.back(), config.probing_multiplier);
    }

    uint8_t *SetupMemory(uint8_t *start, const std::vector<uint64_t> &counts, const Config &config);

    void InitializeFromARPA(const char *file, util::FilePiece &f, const std::vector<uint64_t> &counts, const Config &config, ProbingVocabulary &vocab, Backing &backing);

    void LoadedBinary();

    unsigned char Order() const {
      return middle_.size() + 2;
    }

    typename Value::Weights &UnknownUnigram() { return unigram_.Unknown(); }

    UnigramPointer LookupUnigram(WordIndex word, Node &next, bool &independent_left, uint64_t &extend_left) const {
      extend_left = static_cast<uint64_t>(word);
      next = extend_left;
      UnigramPointer ret(unigram_.Lookup(word));
      independent_left = ret.IndependentLeft();
      return ret;
    }

#pragma GCC diagnostic ignored "-Wuninitialized"
    MiddlePointer Unpack(uint64_t extend_pointer, unsigned char extend_length, Node &node) const {
      node = extend_pointer;
      typename Middle::ConstIterator found;
      bool got = middle_[extend_length - 2].Find(extend_pointer, found);
      assert(got);
      (void)got;
      return MiddlePointer(found->value);
    }

    MiddlePointer LookupMiddle(unsigned char order_minus_2, WordIndex word, Node &node, bool &independent_left, uint64_t &extend_pointer) const {
      node = CombineWordHash(node, word);
      typename Middle::ConstIterator found;
      if (!middle_[order_minus_2].Find(node, found)) {
        independent_left = true;
        return MiddlePointer();
      }
      extend_pointer = node;
      MiddlePointer ret(found->value);
      independent_left = ret.IndependentLeft();
      return ret;
    }

    LongestPointer LookupLongest(WordIndex word, const Node &node) const {
      // Sign bit is always on because longest n-grams do not extend left.  
      typename Longest::ConstIterator found;
      if (!longest_.Find(CombineWordHash(node, word), found)) return LongestPointer();
      return LongestPointer(found->value.prob);
    }

    // Generate a node without necessarily checking that it actually exists.  
    // Optionally return false if it's know to not exist.  
    bool FastMakeNode(const WordIndex *begin, const WordIndex *end, Node &node) const {
      assert(begin != end);
      node = static_cast<Node>(*begin);
      for (const WordIndex *i = begin + 1; i < end; ++i) {
        node = CombineWordHash(node, *i);
      }
      return true;
    }

  private:
    // Interpret config's rest cost build policy and pass the right template argument to ApplyBuild.  
    void DispatchBuild(util::FilePiece &f, const std::vector<uint64_t> &counts, const Config &config, const ProbingVocabulary &vocab, PositiveProbWarn &warn);

    template <class Build> void ApplyBuild(util::FilePiece &f, const std::vector<uint64_t> &counts, const ProbingVocabulary &vocab, PositiveProbWarn &warn, const Build &build);

    class Unigram {
      public:
        Unigram() {}

        Unigram(void *start, uint64_t count, std::size_t /*allocated*/) : 
          unigram_(static_cast<typename Value::Weights*>(start))
#ifdef DEBUG
         ,  count_(count)
#endif
      {}

        static uint64_t Size(uint64_t count) {
          return (count + 1) * sizeof(typename Value::Weights); // +1 for hallucinate <unk>
        }

        const typename Value::Weights &Lookup(WordIndex index) const {
#ifdef DEBUG
          assert(index < count_);
#endif
          return unigram_[index];
        }

        typename Value::Weights &Unknown() { return unigram_[0]; }

        void LoadedBinary() {}

        // For building.
        typename Value::Weights *Raw() { return unigram_; }

      private:
        typename Value::Weights *unigram_;
#ifdef DEBUG
        uint64_t count_;
#endif
    };

    Unigram unigram_;

    typedef util::ProbingHashTable<typename Value::ProbingEntry, util::IdentityHash> Middle;
    std::vector<Middle> middle_;

    typedef util::ProbingHashTable<ProbEntry, util::IdentityHash> Longest;
    Longest longest_;
};

} // namespace detail
} // namespace ngram
} // namespace lm

#endif // LM_SEARCH_HASHED__


================================================
FILE: src/kenlm/lm/search_trie.cc
================================================
/* This is where the trie is built.  It's on-disk.  */
#include "lm/search_trie.hh"

#include "lm/bhiksha.hh"
#include "lm/binary_format.hh"
#include "lm/blank.hh"
#include "lm/lm_exception.hh"
#include "lm/max_order.hh"
#include "lm/quantize.hh"
#include "lm/trie.hh"
#include "lm/trie_sort.hh"
#include "lm/vocab.hh"
#include "lm/weights.hh"
#include "lm/word_index.hh"
#include "util/ersatz_progress.hh"
#include "util/mmap.hh"
#include "util/proxy_iterator.hh"
#include "util/scoped.hh"
#include "util/sized_iterator.hh"

#include <algorithm>
#include <cstring>
#include <cstdio>
#include <cstdlib>
#include <queue>
#include <limits>
#include <numeric>
#include <vector>

#if defined(_WIN32) || defined(_WIN64)
#include <windows.h>
#endif

namespace lm {
namespace ngram {
namespace trie {
namespace {

void ReadOrThrow(FILE *from, void *data, size_t size) {
  UTIL_THROW_IF(1 != std::fread(data, size, 1, from), util::ErrnoException, "Short read");
}

int Compare(unsigned char order, const void *first_void, const void *second_void) {
  const WordIndex *first = reinterpret_cast<const WordIndex*>(first_void), *second = reinterpret_cast<const WordIndex*>(second_void);
  const WordIndex *end = first + order;
  for (; first != end; ++first, ++second) {
    if (*first < *second) return -1;
    if (*first > *second) return 1;
  }
  return 0;
}

struct ProbPointer {
  unsigned char array;
  uint64_t index;
};

// Array of n-grams and float indices.
class BackoffMessages {
  public:
    void Init(std::size_t entry_size) {
      current_ = NULL;
      allocated_ = NULL;
      entry_size_ = entry_size;
    }

    void Add(const WordIndex *to, ProbPointer index) {
      while (current_ + entry_size_ > allocated_) {
        std::size_t allocated_size = allocated_ - (uint8_t*)backing_.get();
        Resize(std::max<std::size_t>(allocated_size * 2, entry_size_));
      }
      memcpy(current_, to, entry_size_ - sizeof(ProbPointer));
      *reinterpret_cast<ProbPointer*>(current_ + entry_size_ - sizeof(ProbPointer)) = index;
      current_ += entry_size_;
    }

    void Apply(float *const *const base, FILE *unigrams) {
      FinishedAdding();
      if (current_ == allocated_) return;
      rewind(unigrams);
      ProbBackoff weights;
      WordIndex unigram = 0;
      ReadOrThrow(unigrams, &weights, sizeof(weights));
      for (; current_ != allocated_; current_ += entry_size_) {
        const WordIndex &cur_word = *reinterpret_cast<const WordIndex*>(current_);
        for (; unigram < cur_word; ++unigram) {
          ReadOrThrow(unigrams, &weights, sizeof(weights));
        }
        if (!HasExtension(weights.backoff)) {
          weights.backoff = kExtensionBackoff;
          UTIL_THROW_IF(fseek(unigrams, -sizeof(weights), SEEK_CUR), util::ErrnoException, "Seeking backwards to denote unigram extension failed.");
          util::WriteOrThrow(unigrams, &weights, sizeof(weights));
        }
        const ProbPointer &write_to = *reinterpret_cast<const ProbPointer*>(current_ + sizeof(WordIndex));
        base[write_to.array][write_to.index] += weights.backoff;
      }
      backing_.reset();
    }

    void Apply(float *const *const base, RecordReader &reader) {
      FinishedAdding();
      if (current_ == allocated_) return;
      // We'll also use the same buffer to record messages to blanks that they extend.
      WordIndex *extend_out = reinterpret_cast<WordIndex*>(current_);
      const unsigned char order = (entry_size_ - sizeof(ProbPointer)) / sizeof(WordIndex);
      for (reader.Rewind(); reader && (current_ != allocated_); ) {
        switch (Compare(order, reader.Data(), current_)) {
          case -1:
            ++reader;
            break;
          case 1:
            // Message but nobody to receive it.  Write it down at the beginning of the buffer so we can inform this blank that it extends.
            for (const WordIndex *w = reinterpret_cast<const WordIndex *>(current_); w != reinterpret_cast<const WordIndex *>(current_) + order; ++w, ++extend_out) *extend_out = *w;
            current_ += entry_size_;
            break;
          case 0:
            float &backoff = reinterpret_cast<ProbBackoff*>((uint8_t*)reader.Data() + order * sizeof(WordIndex))->backoff;
            if (!HasExtension(backoff)) {
              backoff = kExtensionBackoff;
              reader.Overwrite(&backoff, sizeof(float));
            } else {
              const ProbPointer &write_to = *reinterpret_cast<const ProbPointer*>(current_ + entry_size_ - sizeof(ProbPointer));
              base[write_to.array][write_to.index] += backoff;
            }
            current_ += entry_size_;
            break;
        }
      }
      // Now this is a list of blanks that extend right.
      entry_size_ = sizeof(WordIndex) * order;
      Resize(sizeof(WordIndex) * (extend_out - (const WordIndex*)backing_.get()));
      current_ = (uint8_t*)backing_.get();
    }

    // Call after Apply
    bool Extends(unsigned char order, const WordIndex *words) {
      if (current_ == allocated_) return false;
      assert(order * sizeof(WordIndex) == entry_size_);
      while (true) {
        switch(Compare(order, words, current_)) {
          case 1:
            current_ += entry_size_;
            if (current_ == allocated_) return false;
            break;
          case -1:
            return false;
          case 0:
            return true;
        }
      }
    }

  private:
    void FinishedAdding() {
      Resize(current_ - (uint8_t*)backing_.get());
      // Sort requests in same order as files.
      std::sort(
          util::SizedIterator(util::SizedProxy(backing_.get(), entry_size_)),
          util::SizedIterator(util::SizedProxy(current_, entry_size_)),
          util::SizedCompare<EntryCompare>(EntryCompare((entry_size_ - sizeof(ProbPointer)) / sizeof(WordIndex))));
      current_ = (uint8_t*)backing_.get();
    }

    void Resize(std::size_t to) {
      std::size_t current = current_ - (uint8_t*)backing_.get();
      backing_.call_realloc(to);
      current_ = (uint8_t*)backing_.get() + current;
      allocated_ = (uint8_t*)backing_.get() + to;
    }

    util::scoped_malloc backing_;

    uint8_t *current_, *allocated_;

    std::size_t entry_size_;
};

const float kBadProb = std::numeric_limits<float>::infinity();

class SRISucks {
  public:
    SRISucks() {
      for (BackoffMessages *i = messages_; i != messages_ + KENLM_MAX_ORDER - 1; ++i)
        i->Init(sizeof(ProbPointer) + sizeof(WordIndex) * (i - messages_ + 1));
    }

    void Send(unsigned char begin, unsigned char order, const WordIndex *to, float prob_basis) {
      assert(prob_basis != kBadProb);
      ProbPointer pointer;
      pointer.array = order - 1;
      pointer.index = values_[order - 1].size();
      for (unsigned char i = begin; i < order; ++i) {
        messages_[i - 1].Add(to, pointer);
      }
      values_[order - 1].push_back(prob_basis);
    }

    void ObtainBackoffs(unsigned char total_order, FILE *unigram_file, RecordReader *reader) {
      for (unsigned char i = 0; i < KENLM_MAX_ORDER - 1; ++i) {
        it_[i] = values_[i].empty() ? NULL : &*values_[i].begin();
      }
      messages_[0].Apply(it_, unigram_file);
      BackoffMessages *messages = messages_ + 1;
      const RecordReader *end = reader + total_order - 2 /* exclude unigrams and longest order */;
      for (; reader != end; ++messages, ++reader) {
        messages->Apply(it_, *reader);
      }
    }

    ProbBackoff GetBlank(unsigned char total_order, unsigned char order, const WordIndex *indices) {
      assert(order > 1);
      ProbBackoff ret;
      ret.prob = *(it_[order - 1]++);
      ret.backoff = ((order != total_order - 1) && messages_[order - 1].Extends(order, indices)) ? kExtensionBackoff : kNoExtensionBackoff;
      return ret;
    }

    const std::vector<float> &Values(unsigned char order) const {
      return values_[order - 1];
    }

  private:
    // This used to be one array.  Then I needed to separate it by order for quantization to work.
    std::vector<float> values_[KENLM_MAX_ORDER - 1];
    BackoffMessages messages_[KENLM_MAX_ORDER - 1];

    float *it_[KENLM_MAX_ORDER - 1];
};

class FindBlanks {
  public:
    FindBlanks(unsigned char order, const ProbBackoff *unigrams, SRISucks &messages)
      : counts_(order), unigrams_(unigrams), sri_(messages) {}

    float UnigramProb(WordIndex index) const {
      return unigrams_[index].prob;
    }

    void Unigram(WordIndex /*index*/) {
      ++counts_[0];
    }

    void MiddleBlank(const unsigned char order, const WordIndex *indices, unsigned char lower, float prob_basis) {
      sri_.Send(lower, order, indices + 1, prob_basis);
      ++counts_[order - 1];
    }

    void Middle(const unsigned char order, const void * /*data*/) {
      ++counts_[order - 1];
    }

    void Longest(const void * /*data*/) {
      ++counts_.back();
    }

    // Unigrams wrote one past.
    void Cleanup() {
      --counts_[0];
    }

    const std::vector<uint64_t> &Counts() const {
      return counts_;
    }

  private:
    std::vector<uint64_t> counts_;

    const ProbBackoff *unigrams_;

    SRISucks &sri_;
};

// Phase to actually write n-grams to the trie.
template <class Quant, class Bhiksha> class WriteEntries {
  public:
    WriteEntries(RecordReader *contexts, const Quant &quant, UnigramValue *unigrams, BitPackedMiddle<Bhiksha> *middle, BitPackedLongest &longest, unsigned char order, SRISucks &sri) :
      contexts_(contexts),
      quant_(quant),
      unigrams_(unigrams),
      middle_(middle),
      longest_(longest),
      bigram_pack_((order == 2) ? static_cast<BitPacked&>(longest_) : static_cast<BitPacked&>(*middle_)),
      order_(order),
      sri_(sri) {}

    float UnigramProb(WordIndex index) const { return unigrams_[index].weights.prob; }

    void Unigram(WordIndex word) {
      unigrams_[word].next = bigram_pack_.InsertIndex();
    }

    void MiddleBlank(const unsigned char order, const WordIndex *indices, unsigned char /*lower*/, float /*prob_base*/) {
      ProbBackoff weights = sri_.GetBlank(order_, order, indices);
      typename Quant::MiddlePointer(quant_, order - 2, middle_[order - 2].Insert(indices[order - 1])).Write(weights.prob, weights.backoff);
    }

    void Middle(const unsigned char order, const void *data) {
      RecordReader &context = contexts_[order - 1];
      const WordIndex *words = reinterpret_cast<const WordIndex*>(data);
      ProbBackoff weights = *reinterpret_cast<const ProbBackoff*>(words + order);
      if (context && !memcmp(data, context.Data(), sizeof(WordIndex) * order)) {
        SetExtension(weights.backoff);
        ++context;
      }
      typename Quant::MiddlePointer(quant_, order - 2, middle_[order - 2].Insert(words[order - 1])).Write(weights.prob, weights.backoff);
    }

    void Longest(const void *data) {
      const WordIndex *words = reinterpret_cast<const WordIndex*>(data);
      typename Quant::LongestPointer(quant_, longest_.Insert(words[order_ - 1])).Write(reinterpret_cast<const Prob*>(words + order_)->prob);
    }

    void Cleanup() {}

  private:
    RecordReader *contexts_;
    const Quant &quant_;
    UnigramValue *const unigrams_;
    BitPackedMiddle<Bhiksha> *const middle_;
    BitPackedLongest &longest_;
    BitPacked &bigram_pack_;
    const unsigned char order_;
    SRISucks &sri_;
};

struct Gram {
  Gram(const WordIndex *in_begin, unsigned char order) : begin(in_begin), end(in_begin + order) {}

  const WordIndex *begin, *end;

  // For queue, this is the direction we want.
  bool operator<(const Gram &other) const {
    return std::lexicographical_compare(other.begin, other.end, begin, end);
  }
};

template <class Doing> class BlankManager {
  public:
    BlankManager(unsigned char total_order, Doing &doing) : total_order_(total_order), been_length_(0), doing_(doing) {
      for (float *i = basis_; i != basis_ + KENLM_MAX_ORDER - 1; ++i) *i = kBadProb;
    }

    void Visit(const WordIndex *to, unsigned char length, float prob) {
      basis_[length - 1] = prob;
      unsigned char overlap = std::min<unsigned char>(length - 1, been_length_);
      const WordIndex *cur;
      WordIndex *pre;
      for (cur = to, pre = been_; cur != to + overlap; ++cur, ++pre) {
        if (*pre != *cur) break;
      }
      if (cur == to + length - 1) {
        *pre = *cur;
        been_length_ = length;
        return;
      }
      // There are blanks to insert starting with order blank.
      unsigned char blank = cur - to + 1;
      UTIL_THROW_IF(blank == 1, FormatLoadException, "Missing a unigram that appears as context.");
      const float *lower_basis;
      for (lower_basis = basis_ + blank - 2; *lower_basis == kBadProb; --lower_basis) {}
      unsigned char based_on = lower_basis - basis_ + 1;
      for (; cur != to + length - 1; ++blank, ++cur, ++pre) {
        assert(*lower_basis != kBadProb);
        doing_.MiddleBlank(blank, to, based_on, *lower_basis);
        *pre = *cur;
        // Mark that the probability is a blank so it shouldn't be used as the basis for a later n-gram.
        basis_[blank - 1] = kBadProb;
      }
      *pre = *cur;
      been_length_ = length;
    }

  private:
    const unsigned char total_order_;

    WordIndex been_[KENLM_MAX_ORDER];
    unsigned char been_length_;

    float basis_[KENLM_MAX_ORDER];

    Doing &doing_;
};

template <class Doing> void RecursiveInsert(const unsigned char total_order, const WordIndex unigram_count, RecordReader *input, std::ostream *progress_out, const char *message, Doing &doing) {
  util::ErsatzProgress progress(unigram_count + 1, progress_out, message);
  WordIndex unigram = 0;
  std::priority_queue<Gram> grams;
  grams.push(Gram(&unigram, 1));
  for (unsigned char i = 2; i <= total_order; ++i) {
    if (input[i-2]) grams.push(Gram(reinterpret_cast<const WordIndex*>(input[i-2].Data()), i));
  }

  BlankManager<Doing> blank(total_order, doing);

  while (true) {
    Gram top = grams.top();
    grams.pop();
    unsigned char order = top.end - top.begin;
    if (order == 1) {
      blank.Visit(&unigram, 1, doing.UnigramProb(unigram));
      doing.Unigram(unigram);
      progress.Set(unigram);
      if (++unigram == unigram_count + 1) break;
      grams.push(top);
    } else {
      if (order == total_order) {
        blank.Visit(top.begin, order, reinterpret_cast<const Prob*>(top.end)->prob);
        doing.Longest(top.begin);
      } else {
        blank.Visit(top.begin, order, reinterpret_cast<const ProbBackoff*>(top.end)->prob);
        doing.Middle(order, top.begin);
      }
      RecordReader &reader = input[order - 2];
      if (++reader) grams.push(top);
    }
  }
  assert(grams.empty());
  doing.Cleanup();
}

void SanityCheckCounts(const std::vector<uint64_t> &initial, const std::vector<uint64_t> &fixed) {
  if (fixed[0] != initial[0]) UTIL_THROW(util::Exception, "Unigram count should be constant but initial is " << initial[0] << " and recounted is " << fixed[0]);
  if (fixed.back() != initial.back()) UTIL_THROW(util::Exception, "Longest count should be constant but it changed from " << initial.back() << " to " << fixed.back());
  for (unsigned char i = 0; i < initial.size(); ++i) {
    if (fixed[i] < initial[i]) UTIL_THROW(util::Exception, "Counts came out lower than expected.  This shouldn't happen");
  }
}

template <class Quant> void TrainQuantizer(uint8_t order, uint64_t count, const std::vector<float> &additional, RecordReader &reader, util::ErsatzProgress &progress, Quant &quant) {
  std::vector<float> probs(additional), backoffs;
  probs.reserve(count + additional.size());
  backoffs.reserve(count);
  for (reader.Rewind(); reader; ++reader) {
    const ProbBackoff &weights = *reinterpret_cast<const ProbBackoff*>(reinterpret_cast<const uint8_t*>(reader.Data()) + sizeof(WordIndex) * order);
    probs.push_back(weights.prob);
    if (weights.backoff != 0.0) backoffs.push_back(weights.backoff);
    ++progress;
  }
  quant.Train(order, probs, backoffs);
}

template <class Quant> void TrainProbQuantizer(uint8_t order, uint64_t count, RecordReader &reader, util::ErsatzProgress &progress, Quant &quant) {
  std::vector<float> probs, backoffs;
  probs.reserve(count);
  for (reader.Rewind(); reader; ++reader) {
    const Prob &weights = *reinterpret_cast<const Prob*>(reinterpret_cast<const uint8_t*>(reader.Data()) + sizeof(WordIndex) * order);
    probs.push_back(weights.prob);
    ++progress;
  }
  quant.TrainProb(order, probs);
}

void PopulateUnigramWeights(FILE *file, WordIndex unigram_count, RecordReader &contexts, UnigramValue *unigrams) {
  // Fill unigram probabilities.
  try {
    rewind(file);
    for (WordIndex i = 0; i < unigram_count; ++i) {
      ReadOrThrow(file, &unigrams[i].weights, sizeof(ProbBackoff));
      if (contexts && *reinterpret_cast<const WordIndex*>(contexts.Data()) == i) {
        SetExtension(unigrams[i].weights.backoff);
        ++contexts;
      }
    }
  } catch (util::Exception &e) {
    e << " while re-reading unigram probabilities";
    throw;
  }
}

} // namespace

template <class Quant, class Bhiksha> void BuildTrie(SortedFiles &files, std::vector<uint64_t> &counts, const Config &config, TrieSearch<Quant, Bhiksha> &out, Quant &quant, const SortedVocabulary &vocab, Backing &backing) {
  RecordReader inputs[KENLM_MAX_ORDER - 1];
  RecordReader contexts[KENLM_MAX_ORDER - 1];

  for (unsigned char i = 2; i <= counts.size(); ++i) {
    inputs[i-2].Init(files.Full(i), i * sizeof(WordIndex) + (i == counts.size() ? sizeof(Prob) : sizeof(ProbBackoff)));
    contexts[i-2].Init(files.Context(i), (i-1) * sizeof(WordIndex));
  }

  SRISucks sri;
  std::vector<uint64_t> fixed_counts;
  util::scoped_FILE unigram_file;
  util::scoped_fd unigram_fd(files.StealUnigram());
  {
    util::scoped_memory unigrams;
    MapRead(util::POPULATE_OR_READ, unigram_fd.get(), 0, counts[0] * sizeof(ProbBackoff), unigrams);
    FindBlanks finder(counts.size(), reinterpret_cast<const ProbBackoff*>(unigrams.get()), sri);
    RecursiveInsert(counts.size(), counts[0], inputs, config.ProgressMessages(), "Identifying n-grams omitted by SRI", finder);
    fixed_counts = finder.Counts();
  }
  unigram_file.reset(util::FDOpenOrThrow(unigram_fd));
  for (const RecordReader *i = inputs; i != inputs + counts.size() - 2; ++i) {
    if (*i) UTIL_THROW(FormatLoadException, "There's a bug in the trie implementation: the " << (i - inputs + 2) << "-gram table did not complete reading");
  }
  SanityCheckCounts(counts, fixed_counts);
  counts = fixed_counts;

  sri.ObtainBackoffs(counts.size(), unigram_file.get(), inputs);

  out.SetupMemory(GrowForSearch(config, vocab.UnkCountChangePadding(), TrieSearch<Quant, Bhiksha>::Size(fixed_counts, config), backing), fixed_counts, config);

  for (unsigned char i = 2; i <= counts.size(); ++i) {
    inputs[i-2].Rewind();
  }
  if (Quant::kTrain) {
    util::ErsatzProgress progress(std::accumulate(counts.begin() + 1, counts.end(), 0),
                                  config.ProgressMessages(), "Quantizing");
    for (unsigned char i = 2; i < counts.size(); ++i) {
      TrainQuantizer(i, counts[i-1], sri.Values(i), inputs[i-2], progress, quant);
    }
    TrainProbQuantizer(counts.size(), counts.back(), inputs[counts.size() - 2], progress, quant);
    quant.FinishedLoading(config);
  }

  UnigramValue *unigrams = out.unigram_.Raw();
  PopulateUnigramWeights(unigram_file.get(), counts[0], contexts[0], unigrams);
  unigram_file.reset();

  for (unsigned char i = 2; i <= counts.size(); ++i) {
    inputs[i-2].Rewind();
  }
  // Fill entries except unigram probabilities.
  {
    WriteEntries<Quant, Bhiksha> writer(contexts, quant, unigrams, out.middle_begin_, out.longest_, counts.size(), sri);
    RecursiveInsert(counts.size(), counts[0], inputs, config.ProgressMessages(), "Writing trie", writer);
  }

  // Do not disable this error message or else too little state will be returned.  Both WriteEntries::Middle and returning state based on found n-grams will need to be fixed to handle this situation.
  for (unsigned char order = 2; order <= counts.size(); ++order) {
    const RecordReader &context = contexts[order - 2];
    if (context) {
      FormatLoadException e;
      e << "A " << static_cast<unsigned int>(order) << "-gram has context";
      const WordIndex *ctx = reinterpret_cast<const WordIndex*>(context.Data());
      for (const WordIndex *i = ctx; i != ctx + order - 1; ++i) {
        e << ' ' << *i;
      }
      e << " so this context must appear in the model as a " << static_cast<unsigned int>(order - 1) << "-gram but it does not";
      throw e;
    }
  }

  /* Set ending offsets so the last entry will be sized properly */
  // Last entry for unigrams was already set.
  if (out.middle_begin_ != out.middle_end_) {
    for (typename TrieSearch<Quant, Bhiksha>::Middle *i = out.middle_begin_; i != out.middle_end_ - 1; ++i) {
      i->FinishedLoading((i+1)->InsertIndex(), config);
    }
    (out.middle_end_ - 1)->FinishedLoading(out.longest_.InsertIndex(), config);
  }
}

template <class Quant, class Bhiksha> uint8_t *TrieSearch<Quant, Bhiksha>::SetupMemory(uint8_t *start, const std::vector<uint64_t> &counts, const Config &config) {
  quant_.SetupMemory(start, counts.size(), config);
  start += Quant::Size(counts.size(), config);
  unigram_.Init(start);
  start += Unigram::Size(counts[0]);
  FreeMiddles();
  middle_begin_ = static_cast<Middle*>(malloc(sizeof(Middle) * (counts.size() - 2)));
  middle_end_ = middle_begin_ + (counts.size() - 2);
  std::vector<uint8_t*> middle_starts(counts.size() - 2);
  for (unsigned char i = 2; i < counts.size(); ++i) {
    middle_starts[i-2] = start;
    start += Middle::Size(Quant::MiddleBits(config), counts[i-1], counts[0], counts[i], config);
  }
  // Crazy backwards thing so we initialize using pointers to ones that have already been initialized
  for (unsigned char i = counts.size() - 1; i >= 2; --i) {
    new (middle_begin_ + i - 2) Middle(
        middle_starts[i-2],
        quant_.MiddleBits(config),
        counts[i-1],
        counts[0],
        counts[i],
        (i == counts.size() - 1) ? static_cast<const BitPacked&>(longest_) : static_cast<const BitPacked &>(middle_begin_[i-1]),
        config);
  }
  longest_.Init(start, quant_.LongestBits(config), counts[0]);
  return start + Longest::Size(Quant::LongestBits(config), counts.back(), counts[0]);
}

template <class Quant, class Bhiksha> void TrieSearch<Quant, Bhiksha>::LoadedBinary() {
  unigram_.LoadedBinary();
  for (Middle *i = middle_begin_; i != middle_end_; ++i) {
    i->LoadedBinary();
  }
  longest_.LoadedBinary();
}

template <class Quant, class Bhiksha> void TrieSearch<Quant, Bhiksha>::InitializeFromARPA(const char *file, util::FilePiece &f, std::vector<uint64_t> &counts, const Config &config, SortedVocabulary &vocab, Backing &backing) {
  std::string temporary_prefix;
  if (config.temporary_directory_prefix) {
    temporary_prefix = config.temporary_directory_prefix;
  } else if (config.write_mmap) {
    temporary_prefix = config.write_mmap;
  } else {
    temporary_prefix = file;
  }
  // At least 1MB sorting memory.
  SortedFiles sorted(config, f, counts, std::max<size_t>(config.building_memory, 1048576), temporary_prefix, vocab);

  BuildTrie(sorted, counts, config, *this, quant_, vocab, backing);
}

template class TrieSearch<DontQuantize, DontBhiksha>;
template class TrieSearch<DontQuantize, ArrayBhiksha>;
template class TrieSearch<SeparatelyQuantize, DontBhiksha>;
template class TrieSearch<SeparatelyQuantize, ArrayBhiksha>;

} // namespace trie
} // namespace ngram
} // namespace lm


================================================
FILE: src/kenlm/lm/search_trie.hh
================================================
#ifndef LM_SEARCH_TRIE__
#define LM_SEARCH_TRIE__

#include "lm/config.hh"
#include "lm/model_type.hh"
#include "lm/return.hh"
#include "lm/trie.hh"
#include "lm/weights.hh"

#include "util/file.hh"
#include "util/file_piece.hh"

#include <vector>

#include <assert.h>

namespace lm {
namespace ngram {
struct Backing;
class SortedVocabulary;
namespace trie {

template <class Quant, class Bhiksha> class TrieSearch;
class SortedFiles;
template <class Quant, class Bhiksha> void BuildTrie(SortedFiles &files, std::vector<uint64_t> &counts, const Config &config, TrieSearch<Quant, Bhiksha> &out, Quant &quant, const SortedVocabulary &vocab, Backing &backing);

template <class Quant, class Bhiksha> class TrieSearch {
  public:
    typedef NodeRange Node;

    typedef ::lm::ngram::trie::UnigramPointer UnigramPointer;
    typedef typename Quant::MiddlePointer MiddlePointer;
    typedef typename Quant::LongestPointer LongestPointer;

    static const bool kDifferentRest = false;

    static const ModelType kModelType = static_cast<ModelType>(TRIE_SORTED + Quant::kModelTypeAdd + Bhiksha::kModelTypeAdd);

    static const unsigned int kVersion = 1;

    static void UpdateConfigFromBinary(int fd, const std::vector<uint64_t> &counts, Config &config) {
      Quant::UpdateConfigFromBinary(fd, counts, config);
      util::AdvanceOrThrow(fd, Quant::Size(counts.size(), config) + Unigram::Size(counts[0]));
      Bhiksha::UpdateConfigFromBinary(fd, config);
    }

    static uint64_t Size(const std::vector<uint64_t> &counts, const Config &config) {
      uint64_t ret = Quant::Size(counts.size(), config) + Unigram::Size(counts[0]);
      for (unsigned char i = 1; i < counts.size() - 1; ++i) {
        ret += Middle::Size(Quant::MiddleBits(config), counts[i], counts[0], counts[i+1], config);
      }
      return ret + Longest::Size(Quant::LongestBits(config), counts.back(), counts[0]);
    }

    TrieSearch() : middle_begin_(NULL), middle_end_(NULL) {}

    ~TrieSearch() { FreeMiddles(); }

    uint8_t *SetupMemory(uint8_t *start, const std::vector<uint64_t> &counts, const Config &config);

    void LoadedBinary();

    void InitializeFromARPA(const char *file, util::FilePiece &f, std::vector<uint64_t> &counts, const Config &config, SortedVocabulary &vocab, Backing &backing);

    unsigned char Order() const {
      return middle_end_ - middle_begin_ + 2;
    }

    ProbBackoff &UnknownUnigram() { return unigram_.Unknown(); }

    UnigramPointer LookupUnigram(WordIndex word, Node &next, bool &independent_left, uint64_t &extend_left) const {
      extend_left = static_cast<uint64_t>(word);
      UnigramPointer ret(unigram_.Find(word, next));
      independent_left = (next.begin == next.end);
      return ret;
    }

    MiddlePointer Unpack(uint64_t extend_pointer, unsigned char extend_length, Node &node) const {
      return MiddlePointer(quant_, extend_length - 2, middle_begin_[extend_length - 2].ReadEntry(extend_pointer, node));
    }

    MiddlePointer LookupMiddle(unsigned char order_minus_2, WordIndex word, Node &node, bool &independent_left, uint64_t &extend_left) const {
      util::BitAddress address(middle_begin_[order_minus_2].Find(word, node, extend_left));
      independent_left = (address.base == NULL) || (node.begin == node.end);
      return MiddlePointer(quant_, order_minus_2, address);
    }

    LongestPointer LookupLongest(WordIndex word, const Node &node) const {
      return LongestPointer(quant_, longest_.Find(word, node));
    }

    bool FastMakeNode(const WordIndex *begin, const WordIndex *end, Node &node) const {
      assert(begin != end);
      bool independent_left;
      uint64_t ignored;
      LookupUnigram(*begin, node, independent_left, ignored);
      for (const WordIndex *i = begin + 1; i < end; ++i) {
        if (independent_left || !LookupMiddle(i - begin - 1, *i, node, independent_left, ignored).Found()) return false;
      }
      return true;
    }

  private:
    friend void BuildTrie<Quant, Bhiksha>(SortedFiles &files, std::vector<uint64_t> &counts, const Config &config, TrieSearch<Quant, Bhiksha> &out, Quant &quant, const SortedVocabulary &vocab, Backing &backing);

    // Middles are managed manually so we can delay construction and they don't have to be copyable.  
    void FreeMiddles() {
      for (const Middle *i = middle_begin_; i != middle_end_; ++i) {
        i->~Middle();
      }
      free(middle_begin_);
    }

    typedef trie::BitPackedMiddle<Bhiksha> Middle;

    typedef trie::BitPackedLongest Longest;
    Longest longest_;

    Middle *middle_begin_, *middle_end_;
    Quant quant_;

    typedef ::lm::ngram::trie::Unigram Unigram;
    Unigram unigram_;
};

} // namespace trie
} // namespace ngram
} // namespace lm

#endif // LM_SEARCH_TRIE__


================================================
FILE: src/kenlm/lm/sizes.cc
================================================
#include "lm/sizes.hh"
#include "lm/model.hh"
#include "util/file_piece.hh"

#include <vector>
#include <iomanip>

namespace lm {
namespace ngram {

void ShowSizes(const std::vector<uint64_t> &counts, const lm::ngram::Config &config) {
  uint64_t sizes[6];
  sizes[0] = ProbingModel::Size(counts, config);
  sizes[1] = RestProbingModel::Size(counts, config);
  sizes[2] = TrieModel::Size(counts, config);
  sizes[3] = QuantTrieModel::Size(counts, config);
  sizes[4] = ArrayTrieModel::Size(counts, config);
  sizes[5] = QuantArrayTrieModel::Size(counts, config);
  uint64_t max_length = *std::max_element(sizes, sizes + sizeof(sizes) / sizeof(uint64_t));
  uint64_t min_length = *std::min_element(sizes, sizes + sizeof(sizes) / sizeof(uint64_t));
  uint64_t divide;
  char prefix;
  if (min_length < (1 << 10) * 10) {
    prefix = ' ';
    divide = 1;
  } else if (min_length < (1 << 20) * 10) {
    prefix = 'k';
    divide = 1 << 10;
  } else if (min_length < (1ULL << 30) * 10) {
    prefix = 'M';
    divide = 1 << 20;
  } else {
    prefix = 'G';
    divide = 1 << 30;
  }
  long int length = std::max<long int>(2, static_cast<long int>(ceil(log10((double) max_length / divide))));
  std::cerr << "Memory estimate for binary LM:\ntype    ";

  // right align bytes.  
  for (long int i = 0; i < length - 2; ++i) std::cerr << ' ';

  std::cerr << prefix << "B\n"
    "probing " << std::setw(length) << (sizes[0] / divide) << " assuming -p " << config.probing_multiplier << "\n"
    "probing " << std::setw(length) << (sizes[1] / divide) << " assuming -r models -p " << config.probing_multiplier << "\n"
    "trie    " << std::setw(length) << (sizes[2] / divide) << " without quantization\n"
    "trie    " << std::setw(length) << (sizes[3] / divide) << " assuming -q " << (unsigned)config.prob_bits << " -b " << (unsigned)config.backoff_bits << " quantization \n"
    "trie    " << std::setw(length) << (sizes[4] / divide) << " assuming -a " << (unsigned)config.pointer_bhiksha_bits << " array pointer compression\n"
    "trie    " << std::setw(length) << (sizes[5] / divide) << " assuming -a " << (unsigned)config.pointer_bhiksha_bits << " -q " << (unsigned)config.prob_bits << " -b " << (unsigned)config.backoff_bits<< " array pointer compression and quantization\n";
}

void ShowSizes(const std::vector<uint64_t> &counts) {
  lm::ngram::Config config;
  ShowSizes(counts, config);
}

void ShowSizes(const char *file, const lm::ngram::Config &config) {
  std::vector<uint64_t> counts;
  util::FilePiece f(file);
  lm::ReadARPACounts(f, counts);
  ShowSizes(counts, config);
}

}} //namespaces


================================================
FILE: src/kenlm/lm/sizes.hh
================================================
#ifndef LM_SIZES__
#define LM_SIZES__

#include <vector>

#include <stdint.h>

namespace lm { namespace ngram {

struct Config;

void ShowSizes(const std::vector<uint64_t> &counts, const lm::ngram::Config &config);
void ShowSizes(const std::vector<uint64_t> &counts);
void ShowSizes(const char *file, const lm::ngram::Config &config);

}} // namespaces
#endif // LM_SIZES__


================================================
FILE: src/kenlm/lm/state.hh
================================================
#ifndef LM_STATE__
#define LM_STATE__

#include "lm/max_order.hh"
#include "lm/word_index.hh"
#include "util/murmur_hash.hh"

#include <string.h>

namespace lm {
namespace ngram {

// This is a POD but if you want memcmp to return the same as operator==, call
// ZeroRemaining first.    
class State {
  public:
    bool operator==(const State &other) const {
      if (length != other.length) return false;
      return !memcmp(words, other.words, length * sizeof(WordIndex));
    }

    // Three way comparison function.  
    int Compare(const State &other) const {
      if (length != other.length) return length < other.length ? -1 : 1;
      return memcmp(words, other.words, length * sizeof(WordIndex));
    }

    bool operator<(const State &other) const {
      if (length != other.length) return length < other.length;
      return memcmp(words, other.words, length * sizeof(WordIndex)) < 0;
    }

    // Call this before using raw memcmp.  
    void ZeroRemaining() {
      for (unsigned char i = length; i < KENLM_MAX_ORDER - 1; ++i) {
        words[i] = 0;
        backoff[i] = 0.0;
      }
    }

    unsigned char Length() const { return length; }

    // You shouldn't need to touch anything below this line, but the members are public so FullState will qualify as a POD.  
    // This order minimizes total size of the struct if WordIndex is 64 bit, float is 32 bit, and alignment of 64 bit integers is 64 bit.  
    WordIndex words[KENLM_MAX_ORDER - 1];
    float backoff[KENLM_MAX_ORDER - 1];
    unsigned char length;
};

typedef State Right;

inline uint64_t hash_value(const State &state, uint64_t seed = 0) {
  return util::MurmurHashNative(state.words, sizeof(WordIndex) * state.length, seed);
}

struct Left {
  bool operator==(const Left &other) const {
    return 
      length == other.length &&
      (!length || (pointers[length - 1] == other.pointers[length - 1] && full == other.full));
  }

  int Compare(const Left &other) const {
    if (length < other.length) return -1;
    if (length > other.length) return 1;
    if (length == 0) return 0; // Must be full.
    if (pointers[length - 1] > other.pointers[length - 1]) return 1;
    if (pointers[length - 1] < other.pointers[length - 1]) return -1;
    return (int)full - (int)other.full;
  }

  bool operator<(const Left &other) const {
    return Compare(other) == -1;
  }

  void ZeroRemaining() {
    for (uint64_t * i = pointers + length; i < pointers + KENLM_MAX_ORDER - 1; ++i)
      *i = 0;
  }

  uint64_t pointers[KENLM_MAX_ORDER - 1];
  unsigned char length;
  bool full;
};

inline uint64_t hash_value(const Left &left) {
  unsigned char add[2];
  add[0] = left.length;
  add[1] = left.full;
  return util::MurmurHashNative(add, 2, left.length ? left.pointers[left.length - 1] : 0);
}

struct ChartState {
  bool operator==(const ChartState &other) {
    return (right == other.right) && (left == other.left);
  }

  int Compare(const ChartState &other) const {
    int lres = left.Compare(other.left);
    if (lres) return lres;
    return right.Compare(other.right);
  }

  bool operator<(const ChartState &other) const {
    return Compare(other) == -1;
  }

  void ZeroRemaining() {
    left.ZeroRemaining();
    right.ZeroRemaining();
  }

  Left left;
  State right;
};

inline uint64_t hash_value(const ChartState &state) {
  return hash_value(state.right, hash_value(state.left));
}


} // namespace ngram
} // namespace lm

#endif // LM_STATE__


================================================
FILE: src/kenlm/lm/test.arpa
================================================

\data\
ngram 1=37
ngram 2=47
ngram 3=11
ngram 4=6
ngram 5=4

\1-grams:
-1.383514	,	-0.30103
-1.139057	.	-0.845098
-1.029493	</s>
-99	<s>	-0.4149733
-1.995635	<unk>	-20
-1.285941	a	-0.69897
-1.687872	also	-0.30103
-1.687872	beyond	-0.30103
-1.687872	biarritz	-0.30103
-1.687872	call	-0.30103
-1.687872	concerns	-0.30103
-1.687872	consider	-0.30103
-1.687872	considering	-0.30103
-1.687872	for	-0.30103
-1.509559	higher	-0.30103
-1.687872	however	-0.30103
-1.687872	i	-0.30103
-1.687872	immediate	-0.30103
-1.687872	in	-0.30103
-1.687872	is	-0.30103
-1.285941	little	-0.69897
-1.383514	loin	-0.30103
-1.687872	look	-0.30103
-1.285941	looking	-0.4771212
-1.206319	more	-0.544068
-1.509559	on	-0.4771212
-1.509559	screening	-0.4771212
-1.687872	small	-0.30103
-1.687872	the	-0.30103
-1.687872	to	-0.30103
-1.687872	watch	-0.30103
-1.687872	watching	-0.30103
-1.687872	what	-0.30103
-1.687872	would	-0.30103
-3.141592	foo
-2.718281	bar	3.0
-6.535897	baz	-0.0

\2-grams:
-0.6925742	, .
-0.7522095	, however
-0.7522095	, is
-0.0602359	. </s>
-0.4846522	<s> looking	-0.4771214
-1.051485	<s> screening
-1.07153	<s> the
-1.07153	<s> watching
-1.07153	<s> what
-0.09132547	a little	-0.69897
-0.2922095	also call
-0.2922095	beyond immediate
-0.2705918	biarritz .
-0.2922095	call for
-0.2922095	concerns in
-0.2922095	consider watch
-0.2922095	considering consider
-0.2834328	for ,
-0.5511513	higher more
-0.5845945	higher small
-0.2834328	however ,
-0.2922095	i would
-0.2922095	immediate concerns
-0.2922095	in biarritz
-0.2922095	is to
-0.09021038	little more	-0.1998621
-0.7273645	loin ,
-0.6925742	loin .
-0.6708385	loin </s>
-0.2922095	look beyond
-0.4638903	looking higher
-0.4638903	looking on	-0.4771212
-0.5136299	more .	-0.4771212
-0.3561665	more loin
-0.1649931	on a	-0.4771213
-0.1649931	screening a	-0.4771213
-0.2705918	small .
-0.287799	the screening
-0.2922095	to look
-0.2622373	watch </s>
-0.2922095	watching considering
-0.2922095	what i
-0.2922095	would also
-2	also would	-6
-15	<unk> <unk>	-2
-4	<unk> however	-1
-6	foo bar

\3-grams:
-0.01916512	more . </s>
-0.0283603	on a little	-0.4771212
-0.0283603	screening a little	-0.4771212
-0.01660496	a little more	-0.09409451
-0.3488368	<s> looking higher
-0.3488368	<s> looking on	-0.4771212
-0.1892331	little more loin
-0.04835128	looking on a	-0.4771212
-3	also would consider	-7
-6	<unk> however <unk>	-12
-7	to look good

\4-grams:
-0.009249173	looking on a little	-0.4771212
-0.005464747	on a little more	-0.4771212
-0.005464747	screening a little more
-0.1453306	a little more loin
-0.01552657	<s> looking on a	-0.4771212
-4	also would consider higher	-8

\5-grams:
-0.003061223	<s> looking on a little
-0.001813953	looking on a little more
-0.0432557	on a little more loin
-5	also would consider higher looking

\end\


================================================
FILE: src/kenlm/lm/test_nounk.arpa
================================================

\data\
ngram 1=36
ngram 2=45
ngram 3=10
ngram 4=6
ngram 5=4

\1-grams:
-1.383514	,	-0.30103
-1.139057	.	-0.845098
-1.029493	</s>
-99	<s>	-0.4149733
-1.285941	a	-0.69897
-1.687872	also	-0.30103
-1.687872	beyond	-0.30103
-1.687872	biarritz	-0.30103
-1.687872	call	-0.30103
-1.687872	concerns	-0.30103
-1.687872	consider	-0.30103
-1.687872	considering	-0.30103
-1.687872	for	-0.30103
-1.509559	higher	-0.30103
-1.687872	however	-0.30103
-1.687872	i	-0.30103
-1.687872	immediate	-0.30103
-1.687872	in	-0.30103
-1.687872	is	-0.30103
-1.285941	little	-0.69897
-1.383514	loin	-0.30103
-1.687872	look	-0.30103
-1.285941	looking	-0.4771212
-1.206319	more	-0.544068
-1.509559	on	-0.4771212
-1.509559	screening	-0.4771212
-1.687872	small	-0.30103
-1.687872	the	-0.30103
-1.687872	to	-0.30103
-1.687872	watch	-0.30103
-1.687872	watching	-0.30103
-1.687872	what	-0.30103
-1.687872	would	-0.30103
-3.141592	foo
-2.718281	bar	3.0
-6.535897	baz	-0.0

\2-grams:
-0.6925742	, .
-0.7522095	, however
-0.7522095	, is
-0.0602359	. </s>
-0.4846522	<s> looking	-0.4771214
-1.051485	<s> screening
-1.07153	<s> the
-1.07153	<s> watching
-1.07153	<s> what
-0.09132547	a little	-0.69897
-0.2922095	also call
-0.2922095	beyond immediate
-0.2705918	biarritz .
-0.2922095	call for
-0.2922095	concerns in
-0.2922095	consider watch
-0.2922095	considering consider
-0.2834328	for ,
-0.5511513	higher more
-0.5845945	higher small
-0.2834328	however ,
-0.2922095	i would
-0.2922095	immediate concerns
-0.2922095	in biarritz
-0.2922095	is to
-0.09021038	little more	-0.1998621
-0.7273645	loin ,
-0.6925742	loin .
-0.6708385	loin </s>
-0.2922095	look beyond
-0.4638903	looking higher
-0.4638903	looking on	-0.4771212
-0.5136299	more .	-0.4771212
-0.3561665	more loin
-0.1649931	on a	-0.4771213
-0.1649931	screening a	-0.4771213
-0.2705918	small .
-0.287799	the screening
-0.2922095	to look
-0.2622373	watch </s>
-0.2922095	watching considering
-0.2922095	what i
-0.2922095	would also
-2	also would	-6
-6	foo bar

\3-grams:
-0.01916512	more . </s>
-0.0283603	on a little	-0.4771212
-0.0283603	screening a little	-0.4771212
-0.01660496	a little more	-0.09409451
-0.3488368	<s> looking higher
-0.3488368	<s> looking on	-0.4771212
-0.1892331	little more loin
-0.04835128	looking on a	-0.4771212
-3	also would consider	-7
-7	to look good

\4-grams:
-0.009249173	looking on a little	-0.4771212
-0.005464747	on a little more	-0.4771212
-0.005464747	screening a little more
-0.1453306	a little more loin
-0.01552657	<s> looking on a	-0.4771212
-4	also would consider higher	-8

\5-grams:
-0.003061223	<s> looking on a little
-0.001813953	looking on a little more
-0.0432557	on a little more loin
-5	also would consider higher looking

\end\


================================================
FILE: src/kenlm/lm/trie.cc
================================================
#include "lm/trie.hh"

#include "lm/bhiksha.hh"
#include "util/bit_packing.hh"
#include "util/exception.hh"
#include "util/sorted_uniform.hh"

#include <assert.h>

namespace lm {
namespace ngram {
namespace trie {
namespace {

class KeyAccessor {
  public:
    KeyAccessor(const void *base, uint64_t key_mask, uint8_t key_bits, uint8_t total_bits) 
      : base_(reinterpret_cast<const uint8_t*>(base)), key_mask_(key_mask), key_bits_(key_bits), total_bits_(total_bits) {}

    typedef uint64_t Key;

    Key operator()(uint64_t index) const {
      return util::ReadInt57(base_, index * static_cast<uint64_t>(total_bits_), key_bits_, key_mask_);
    }

  private:
    const uint8_t *const base_;
    const WordIndex key_mask_;
    const uint8_t key_bits_, total_bits_;
};

bool FindBitPacked(const void *base, uint64_t key_mask, uint8_t key_bits, uint8_t total_bits, uint64_t begin_index, uint64_t end_index, const uint64_t max_vocab, const uint64_t key, uint64_t &at_index) {
  KeyAccessor accessor(base, key_mask, key_bits, total_bits);
  if (!util::BoundedSortedUniformFind<uint64_t, KeyAccessor, util::PivotSelect<sizeof(WordIndex)>::T>(accessor, begin_index - 1, (uint64_t)0, end_index, max_vocab, key, at_index)) return false;
  return true;
}
} // namespace

uint64_t BitPacked::BaseSize(uint64_t entries, uint64_t max_vocab, uint8_t remaining_bits) {
  uint8_t total_bits = util::RequiredBits(max_vocab) + remaining_bits;
  // Extra entry for next pointer at the end.  
  // +7 then / 8 to round up bits and convert to bytes
  // +sizeof(uint64_t) so that ReadInt57 etc don't go segfault.  
  // Note that this waste is O(order), not O(number of ngrams).
  return ((1 + entries) * total_bits + 7) / 8 + sizeof(uint64_t);
}

void BitPacked::BaseInit(void *base, uint64_t max_vocab, uint8_t remaining_bits) {
  util::BitPackingSanity();
  word_bits_ = util::RequiredBits(max_vocab);
  word_mask_ = (1ULL << word_bits_) - 1ULL;
  if (word_bits_ > 57) UTIL_THROW(util::Exception, "Sorry, word indices more than " << (1ULL << 57) << " are not implemented.  Edit util/bit_packing.hh and fix the bit packing functions.");
  total_bits_ = word_bits_ + remaining_bits;

  base_ = static_cast<uint8_t*>(base);
  insert_index_ = 0;
  max_vocab_ = max_vocab;
}

template <class Bhiksha> uint64_t BitPackedMiddle<Bhiksha>::Size(uint8_t quant_bits, uint64_t entries, uint64_t max_vocab, uint64_t max_ptr, const Config &config) {
  return Bhiksha::Size(entries + 1, max_ptr, config) + BaseSize(entries, max_vocab, quant_bits + Bhiksha::InlineBits(entries + 1, max_ptr, config));
}

template <class Bhiksha> BitPackedMiddle<Bhiksha>::BitPackedMiddle(void *base, uint8_t quant_bits, uint64_t entries, uint64_t max_vocab, uint64_t max_next, const BitPacked &next_source, const Config &config) :
  BitPacked(),
  quant_bits_(quant_bits),
  // If the offset of the method changes, also change TrieSearch::UpdateConfigFromBinary.
  bhiksha_(base, entries + 1, max_next, config),
  next_source_(&next_source) {
  if (entries + 1 >= (1ULL << 57) || (max_next >= (1ULL << 57)))  UTIL_THROW(util::Exception, "Sorry, this does not support more than " << (1ULL << 57) << " n-grams of a particular order.  Edit util/bit_packing.hh and fix the bit packing functions.");
  BaseInit(reinterpret_cast<uint8_t*>(base) + Bhiksha::Size(entries + 1, max_next, config), max_vocab, quant_bits_ + bhiksha_.InlineBits());
}

template <class Bhiksha> util::BitAddress BitPackedMiddle<Bhiksha>::Insert(WordIndex word) {
  assert(word <= word_mask_);
  uint64_t at_pointer = insert_index_ * total_bits_;

  util::WriteInt57(base_, at_pointer, word_bits_, word);
  at_pointer += word_bits_;
  util::BitAddress ret(base_, at_pointer);
  at_pointer += quant_bits_;
  uint64_t next = next_source_->InsertIndex();
  bhiksha_.WriteNext(base_, at_pointer, insert_index_, next);
  ++insert_index_;
  return ret;
}

template <class Bhiksha> util::BitAddress BitPackedMiddle<Bhiksha>::Find(WordIndex word, NodeRange &range, uint64_t &pointer) const {
  uint64_t at_pointer;
  if (!FindBitPacked(base_, word_mask_, word_bits_, total_bits_, range.begin, range.end, max_vocab_, word, at_pointer)) {
    return util::BitAddress(NULL, 0);
  }
  pointer = at_pointer;
  at_pointer *= total_bits_;
  at_pointer += word_bits_;
  bhiksha_.ReadNext(base_, at_pointer + quant_bits_, pointer, total_bits_, range);

  return util::BitAddress(base_, at_pointer);
}

template <class Bhiksha> void BitPackedMiddle<Bhiksha>::FinishedLoading(uint64_t next_end, const Config &config) {
  uint64_t last_next_write = (insert_index_ + 1) * total_bits_ - bhiksha_.InlineBits();
  bhiksha_.WriteNext(base_, last_next_write, insert_index_ + 1, next_end);
  bhiksha_.FinishedLoading(config);
}

util::BitAddress BitPackedLongest::Insert(WordIndex index) {
  assert(index <= word_mask_);
  uint64_t at_pointer = insert_index_ * total_bits_;
  util::WriteInt57(base_, at_pointer, word_bits_, index);
  at_pointer += word_bits_;
  ++insert_index_;
  return util::BitAddress(base_, at_pointer);
}

util::BitAddress BitPackedLongest::Find(WordIndex word, const NodeRange &range) const {
  uint64_t at_pointer;
  if (!FindBitPacked(base_, word_mask_, word_bits_, total_bits_, range.begin, range.end, max_vocab_, word, at_pointer)) return util::BitAddress(NULL, 0);
  at_pointer = at_pointer * total_bits_ + word_bits_;
  return util::BitAddress(base_, at_pointer);
}

template class BitPackedMiddle<DontBhiksha>;
template class BitPackedMiddle<ArrayBhiksha>;

} // namespace trie
} // namespace ngram
} // namespace lm


================================================
FILE: src/kenlm/lm/trie.hh
================================================
#ifndef LM_TRIE__
#define LM_TRIE__

#include "lm/weights.hh"
#include "lm/word_index.hh"
#include "util/bit_packing.hh"

#include <cstddef>

#include <stdint.h>

namespace lm {
namespace ngram {
struct Config;
namespace trie {

struct NodeRange {
  uint64_t begin, end;
};

// TODO: if the number of unigrams is a concern, also bit pack these records.  
struct UnigramValue {
  ProbBackoff weights;
  uint64_t next;
  uint64_t Next() const { return next; }
};

class UnigramPointer {
  public:
    explicit UnigramPointer(const ProbBackoff &to) : to_(&to) {}

    UnigramPointer() : to_(NULL) {}

    bool Found() const { return to_ != NULL; }

    float Prob() const { return to_->prob; }
    float Backoff() const { return to_->backoff; }
    float Rest() const { return Prob(); }

  private:
    const ProbBackoff *to_;
};

class Unigram {
  public:
    Unigram() {}
    
    void Init(void *start) {
      unigram_ = static_cast<UnigramValue*>(start);
    }
    
    static uint64_t Size(uint64_t count) {
      // +1 in case unknown doesn't appear.  +1 for the final next.  
      return (count + 2) * sizeof(UnigramValue);
    }
    
    const ProbBackoff &Lookup(WordIndex index) const { return unigram_[index].weights; }
    
    ProbBackoff &Unknown() { return unigram_[0].weights; }

    UnigramValue *Raw() {
      return unigram_;
    }
    
    void LoadedBinary() {}

    UnigramPointer Find(WordIndex word, NodeRange &next) const {
      UnigramValue *val = unigram_ + word;
      next.begin = val->next;
      next.end = (val+1)->next;
      return UnigramPointer(val->weights);
    }

  private:
    UnigramValue *unigram_;
};  

class BitPacked {
  public:
    BitPacked() {}

    uint64_t InsertIndex() const {
      return insert_index_;
    }

  protected:
    static uint64_t BaseSize(uint64_t entries, uint64_t max_vocab, uint8_t remaining_bits);

    void BaseInit(void *base, uint64_t max_vocab, uint8_t remaining_bits);

    uint8_t word_bits_;
    uint8_t total_bits_;
    uint64_t word_mask_;

    uint8_t *base_;

    uint64_t insert_index_, max_vocab_;
};

template <class Bhiksha> class BitPackedMiddle : public BitPacked {
  public:
    static uint64_t Size(uint8_t quant_bits, uint64_t entries, uint64_t max_vocab, uint64_t max_next, const Config &config);

    // next_source need not be initialized.  
    BitPackedMiddle(void *base, uint8_t quant_bits, uint64_t entries, uint64_t max_vocab, uint64_t max_next, const BitPacked &next_source, const Config &config);

    util::BitAddress Insert(WordIndex word);

    void FinishedLoading(uint64_t next_end, const Config &config);

    void LoadedBinary() { bhiksha_.LoadedBinary(); }

    util::BitAddress Find(WordIndex word, NodeRange &range, uint64_t &pointer) const;

    util::BitAddress ReadEntry(uint64_t pointer, NodeRange &range) {
      uint64_t addr = pointer * total_bits_;
      addr += word_bits_;
      bhiksha_.ReadNext(base_, addr + quant_bits_, pointer, total_bits_, range);
      return util::BitAddress(base_, addr);
    }

  private:
    uint8_t quant_bits_;
    Bhiksha bhiksha_;

    const BitPacked *next_source_;
};

class BitPackedLongest : public BitPacked {
  public:
    static uint64_t Size(uint8_t quant_bits, uint64_t entries, uint64_t max_vocab) {
      return BaseSize(entries, max_vocab, quant_bits);
    }

    BitPackedLongest() {}

    void Init(void *base, uint8_t quant_bits, uint64_t max_vocab) {
      BaseInit(base, max_vocab, quant_bits);
    }

    void LoadedBinary() {}

    util::BitAddress Insert(WordIndex word);

    util::BitAddress Find(WordIndex word, const NodeRange &node) const;

  private:
    uint8_t quant_bits_;
};

} // namespace trie
} // namespace ngram
} // namespace lm

#endif // LM_TRIE__


================================================
FILE: src/kenlm/lm/trie_sort.cc
================================================
#include "lm/trie_sort.hh"

#include "lm/config.hh"
#include "lm/lm_exception.hh"
#include "lm/read_arpa.hh"
#include "lm/vocab.hh"
#include "lm/weights.hh"
#include "lm/word_index.hh"
#include "util/file_piece.hh"
#include "util/mmap.hh"
#include "util/proxy_iterator.hh"
#include "util/sized_iterator.hh"

#include <algorithm>
#include <cstring>
#include <cstdio>
#include <cstdlib>
#include <deque>
#include <limits>
#include <vector>

namespace lm {
namespace ngram {
namespace trie {
namespace {

typedef util::SizedIterator NGramIter;

// Proxy for an entry except there is some extra cruft between the entries.  This is used to sort (n-1)-grams using the same memory as the sorted n-grams.  
class PartialViewProxy {
  public:
    PartialViewProxy() : attention_size_(0), inner_() {}

    PartialViewProxy(void *ptr, std::size_t block_size, std::size_t attention_size) : attention_size_(attention_size), inner_(ptr, block_size) {}

    operator std::string() const {
      return std::string(reinterpret_cast<const char*>(inner_.Data()), attention_size_);
    }

    PartialViewProxy &operator=(const PartialViewProxy &from) {
      memcpy(inner_.Data(), from.inner_.Data(), attention_size_);
      return *this;
    }

    PartialViewProxy &operator=(const std::string &from) {
      memcpy(inner_.Data(), from.data(), attention_size_);
      return *this;
    }

    const void *Data() const { return inner_.Data(); }
    void *Data() { return inner_.Data(); }

  private:
    friend class util::ProxyIterator<PartialViewProxy>;

    typedef std::string value_type;

    const std::size_t attention_size_;

    typedef util::SizedInnerIterator InnerIterator;
    InnerIterator &Inner() { return inner_; }
    const InnerIterator &Inner() const { return inner_; } 
    InnerIterator inner_;
};

typedef util::ProxyIterator<PartialViewProxy> PartialIter;

FILE *DiskFlush(const void *mem_begin, const void *mem_end, const std::string &temp_prefix) {
  util::scoped_fd file(util::MakeTemp(temp_prefix));
  util::WriteOrThrow(file.get(), mem_begin, (uint8_t*)mem_end - (uint8_t*)mem_begin);
  return util::FDOpenOrThrow(file);
}

FILE *WriteContextFile(uint8_t *begin, uint8_t *end, const std::string &temp_prefix, std::size_t entry_size, unsigned char order) {
  const size_t context_size = sizeof(WordIndex) * (order - 1);
  // Sort just the contexts using the same memory.  
  PartialIter context_begin(PartialViewProxy(begin + sizeof(WordIndex), entry_size, context_size));
  PartialIter context_end(PartialViewProxy(end + sizeof(WordIndex), entry_size, context_size));

#if defined(_WIN32) || defined(_WIN64)
  std::stable_sort
#else
  std::sort
#endif
    (context_begin, context_end, util::SizedCompare<EntryCompare, PartialViewProxy>(EntryCompare(order - 1)));

  util::scoped_FILE out(util::FMakeTemp(temp_prefix));

  // Write out to file and uniqueify at the same time.  Could have used unique_copy if there was an appropriate OutputIterator.  
  if (context_begin == context_end) return out.release();
  PartialIter i(context_begin);
  util::WriteOrThrow(out.get(), i->Data(), context_size);
  const void *previous = i->Data();
  ++i;
  for (; i != context_end; ++i) {
    if (memcmp(previous, i->Data(), context_size)) {
      util::WriteOrThrow(out.get(), i->Data(), context_size);
      previous = i->Data();
    }
  }
  return out.release();
}

struct ThrowCombine {
  void operator()(std::size_t /*entry_size*/, const void * /*first*/, const void * /*second*/, FILE * /*out*/) const {
    UTIL_THROW(FormatLoadException, "Duplicate n-gram detected.");
  }
};

// Useful for context files that just contain records with no value.  
struct FirstCombine {
  void operator()(std::size_t entry_size, const void *first, const void * /*second*/, FILE *out) const {
    util::WriteOrThrow(out, first, entry_size);
  }
};

template <class Combine> FILE *MergeSortedFiles(FILE *first_file, FILE *second_file, const std::string &temp_prefix, std::size_t weights_size, unsigned char order, const Combine &combine) {
  std::size_t entry_size = sizeof(WordIndex) * order + weights_size;
  RecordReader first, second;
  first.Init(first_file, entry_size);
  second.Init(second_file, entry_size);
  util::scoped_FILE out_file(util::FMakeTemp(temp_prefix));
  EntryCompare less(order);
  while (first && second) {
    if (less(first.Data(), second.Data())) {
      util::WriteOrThrow(out_file.get(), first.Data(), entry_size);
      ++first;
    } else if (less(second.Data(), first.Data())) {
      util::WriteOrThrow(out_file.get(), second.Data(), entry_size);
      ++second;
    } else {
      combine(entry_size, first.Data(), second.Data(), out_file.get());
      ++first; ++second;
    }
  }
  for (RecordReader &remains = (first ? first : second); remains; ++remains) {
    util::WriteOrThrow(out_file.get(), remains.Data(), entry_size);
  }
  return out_file.release();
}

} // namespace

void RecordReader::Init(FILE *file, std::size_t entry_size) {
  entry_size_ = entry_size;
  data_.reset(malloc(entry_size));
  UTIL_THROW_IF(!data_.get(), util::ErrnoException, "Failed to malloc read buffer");
  file_ = file;
  if (file) {
    rewind(file);
    remains_ = true;
    ++*this;
  } else {
    remains_ = false;
  }
}

void RecordReader::Overwrite(const void *start, std::size_t amount) {
  long internal = (uint8_t*)start - (uint8_t*)data_.get();
  UTIL_THROW_IF(fseek(file_, internal - entry_size_, SEEK_CUR), util::ErrnoException, "Couldn't seek backwards for revision");
  util::WriteOrThrow(file_, start, amount);
  long forward = entry_size_ - internal - amount;
#if !defined(_WIN32) && !defined(_WIN64)
  if (forward) 
#endif
    UTIL_THROW_IF(fseek(file_, forward, SEEK_CUR), util::ErrnoException, "Couldn't seek forwards past revision");
}

void RecordReader::Rewind() {
  if (file_) {
    rewind(file_);
    remains_ = true;
    ++*this;
  } else {
    remains_ = false;
  }
}

SortedFiles::SortedFiles(const Config &config, util::FilePiece &f, std::vector<uint64_t> &counts, size_t buffer, const std::string &file_prefix, SortedVocabulary &vocab) {
  PositiveProbWarn warn(config.positive_log_probability);
  unigram_.reset(util::MakeTemp(file_prefix));
  {
    // In case <unk> appears.  
    size_t size_out = (counts[0] + 1) * sizeof(ProbBackoff);
    util::scoped_mmap unigram_mmap(util::MapZeroedWrite(unigram_.get(), size_out), size_out);
    Read1Grams(f, counts[0], vocab, reinterpret_cast<ProbBackoff*>(unigram_mmap.get()), warn);
    CheckSpecials(config, vocab);
    if (!vocab.SawUnk()) ++counts[0];
  }

  // Only use as much buffer as we need.  
  size_t buffer_use = 0;
  for (unsigned int order = 2; order < counts.size(); ++order) {
    buffer_use = std::max<size_t>(buffer_use, static_cast<size_t>((sizeof(WordIndex) * order + 2 * sizeof(float)) * counts[order - 1]));
  }
  buffer_use = std::max<size_t>(buffer_use, static_cast<size_t>((sizeof(WordIndex) * counts.size() + sizeof(float)) * counts.back()));
  buffer = std::min<size_t>(buffer, buffer_use);

  util::scoped_malloc mem;
  mem.reset(malloc(buffer));
  if (!mem.get()) UTIL_THROW(util::ErrnoException, "malloc failed for sort buffer size " << buffer);

  for (unsigned char order = 2; order <= counts.size(); ++order) {
    ConvertToSorted(f, vocab, counts, file_prefix, order, warn, mem.get(), buffer);
  }
  ReadEnd(f);
}

namespace {
class Closer {
  public:
    explicit Closer(std::deque<FILE*> &files) : files_(files) {}

    ~Closer() {
      for (std::deque<FILE*>::iterator i = files_.begin(); i != files_.end(); ++i) {
        util::scoped_FILE deleter(*i);
      }
    }

    void PopFront() {
      util::scoped_FILE deleter(files_.front());
      files_.pop_front();
    }
  private:
    std::deque<FILE*> &files_;
};
} // namespace

void SortedFiles::ConvertToSorted(util::FilePiece &f, const SortedVocabulary &vocab, const std::vector<uint64_t> &counts, const std::string &file_prefix, unsigned char order, PositiveProbWarn &warn, void *mem, std::size_t mem_size) {
  ReadNGramHeader(f, order);
  const size_t count = counts[order - 1];
  // Size of weights.  Does it include backoff?  
  const size_t words_size = sizeof(WordIndex) * order;
  const size_t weights_size = sizeof(float) + ((order == counts.size()) ? 0 : sizeof(float));
  const size_t entry_size = words_size + weights_size;
  const size_t batch_size = std::min(count, mem_size / entry_size);
  uint8_t *const begin = reinterpret_cast<uint8_t*>(mem);

  std::deque<FILE*> files, contexts;
  Closer files_closer(files), contexts_closer(contexts);

  for (std::size_t batch = 0, done = 0; done < count; ++batch) {
    uint8_t *out = begin;
    uint8_t *out_end = out + std::min(count - done, batch_size) * entry_size;
    if (order == counts.size()) {
      for (; out != out_end; out += entry_size) {
        ReadNGram(f, order, vocab, reinterpret_cast<WordIndex*>(out), *reinterpret_cast<Prob*>(out + words_size), warn);
      }
    } else {
      for (; out != out_end; out += entry_size) {
        ReadNGram(f, order, vocab, reinterpret_cast<WordIndex*>(out), *reinterpret_cast<ProbBackoff*>(out + words_size), warn);
      }
    }
    // Sort full records by full n-gram.  
    util::SizedProxy proxy_begin(begin, entry_size), proxy_end(out_end, entry_size);
    // parallel_sort uses too much RAM.  TODO: figure out why windows sort doesn't like my proxies.  
#if defined(_WIN32) || defined(_WIN64)
    std::stable_sort
#else
    std::sort
#endif
        (NGramIter(proxy_begin), NGramIter(proxy_end), util::SizedCompare<EntryCompare>(EntryCompare(order)));
    files.push_back(DiskFlush(begin, out_end, file_prefix));
    contexts.push_back(WriteContextFile(begin, out_end, file_prefix, entry_size, order));

    done += (out_end - begin) / entry_size;
  }

  // All individual files created.  Merge them.  

  while (files.size() > 1) {
    files.push_back(MergeSortedFiles(files[0], files[1], file_prefix, weights_size, order, ThrowCombine()));
    files_closer.PopFront();
    files_closer.PopFront();
    contexts.push_back(MergeSortedFiles(contexts[0], contexts[1], file_prefix, 0, order - 1, FirstCombine()));
    contexts_closer.PopFront();
    contexts_closer.PopFront();
  }

  if (!files.empty()) {
    // Steal from closers.
    full_[order - 2].reset(files.front());
    files.pop_front();
    context_[order - 2].reset(contexts.front());
    contexts.pop_front();
  }
}

} // namespace trie
} // namespace ngram
} // namespace lm


================================================
FILE: src/kenlm/lm/trie_sort.hh
================================================
// Step of trie builder: create sorted files.  

#ifndef LM_TRIE_SORT__
#define LM_TRIE_SORT__

#include "lm/max_order.hh"
#include "lm/word_index.hh"

#include "util/file.hh"
#include "util/scoped.hh"

#include <cstddef>
#include <functional>
#include <string>
#include <vector>

#include <stdint.h>

namespace util {
class FilePiece;
} // namespace util

namespace lm {
class PositiveProbWarn;
namespace ngram {
class SortedVocabulary;
struct Config;

namespace trie {

class EntryCompare : public std::binary_function<const void*, const void*, bool> {
  public:
    explicit EntryCompare(unsigned char order) : order_(order) {}

    bool operator()(const void *first_void, const void *second_void) const {
      const WordIndex *first = static_cast<const WordIndex*>(first_void);
      const WordIndex *second = static_cast<const WordIndex*>(second_void);
      const WordIndex *end = first + order_;
      for (; first != end; ++first, ++second) {
        if (*first < *second) return true;
        if (*first > *second) return false;
      }
      return false;
    }
  private:
    unsigned char order_;
};

class RecordReader {
  public:
    RecordReader() : remains_(true) {}

    void Init(FILE *file, std::size_t entry_size);

    void *Data() { return data_.get(); }
    const void *Data() const { return data_.get(); }

    RecordReader &operator++() {
      std::size_t ret = fread(data_.get(), entry_size_, 1, file_);
      if (!ret) {
        UTIL_THROW_IF(!feof(file_), util::ErrnoException, "Error reading temporary file");
        remains_ = false;
      }
      return *this;
    }

    operator bool() const { return remains_; }

    void Rewind();

    std::size_t EntrySize() const { return entry_size_; }

    void Overwrite(const void *start, std::size_t amount);

  private:
    FILE *file_;

    util::scoped_malloc data_;

    bool remains_;

    std::size_t entry_size_;
};

class SortedFiles {
  public:
    // Build from ARPA
    SortedFiles(const Config &config, util::FilePiece &f, std::vector<uint64_t> &counts, std::size_t buffer, const std::string &file_prefix, SortedVocabulary &vocab);

    int StealUnigram() {
      return unigram_.release();
    }

    FILE *Full(unsigned char order) {
      return full_[order - 2].get();
    }

    FILE *Context(unsigned char of_order) {
      return context_[of_order - 2].get();
    }

  private:
    void ConvertToSorted(util::FilePiece &f, const SortedVocabulary &vocab, const std::vector<uint64_t> &counts, const std::string &prefix, unsigned char order, PositiveProbWarn &warn, void *mem, std::size_t mem_size);
    
    util::scoped_fd unigram_;

    util::scoped_FILE full_[KENLM_MAX_ORDER - 1], context_[KENLM_MAX_ORDER - 1];
};

} // namespace trie
} // namespace ngram
} // namespace lm

#endif // LM_TRIE_SORT__


================================================
FILE: src/kenlm/lm/value.hh
================================================
#ifndef LM_VALUE__
#define LM_VALUE__

#include "lm/model_type.hh"
#include "lm/value_build.hh"
#include "lm/weights.hh"
#include "util/bit_packing.hh"

#include <stdint.h>

namespace lm {
namespace ngram {

// Template proxy for probing unigrams and middle.
template <class Weights> class GenericProbingProxy {
  public:
    explicit GenericProbingProxy(const Weights &to) : to_(&to) {}

    GenericProbingProxy() : to_(0) {}

    bool Found() const { return to_ != 0; }

    float Prob() const {
      util::FloatEnc enc;
      enc.f = to_->prob;
      enc.i |= util::kSignBit;
      return enc.f;
    }

    float Backoff() const { return to_->backoff; }

    bool IndependentLeft() const {
      util::FloatEnc enc;
      enc.f = to_->prob;
      return enc.i & util::kSignBit;
    }

  protected:
    const Weights *to_;
};

// Basic proxy for trie unigrams.  
template <class Weights> class GenericTrieUnigramProxy {
  public:
    explicit GenericTrieUnigramProxy(const Weights &to) : to_(&to) {}

    GenericTrieUnigramProxy() : to_(0) {}

    bool Found() const { return to_ != 0; }
    float Prob() const { return to_->prob; }
    float Backoff() const { return to_->backoff; }
    float Rest() const { return Prob(); }

  protected:
    const Weights *to_;
};

struct BackoffValue {
  typedef ProbBackoff Weights;
  static const ModelType kProbingModelType = PROBING;

  class ProbingProxy : public GenericProbingProxy<Weights> {
    public:
      explicit ProbingProxy(const Weights &to) : GenericProbingProxy<Weights>(to) {}
      ProbingProxy() {}
      float Rest() const { return Prob(); }
  };

  class TrieUnigramProxy : public GenericTrieUnigramProxy<Weights> {
    public:
      explicit TrieUnigramProxy(const Weights &to) : GenericTrieUnigramProxy<Weights>(to) {}
      TrieUnigramProxy() {}
      float Rest() const { return Prob(); }
  };

  struct ProbingEntry {
    typedef uint64_t Key;
    typedef Weights Value;
    uint64_t key;
    ProbBackoff value;
    uint64_t GetKey() const { return key; }
  };

  struct TrieUnigramValue {
    Weights weights;
    uint64_t next;
    uint64_t Next() const { return next; }
  };

  const static bool kDifferentRest = false;

  template <class Model, class C> void Callback(const Config &, unsigned int, typename Model::Vocabulary &, C &callback) {
    NoRestBuild build;
    callback(build);
  }
};

struct RestValue {
  typedef RestWeights Weights;
  static const ModelType kProbingModelType = REST_PROBING;

  class ProbingProxy : public GenericProbingProxy<RestWeights> {
    public:
      explicit ProbingProxy(const Weights &to) : GenericProbingProxy<RestWeights>(to) {}
      ProbingProxy() {}
      float Rest() const { return to_->rest; }
  };

  class TrieUnigramProxy : public GenericTrieUnigramProxy<Weights> {
    public:
      explicit TrieUnigramProxy(const Weights &to) : GenericTrieUnigramProxy<Weights>(to) {}
      TrieUnigramProxy() {}
      float Rest() const { return to_->rest; }
  };

// gcc 4.1 doesn't properly back dependent types :-(.  
#pragma pack(push)
#pragma pack(4)
  struct ProbingEntry {
    typedef uint64_t Key;
    typedef Weights Value;
    Key key;
    Value value;
    Key GetKey() const { return key; }
  };

  struct TrieUnigramValue {
    Weights weights;
    uint64_t next;
    uint64_t Next() const { return next; }
  };
#pragma pack(pop)

  const static bool kDifferentRest = true;

  template <class Model, class C> void Callback(const Config &config, unsigned int order, typename Model::Vocabulary &vocab, C &callback) {
    switch (config.rest_function) {
      case Config::REST_MAX:
        {
          MaxRestBuild build;
          callback(build);
        }
        break;
      case Config::REST_LOWER:
        {
          LowerRestBuild<Model> build(config, order, vocab);
          callback(build);
        }
        break;
    }
  }
};

} // namespace ngram
} // namespace lm

#endif // LM_VALUE__


================================================
FILE: src/kenlm/lm/value_build.cc
================================================
#include "lm/value_build.hh"

#include "lm/model.hh"
#include "lm/read_arpa.hh"

namespace lm { 
namespace ngram {

template <class Model> LowerRestBuild<Model>::LowerRestBuild(const Config &config, unsigned int order, const typename Model::Vocabulary &vocab) {
  UTIL_THROW_IF(config.rest_lower_files.size() != order - 1, ConfigException, "This model has order " << order << " so there should be " << (order - 1) << " lower-order models for rest cost purposes.");
  Config for_lower = config;
  for_lower.rest_lower_files.clear();

  // Unigram models aren't supported, so this is a custom loader.  
  // TODO: optimize the unigram loading?  
  {
    util::FilePiece uni(config.rest_lower_files[0].c_str());
    std::vector<uint64_t> number;
    ReadARPACounts(uni, number);
    UTIL_THROW_IF(number.size() != 1, FormatLoadException, "Expected the unigram model to have order 1, not " << number.size());
    ReadNGramHeader(uni, 1);
    unigrams_.resize(number[0]);
    unigrams_[0] = config.unknown_missing_logprob;
    PositiveProbWarn warn;
    for (uint64_t i = 0; i < number[0]; ++i) {
      WordIndex w;
      Prob entry;
      ReadNGram(uni, 1, vocab, &w, entry, warn);
      unigrams_[w] = entry.prob;
    }
  }

  try {
    for (unsigned int i = 2; i < order; ++i) {
      models_.push_back(new Model(config.rest_lower_files[i - 1].c_str(), for_lower));
      UTIL_THROW_IF(models_.back()->Order() != i, FormatLoadException, "Lower order file " << config.rest_lower_files[i-1] << " should have order " << i);
    }
  } catch (...) {
    for (typename std::vector<const Model*>::const_iterator i = models_.begin(); i != models_.end(); ++i) {
      delete *i;
    }
    models_.clear();
    throw;
  }

  // TODO: force/check same vocab.  
}

template <class Model> LowerRestBuild<Model>::~LowerRestBuild() {
  for (typename std::vector<const Model*>::const_iterator i = models_.begin(); i != models_.end(); ++i) {
    delete *i;
  }
}

template class LowerRestBuild<ProbingModel>;

} // namespace ngram
} // namespace lm


================================================
FILE: src/kenlm/lm/value_build.hh
================================================
#ifndef LM_VALUE_BUILD__
#define LM_VALUE_BUILD__

#include "lm/weights.hh"
#include "lm/word_index.hh"
#include "util/bit_packing.hh"

#include <vector>

namespace lm {
namespace ngram {

struct Config;
struct BackoffValue;
struct RestValue;

class NoRestBuild {
  public:
    typedef BackoffValue Value;

    NoRestBuild() {}

    void SetRest(const WordIndex *, unsigned int, const Prob &/*prob*/) const {}
    void SetRest(const WordIndex *, unsigned int, const ProbBackoff &) const {}

    template <class Second> bool MarkExtends(ProbBackoff &weights, const Second &) const {
      util::UnsetSign(weights.prob);
      return false;
    }

    // Probing doesn't need to go back to unigram.
    const static bool kMarkEvenLower = false;
};

class MaxRestBuild {
  public:
    typedef RestValue Value;

    MaxRestBuild() {}

    void SetRest(const WordIndex *, unsigned int, const Prob &/*prob*/) const {}
    void SetRest(const WordIndex *, unsigned int, RestWeights &weights) const {
      weights.rest = weights.prob;
      util::SetSign(weights.rest);
    }

    bool MarkExtends(RestWeights &weights, const RestWeights &to) const {
      util::UnsetSign(weights.prob);
      if (weights.rest >= to.rest) return false;
      weights.rest = to.rest;
      return true;
    }
    bool MarkExtends(RestWeights &weights, const Prob &to) const {
      util::UnsetSign(weights.prob);
      if (weights.rest >= to.prob) return false;
      weights.rest = to.prob;
      return true;
    }

    // Probing does need to go back to unigram.  
    const static bool kMarkEvenLower = true;
};

template <class Model> class LowerRestBuild {
  public:
    typedef RestValue Value;

    LowerRestBuild(const Config &config, unsigned int order, const typename Model::Vocabulary &vocab);

    ~LowerRestBuild();

    void SetRest(const WordIndex *, unsigned int, const Prob &/*prob*/) const {}
    void SetRest(const WordIndex *vocab_ids, unsigned int n, RestWeights &weights) const {
      typename Model::State ignored;
      if (n == 1) {
        weights.rest = unigrams_[*vocab_ids];
      } else {
        weights.rest = models_[n-2]->FullScoreForgotState(vocab_ids + 1, vocab_ids + n, *vocab_ids, ignored).prob;
      }
    }

    template <class Second> bool MarkExtends(RestWeights &weights, const Second &) const {
      util::UnsetSign(weights.prob);
      return false;
    }

    const static bool kMarkEvenLower = false;

    std::vector<float> unigrams_;

    std::vector<const Model*> models_;
};

} // namespace ngram
} // namespace lm

#endif // LM_VALUE_BUILD__


================================================
FILE: src/kenlm/lm/virtual_interface.cc
================================================
#include "lm/virtual_interface.hh"

#include "lm/lm_exception.hh"

namespace lm {
namespace base {

Vocabulary::~Vocabulary() {}

void Vocabulary::SetSpecial(WordIndex begin_sentence, WordIndex end_sentence, WordIndex not_found) {
  begin_sentence_ = begin_sentence;
  end_sentence_ = end_sentence;
  not_found_ = not_found;
}

Model::~Model() {}

} // namespace base
} // namespace lm


================================================
FILE: src/kenlm/lm/virtual_interface.hh
================================================
#ifndef LM_VIRTUAL_INTERFACE__
#define LM_VIRTUAL_INTERFACE__

#include "lm/return.hh"
#include "lm/word_index.hh"
#include "util/string_piece.hh"

#include <string>

namespace lm {
namespace base {

template <class T, class U, class V> class ModelFacade;

/* Vocabulary interface.  Call Index(string) and get a word index for use in
 * calling Model.  It provides faster convenience functions for <s>, </s>, and
 * <unk> although you can also find these using Index.  
 *
 * Some models do not load the mapping from index to string.  If you need this,
 * check if the model Vocabulary class implements such a function and access it
 * directly.  
 *
 * The Vocabulary object is always owned by the Model and can be retrieved from
 * the Model using BaseVocabulary() for this abstract interface or
 * GetVocabulary() for the actual implementation (in which case you'll need the
 * actual implementation of the Model too).  
 */
class Vocabulary {
  public:
    virtual ~Vocabulary();

    WordIndex BeginSentence() const { return begin_sentence_; }
    WordIndex EndSentence() const { return end_sentence_; }
    WordIndex NotFound() const { return not_found_; }

    /* Most implementations allow StringPiece lookups and need only override
     * Index(StringPiece).  SRI requires null termination and overrides all
     * three methods.  
     */
    virtual WordIndex Index(const StringPiece &str) const = 0;
    virtual WordIndex Index(const std::string &str) const {
      return Index(StringPiece(str));
    }
    virtual WordIndex Index(const char *str) const {
      return Index(StringPiece(str));
    }

  protected:
    // Call SetSpecial afterward.  
    Vocabulary() {}

    Vocabulary(WordIndex begin_sentence, WordIndex end_sentence, WordIndex not_found) {
      SetSpecial(begin_sentence, end_sentence, not_found);
    }

    void SetSpecial(WordIndex begin_sentence, WordIndex end_sentence, WordIndex not_found);

    WordIndex begin_sentence_, end_sentence_, not_found_;

  private:
    // Disable copy constructors.  They're private and undefined. 
    // Ersatz boost::noncopyable.
    Vocabulary(const Vocabulary &);
    Vocabulary &operator=(const Vocabulary &);
};

/* There are two ways to access a Model.  
 *
 *
 * OPTION 1: Access the Model directly (e.g. lm::ngram::Model in model.hh).
 *
 * Every Model implements the scoring function:
 * float Score(
 *   const Model::State &in_state,
 *   const WordIndex new_word,
 *   Model::State &out_state) const;
 *
 * It can also return the length of n-gram matched by the model:
 * FullScoreReturn FullScore(
 *   const Model::State &in_state,
 *   const WordIndex new_word,
 *   Model::State &out_state) const;
 *
 *
 * There are also accessor functions:
 * const State &BeginSentenceState() const;
 * const State &NullContextState() const;
 * const Vocabulary &GetVocabulary() const;
 * unsigned int Order() const;
 *
 * NB: In case you're wondering why the model implementation looks like it's
 * missing these methods, see facade.hh.  
 *
 * This is the fastest way to use a model and presents a normal State class to
 * be included in a hypothesis state structure.  
 *
 *
 * OPTION 2: Use the virtual interface below.  
 *
 * The virtual interface allow you to decide which Model to use at runtime 
 * without templatizing everything on the Model type.  However, each Model has
 * its own State class, so a single State cannot be efficiently provided (it
 * would require using the maximum memory of any Model's State or memory
 * allocation with each lookup).  This means you become responsible for
 * allocating memory with size StateSize() and passing it to the Score or 
 * FullScore functions provided here.  
 *
 * For example, cdec has a std::string containing the entire state of a
 * hypothesis.  It can reserve StateSize bytes in this string for the model
 * state.  
 *
 * All the State objects are POD, so it's ok to use raw memory for storing
 * State.
 * in_state and out_state must not have the same address. 
 */
class Model {
  public:
    virtual ~Model();

    size_t StateSize() const { return state_size_; }
    const void *BeginSentenceMemory() const { return begin_sentence_memory_; }
    const void *NullContextMemory() const { return null_context_memory_; }

    // Requires in_state != out_state
    virtual float Score(const void *in_state, const WordIndex new_word, void *out_state) const = 0;

    // Requires in_state != out_state
    virtual FullScoreReturn FullScore(const void *in_state, const WordIndex new_word, void *out_state) const = 0;

    unsigned char Order() const { return order_; }

    const Vocabulary &BaseVocabulary() const { return *base_vocab_; }

  private:
    template <class T, class U, class V> friend class ModelFacade;
    explicit Model(size_t state_size) : state_size_(state_size) {}

    const size_t state_size_;
    const void *begin_sentence_memory_, *null_context_memory_;

    const Vocabulary *base_vocab_;

    unsigned char order_;

    // Disable copy constructors.  They're private and undefined. 
    // Ersatz boost::noncopyable.
    Model(const Model &);
    Model &operator=(const Model &);
};

} // mamespace base
} // namespace lm

#endif // LM_VIRTUAL_INTERFACE__


================================================
FILE: src/kenlm/lm/weights.hh
================================================
#ifndef LM_WEIGHTS__
#define LM_WEIGHTS__

// Weights for n-grams.  Probability and possibly a backoff.  

namespace lm {
struct Prob {
  float prob;
};
// No inheritance so this will be a POD.  
struct ProbBackoff {
  float prob;
  float backoff;
};
struct RestWeights {
  float prob;
  float backoff;
  float rest;
};

} // namespace lm
#endif // LM_WEIGHTS__


================================================
FILE: src/kenlm/lm/word_index.hh
================================================
// Separate header because this is used often.
#ifndef LM_WORD_INDEX__
#define LM_WORD_INDEX__

#include <limits.h>

namespace lm {
typedef unsigned int WordIndex;
const WordIndex kMaxWordIndex = UINT_MAX;
} // namespace lm

typedef lm::WordIndex LMWordIndex;

#endif


================================================
FILE: src/kenlm/util/Jamfile
================================================
local compressed_flags = <include>.. <define>HAVE_ZLIB ;
local compressed_deps = /top//z ;
if [ test_library "bz2" ] && [ test_header "bzlib.h" ] {
  external-lib bz2 ;
  compressed_flags += <define>HAVE_BZLIB ;
  compressed_deps += bz2 ;
}
if [ test_library "lzma" ] && [ test_header "lzma.h" ] {
  external-lib lzma ;
  compressed_flags += <define>HAVE_XZLIB ;
  compressed_deps += lzma ;
}

obj read_compressed.o : read_compressed.cc : $(compressed_flags) ;
alias read_compressed : read_compressed.o $(compressed_deps) ;
obj read_compressed_test.o : read_compressed_test.cc /top//boost_unit_test_framework : $(compressed_flags) ;
obj file_piece_test.o : file_piece_test.cc /top//boost_unit_test_framework : $(compressed_flags) ;

fakelib kenutil : bit_packing.cc ersatz_progress.cc exception.cc file.cc file_piece.cc mmap.cc murmur_hash.cc pool.cc read_compressed scoped.cc string_piece.cc usage.cc double-conversion//double-conversion : <include>.. : : <include>.. ;

import testing ;

unit-test bit_packing_test : bit_packing_test.cc kenutil /top//boost_unit_test_framework ;
run file_piece_test.o kenutil /top//boost_unit_test_framework : : file_piece.cc ;
unit-test read_compressed_test : read_compressed_test.o kenutil /top//boost_unit_test_framework ;
unit-test joint_sort_test : joint_sort_test.cc kenutil /top//boost_unit_test_framework ;
unit-test probing_hash_table_test : probing_hash_table_test.cc kenutil /top//boost_unit_test_framework ;
unit-test sorted_uniform_test : sorted_uniform_test.cc kenutil /top//boost_unit_test_framework ;
unit-test tokenize_piece_test : tokenize_piece_test.cc kenutil /top//boost_unit_test_framework ;
unit-test multi_intersection_test : multi_intersection_test.cc kenutil /top//boost_unit_test_framework ;


================================================
FILE: src/kenlm/util/bit_packing.cc
================================================
#include "util/bit_packing.hh"
#include "util/exception.hh"

#include <string.h>

namespace util {

namespace {
template <bool> struct StaticCheck {};
template <> struct StaticCheck<true> { typedef bool StaticAssertionPassed; };

// If your float isn't 4 bytes, we're hosed.  
typedef StaticCheck<sizeof(float) == 4>::StaticAssertionPassed FloatSize;

} // namespace

uint8_t RequiredBits(uint64_t max_value) {
  if (!max_value) return 0;
  uint8_t ret = 1;
  while (max_value >>= 1) ++ret;
  return ret;
}

void BitPackingSanity() {
  const FloatEnc neg1 = { -1.0 }, pos1 = { 1.0 };
  if ((neg1.i ^ pos1.i) != 0x80000000) UTIL_THROW(Exception, "Sign bit is not 0x80000000");
  char mem[57+8];
  memset(mem, 0, sizeof(mem));
  const uint64_t test57 = 0x123456789abcdefULL;
  for (uint64_t b = 0; b < 57 * 8; b += 57) {
    WriteInt57(mem, b, 57, test57);
  }
  for (uint64_t b = 0; b < 57 * 8; b += 57) {
    if (test57 != ReadInt57(mem, b, 57, (1ULL << 57) - 1))
      UTIL_THROW(Exception, "The bit packing routines are failing for your architecture.  Please send a bug report with your architecture, operating system, and compiler.");
  }
  // TODO: more checks.  
}

} // namespace util


================================================
FILE: src/kenlm/util/bit_packing.hh
================================================
#ifndef UTIL_BIT_PACKING__
#define UTIL_BIT_PACKING__

/* Bit-level packing routines 
 *
 * WARNING WARNING WARNING:
 * The write functions assume that memory is zero initially.  This makes them
 * faster and is the appropriate case for mmapped language model construction.
 * These routines assume that unaligned access to uint64_t is fast.  This is
 * the case on x86_64.  I'm not sure how fast unaligned 64-bit access is on
 * x86 but my target audience is large language models for which 64-bit is
 * necessary.  
 *
 * Call the BitPackingSanity function to sanity check.  Calling once suffices,
 * but it may be called multiple times when that's inconvenient.  
 *
 * ARM and MinGW ports contributed by Hideo Okuma and Tomoyuki Yoshimura at
 * NICT.
 */

#include <assert.h>
#ifdef __APPLE__
#include <architecture/byte_order.h>
#elif __linux__
#include <endian.h>
#elif !defined(_WIN32) && !defined(_WIN64)
#include <arpa/nameser_compat.h>
#endif 

#include <stdint.h>

#include <string.h>

namespace util {

// Fun fact: __BYTE_ORDER is wrong on Solaris Sparc, but the version without __ is correct.  
#if BYTE_ORDER == LITTLE_ENDIAN
inline uint8_t BitPackShift(uint8_t bit, uint8_t /*length*/) {
  return bit;
}
#elif BYTE_ORDER == BIG_ENDIAN
inline uint8_t BitPackShift(uint8_t bit, uint8_t length) {
  return 64 - length - bit;
}
#else
#error "Bit packing code isn't written for your byte order."
#endif

inline uint64_t ReadOff(const void *base, uint64_t bit_off) {
#if defined(__arm) || defined(__arm__)
  const uint8_t *base_off = reinterpret_cast<const uint8_t*>(base) + (bit_off >> 3);
  uint64_t value64;
  memcpy(&value64, base_off, sizeof(value64));
  return value64;
#else
  return *reinterpret_cast<const uint64_t*>(reinterpret_cast<const uint8_t*>(base) + (bit_off >> 3));
#endif
}

/* Pack integers up to 57 bits using their least significant digits. 
 * The length is specified using mask:
 * Assumes mask == (1 << length) - 1 where length <= 57.   
 */
inline uint64_t ReadInt57(const void *base, uint64_t bit_off, uint8_t length, uint64_t mask) {
  return (ReadOff(base, bit_off) >> BitPackShift(bit_off & 7, length)) & mask;
}
/* Assumes value < (1 << length) and length <= 57.
 * Assumes the memory is zero initially. 
 */
inline void WriteInt57(void *base, uint64_t bit_off, uint8_t length, uint64_t value) {
#if defined(__arm) || defined(__arm__)
  uint8_t *base_off = reinterpret_cast<uint8_t*>(base) + (bit_off >> 3);
  uint64_t value64;
  memcpy(&value64, base_off, sizeof(value64));
  value64 |= (value << BitPackShift(bit_off & 7, length));
  memcpy(base_off, &value64, sizeof(value64));
#else
  *reinterpret_cast<uint64_t*>(reinterpret_cast<uint8_t*>(base) + (bit_off >> 3)) |= 
    (value << BitPackShift(bit_off & 7, length));
#endif
}

/* Same caveats as above, but for a 25 bit limit. */
inline uint32_t ReadInt25(const void *base, uint64_t bit_off, uint8_t length, uint32_t mask) {
#if defined(__arm) || defined(__arm__)
  const uint8_t *base_off = reinterpret_cast<const uint8_t*>(base) + (bit_off >> 3);
  uint32_t value32;
  memcpy(&value32, base_off, sizeof(value32));
  return (value32 >> BitPackShift(bit_off & 7, length)) & mask;
#else
  return (*reinterpret_cast<const uint32_t*>(reinterpret_cast<const uint8_t*>(base) + (bit_off >> 3)) >> BitPackShift(bit_off & 7, length)) & mask;
#endif
}

inline void WriteInt25(void *base, uint64_t bit_off, uint8_t length, uint32_t value) {
#if defined(__arm) || defined(__arm__)
  uint8_t *base_off = reinterpret_cast<uint8_t*>(base) + (bit_off >> 3);
  uint32_t value32;
  memcpy(&value32, base_off, sizeof(value32));
  value32 |= (value << BitPackShift(bit_off & 7, length));
  memcpy(base_off, &value32, sizeof(value32));
#else
  *reinterpret_cast<uint32_t*>(reinterpret_cast<uint8_t*>(base) + (bit_off >> 3)) |= 
    (value << BitPackShift(bit_off & 7, length));
#endif
}

typedef union { float f; uint32_t i; } FloatEnc;

inline float ReadFloat32(const void *base, uint64_t bit_off) {
  FloatEnc encoded;
  encoded.i = ReadOff(base, bit_off) >> BitPackShift(bit_off & 7, 32);
  return encoded.f;
}
inline void WriteFloat32(void *base, uint64_t bit_off, float value) {
  FloatEnc encoded;
  encoded.f = value;
  WriteInt57(base, bit_off, 32, encoded.i);
}

const uint32_t kSignBit = 0x80000000;

inline void SetSign(float &to) {
  FloatEnc enc;
  enc.f = to;
  enc.i |= kSignBit;
  to = enc.f;
}

inline void UnsetSign(float &to) {
  FloatEnc enc;
  enc.f = to;
  enc.i &= ~kSignBit;
  to = enc.f;
}

inline float ReadNonPositiveFloat31(const void *base, uint64_t bit_off) {
  FloatEnc encoded;
  encoded.i = ReadOff(base, bit_off) >> BitPackShift(bit_off & 7, 31);
  // Sign bit set means negative.  
  encoded.i |= kSignBit;
  return encoded.f;
}
inline void WriteNonPositiveFloat31(void *base, uint64_t bit_off, float value) {
  FloatEnc encoded;
  encoded.f = value;
  encoded.i &= ~kSignBit;
  WriteInt57(base, bit_off, 31, encoded.i);
}

void BitPackingSanity();

// Return bits required to store integers upto max_value.  Not the most
// efficient implementation, but this is only called a few times to size tries. 
uint8_t RequiredBits(uint64_t max_value);

struct BitsMask {
  static BitsMask ByMax(uint64_t max_value) {
    BitsMask ret;
    ret.FromMax(max_value);
    return ret;
  }
  static BitsMask ByBits(uint8_t bits) {
    BitsMask ret;
    ret.bits = bits;
    ret.mask = (1ULL << bits) - 1;
    return ret;
  }
  void FromMax(uint64_t max_value) {
    bits = RequiredBits(max_value);
    mask = (1ULL << bits) - 1;
  }
  uint8_t bits;
  uint64_t mask;
};

struct BitAddress {
  BitAddress(void *in_base, uint64_t in_offset) : base(in_base), offset(in_offset) {}

  void *base;
  uint64_t offset;
};

} // namespace util

#endif // UTIL_BIT_PACKING__


================================================
FILE: src/kenlm/util/bit_packing_test.cc
================================================
#include "util/bit_packing.hh"

#define BOOST_TEST_MODULE BitPackingTest
#include <boost/test/unit_test.hpp>

#include <string.h>

namespace util {
namespace {

const uint64_t test57 = 0x123456789abcdefULL;
const uint32_t test25 = 0x1234567;

BOOST_AUTO_TEST_CASE(ZeroBit57) {
  char mem[16];
  memset(mem, 0, sizeof(mem));
  WriteInt57(mem, 0, 57, test57);
  BOOST_CHECK_EQUAL(test57, ReadInt57(mem, 0, 57, (1ULL << 57) - 1));
}

BOOST_AUTO_TEST_CASE(EachBit57) {
  char mem[16];
  for (uint8_t b = 0; b < 8; ++b) {
    memset(mem, 0, sizeof(mem));
    WriteInt57(mem, b, 57, test57);
    BOOST_CHECK_EQUAL(test57, ReadInt57(mem, b, 57, (1ULL << 57) - 1));
  }
}

BOOST_AUTO_TEST_CASE(Consecutive57) {
  char mem[57+8];
  memset(mem, 0, sizeof(mem));
  for (uint64_t b = 0; b < 57 * 8; b += 57) {
    WriteInt57(mem, b, 57, test57);
    BOOST_CHECK_EQUAL(test57, ReadInt57(mem, b, 57, (1ULL << 57) - 1));
  }
  for (uint64_t b = 0; b < 57 * 8; b += 57) {
    BOOST_CHECK_EQUAL(test57, ReadInt57(mem, b, 57, (1ULL << 57) - 1));
  }
}

BOOST_AUTO_TEST_CASE(Consecutive25) {
  char mem[25+8];
  memset(mem, 0, sizeof(mem));
  for (uint64_t b = 0; b < 25 * 8; b += 25) {
    WriteInt25(mem, b, 25, test25);
    BOOST_CHECK_EQUAL(test25, ReadInt25(mem, b, 25, (1ULL << 25) - 1));
  }
  for (uint64_t b = 0; b < 25 * 8; b += 25) {
    BOOST_CHECK_EQUAL(test25, ReadInt25(mem, b, 25, (1ULL << 25) - 1));
  }
}

BOOST_AUTO_TEST_CASE(Sanity) {
  BitPackingSanity();
}

} // namespace
} // namespace util


================================================
FILE: src/kenlm/util/double-conversion/Jamfile
================================================
fakelib double-conversion : [ glob *.cc ] : : : <include>. ;


================================================
FILE: src/kenlm/util/double-conversion/LICENSE
================================================
Copyright 2006-2011, the V8 project authors. All rights reserved.
Redistribution and use in source and binary forms, with or without
modification, are permitted provided that the following conditions are
met:

    * Redistributions of source code must retain the above copyright
      notice, this list of conditions and the following disclaimer.
    * Redistributions in binary form must reproduce the above
      copyright notice, this list of conditions and the following
      disclaimer in the documentation and/or other materials provided
      with the distribution.
    * Neither the name of Google Inc. nor the names of its
      contributors may be used to endorse or promote products derived
      from this software without specific prior written permission.

THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
"AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
(INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.


================================================
FILE: src/kenlm/util/double-conversion/bignum-dtoa.cc
================================================
// Copyright 2010 the V8 project authors. All rights reserved.
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are
// met:
//
//     * Redistributions of source code must retain the above copyright
//       notice, this list of conditions and the following disclaimer.
//     * Redistributions in binary form must reproduce the above
//       copyright notice, this list of conditions and the following
//       disclaimer in the documentation and/or other materials provided
//       with the distribution.
//     * Neither the name of Google Inc. nor the names of its
//       contributors may be used to endorse or promote products derived
//       from this software without specific prior written permission.
//
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

#include <math.h>

#include "bignum-dtoa.h"

#include "bignum.h"
#include "ieee.h"

namespace double_conversion {

static int NormalizedExponent(uint64_t significand, int exponent) {
  ASSERT(significand != 0);
  while ((significand & Double::kHiddenBit) == 0) {
    significand = significand << 1;
    exponent = exponent - 1;
  }
  return exponent;
}


// Forward declarations:
// Returns an estimation of k such that 10^(k-1) <= v < 10^k.
static int EstimatePower(int exponent);
// Computes v / 10^estimated_power exactly, as a ratio of two bignums, numerator
// and denominator.
static void InitialScaledStartValues(uint64_t significand,
                                     int exponent,
                                     bool lower_boundary_is_closer,
                                     int estimated_power,
                                     bool need_boundary_deltas,
                                     Bignum* numerator,
                                     Bignum* denominator,
                                     Bignum* delta_minus,
                                     Bignum* delta_plus);
// Multiplies numerator/denominator so that its values lies in the range 1-10.
// Returns decimal_point s.t.
//  v = numerator'/denominator' * 10^(decimal_point-1)
//     where numerator' and denominator' are the values of numerator and
//     denominator after the call to this function.
static void FixupMultiply10(int estimated_power, bool is_even,
                            int* decimal_point,
                            Bignum* numerator, Bignum* denominator,
                            Bignum* delta_minus, Bignum* delta_plus);
// Generates digits from the left to the right and stops when the generated
// digits yield the shortest decimal representation of v.
static void GenerateShortestDigits(Bignum* numerator, Bignum* denominator,
                                   Bignum* delta_minus, Bignum* delta_plus,
                                   bool is_even,
                                   Vector<char> buffer, int* length);
// Generates 'requested_digits' after the decimal point.
static void BignumToFixed(int requested_digits, int* decimal_point,
                          Bignum* numerator, Bignum* denominator,
                          Vector<char>(buffer), int* length);
// Generates 'count' digits of numerator/denominator.
// Once 'count' digits have been produced rounds the result depending on the
// remainder (remainders of exactly .5 round upwards). Might update the
// decimal_point when rounding up (for example for 0.9999).
static void GenerateCountedDigits(int count, int* decimal_point,
                                  Bignum* numerator, Bignum* denominator,
                                  Vector<char>(buffer), int* length);


void BignumDtoa(double v, BignumDtoaMode mode, int requested_digits,
                Vector<char> buffer, int* length, int* decimal_point) {
  ASSERT(v > 0);
  ASSERT(!Double(v).IsSpecial());
  uint64_t significand;
  int exponent;
  bool lower_boundary_is_closer;
  if (mode == BIGNUM_DTOA_SHORTEST_SINGLE) {
    float f = static_cast<float>(v);
    ASSERT(f == v);
    significand = Single(f).Significand();
    exponent = Single(f).Exponent();
    lower_boundary_is_closer = Single(f).LowerBoundaryIsCloser();
  } else {
    significand = Double(v).Significand();
    exponent = Double(v).Exponent();
    lower_boundary_is_closer = Double(v).LowerBoundaryIsCloser();
  }
  bool need_boundary_deltas =
      (mode == BIGNUM_DTOA_SHORTEST || mode == BIGNUM_DTOA_SHORTEST_SINGLE);

  bool is_even = (significand & 1) == 0;
  int normalized_exponent = NormalizedExponent(significand, exponent);
  // estimated_power might be too low by 1.
  int estimated_power = EstimatePower(normalized_exponent);

  // Shortcut for Fixed.
  // The requested digits correspond to the digits after the point. If the
  // number is much too small, then there is no need in trying to get any
  // digits.
  if (mode == BIGNUM_DTOA_FIXED && -estimated_power - 1 > requested_digits) {
    buffer[0] = '\0';
    *length = 0;
    // Set decimal-point to -requested_digits. This is what Gay does.
    // Note that it should not have any effect anyways since the string is
    // empty.
    *decimal_point = -requested_digits;
    return;
  }

  Bignum numerator;
  Bignum denominator;
  Bignum delta_minus;
  Bignum delta_plus;
  // Make sure the bignum can grow large enough. The smallest double equals
  // 4e-324. In this case the denominator needs fewer than 324*4 binary digits.
  // The maximum double is 1.7976931348623157e308 which needs fewer than
  // 308*4 binary digits.
  ASSERT(Bignum::kMaxSignificantBits >= 324*4);
  InitialScaledStartValues(significand, exponent, lower_boundary_is_closer,
                           estimated_power, need_boundary_deltas,
                           &numerator, &denominator,
                           &delta_minus, &delta_plus);
  // We now have v = (numerator / denominator) * 10^estimated_power.
  FixupMultiply10(estimated_power, is_even, decimal_point,
                  &numerator, &denominator,
                  &delta_minus, &delta_plus);
  // We now have v = (numerator / denominator) * 10^(decimal_point-1), and
  //  1 <= (numerator + delta_plus) / denominator < 10
  switch (mode) {
    case BIGNUM_DTOA_SHORTEST:
    case BIGNUM_DTOA_SHORTEST_SINGLE:
      GenerateShortestDigits(&numerator, &denominator,
                             &delta_minus, &delta_plus,
                             is_even, buffer, length);
      break;
    case BIGNUM_DTOA_FIXED:
      BignumToFixed(requested_digits, decimal_point,
                    &numerator, &denominator,
                    buffer, length);
      break;
    case BIGNUM_DTOA_PRECISION:
      GenerateCountedDigits(requested_digits, decimal_point,
                            &numerator, &denominator,
                            buffer, length);
      break;
    default:
      UNREACHABLE();
  }
  buffer[*length] = '\0';
}


// The procedure starts generating digits from the left to the right and stops
// when the generated digits yield the shortest decimal representation of v. A
// decimal representation of v is a number lying closer to v than to any other
// double, so it converts to v when read.
//
// This is true if d, the decimal representation, is between m- and m+, the
// upper and lower boundaries. d must be strictly between them if !is_even.
//           m- := (numerator - delta_minus) / denominator
//           m+ := (numerator + delta_plus) / denominator
//
// Precondition: 0 <= (numerator+delta_plus) / denominator < 10.
//   If 1 <= (numerator+delta_plus) / denominator < 10 then no leading 0 digit
//   will be produced. This should be the standard precondition.
static void GenerateShortestDigits(Bignum* numerator, Bignum* denominator,
                                   Bignum* delta_minus, Bignum* delta_plus,
                                   bool is_even,
                                   Vector<char> buffer, int* length) {
  // Small optimization: if delta_minus and delta_plus are the same just reuse
  // one of the two bignums.
  if (Bignum::Equal(*delta_minus, *delta_plus)) {
    delta_plus = delta_minus;
  }
  *length = 0;
  while (true) {
    uint16_t digit;
    digit = numerator->DivideModuloIntBignum(*denominator);
    ASSERT(digit <= 9);  // digit is a uint16_t and therefore always positive.
    // digit = numerator / denominator (integer division).
    // numerator = numerator % denominator.
    buffer[(*length)++] = digit + '0';

    // Can we stop already?
    // If the remainder of the division is less than the distance to the lower
    // boundary we can stop. In this case we simply round down (discarding the
    // remainder).
    // Similarly we test if we can round up (using the upper boundary).
    bool in_delta_room_minus;
    bool in_delta_room_plus;
    if (is_even) {
      in_delta_room_minus = Bignum::LessEqual(*numerator, *delta_minus);
    } else {
      in_delta_room_minus = Bignum::Less(*numerator, *delta_minus);
    }
    if (is_even) {
      in_delta_room_plus =
          Bignum::PlusCompare(*numerator, *delta_plus, *denominator) >= 0;
    } else {
      in_delta_room_plus =
          Bignum::PlusCompare(*numerator, *delta_plus, *denominator) > 0;
    }
    if (!in_delta_room_minus && !in_delta_room_plus) {
      // Prepare for next iteration.
      numerator->Times10();
      delta_minus->Times10();
      // We optimized delta_plus to be equal to delta_minus (if they share the
      // same value). So don't multiply delta_plus if they point to the same
      // object.
      if (delta_minus != delta_plus) {
        delta_plus->Times10();
      }
    } else if (in_delta_room_minus && in_delta_room_plus) {
      // Let's see if 2*numerator < denominator.
      // If yes, then the next digit would be < 5 and we can round down.
      int compare = Bignum::PlusCompare(*numerator, *numerator, *denominator);
      if (compare < 0) {
        // Remaining digits are less than .5. -> Round down (== do nothing).
      } else if (compare > 0) {
        // Remaining digits are more than .5 of denominator. -> Round up.
        // Note that the last digit could not be a '9' as otherwise the whole
        // loop would have stopped earlier.
        // We still have an assert here in case the preconditions were not
        // satisfied.
        ASSERT(buffer[(*length) - 1] != '9');
        buffer[(*length) - 1]++;
      } else {
        // Halfway case.
        // TODO(floitsch): need a way to solve half-way cases.
        //   For now let's round towards even (since this is what Gay seems to
        //   do).

        if ((buffer[(*length) - 1] - '0') % 2 == 0) {
          // Round down => Do nothing.
        } else {
          ASSERT(buffer[(*length) - 1] != '9');
          buffer[(*length) - 1]++;
        }
      }
      return;
    } else if (in_delta_room_minus) {
      // Round down (== do nothing).
      return;
    } else {  // in_delta_room_plus
      // Round up.
      // Note again that the last digit could not be '9' since this would have
      // stopped the loop earlier.
      // We still have an ASSERT here, in case the preconditions were not
      // satisfied.
      ASSERT(buffer[(*length) -1] != '9');
      buffer[(*length) - 1]++;
      return;
    }
  }
}


// Let v = numerator / denominator < 10.
// Then we generate 'count' digits of d = x.xxxxx... (without the decimal point)
// from left to right. Once 'count' digits have been produced we decide wether
// to round up or down. Remainders of exactly .5 round upwards. Numbers such
// as 9.999999 propagate a carry all the way, and change the
// exponent (decimal_point), when rounding upwards.
static void GenerateCountedDigits(int count, int* decimal_point,
                                  Bignum* numerator, Bignum* denominator,
                                  Vector<char>(buffer), int* length) {
  ASSERT(count >= 0);
  for (int i = 0; i < count - 1; ++i) {
    uint16_t digit;
    digit = numerator->DivideModuloIntBignum(*denominator);
    ASSERT(digit <= 9);  // digit is a uint16_t and therefore always positive.
    // digit = numerator / denominator (integer division).
    // numerator = numerator % denominator.
    buffer[i] = digit + '0';
    // Prepare for next iteration.
    numerator->Times10();
  }
  // Generate the last digit.
  uint16_t digit;
  digit = numerator->DivideModuloIntBignum(*denominator);
  if (Bignum::PlusCompare(*numerator, *numerator, *denominator) >= 0) {
    digit++;
  }
  buffer[count - 1] = digit + '0';
  // Correct bad digits (in case we had a sequence of '9's). Propagate the
  // carry until we hat a non-'9' or til we reach the first digit.
  for (int i = count - 1; i > 0; --i) {
    if (buffer[i] != '0' + 10) break;
    buffer[i] = '0';
    buffer[i - 1]++;
  }
  if (buffer[0] == '0' + 10) {
    // Propagate a carry past the top place.
    buffer[0] = '1';
    (*decimal_point)++;
  }
  *length = count;
}


// Generates 'requested_digits' after the decimal point. It might omit
// trailing '0's. If the input number is too small then no digits at all are
// generated (ex.: 2 fixed digits for 0.00001).
//
// Input verifies:  1 <= (numerator + delta) / denominator < 10.
static void BignumToFixed(int requested_digits, int* decimal_point,
                          Bignum* numerator, Bignum* denominator,
                          Vector<char>(buffer), int* length) {
  // Note that we have to look at more than just the requested_digits, since
  // a number could be rounded up. Example: v=0.5 with requested_digits=0.
  // Even though the power of v equals 0 we can't just stop here.
  if (-(*decimal_point) > requested_digits) {
    // The number is definitively too small.
    // Ex: 0.001 with requested_digits == 1.
    // Set decimal-point to -requested_digits. This is what Gay does.
    // Note that it should not have any effect anyways since the string is
    // empty.
    *decimal_point = -requested_digits;
    *length = 0;
    return;
  } else if (-(*decimal_point) == requested_digits) {
    // We only need to verify if the number rounds down or up.
    // Ex: 0.04 and 0.06 with requested_digits == 1.
    ASSERT(*decimal_point == -requested_digits);
    // Initially the fraction lies in range (1, 10]. Multiply the denominator
    // by 10 so that we can compare more easily.
    denominator->Times10();
    if (Bignum::PlusCompare(*numerator, *numerator, *denominator) >= 0) {
      // If the fraction is >= 0.5 then we have to include the rounded
      // digit.
      buffer[0] = '1';
      *length = 1;
      (*decimal_point)++;
    } else {
      // Note that we caught most of similar cases earlier.
      *length = 0;
    }
    return;
  } else {
    // The requested digits correspond to the digits after the point.
    // The variable 'needed_digits' includes the digits before the point.
    int needed_digits = (*decimal_point) + requested_digits;
    GenerateCountedDigits(needed_digits, decimal_point,
                          numerator, denominator,
                          buffer, length);
  }
}


// Returns an estimation of k such that 10^(k-1) <= v < 10^k where
// v = f * 2^exponent and 2^52 <= f < 2^53.
// v is hence a normalized double with the given exponent. The output is an
// approximation for the exponent of the decimal approimation .digits * 10^k.
//
// The result might undershoot by 1 in which case 10^k <= v < 10^k+1.
// Note: this property holds for v's upper boundary m+ too.
//    10^k <= m+ < 10^k+1.
//   (see explanation below).
//
// Examples:
//  EstimatePower(0)   => 16
//  EstimatePower(-52) => 0
//
// Note: e >= 0 => EstimatedPower(e) > 0. No similar claim can be made for e<0.
static int EstimatePower(int exponent) {
  // This function estimates log10 of v where v = f*2^e (with e == exponent).
  // Note that 10^floor(log10(v)) <= v, but v <= 10^ceil(log10(v)).
  // Note that f is bounded by its container size. Let p = 53 (the double's
  // significand size). Then 2^(p-1) <= f < 2^p.
  //
  // Given that log10(v) == log2(v)/log2(10) and e+(len(f)-1) is quite close
  // to log2(v) the function is simplified to (e+(len(f)-1)/log2(10)).
  // The computed number undershoots by less than 0.631 (when we compute log3
  // and not log10).
  //
  // Optimization: since we only need an approximated result this computation
  // can be performed on 64 bit integers. On x86/x64 architecture the speedup is
  // not really measurable, though.
  //
  // Since we want to avoid overshooting we decrement by 1e10 so that
  // floating-point imprecisions don't affect us.
  //
  // Explanation for v's boundary m+: the computation takes advantage of
  // the fact that 2^(p-1) <= f < 2^p. Boundaries still satisfy this requirement
  // (even for denormals where the delta can be much more important).

  const double k1Log10 = 0.30102999566398114;  // 1/lg(10)

  // For doubles len(f) == 53 (don't forget the hidden bit).
  const int kSignificandSize = Double::kSignificandSize;
  double estimate = ceil((exponent + kSignificandSize - 1) * k1Log10 - 1e-10);
  return static_cast<int>(estimate);
}


// See comments for InitialScaledStartValues.
static void InitialScaledStartValuesPositiveExponent(
    uint64_t significand, int exponent,
    int estimated_power, bool need_boundary_deltas,
    Bignum* numerator, Bignum* denominator,
    Bignum* delta_minus, Bignum* delta_plus) {
  // A positive exponent implies a positive power.
  ASSERT(estimated_power >= 0);
  // Since the estimated_power is positive we simply multiply the denominator
  // by 10^estimated_power.

  // numerator = v.
  numerator->AssignUInt64(significand);
  numerator->ShiftLeft(exponent);
  // denominator = 10^estimated_power.
  denominator->AssignPowerUInt16(10, estimated_power);

  if (need_boundary_deltas) {
    // Introduce a common denominator so that the deltas to the boundaries are
    // integers.
    denominator->ShiftLeft(1);
    numerator->ShiftLeft(1);
    // Let v = f * 2^e, then m+ - v = 1/2 * 2^e; With the common
    // denominator (of 2) delta_plus equals 2^e.
    delta_plus->AssignUInt16(1);
    delta_plus->ShiftLeft(exponent);
    // Same for delta_minus. The adjustments if f == 2^p-1 are done later.
    delta_minus->AssignUInt16(1);
    delta_minus->ShiftLeft(exponent);
  }
}


// See comments for InitialScaledStartValues
static void InitialScaledStartValuesNegativeExponentPositivePower(
    uint64_t significand, int exponent,
    int estimated_power, bool need_boundary_deltas,
    Bignum* numerator, Bignum* denominator,
    Bignum* delta_minus, Bignum* delta_plus) {
  // v = f * 2^e with e < 0, and with estimated_power >= 0.
  // This means that e is close to 0 (have a look at how estimated_power is
  // computed).

  // numerator = significand
  //  since v = significand * 2^exponent this is equivalent to
  //  numerator = v * / 2^-exponent
  numerator->AssignUInt64(significand);
  // denominator = 10^estimated_power * 2^-exponent (with exponent < 0)
  denominator->AssignPowerUInt16(10, estimated_power);
  denominator->ShiftLeft(-exponent);

  if (need_boundary_deltas) {
    // Introduce a common denominator so that the deltas to the boundaries are
    // integers.
    denominator->ShiftLeft(1);
    numerator->ShiftLeft(1);
    // Let v = f * 2^e, then m+ - v = 1/2 * 2^e; With the common
    // denominator (of 2) delta_plus equals 2^e.
    // Given that the denominator already includes v's exponent the distance
    // to the boundaries is simply 1.
    delta_plus->AssignUInt16(1);
    // Same for delta_minus. The adjustments if f == 2^p-1 are done later.
    delta_minus->AssignUInt16(1);
  }
}


// See comments for InitialScaledStartValues
static void InitialScaledStartValuesNegativeExponentNegativePower(
    uint64_t significand, int exponent,
    int estimated_power, bool need_boundary_deltas,
    Bignum* numerator, Bignum* denominator,
    Bignum* delta_minus, Bignum* delta_plus) {
  // Instead of multiplying the denominator with 10^estimated_power we
  // multiply all values (numerator and deltas) by 10^-estimated_power.

  // Use numerator as temporary container for power_ten.
  Bignum* power_ten = numerator;
  power_ten->AssignPowerUInt16(10, -estimated_power);

  if (need_boundary_deltas) {
    // Since power_ten == numerator we must make a copy of 10^estimated_power
    // before we complete the computation of the numerator.
    // delta_plus = delta_minus = 10^estimated_power
    delta_plus->AssignBignum(*power_ten);
    delta_minus->AssignBignum(*power_ten);
  }

  // numerator = significand * 2 * 10^-estimated_power
  //  since v = significand * 2^exponent this is equivalent to
  // numerator = v * 10^-estimated_power * 2 * 2^-exponent.
  // Remember: numerator has been abused as power_ten. So no need to assign it
  //  to itself.
  ASSERT(numerator == power_ten);
  numerator->MultiplyByUInt64(significand);

  // denominator = 2 * 2^-exponent with exponent < 0.
  denominator->AssignUInt16(1);
  denominator->ShiftLeft(-exponent);

  if (need_boundary_deltas) {
    // Introduce a common denominator so that the deltas to the boundaries are
    // integers.
    numerator->ShiftLeft(1);
    denominator->ShiftLeft(1);
    // With this shift the boundaries have their correct value, since
    // delta_plus = 10^-estimated_power, and
    // delta_minus = 10^-estimated_power.
    // These assignments have been done earlier.
    // The adjustments if f == 2^p-1 (lower boundary is closer) are done later.
  }
}


// Let v = significand * 2^exponent.
// Computes v / 10^estimated_power exactly, as a ratio of two bignums, numerator
// and denominator. The functions GenerateShortestDigits and
// GenerateCountedDigits will then convert this ratio to its decimal
// representation d, with the required accuracy.
// Then d * 10^estimated_power is the representation of v.
// (Note: the fraction and the estimated_power might get adjusted before
// generating the decimal representation.)
//
// The initial start values consist of:
//  - a scaled numerator: s.t. numerator/denominator == v / 10^estimated_power.
//  - a scaled (common) denominator.
//  optionally (used by GenerateShortestDigits to decide if it has the shortest
//  decimal converting back to v):
//  - v - m-: the distance to the lower boundary.
//  - m+ - v: the distance to the upper boundary.
//
// v, m+, m-, and therefore v - m- and m+ - v all share the same denominator.
//
// Let ep == estimated_power, then the returned values will satisfy:
//  v / 10^ep = numerator / denominator.
//  v's boundarys m- and m+:
//    m- / 10^ep == v / 10^ep - delta_minus / denominator
//    m+ / 10^ep == v / 10^ep + delta_plus / denominator
//  Or in other words:
//    m- == v - delta_minus * 10^ep / denominator;
//    m+ == v + delta_plus * 10^ep / denominator;
//
// Since 10^(k-1) <= v < 10^k    (with k == estimated_power)
//  or       10^k <= v < 10^(k+1)
//  we then have 0.1 <= numerator/denominator < 1
//           or    1 <= numerator/denominator < 10
//
// It is then easy to kickstart the digit-generation routine.
//
// The boundary-deltas are only filled if the mode equals BIGNUM_DTOA_SHORTEST
// or BIGNUM_DTOA_SHORTEST_SINGLE.

static void InitialScaledStartValues(uint64_t significand,
                                     int exponent,
                                     bool lower_boundary_is_closer,
                                     int estimated_power,
                                     bool need_boundary_deltas,
                                     Bignum* numerator,
                                     Bignum* denominator,
                                     Bignum* delta_minus,
                                     Bignum* delta_plus) {
  if (exponent >= 0) {
    InitialScaledStartValuesPositiveExponent(
        significand, exponent, estimated_power, need_boundary_deltas,
        numerator, denominator, delta_minus, delta_plus);
  } else if (estimated_power >= 0) {
    InitialScaledStartValuesNegativeExponentPositivePower(
        significand, exponent, estimated_power, need_boundary_deltas,
        numerator, denominator, delta_minus, delta_plus);
  } else {
    InitialScaledStartValuesNegativeExponentNegativePower(
        significand, exponent, estimated_power, need_boundary_deltas,
        numerator, denominator, delta_minus, delta_plus);
  }

  if (need_boundary_deltas && lower_boundary_is_closer) {
    // The lower boundary is closer at half the distance of "normal" numbers.
    // Increase the common denominator and adapt all but the delta_minus.
    denominator->ShiftLeft(1);  // *2
    numerator->ShiftLeft(1);    // *2
    delta_plus->ShiftLeft(1);   // *2
  }
}


// This routine multiplies numerator/denominator so that its values lies in the
// range 1-10. That is after a call to this function we have:
//    1 <= (numerator + delta_plus) /denominator < 10.
// Let numerator the input before modification and numerator' the argument
// after modification, then the output-parameter decimal_point is such that
//  numerator / denominator * 10^estimated_power ==
//    numerator' / denominator' * 10^(decimal_point - 1)
// In some cases estimated_power was too low, and this is already the case. We
// then simply adjust the power so that 10^(k-1) <= v < 10^k (with k ==
// estimated_power) but do not touch the numerator or denominator.
// Otherwise the routine multiplies the numerator and the deltas by 10.
static void FixupMultiply10(int estimated_power, bool is_even,
                            int* decimal_point,
                            Bignum* numerator, Bignum* denominator,
                            Bignum* delta_minus, Bignum* delta_plus) {
  bool in_range;
  if (is_even) {
    // For IEEE doubles half-way cases (in decimal system numbers ending with 5)
    // are rounded to the closest floating-point number with even significand.
    in_range = Bignum::PlusCompare(*numerator, *delta_plus, *denominator) >= 0;
  } else {
    in_range = Bignum::PlusCompare(*numerator, *delta_plus, *denominator) > 0;
  }
  if (in_range) {
    // Since numerator + delta_plus >= denominator we already have
    // 1 <= numerator/denominator < 10. Simply update the estimated_power.
    *decimal_point = estimated_power + 1;
  } else {
    *decimal_point = estimated_power;
    numerator->Times10();
    if (Bignum::Equal(*delta_minus, *delta_plus)) {
      delta_minus->Times10();
      delta_plus->AssignBignum(*delta_minus);
    } else {
      delta_minus->Times10();
      delta_plus->Times10();
    }
  }
}

}  // namespace double_conversion


================================================
FILE: src/kenlm/util/double-conversion/bignum-dtoa.h
================================================
// Copyright 2010 the V8 project authors. All rights reserved.
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are
// met:
//
//     * Redistributions of source code must retain the above copyright
//       notice, this list of conditions and the following disclaimer.
//     * Redistributions in binary form must reproduce the above
//       copyright notice, this list of conditions and the following
//       disclaimer in the documentation and/or other materials provided
//       with the distribution.
//     * Neither the name of Google Inc. nor the names of its
//       contributors may be used to endorse or promote products derived
//       from this software without specific prior written permission.
//
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

#ifndef DOUBLE_CONVERSION_BIGNUM_DTOA_H_
#define DOUBLE_CONVERSION_BIGNUM_DTOA_H_

#include "utils.h"

namespace double_conversion {

enum BignumDtoaMode {
  // Return the shortest correct representation.
  // For example the output of 0.299999999999999988897 is (the less accurate but
  // correct) 0.3.
  BIGNUM_DTOA_SHORTEST,
  // Same as BIGNUM_DTOA_SHORTEST but for single-precision floats.
  BIGNUM_DTOA_SHORTEST_SINGLE,
  // Return a fixed number of digits after the decimal point.
  // For instance fixed(0.1, 4) becomes 0.1000
  // If the input number is big, the output will be big.
  BIGNUM_DTOA_FIXED,
  // Return a fixed number of digits, no matter what the exponent is.
  BIGNUM_DTOA_PRECISION
};

// Converts the given double 'v' to ascii.
// The result should be interpreted as buffer * 10^(point-length).
// The buffer will be null-terminated.
//
// The input v must be > 0 and different from NaN, and Infinity.
//
// The output depends on the given mode:
//  - SHORTEST: produce the least amount of digits for which the internal
//   identity requirement is still satisfied. If the digits are printed
//   (together with the correct exponent) then reading this number will give
//   'v' again. The buffer will choose the representation that is closest to
//   'v'. If there are two at the same distance, than the number is round up.
//   In this mode the 'requested_digits' parameter is ignored.
//  - FIXED: produces digits necessary to print a given number with
//   'requested_digits' digits after the decimal point. The produced digits
//   might be too short in which case the caller has to fill the gaps with '0's.
//   Example: toFixed(0.001, 5) is allowed to return buffer="1", point=-2.
//   Halfway cases are rounded up. The call toFixed(0.15, 2) thus returns
//     buffer="2", point=0.
//   Note: the length of the returned buffer has no meaning wrt the significance
//   of its digits. That is, just because it contains '0's does not mean that
//   any other digit would not satisfy the internal identity requirement.
//  - PRECISION: produces 'requested_digits' where the first digit is not '0'.
//   Even though the length of produced digits usually equals
//   'requested_digits', the function is allowed to return fewer digits, in
//   which case the caller has to fill the missing digits with '0's.
//   Halfway cases are again rounded up.
// 'BignumDtoa' expects the given buffer to be big enough to hold all digits
// and a terminating null-character.
void BignumDtoa(double v, BignumDtoaMode mode, int requested_digits,
                Vector<char> buffer, int* length, int* point);

}  // namespace double_conversion

#endif  // DOUBLE_CONVERSION_BIGNUM_DTOA_H_


================================================
FILE: src/kenlm/util/double-conversion/bignum.cc
================================================
// Copyright 2010 the V8 project authors. All rights reserved.
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are
// met:
//
//     * Redistributions of source code must retain the above copyright
//       notice, this list of conditions and the following disclaimer.
//     * Redistributions in binary form must reproduce the above
//       copyright notice, this list of conditions and the following
//       disclaimer in the documentation and/or other materials provided
//       with the distribution.
//     * Neither the name of Google Inc. nor the names of its
//       contributors may be used to endorse or promote products derived
//       from this software without specific prior written permission.
//
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

#include "bignum.h"
#include "utils.h"

namespace double_conversion {

Bignum::Bignum()
    : bigits_(bigits_buffer_, kBigitCapacity), used_digits_(0), exponent_(0) {
  for (int i = 0; i < kBigitCapacity; ++i) {
    bigits_[i] = 0;
  }
}


template<typename S>
static int BitSize(S value) {
  return 8 * sizeof(value);
}

// Guaranteed to lie in one Bigit.
void Bignum::AssignUInt16(uint16_t value) {
  ASSERT(kBigitSize >= BitSize(value));
  Zero();
  if (value == 0) return;

  EnsureCapacity(1);
  bigits_[0] = value;
  used_digits_ = 1;
}


void Bignum::AssignUInt64(uint64_t value) {
  const int kUInt64Size = 64;

  Zero();
  if (value == 0) return;

  int needed_bigits = kUInt64Size / kBigitSize + 1;
  EnsureCapacity(needed_bigits);
  for (int i = 0; i < needed_bigits; ++i) {
    bigits_[i] = value & kBigitMask;
    value = value >> kBigitSize;
  }
  used_digits_ = needed_bigits;
  Clamp();
}


void Bignum::AssignBignum(const Bignum& other) {
  exponent_ = other.exponent_;
  for (int i = 0; i < other.used_digits_; ++i) {
    bigits_[i] = other.bigits_[i];
  }
  // Clear the excess digits (if there were any).
  for (int i = other.used_digits_; i < used_digits_; ++i) {
    bigits_[i] = 0;
  }
  used_digits_ = other.used_digits_;
}


static uint64_t ReadUInt64(Vector<const char> buffer,
                           int from,
                           int digits_to_read) {
  uint64_t result = 0;
  for (int i = from; i < from + digits_to_read; ++i) {
    int digit = buffer[i] - '0';
    ASSERT(0 <= digit && digit <= 9);
    result = result * 10 + digit;
  }
  return result;
}


void Bignum::AssignDecimalString(Vector<const char> value) {
  // 2^64 = 18446744073709551616 > 10^19
  const int kMaxUint64DecimalDigits = 19;
  Zero();
  int length = value.length();
  int pos = 0;
  // Let's just say that each digit needs 4 bits.
  while (length >= kMaxUint64DecimalDigits) {
    uint64_t digits = ReadUInt64(value, pos, kMaxUint64DecimalDigits);
    pos += kMaxUint64DecimalDigits;
    length -= kMaxUint64DecimalDigits;
    MultiplyByPowerOfTen(kMaxUint64DecimalDigits);
    AddUInt64(digits);
  }
  uint64_t digits = ReadUInt64(value, pos, length);
  MultiplyByPowerOfTen(length);
  AddUInt64(digits);
  Clamp();
}


static int HexCharValue(char c) {
  if ('0' <= c && c <= '9') return c - '0';
  if ('a' <= c && c <= 'f') return 10 + c - 'a';
  if ('A' <= c && c <= 'F') return 10 + c - 'A';
  UNREACHABLE();
  return 0;  // To make compiler happy.
}


void Bignum::AssignHexString(Vector<const char> value) {
  Zero();
  int length = value.length();

  int needed_bigits = length * 4 / kBigitSize + 1;
  EnsureCapacity(needed_bigits);
  int string_index = length - 1;
  for (int i = 0; i < needed_bigits - 1; ++i) {
    // These bigits are guaranteed to be "full".
    Chunk current_bigit = 0;
    for (int j = 0; j < kBigitSize / 4; j++) {
      current_bigit += HexCharValue(value[string_index--]) << (j * 4);
    }
    bigits_[i] = current_bigit;
  }
  used_digits_ = needed_bigits - 1;

  Chunk most_significant_bigit = 0;  // Could be = 0;
  for (int j = 0; j <= string_index; ++j) {
    most_significant_bigit <<= 4;
    most_significant_bigit += HexCharValue(value[j]);
  }
  if (most_significant_bigit != 0) {
    bigits_[used_digits_] = most_significant_bigit;
    used_digits_++;
  }
  Clamp();
}


void Bignum::AddUInt64(uint64_t operand) {
  if (operand == 0) return;
  Bignum other;
  other.AssignUInt64(operand);
  AddBignum(other);
}


void Bignum::AddBignum(const Bignum& other) {
  ASSERT(IsClamped());
  ASSERT(other.IsClamped());

  // If this has a greater exponent than other append zero-bigits to this.
  // After this call exponent_ <= other.exponent_.
  Align(other);

  // There are two possibilities:
  //   aaaaaaaaaaa 0000  (where the 0s represent a's exponent)
  //     bbbbb 00000000
  //   ----------------
  //   ccccccccccc 0000
  // or
  //    aaaaaaaaaa 0000
  //  bbbbbbbbb 0000000
  //  -----------------
  //  cccccccccccc 0000
  // In both cases we might need a carry bigit.

  EnsureCapacity(1 + Max(BigitLength(), other.BigitLength()) - exponent_);
  Chunk carry = 0;
  int bigit_pos = other.exponent_ - exponent_;
  ASSERT(bigit_pos >= 0);
  for (int i = 0; i < other.used_digits_; ++i) {
    Chunk sum = bigits_[bigit_pos] + other.bigits_[i] + carry;
    bigits_[bigit_pos] = sum & kBigitMask;
    carry = sum >> kBigitSize;
    bigit_pos++;
  }

  while (carry != 0) {
    Chunk sum = bigits_[bigit_pos] + carry;
    bigits_[bigit_pos] = sum & kBigitMask;
    carry = sum >> kBigitSize;
    bigit_pos++;
  }
  used_digits_ = Max(bigit_pos, used_digits_);
  ASSERT(IsClamped());
}


void Bignum::SubtractBignum(const Bignum& other) {
  ASSERT(IsClamped());
  ASSERT(other.IsClamped());
  // We require this to be bigger than other.
  ASSERT(LessEqual(other, *this));

  Align(other);

  int offset = other.exponent_ - exponent_;
  Chunk borrow = 0;
  int i;
  for (i = 0; i < other.used_digits_; ++i) {
    ASSERT((borrow == 0) || (borrow == 1));
    Chunk difference = bigits_[i + offset] - other.bigits_[i] - borrow;
    bigits_[i + offset] = difference & kBigitMask;
    borrow = difference >> (kChunkSize - 1);
  }
  while (borrow != 0) {
    Chunk difference = bigits_[i + offset] - borrow;
    bigits_[i + offset] = difference & kBigitMask;
    borrow = difference >> (kChunkSize - 1);
    ++i;
  }
  Clamp();
}


void Bignum::ShiftLeft(int shift_amount) {
  if (used_digits_ == 0) return;
  exponent_ += shift_amount / kBigitSize;
  int local_shift = shift_amount % kBigitSize;
  EnsureCapacity(used_digits_ + 1);
  BigitsShiftLeft(local_shift);
}


void Bignum::MultiplyByUInt32(uint32_t factor) {
  if (factor == 1) return;
  if (factor == 0) {
    Zero();
    return;
  }
  if (used_digits_ == 0) return;

  // The product of a bigit with the factor is of size kBigitSize + 32.
  // Assert that this number + 1 (for the carry) fits into double chunk.
  ASSERT(kDoubleChunkSize >= kBigitSize + 32 + 1);
  DoubleChunk carry = 0;
  for (int i = 0; i < used_digits_; ++i) {
    DoubleChunk product = static_cast<DoubleChunk>(factor) * bigits_[i] + carry;
    bigits_[i] = static_cast<Chunk>(product & kBigitMask);
    carry = (product >> kBigitSize);
  }
  while (carry != 0) {
    EnsureCapacity(used_digits_ + 1);
    bigits_[used_digits_] = carry & kBigitMask;
    used_digits_++;
    carry >>= kBigitSize;
  }
}


void Bignum::MultiplyByUInt64(uint64_t factor) {
  if (factor == 1) return;
  if (factor == 0) {
    Zero();
    return;
  }
  ASSERT(kBigitSize < 32);
  uint64_t carry = 0;
  uint64_t low = factor & 0xFFFFFFFF;
  uint64_t high = factor >> 32;
  for (int i = 0; i < used_digits_; ++i) {
    uint64_t product_low = low * bigits_[i];
    uint64_t product_high = high * bigits_[i];
    uint64_t tmp = (carry & kBigitMask) + product_low;
    bigits_[i] = tmp & kBigitMask;
    carry = (carry >> kBigitSize) + (tmp >> kBigitSize) +
        (product_high << (32 - kBigitSize));
  }
  while (carry != 0) {
    EnsureCapacity(used_digits_ + 1);
    bigits_[used_digits_] = carry & kBigitMask;
    used_digits_++;
    carry >>= kBigitSize;
  }
}


void Bignum::MultiplyByPowerOfTen(int exponent) {
  const uint64_t kFive27 = UINT64_2PART_C(0x6765c793, fa10079d);
  const uint16_t kFive1 = 5;
  const uint16_t kFive2 = kFive1 * 5;
  const uint16_t kFive3 = kFive2 * 5;
  const uint16_t kFive4 = kFive3 * 5;
  const uint16_t kFive5 = kFive4 * 5;
  const uint16_t kFive6 = kFive5 * 5;
  const uint32_t kFive7 = kFive6 * 5;
  const uint32_t kFive8 = kFive7 * 5;
  const uint32_t kFive9 = kFive8 * 5;
  const uint32_t kFive10 = kFive9 * 5;
  const uint32_t kFive11 = kFive10 * 5;
  const uint32_t kFive12 = kFive11 * 5;
  const uint32_t kFive13 = kFive12 * 5;
  const uint32_t kFive1_to_12[] =
      { kFive1, kFive2, kFive3, kFive4, kFive5, kFive6,
        kFive7, kFive8, kFive9, kFive10, kFive11, kFive12 };

  ASSERT(exponent >= 0);
  if (exponent == 0) return;
  if (used_digits_ == 0) return;

  // We shift by exponent at the end just before returning.
  int remaining_exponent = exponent;
  while (remaining_exponent >= 27) {
    MultiplyByUInt64(kFive27);
    remaining_exponent -= 27;
  }
  while (remaining_exponent >= 13) {
    MultiplyByUInt32(kFive13);
    remaining_exponent -= 13;
  }
  if (remaining_exponent > 0) {
    MultiplyByUInt32(kFive1_to_12[remaining_exponent - 1]);
  }
  ShiftLeft(exponent);
}


void Bignum::Square() {
  ASSERT(IsClamped());
  int product_length = 2 * used_digits_;
  EnsureCapacity(product_length);

  // Comba multiplication: compute each column separately.
  // Example: r = a2a1a0 * b2b1b0.
  //    r =  1    * a0b0 +
  //        10    * (a1b0 + a0b1) +
  //        100   * (a2b0 + a1b1 + a0b2) +
  //        1000  * (a2b1 + a1b2) +
  //        10000 * a2b2
  //
  // In the worst case we have to accumulate nb-digits products of digit*digit.
  //
  // Assert that the additional number of bits in a DoubleChunk are enough to
  // sum up used_digits of Bigit*Bigit.
  if ((1 << (2 * (kChunkSize - kBigitSize))) <= used_digits_) {
    UNIMPLEMENTED();
  }
  DoubleChunk accumulator = 0;
  // First shift the digits so we don't overwrite them.
  int copy_offset = used_digits_;
  for (int i = 0; i < used_digits_; ++i) {
    bigits_[copy_offset + i] = bigits_[i];
  }
  // We have two loops to avoid some 'if's in the loop.
  for (int i = 0; i < used_digits_; ++i) {
    // Process temporary digit i with power i.
    // The sum of the two indices must be equal to i.
    int bigit_index1 = i;
    int bigit_index2 = 0;
    // Sum all of the sub-products.
    while (bigit_index1 >= 0) {
      Chunk chunk1 = bigits_[copy_offset + bigit_index1];
      Chunk chunk2 = bigits_[copy_offset + bigit_index2];
      accumulator += static_cast<DoubleChunk>(chunk1) * chunk2;
      bigit_index1--;
      bigit_index2++;
    }
    bigits_[i] = static_cast<Chunk>(accumulator) & kBigitMask;
    accumulator >>= kBigitSize;
  }
  for (int i = used_digits_; i < product_length; ++i) {
    int bigit_index1 = used_digits_ - 1;
    int bigit_index2 = i - bigit_index1;
    // Invariant: sum of both indices is again equal to i.
    // Inner loop runs 0 times on last iteration, emptying accumulator.
    while (bigit_index2 < used_digits_) {
      Chunk chunk1 = bigits_[copy_offset + bigit_index1];
      Chunk chunk2 = bigits_[copy_offset + bigit_index2];
      accumulator += static_cast<DoubleChunk>(chunk1) * chunk2;
      bigit_index1--;
      bigit_index2++;
    }
    // The overwritten bigits_[i] will never be read in further loop iterations,
    // because bigit_index1 and bigit_index2 are always greater
    // than i - used_digits_.
    bigits_[i] = static_cast<Chunk>(accumulator) & kBigitMask;
    accumulator >>= kBigitSize;
  }
  // Since the result was guaranteed to lie inside the number the
  // accumulator must be 0 now.
  ASSERT(accumulator == 0);

  // Don't forget to update the used_digits and the exponent.
  used_digits_ = product_length;
  exponent_ *= 2;
  Clamp();
}


void Bignum::AssignPowerUInt16(uint16_t base, int power_exponent) {
  ASSERT(base != 0);
  ASSERT(power_exponent >= 0);
  if (power_exponent == 0) {
    AssignUInt16(1);
    return;
  }
  Zero();
  int shifts = 0;
  // We expect base to be in range 2-32, and most often to be 10.
  // It does not make much sense to implement different algorithms for counting
  // the bits.
  while ((base & 1) == 0) {
    base >>= 1;
    shifts++;
  }
  int bit_size = 0;
  int tmp_base = base;
  while (tmp_base != 0) {
    tmp_base >>= 1;
    bit_size++;
  }
  int final_size = bit_size * power_exponent;
  // 1 extra bigit for the shifting, and one for rounded final_size.
  EnsureCapacity(final_size / kBigitSize + 2);

  // Left to Right exponentiation.
  int mask = 1;
  while (power_exponent >= mask) mask <<= 1;

  // The mask is now pointing to the bit above the most significant 1-bit of
  // power_exponent.
  // Get rid of first 1-bit;
  mask >>= 2;
  uint64_t this_value = base;

  bool delayed_multipliciation = false;
  const uint64_t max_32bits = 0xFFFFFFFF;
  while (mask != 0 && this_value <= max_32bits) {
    this_value = this_value * this_value;
    // Verify that there is enough space in this_value to perform the
    // multiplication.  The first bit_size bits must be 0.
    if ((power_exponent & mask) != 0) {
      uint64_t base_bits_mask =
          ~((static_cast<uint64_t>(1) << (64 - bit_size)) - 1);
      bool high_bits_zero = (this_value & base_bits_mask) == 0;
      if (high_bits_zero) {
        this_value *= base;
      } else {
        delayed_multipliciation = true;
      }
    }
    mask >>= 1;
  }
  AssignUInt64(this_value);
  if (delayed_multipliciation) {
    MultiplyByUInt32(base);
  }

  // Now do the same thing as a bignum.
  while (mask != 0) {
    Square();
    if ((power_exponent & mask) != 0) {
      MultiplyByUInt32(base);
    }
    mask >>= 1;
  }

  // And finally add the saved shifts.
  ShiftLeft(shifts * power_exponent);
}


// Precondition: this/other < 16bit.
uint16_t Bignum::DivideModuloIntBignum(const Bignum& other) {
  ASSERT(IsClamped());
  ASSERT(other.IsClamped());
  ASSERT(other.used_digits_ > 0);

  // Easy case: if we have less digits than the divisor than the result is 0.
  // Note: this handles the case where this == 0, too.
  if (BigitLength() < other.BigitLength()) {
    return 0;
  }

  Align(other);

  uint16_t result = 0;

  // Start by removing multiples of 'other' until both numbers have the same
  // number of digits.
  while (BigitLength() > other.BigitLength()) {
    // This naive approach is extremely inefficient if the this divided other
    // might be big. This function is implemented for doubleToString where
    // the result should be small (less than 10).
    ASSERT(other.bigits_[other.used_digits_ - 1] >= ((1 << kBigitSize) / 16));
    // Remove the multiples of the first digit.
    // Example this = 23 and other equals 9. -> Remove 2 multiples.
    result += bigits_[used_digits_ - 1];
    SubtractTimes(other, bigits_[used_digits_ - 1]);
  }

  ASSERT(BigitLength() == other.BigitLength());

  // Both bignums are at the same length now.
  // Since other has more than 0 digits we know that the access to
  // bigits_[used_digits_ - 1] is safe.
  Chunk this_bigit = bigits_[used_digits_ - 1];
  Chunk other_bigit = other.bigits_[other.used_digits_ - 1];

  if (other.used_digits_ == 1) {
    // Shortcut for easy (and common) case.
    int quotient = this_bigit / other_bigit;
    bigits_[used_digits_ - 1] = this_bigit - other_bigit * quotient;
    result += quotient;
    Clamp();
    return result;
  }

  int division_estimate = this_bigit / (other_bigit + 1);
  result += division_estimate;
  SubtractTimes(other, division_estimate);

  if (other_bigit * (division_estimate + 1) > this_bigit) {
    // No need to even try to subtract. Even if other's remaining digits were 0
    // another subtraction would be too much.
    return result;
  }

  while (LessEqual(other, *this)) {
    SubtractBignum(other);
    result++;
  }
  return result;
}


template<typename S>
static int SizeInHexChars(S number) {
  ASSERT(number > 0);
  int result = 0;
  while (number != 0) {
    number >>= 4;
    result++;
  }
  return result;
}


static char HexCharOfValue(int value) {
  ASSERT(0 <= value && value <= 16);
  if (value < 10) return value + '0';
  return value - 10 + 'A';
}


bool Bignum::ToHexString(char* buffer, int buffer_size) const {
  ASSERT(IsClamped());
  // Each bigit must be printable as separate hex-character.
  ASSERT(kBigitSize % 4 == 0);
  const int kHexCharsPerBigit = kBigitSize / 4;

  if (used_digits_ == 0) {
    if (buffer_size < 2) return false;
    buffer[0] = '0';
    buffer[1] = '\0';
    return true;
  }
  // We add 1 for the terminating '\0' character.
  int needed_chars = (BigitLength() - 1) * kHexCharsPerBigit +
      SizeInHexChars(bigits_[used_digits_ - 1]) + 1;
  if (needed_chars > buffer_size) return false;
  int string_index = needed_chars - 1;
  buffer[string_index--] = '\0';
  for (int i = 0; i < exponent_; ++i) {
    for (int j = 0; j < kHexCharsPerBigit; ++j) {
      buffer[string_index--] = '0';
    }
  }
  for (int i = 0; i < used_digits_ - 1; ++i) {
    Chunk current_bigit = bigits_[i];
    for (int j = 0; j < kHexCharsPerBigit; ++j) {
      buffer[string_index--] = HexCharOfValue(current_bigit & 0xF);
      current_bigit >>= 4;
    }
  }
  // And finally the last bigit.
  Chunk most_significant_bigit = bigits_[used_digits_ - 1];
  while (most_significant_bigit != 0) {
    buffer[string_index--] = HexCharOfValue(most_significant_bigit & 0xF);
    most_significant_bigit >>= 4;
  }
  return true;
}


Bignum::Chunk Bignum::BigitAt(int index) const {
  if (index >= BigitLength()) return 0;
  if (index < exponent_) return 0;
  return bigits_[index - exponent_];
}


int Bignum::Compare(const Bignum& a, const Bignum& b) {
  ASSERT(a.IsClamped());
  ASSERT(b.IsClamped());
  int bigit_length_a = a.BigitLength();
  int bigit_length_b = b.BigitLength();
  if (bigit_length_a < bigit_length_b) return -1;
  if (bigit_length_a > bigit_length_b) return +1;
  for (int i = bigit_length_a - 1; i >= Min(a.exponent_, b.exponent_); --i) {
    Chunk bigit_a = a.BigitAt(i);
    Chunk bigit_b = b.BigitAt(i);
    if (bigit_a < bigit_b) return -1;
    if (bigit_a > bigit_b) return +1;
    // Otherwise they are equal up to this digit. Try the next digit.
  }
  return 0;
}


int Bignum::PlusCompare(const Bignum& a, const Bignum& b, const Bignum& c) {
  ASSERT(a.IsClamped());
  ASSERT(b.IsClamped());
  ASSERT(c.IsClamped());
  if (a.BigitLength() < b.BigitLength()) {
    return PlusCompare(b, a, c);
  }
  if (a.BigitLength() + 1 < c.BigitLength()) return -1;
  if (a.BigitLength() > c.BigitLength()) return +1;
  // The exponent encodes 0-bigits. So if there are more 0-digits in 'a' than
  // 'b' has digits, then the bigit-length of 'a'+'b' must be equal to the one
  // of 'a'.
  if (a.exponent_ >= b.BigitLength() && a.BigitLength() < c.BigitLength()) {
    return -1;
  }

  Chunk borrow = 0;
  // Starting at min_exponent all digits are == 0. So no need to compare them.
  int min_exponent = Min(Min(a.exponent_, b.exponent_), c.exponent_);
  for (int i = c.BigitLength() - 1; i >= min_exponent; --i) {
    Chunk chunk_a = a.BigitAt(i);
    Chunk chunk_b = b.BigitAt(i);
    Chunk chunk_c = c.BigitAt(i);
    Chunk sum = chunk_a + chunk_b;
    if (sum > chunk_c + borrow) {
      return +1;
    } else {
      borrow = chunk_c + borrow - sum;
      if (borrow > 1) return -1;
      borrow <<= kBigitSize;
    }
  }
  if (borrow == 0) return 0;
  return -1;
}


void Bignum::Clamp() {
  while (used_digits_ > 0 && bigits_[used_digits_ - 1] == 0) {
    used_digits_--;
  }
  if (used_digits_ == 0) {
    // Zero.
    exponent_ = 0;
  }
}


bool Bignum::IsClamped() const {
  return used_digits_ == 0 || bigits_[used_digits_ - 1] != 0;
}


void Bignum::Zero() {
  for (int i = 0; i < used_digits_; ++i) {
    bigits_[i] = 0;
  }
  used_digits_ = 0;
  exponent_ = 0;
}


void Bignum::Align(const Bignum& other) {
  if (exponent_ > other.exponent_) {
    // If "X" represents a "hidden" digit (by the exponent) then we are in the
    // following case (a == this, b == other):
    // a:  aaaaaaXXXX   or a:   aaaaaXXX
    // b:     bbbbbbX      b: bbbbbbbbXX
    // We replace some of the hidden digits (X) of a with 0 digits.
    // a:  aaaaaa000X   or a:   aaaaa0XX
    int zero_digits = exponent_ - other.exponent_;
    EnsureCapacity(used_digits_ + zero_digits);
    for (int i = used_digits_ - 1; i >= 0; --i) {
      bigits_[i + zero_digits] = bigits_[i];
    }
    for (int i = 0; i < zero_digits; ++i) {
      bigits_[i] = 0;
    }
    used_digits_ += zero_digits;
    exponent_ -= zero_digits;
    ASSERT(used_digits_ >= 0);
    ASSERT(exponent_ >= 0);
  }
}


void Bignum::BigitsShiftLeft(int shift_amount) {
  ASSERT(shift_amount < kBigitSize);
  ASSERT(shift_amount >= 0);
  Chunk carry = 0;
  for (int i = 0; i < used_digits_; ++i) {
    Chunk new_carry = bigits_[i] >> (kBigitSize - shift_amount);
    bigits_[i] = ((bigits_[i] << shift_amount) + carry) & kBigitMask;
    carry = new_carry;
  }
  if (carry != 0) {
    bigits_[used_digits_] = carry;
    used_digits_++;
  }
}


void Bignum::SubtractTimes(const Bignum& other, int factor) {
  ASSERT(exponent_ <= other.exponent_);
  if (factor < 3) {
    for (int i = 0; i < factor; ++i) {
      SubtractBignum(other);
    }
    return;
  }
  Chunk borrow = 0;
  int exponent_diff = other.exponent_ - exponent_;
  for (int i = 0; i < other.used_digits_; ++i) {
    DoubleChunk product = static_cast<DoubleChunk>(factor) * other.bigits_[i];
    DoubleChunk remove = borrow + product;
    Chunk difference = bigits_[i + exponent_diff] - (remove & kBigitMask);
    bigits_[i + exponent_diff] = difference & kBigitMask;
    borrow = static_cast<Chunk>((difference >> (kChunkSize - 1)) +
                                (remove >> kBigitSize));
  }
  for (int i = other.used_digits_ + exponent_diff; i < used_digits_; ++i) {
    if (borrow == 0) return;
    Chunk difference = bigits_[i] - borrow;
    bigits_[i] = difference & kBigitMask;
    borrow = difference >> (kChunkSize - 1);
    ++i;
  }
  Clamp();
}


}  // namespace double_conversion


================================================
FILE: src/kenlm/util/double-conversion/bignum.h
================================================
// Copyright 2010 the V8 project authors. All rights reserved.
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are
// met:
//
//     * Redistributions of source code must retain the above copyright
//       notice, this list of conditions and the following disclaimer.
//     * Redistributions in binary form must reproduce the above
//       copyright notice, this list of conditions and the following
//       disclaimer in the documentation and/or other materials provided
//       with the distribution.
//     * Neither the name of Google Inc. nor the names of its
//       contributors may be used to endorse or promote products derived
//       from this software without specific prior written permission.
//
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

#ifndef DOUBLE_CONVERSION_BIGNUM_H_
#define DOUBLE_CONVERSION_BIGNUM_H_

#include "utils.h"

namespace double_conversion {

class Bignum {
 public:
  // 3584 = 128 * 28. We can represent 2^3584 > 10^1000 accurately.
  // This bignum can encode much bigger numbers, since it contains an
  // exponent.
  static const int kMaxSignificantBits = 3584;

  Bignum();
  void AssignUInt16(uint16_t value);
  void AssignUInt64(uint64_t value);
  void AssignBignum(const Bignum& other);

  void AssignDecimalString(Vector<const char> value);
  void AssignHexString(Vector<const char> value);

  void AssignPowerUInt16(uint16_t base, int exponent);

  void AddUInt16(uint16_t operand);
  void AddUInt64(uint64_t operand);
  void AddBignum(const Bignum& other);
  // Precondition: this >= other.
  void SubtractBignum(const Bignum& other);

  void Square();
  void ShiftLeft(int shift_amount);
  void MultiplyByUInt32(uint32_t factor);
  void MultiplyByUInt64(uint64_t factor);
  void MultiplyByPowerOfTen(int exponent);
  void Times10() { return MultiplyByUInt32(10); }
  // Pseudocode:
  //  int result = this / other;
  //  this = this % other;
  // In the worst case this function is in O(this/other).
  uint16_t DivideModuloIntBignum(const Bignum& other);

  bool ToHexString(char* buffer, int buffer_size) const;

  // Returns
  //  -1 if a < b,
  //   0 if a == b, and
  //  +1 if a > b.
  static int Compare(const Bignum& a, const Bignum& b);
  static bool Equal(const Bignum& a, const Bignum& b) {
    return Compare(a, b) == 0;
  }
  static bool LessEqual(const Bignum& a, const Bignum& b) {
    return Compare(a, b) <= 0;
  }
  static bool Less(const Bignum& a, const Bignum& b) {
    return Compare(a, b) < 0;
  }
  // Returns Compare(a + b, c);
  static int PlusCompare(const Bignum& a, const Bignum& b, const Bignum& c);
  // Returns a + b == c
  static bool PlusEqual(const Bignum& a, const Bignum& b, const Bignum& c) {
    return PlusCompare(a, b, c) == 0;
  }
  // Returns a + b <= c
  static bool PlusLessEqual(const Bignum& a, const Bignum& b, const Bignum& c) {
    return PlusCompare(a, b, c) <= 0;
  }
  // Returns a + b < c
  static bool PlusLess(const Bignum& a, const Bignum& b, const Bignum& c) {
    return PlusCompare(a, b, c) < 0;
  }
 private:
  typedef uint32_t Chunk;
  typedef uint64_t DoubleChunk;

  static const int kChunkSize = sizeof(Chunk) * 8;
  static const int kDoubleChunkSize = sizeof(DoubleChunk) * 8;
  // With bigit size of 28 we loose some bits, but a double still fits easily
  // into two chunks, and more importantly we can use the Comba multiplication.
  static const int kBigitSize = 28;
  static const Chunk kBigitMask = (1 << kBigitSize) - 1;
  // Every instance allocates kBigitLength chunks on the stack. Bignums cannot
  // grow. There are no checks if the stack-allocated space is sufficient.
  static const int kBigitCapacity = kMaxSignificantBits / kBigitSize;

  void EnsureCapacity(int size) {
    if (size > kBigitCapacity) {
      UNREACHABLE();
    }
  }
  void Align(const Bignum& other);
  void Clamp();
  bool IsClamped() const;
  void Zero();
  // Requires this to have enough capacity (no tests done).
  // Updates used_digits_ if necessary.
  // shift_amount must be < kBigitSize.
  void BigitsShiftLeft(int shift_amount);
  // BigitLength includes the "hidden" digits encoded in the exponent.
  int BigitLength() const { return used_digits_ + exponent_; }
  Chunk BigitAt(int index) const;
  void SubtractTimes(const Bignum& other, int factor);

  Chunk bigits_buffer_[kBigitCapacity];
  // A vector backed by bigits_buffer_. This way accesses to the array are
  // checked for out-of-bounds errors.
  Vector<Chunk> bigits_;
  int used_digits_;
  // The Bignum's value equals value(bigits_) * 2^(exponent_ * kBigitSize).
  int exponent_;

  DISALLOW_COPY_AND_ASSIGN(Bignum);
};

}  // namespace double_conversion

#endif  // DOUBLE_CONVERSION_BIGNUM_H_


================================================
FILE: src/kenlm/util/double-conversion/cached-powers.cc
================================================
// Copyright 2006-2008 the V8 project authors. All rights reserved.
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are
// met:
//
//     * Redistributions of source code must retain the above copyright
//       notice, this list of conditions and the following disclaimer.
//     * Redistributions in binary form must reproduce the above
//       copyright notice, this list of conditions and the following
//       disclaimer in the documentation and/or other materials provided
//       with the distribution.
//     * Neither the name of Google Inc. nor the names of its
//       contributors may be used to endorse or promote products derived
//       from this software without specific prior written permission.
//
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

#include <stdarg.h>
#include <limits.h>
#include <math.h>

#include "utils.h"

#include "cached-powers.h"

namespace double_conversion {

struct CachedPower {
  uint64_t significand;
  int16_t binary_exponent;
  int16_t decimal_exponent;
};

static const CachedPower kCachedPowers[] = {
  {UINT64_2PART_C(0xfa8fd5a0, 081c0288), -1220, -348},
  {UINT64_2PART_C(0xbaaee17f, a23ebf76), -1193, -340},
  {UINT64_2PART_C(0x8b16fb20, 3055ac76), -1166, -332},
  {UINT64_2PART_C(0xcf42894a, 5dce35ea), -1140, -324},
  {UINT64_2PART_C(0x9a6bb0aa, 55653b2d), -1113, -316},
  {UINT64_2PART_C(0xe61acf03, 3d1a45df), -1087, -308},
  {UINT64_2PART_C(0xab70fe17, c79ac6ca), -1060, -300},
  {UINT64_2PART_C(0xff77b1fc, bebcdc4f), -1034, -292},
  {UINT64_2PART_C(0xbe5691ef, 416bd60c), -1007, -284},
  {UINT64_2PART_C(0x8dd01fad, 907ffc3c), -980, -276},
  {UINT64_2PART_C(0xd3515c28, 31559a83), -954, -268},
  {UINT64_2PART_C(0x9d71ac8f, ada6c9b5), -927, -260},
  {UINT64_2PART_C(0xea9c2277, 23ee8bcb), -901, -252},
  {UINT64_2PART_C(0xaecc4991, 4078536d), -874, -244},
  {UINT64_2PART_C(0x823c1279, 5db6ce57), -847, -236},
  {UINT64_2PART_C(0xc2109436, 4dfb5637), -821, -228},
  {UINT64_2PART_C(0x9096ea6f, 3848984f), -794, -220},
  {UINT64_2PART_C(0xd77485cb, 25823ac7), -768, -212},
  {UINT64_2PART_C(0xa086cfcd, 97bf97f4), -741, -204},
  {UINT64_2PART_C(0xef340a98, 172aace5), -715, -196},
  {UINT64_2PART_C(0xb23867fb, 2a35b28e), -688, -188},
  {UINT64_2PART_C(0x84c8d4df, d2c63f3b), -661, -180},
  {UINT64_2PART_C(0xc5dd4427, 1ad3cdba), -635, -172},
  {UINT64_2PART_C(0x936b9fce, bb25c996), -608, -164},
  {UINT64_2PART_C(0xdbac6c24, 7d62a584), -582, -156},
  {UINT64_2PART_C(0xa3ab6658, 0d5fdaf6), -555, -148},
  {UINT64_2PART_C(0xf3e2f893, dec3f126), -529, -140},
  {UINT64_2PART_C(0xb5b5ada8, aaff80b8), -502, -132},
  {UINT64_2PART_C(0x87625f05, 6c7c4a8b), -475, -124},
  {UINT64_2PART_C(0xc9bcff60, 34c13053), -449, -116},
  {UINT64_2PART_C(0x964e858c, 91ba2655), -422, -108},
  {UINT64_2PART_C(0xdff97724, 70297ebd), -396, -100},
  {UINT64_2PART_C(0xa6dfbd9f, b8e5b88f), -369, -92},
  {UINT64_2PART_C(0xf8a95fcf, 88747d94), -343, -84},
  {UINT64_2PART_C(0xb9447093, 8fa89bcf), -316, -76},
  {UINT64_2PART_C(0x8a08f0f8, bf0f156b), -289, -68},
  {UINT64_2PART_C(0xcdb02555, 653131b6), -263, -60},
  {UINT64_2PART_C(0x993fe2c6, d07b7fac), -236, -52},
  {UINT64_2PART_C(0xe45c10c4, 2a2b3b06), -210, -44},
  {UINT64_2PART_C(0xaa242499, 697392d3), -183, -36},
  {UINT64_2PART_C(0xfd87b5f2, 8300ca0e), -157, -28},
  {UINT64_2PART_C(0xbce50864, 92111aeb), -130, -20},
  {UINT64_2PART_C(0x8cbccc09, 6f5088cc), -103, -12},
  {UINT64_2PART_C(0xd1b71758, e219652c), -77, -4},
  {UINT64_2PART_C(0x9c400000, 00000000), -50, 4},
  {UINT64_2PART_C(0xe8d4a510, 00000000), -24, 12},
  {UINT64_2PART_C(0xad78ebc5, ac620000), 3, 20},
  {UINT64_2PART_C(0x813f3978, f8940984), 30, 28},
  {UINT64_2PART_C(0xc097ce7b, c90715b3), 56, 36},
  {UINT64_2PART_C(0x8f7e32ce, 7bea5c70), 83, 44},
  {UINT64_2PART_C(0xd5d238a4, abe98068), 109, 52},
  {UINT64_2PART_C(0x9f4f2726, 179a2245), 136, 60},
  {UINT64_2PART_C(0xed63a231, d4c4fb27), 162, 68},
  {UINT64_2PART_C(0xb0de6538, 8cc8ada8), 189, 76},
  {UINT64_2PART_C(0x83c7088e, 1aab65db), 216, 84},
  {UINT64_2PART_C(0xc45d1df9, 42711d9a), 242, 92},
  {UINT64_2PART_C(0x924d692c, a61be758), 269, 100},
  {UINT64_2PART_C(0xda01ee64, 1a708dea), 295, 108},
  {UINT64_2PART_C(0xa26da399, 9aef774a), 322, 116},
  {UINT64_2PART_C(0xf209787b, b47d6b85), 348, 124},
  {UINT64_2PART_C(0xb454e4a1, 79dd1877), 375, 132},
  {UINT64_2PART_C(0x865b8692, 5b9bc5c2), 402, 140},
  {UINT64_2PART_C(0xc83553c5, c8965d3d), 428, 148},
  {UINT64_2PART_C(0x952ab45c, fa97a0b3), 455, 156},
  {UINT64_2PART_C(0xde469fbd, 99a05fe3), 481, 164},
  {UINT64_2PART_C(0xa59bc234, db398c25), 508, 172},
  {UINT64_2PART_C(0xf6c69a72, a3989f5c), 534, 180},
  {UINT64_2PART_C(0xb7dcbf53, 54e9bece), 561, 188},
  {UINT64_2PART_C(0x88fcf317, f22241e2), 588, 196},
  {UINT64_2PART_C(0xcc20ce9b, d35c78a5), 614, 204},
  {UINT64_2PART_C(0x98165af3, 7b2153df), 641, 212},
  {UINT64_2PART_C(0xe2a0b5dc, 971f303a), 667, 220},
  {UINT64_2PART_C(0xa8d9d153, 5ce3b396), 694, 228},
  {UINT64_2PART_C(0xfb9b7cd9, a4a7443c), 720, 236},
  {UINT64_2PART_C(0xbb764c4c, a7a44410), 747, 244},
  {UINT64_2PART_C(0x8bab8eef, b6409c1a), 774, 252},
  {UINT64_2PART_C(0xd01fef10, a657842c), 800, 260},
  {UINT64_2PART_C(0x9b10a4e5, e9913129), 827, 268},
  {UINT64_2PART_C(0xe7109bfb, a19c0c9d), 853, 276},
  {UINT64_2PART_C(0xac2820d9, 623bf429), 880, 284},
  {UINT64_2PART_C(0x80444b5e, 7aa7cf85), 907, 292},
  {UINT64_2PART_C(0xbf21e440, 03acdd2d), 933, 300},
  {UINT64_2PART_C(0x8e679c2f, 5e44ff8f), 960, 308},
  {UINT64_2PART_C(0xd433179d, 9c8cb841), 986, 316},
  {UINT64_2PART_C(0x9e19db92, b4e31ba9), 1013, 324},
  {UINT64_2PART_C(0xeb96bf6e, badf77d9), 1039, 332},
  {UINT64_2PART_C(0xaf87023b, 9bf0ee6b), 1066, 340},
};

static const int kCachedPowersLength = ARRAY_SIZE(kCachedPowers);
static const int kCachedPowersOffset = 348;  // -1 * the first decimal_exponent.
static const double kD_1_LOG2_10 = 0.30102999566398114;  //  1 / lg(10)
// Difference between the decimal exponents in the table above.
const int PowersOfTenCache::kDecimalExponentDistance = 8;
const int PowersOfTenCache::kMinDecimalExponent = -348;
const int PowersOfTenCache::kMaxDecimalExponent = 340;

void PowersOfTenCache::GetCachedPowerForBinaryExponentRange(
    int min_exponent,
    int max_exponent,
    DiyFp* power,
    int* decimal_exponent) {
  int kQ = DiyFp::kSignificandSize;
  double k = ceil((min_exponent + kQ - 1) * kD_1_LOG2_10);
  int foo = kCachedPowersOffset;
  int index =
      (foo + static_cast<int>(k) - 1) / kDecimalExponentDistance + 1;
  ASSERT(0 <= index && index < kCachedPowersLength);
  CachedPower cached_power = kCachedPowers[index];
  ASSERT(min_exponent <= cached_power.binary_exponent);
  ASSERT(cached_power.binary_exponent <= max_exponent);
  *decimal_exponent = cached_power.decimal_exponent;
  *power = DiyFp(cached_power.significand, cached_power.binary_exponent);
}


void PowersOfTenCache::GetCachedPowerForDecimalExponent(int requested_exponent,
                                                        DiyFp* power,
                                                        int* found_exponent) {
  ASSERT(kMinDecimalExponent <= requested_exponent);
  ASSERT(requested_exponent < kMaxDecimalExponent + kDecimalExponentDistance);
  int index =
      (requested_exponent + kCachedPowersOffset) / kDecimalExponentDistance;
  CachedPower cached_power = kCachedPowers[index];
  *power = DiyFp(cached_power.significand, cached_power.binary_exponent);
  *found_exponent = cached_power.decimal_exponent;
  ASSERT(*found_exponent <= requested_exponent);
  ASSERT(requested_exponent < *found_exponent + kDecimalExponentDistance);
}

}  // namespace double_conversion


================================================
FILE: src/kenlm/util/double-conversion/cached-powers.h
================================================
// Copyright 2010 the V8 project authors. All rights reserved.
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are
// met:
//
//     * Redistributions of source code must retain the above copyright
//       notice, this list of conditions and the following disclaimer.
//     * Redistributions in binary form must reproduce the above
//       copyright notice, this list of conditions and the following
//       disclaimer in the documentation and/or other materials provided
//       with the distribution.
//     * Neither the name of Google Inc. nor the names of its
//       contributors may be used to endorse or promote products derived
//       from this software without specific prior written permission.
//
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

#ifndef DOUBLE_CONVERSION_CACHED_POWERS_H_
#define DOUBLE_CONVERSION_CACHED_POWERS_H_

#include "diy-fp.h"

namespace double_conversion {

class PowersOfTenCache {
 public:

  // Not all powers of ten are cached. The decimal exponent of two neighboring
  // cached numbers will differ by kDecimalExponentDistance.
  static const int kDecimalExponentDistance;

  static const int kMinDecimalExponent;
  static const int kMaxDecimalExponent;

  // Returns a cached power-of-ten with a binary exponent in the range
  // [min_exponent; max_exponent] (boundaries included).
  static void GetCachedPowerForBinaryExponentRange(int min_exponent,
                                                   int max_exponent,
                                                   DiyFp* power,
                                                   int* decimal_exponent);

  // Returns a cached power of ten x ~= 10^k such that
  //   k <= decimal_exponent < k + kCachedPowersDecimalDistance.
  // The given decimal_exponent must satisfy
  //   kMinDecimalExponent <= requested_exponent, and
  //   requested_exponent < kMaxDecimalExponent + kDecimalExponentDistance.
  static void GetCachedPowerForDecimalExponent(int requested_exponent,
                                               DiyFp* power,
                                               int* found_exponent);
};

}  // namespace double_conversion

#endif  // DOUBLE_CONVERSION_CACHED_POWERS_H_


================================================
FILE: src/kenlm/util/double-conversion/diy-fp.cc
================================================
// Copyright 2010 the V8 project authors. All rights reserved.
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are
// met:
//
//     * Redistributions of source code must retain the above copyright
//       notice, this list of conditions and the following disclaimer.
//     * Redistributions in binary form must reproduce the above
//       copyright notice, this list of conditions and the following
//       disclaimer in the documentation and/or other materials provided
//       with the distribution.
//     * Neither the name of Google Inc. nor the names of its
//       contributors may be used to endorse or promote products derived
//       from this software without specific prior written permission.
//
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.


#include "diy-fp.h"
#include "utils.h"

namespace double_conversion {

void DiyFp::Multiply(const DiyFp& other) {
  // Simply "emulates" a 128 bit multiplication.
  // However: the resulting number only contains 64 bits. The least
  // significant 64 bits are only used for rounding the most significant 64
  // bits.
  const uint64_t kM32 = 0xFFFFFFFFU;
  uint64_t a = f_ >> 32;
  uint64_t b = f_ & kM32;
  uint64_t c = other.f_ >> 32;
  uint64_t d = other.f_ & kM32;
  uint64_t ac = a * c;
  uint64_t bc = b * c;
  uint64_t ad = a * d;
  uint64_t bd = b * d;
  uint64_t tmp = (bd >> 32) + (ad & kM32) + (bc & kM32);
  // By adding 1U << 31 to tmp we round the final result.
  // Halfway cases will be round up.
  tmp += 1U << 31;
  uint64_t result_f = ac + (ad >> 32) + (bc >> 32) + (tmp >> 32);
  e_ += other.e_ + 64;
  f_ = result_f;
}

}  // namespace double_conversion


================================================
FILE: src/kenlm/util/double-conversion/diy-fp.h
================================================
// Copyright 2010 the V8 project authors. All rights reserved.
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are
// met:
//
//     * Redistributions of source code must retain the above copyright
//       notice, this list of conditions and the following disclaimer.
//     * Redistributions in binary form must reproduce the above
//       copyright notice, this list of conditions and the following
//       disclaimer in the documentation and/or other materials provided
//       with the distribution.
//     * Neither the name of Google Inc. nor the names of its
//       contributors may be used to endorse or promote products derived
//       from this software without specific prior written permission.
//
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

#ifndef DOUBLE_CONVERSION_DIY_FP_H_
#define DOUBLE_CONVERSION_DIY_FP_H_

#include "utils.h"

namespace double_conversion {

// This "Do It Yourself Floating Point" class implements a floating-point number
// with a uint64 significand and an int exponent. Normalized DiyFp numbers will
// have the most significant bit of the significand set.
// Multiplication and Subtraction do not normalize their results.
// DiyFp are not designed to contain special doubles (NaN and Infinity).
class DiyFp {
 public:
  static const int kSignificandSize = 64;

  DiyFp() : f_(0), e_(0) {}
  DiyFp(uint64_t f, int e) : f_(f), e_(e) {}

  // this = this - other.
  // The exponents of both numbers must be the same and the significand of this
  // must be bigger than the significand of other.
  // The result will not be normalized.
  void Subtract(const DiyFp& other) {
    ASSERT(e_ == other.e_);
    ASSERT(f_ >= other.f_);
    f_ -= other.f_;
  }

  // Returns a - b.
  // The exponents of both numbers must be the same and this must be bigger
  // than other. The result will not be normalized.
  static DiyFp Minus(const DiyFp& a, const DiyFp& b) {
    DiyFp result = a;
    result.Subtract(b);
    return result;
  }


  // this = this * other.
  void Multiply(const DiyFp& other);

  // returns a * b;
  static DiyFp Times(const DiyFp& a, const DiyFp& b) {
    DiyFp result = a;
    result.Multiply(b);
    return result;
  }

  void Normalize() {
    ASSERT(f_ != 0);
    uint64_t f = f_;
    int e = e_;

    // This method is mainly called for normalizing boundaries. In general
    // boundaries need to be shifted by 10 bits. We thus optimize for this case.
    const uint64_t k10MSBits = UINT64_2PART_C(0xFFC00000, 00000000);
    while ((f & k10MSBits) == 0) {
      f <<= 10;
      e -= 10;
    }
    while ((f & kUint64MSB) == 0) {
      f <<= 1;
      e--;
    }
    f_ = f;
    e_ = e;
  }

  static DiyFp Normalize(const DiyFp& a) {
    DiyFp result = a;
    result.Normalize();
    return result;
  }

  uint64_t f() const { return f_; }
  int e() const { return e_; }

  void set_f(uint64_t new_value) { f_ = new_value; }
  void set_e(int new_value) { e_ = new_value; }

 private:
  static const uint64_t kUint64MSB = UINT64_2PART_C(0x80000000, 00000000);

  uint64_t f_;
  int e_;
};

}  // namespace double_conversion

#endif  // DOUBLE_CONVERSION_DIY_FP_H_


================================================
FILE: src/kenlm/util/double-conversion/double-conversion.cc
================================================
// Copyright 2010 the V8 project authors. All rights reserved.
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are
// met:
//
//     * Redistributions of source code must retain the above copyright
//       notice, this list of conditions and the following disclaimer.
//     * Redistributions in binary form must reproduce the above
//       copyright notice, this list of conditions and the following
//       disclaimer in the documentation and/or other materials provided
//       with the distribution.
//     * Neither the name of Google Inc. nor the names of its
//       contributors may be used to endorse or promote products derived
//       from this software without specific prior written permission.
//
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

#include <limits.h>
#include <math.h>

#include "double-conversion.h"

#include "bignum-dtoa.h"
#include "fast-dtoa.h"
#include "fixed-dtoa.h"
#include "ieee.h"
#include "strtod.h"
#include "utils.h"

namespace double_conversion {

const DoubleToStringConverter& DoubleToStringConverter::EcmaScriptConverter() {
  int flags = UNIQUE_ZERO | EMIT_POSITIVE_EXPONENT_SIGN;
  static DoubleToStringConverter converter(flags,
                                           "Infinity",
                                           "NaN",
                                           'e',
                                           -6, 21,
                                           6, 0);
  return converter;
}


bool DoubleToStringConverter::HandleSpecialValues(
    double value,
    StringBuilder* result_builder) const {
  Double double_inspect(value);
  if (double_inspect.IsInfinite()) {
    if (infinity_symbol_ == NULL) return false;
    if (value < 0) {
      result_builder->AddCharacter('-');
    }
    result_builder->AddString(infinity_symbol_);
    return true;
  }
  if (double_inspect.IsNan()) {
    if (nan_symbol_ == NULL) return false;
    result_builder->AddString(nan_symbol_);
    return true;
  }
  return false;
}


void DoubleToStringConverter::CreateExponentialRepresentation(
    const char* decimal_digits,
    int length,
    int exponent,
    StringBuilder* result_builder) const {
  ASSERT(length != 0);
  result_builder->AddCharacter(decimal_digits[0]);
  if (length != 1) {
    result_builder->AddCharacter('.');
    result_builder->AddSubstring(&decimal_digits[1], length-1);
  }
  result_builder->AddCharacter(exponent_character_);
  if (exponent < 0) {
    result_builder->AddCharacter('-');
    exponent = -exponent;
  } else {
    if ((flags_ & EMIT_POSITIVE_EXPONENT_SIGN) != 0) {
      result_builder->AddCharacter('+');
    }
  }
  if (exponent == 0) {
    result_builder->AddCharacter('0');
    return;
  }
  ASSERT(exponent < 1e4);
  const int kMaxExponentLength = 5;
  char buffer[kMaxExponentLength + 1];
  buffer[kMaxExponentLength] = '\0';
  int first_char_pos = kMaxExponentLength;
  while (exponent > 0) {
    buffer[--first_char_pos] = '0' + (exponent % 10);
    exponent /= 10;
  }
  result_builder->AddSubstring(&buffer[first_char_pos],
                               kMaxExponentLength - first_char_pos);
}


void DoubleToStringConverter::CreateDecimalRepresentation(
    const char* decimal_digits,
    int length,
    int decimal_point,
    int digits_after_point,
    StringBuilder* result_builder) const {
  // Create a representation that is padded with zeros if needed.
  if (decimal_point <= 0) {
      // "0.00000decimal_rep".
    result_builder->AddCharacter('0');
    if (digits_after_point > 0) {
      result_builder->AddCharacter('.');
      result_builder->AddPadding('0', -decimal_point);
      ASSERT(length <= digits_after_point - (-decimal_point));
      result_builder->AddSubstring(decimal_digits, length);
      int remaining_digits = digits_after_point - (-decimal_point) - length;
      result_builder->AddPadding('0', remaining_digits);
    }
  } else if (decimal_point >= length) {
    // "decimal_rep0000.00000" or "decimal_rep.0000"
    result_builder->AddSubstring(decimal_digits, length);
    result_builder->AddPadding('0', decimal_point - length);
    if (digits_after_point > 0) {
      result_builder->AddCharacter('.');
      result_builder->AddPadding('0', digits_after_point);
    }
  } else {
    // "decima.l_rep000"
    ASSERT(digits_after_point > 0);
    result_builder->AddSubstring(decimal_digits, decimal_point);
    result_builder->AddCharacter('.');
    ASSERT(length - decimal_point <= digits_after_point);
    result_builder->AddSubstring(&decimal_digits[decimal_point],
                                 length - decimal_point);
    int remaining_digits = digits_after_point - (length - decimal_point);
    result_builder->AddPadding('0', remaining_digits);
  }
  if (digits_after_point == 0) {
    if ((flags_ & EMIT_TRAILING_DECIMAL_POINT) != 0) {
      result_builder->AddCharacter('.');
    }
    if ((flags_ & EMIT_TRAILING_ZERO_AFTER_POINT) != 0) {
      result_builder->AddCharacter('0');
    }
  }
}


bool DoubleToStringConverter::ToShortestIeeeNumber(
    double value,
    StringBuilder* result_builder,
    DoubleToStringConverter::DtoaMode mode) const {
  ASSERT(mode == SHORTEST || mode == SHORTEST_SINGLE);
  if (Double(value).IsSpecial()) {
    return HandleSpecialValues(value, result_builder);
  }

  int decimal_point;
  bool sign;
  const int kDecimalRepCapacity = kBase10MaximalLength + 1;
  char decimal_rep[kDecimalRepCapacity];
  int decimal_rep_length;

  DoubleToAscii(value, mode, 0, decimal_rep, kDecimalRepCapacity,
                &sign, &decimal_rep_length, &decimal_point);

  bool unique_zero = (flags_ & UNIQUE_ZERO) != 0;
  if (sign && (value != 0.0 || !unique_zero)) {
    result_builder->AddCharacter('-');
  }

  int exponent = decimal_point - 1;
  if ((decimal_in_shortest_low_ <= exponent) &&
      (exponent < decimal_in_shortest_high_)) {
    CreateDecimalRepresentation(decimal_rep, decimal_rep_length,
                                decimal_point,
                                Max(0, decimal_rep_length - decimal_point),
                                result_builder);
  } else {
    CreateExponentialRepresentation(decimal_rep, decimal_rep_length, exponent,
                                    result_builder);
  }
  return true;
}


bool DoubleToStringConverter::ToFixed(double value,
                                      int requested_digits,
                                      StringBuilder* result_builder) const {
  ASSERT(kMaxFixedDigitsBeforePoint == 60);
  const double kFirstNonFixed = 1e60;

  if (Double(value).IsSpecial()) {
    return HandleSpecialValues(value, result_builder);
  }

  if (requested_digits > kMaxFixedDigitsAfterPoint) return false;
  if (value >= kFirstNonFixed || value <= -kFirstNonFixed) return false;

  // Find a sufficiently precise decimal representation of n.
  int decimal_point;
  bool sign;
  // Add space for the '\0' byte.
  const int kDecimalRepCapacity =
      kMaxFixedDigitsBeforePoint + kMaxFixedDigitsAfterPoint + 1;
  char decimal_rep[kDecimalRepCapacity];
  int decimal_rep_length;
  DoubleToAscii(value, FIXED, requested_digits,
                decimal_rep, kDecimalRepCapacity,
                &sign, &decimal_rep_length, &decimal_point);

  bool unique_zero = ((flags_ & UNIQUE_ZERO) != 0);
  if (sign && (value != 0.0 || !unique_zero)) {
    result_builder->AddCharacter('-');
  }

  CreateDecimalRepresentation(decimal_rep, decimal_rep_length, decimal_point,
                              requested_digits, result_builder);
  return true;
}


bool DoubleToStringConverter::ToExponential(
    double value,
    int requested_digits,
    StringBuilder* result_builder) const {
  if (Double(value).IsSpecial()) {
    return HandleSpecialValues(value, result_builder);
  }

  if (requested_digits < -1) return false;
  if (requested_digits > kMaxExponentialDigits) return false;

  int decimal_point;
  bool sign;
  // Add space for digit before the decimal point and the '\0' character.
  const int kDecimalRepCapacity = kMaxExponentialDigits + 2;
  ASSERT(kDecimalRepCapacity > kBase10MaximalLength);
  char decimal_rep[kDecimalRepCapacity];
  int decimal_rep_length;

  if (requested_digits == -1) {
    DoubleToAscii(value, SHORTEST, 0,
                  decimal_rep, kDecimalRepCapacity,
                  &sign, &decimal_rep_length, &decimal_point);
  } else {
    DoubleToAscii(value, PRECISION, requested_digits + 1,
                  decimal_rep, kDecimalRepCapacity,
                  &sign, &decimal_rep_length, &decimal_point);
    ASSERT(decimal_rep_length <= requested_digits + 1);

    for (int i = decimal_rep_length; i < requested_digits + 1; ++i) {
      decimal_rep[i] = '0';
    }
    decimal_rep_length = requested_digits + 1;
  }

  bool unique_zero = ((flags_ & UNIQUE_ZERO) != 0);
  if (sign && (value != 0.0 || !unique_zero)) {
    result_builder->AddCharacter('-');
  }

  int exponent = decimal_point - 1;
  CreateExponentialRepresentation(decimal_rep,
                                  decimal_rep_length,
                                  exponent,
                                  result_builder);
  return true;
}


bool DoubleToStringConverter::ToPrecision(double value,
                                          int precision,
                                          StringBuilder* result_builder) const {
  if (Double(value).IsSpecial()) {
    return HandleSpecialValues(value, result_builder);
  }

  if (precision < kMinPrecisionDigits || precision > kMaxPrecisionDigits) {
    return false;
  }

  // Find a sufficiently precise decimal representation of n.
  int decimal_point;
  bool sign;
  // Add one for the terminating null character.
  const int kDecimalRepCapacity = kMaxPrecisionDigits + 1;
  char decimal_rep[kDecimalRepCapacity];
  int decimal_rep_length;

  DoubleToAscii(value, PRECISION, precision,
                decimal_rep, kDecimalRepCapacity,
                &sign, &decimal_rep_length, &decimal_point);
  ASSERT(decimal_rep_length <= precision);

  bool unique_zero = ((flags_ & UNIQUE_ZERO) != 0);
  if (sign && (value != 0.0 || !unique_zero)) {
    result_builder->AddCharacter('-');
  }

  // The exponent if we print the number as x.xxeyyy. That is with the
  // decimal point after the first digit.
  int exponent = decimal_point - 1;

  int extra_zero = ((flags_ & EMIT_TRAILING_ZERO_AFTER_POINT) != 0) ? 1 : 0;
  if ((-decimal_point + 1 > max_leading_padding_zeroes_in_precision_mode_) ||
      (decimal_point - precision + extra_zero >
       max_trailing_padding_zeroes_in_precision_mode_)) {
    // Fill buffer to contain 'precision' digits.
    // Usually the buffer is already at the correct length, but 'DoubleToAscii'
    // is allowed to return less characters.
    for (int i = decimal_rep_length; i < precision; ++i) {
      decimal_rep[i] = '0';
    }

    CreateExponentialRepresentation(decimal_rep,
                                    precision,
                                    exponent,
                                    result_builder);
  } else {
    CreateDecimalRepresentation(decimal_rep, decimal_rep_length, decimal_point,
                                Max(0, precision - decimal_point),
                                result_builder);
  }
  return true;
}


static BignumDtoaMode DtoaToBignumDtoaMode(
    DoubleToStringConverter::DtoaMode dtoa_mode) {
  switch (dtoa_mode) {
    case DoubleToStringConverter::SHORTEST:  return BIGNUM_DTOA_SHORTEST;
    case DoubleToStringConverter::SHORTEST_SINGLE:
        return BIGNUM_DTOA_SHORTEST_SINGLE;
    case DoubleToStringConverter::FIXED:     return BIGNUM_DTOA_FIXED;
    case DoubleToStringConverter::PRECISION: return BIGNUM_DTOA_PRECISION;
    default:
      UNREACHABLE();
      return BIGNUM_DTOA_SHORTEST;  // To silence compiler.
  }
}


void DoubleToStringConverter::DoubleToAscii(double v,
                                            DtoaMode mode,
                                            int requested_digits,
                                            char* buffer,
                                            int buffer_length,
                                            bool* sign,
                                            int* length,
                                            int* point) {
  Vector<char> vector(buffer, buffer_length);
  ASSERT(!Double(v).IsSpecial());
  ASSERT(mode == SHORTEST || mode == SHORTEST_SINGLE || requested_digits >= 0);

  if (Double(v).Sign() < 0) {
    *sign = true;
    v = -v;
  } else {
    *sign = false;
  }

  if (mode == PRECISION && requested_digits == 0) {
    vector[0] = '\0';
    *length = 0;
    return;
  }

  if (v == 0) {
    vector[0] = '0';
    vector[1] = '\0';
    *length = 1;
    *point = 1;
    return;
  }

  bool fast_worked;
  switch (mode) {
    case SHORTEST:
      fast_worked = FastDtoa(v, FAST_DTOA_SHORTEST, 0, vector, length, point);
      break;
    case SHORTEST_SINGLE:
      fast_worked = FastDtoa(v, FAST_DTOA_SHORTEST_SINGLE, 0,
                             vector, length, point);
      break;
    case FIXED:
      fast_worked = FastFixedDtoa(v, requested_digits, vector, length, point);
      break;
    case PRECISION:
      fast_worked = FastDtoa(v, FAST_DTOA_PRECISION, requested_digits,
                             vector, length, point);
      break;
    default:
      UNREACHABLE();
      fast_worked = false;
  }
  if (fast_worked) return;

  // If the fast dtoa didn't succeed use the slower bignum version.
  BignumDtoaMode bignum_mode = DtoaToBignumDtoaMode(mode);
  BignumDtoa(v, bignum_mode, requested_digits, vector, length, point);
  vector[*length] = '\0';
}


// Consumes the given substring from the iterator.
// Returns false, if the substring does not match.
static bool ConsumeSubString(const char** current,
                             const char* end,
                             const char* substring) {
  ASSERT(**current == *substring);
  for (substring++; *substring != '\0'; substring++) {
    ++*current;
    if (*current == end || **current != *substring) return false;
  }
  ++*current;
  return true;
}


// Maximum number of significant digits in decimal representation.
// The longest possible double in decimal representation is
// (2^53 - 1) * 2 ^ -1074 that is (2 ^ 53 - 1) * 5 ^ 1074 / 10 ^ 1074
// (768 digits). If we parse a number whose first digits are equal to a
// mean of 2 adjacent doubles (that could have up to 769 digits) the result
// must be rounded to the bigger one unless the tail consists of zeros, so
// we don't need to preserve all the digits.
const int kMaxSignificantDigits = 772;


// Returns true if a nonspace found and false if the end has reached.
static inline bool AdvanceToNonspace(const char** current, const char* end) {
  while (*current != end) {
    if (**current != ' ') return true;
    ++*current;
  }
  return false;
}


static bool isDigit(int x, int radix) {
  return (x >= '0' && x <= '9' && x < '0' + radix)
      || (radix > 10 && x >= 'a' && x < 'a' + radix - 10)
      || (radix > 10 && x >= 'A' && x < 'A' + radix - 10);
}


static double SignedZero(bool sign) {
  return sign ? -0.0 : 0.0;
}


// Parsing integers with radix 2, 4, 8, 16, 32. Assumes current != end.
template <int radix_log_2>
static double RadixStringToIeee(const char* current,
                                const char* end,
                                bool sign,
                                bool allow_trailing_junk,
                                double junk_string_value,
                                bool read_as_double,
                                const char** trailing_pointer) {
  ASSERT(current != end);

  const int kDoubleSize = Double::kSignificandSize;
  const int kSingleSize = Single::kSignificandSize;
  const int kSignificandSize = read_as_double? kDoubleSize: kSingleSize;

  // Skip leading 0s.
  while (*current == '0') {
    ++current;
    if (current == end) {
      *trailing_pointer = end;
      return SignedZero(sign);
    }
  }

  int64_t number = 0;
  int exponent = 0;
  const int radix = (1 << radix_log_2);

  do {
    int digit;
    if (*current >= '0' && *current <= '9' && *current < '0' + radix) {
      digit = static_cast<char>(*current) - '0';
    } else if (radix > 10 && *current >= 'a' && *current < 'a' + radix - 10) {
      digit = static_cast<char>(*current) - 'a' + 10;
    } else if (radix > 10 && *current >= 'A' && *current < 'A' + radix - 10) {
      digit = static_cast<char>(*current) - 'A' + 10;
    } else {
      if (allow_trailing_junk || !AdvanceToNonspace(&current, end)) {
        break;
      } else {
        return junk_string_value;
      }
    }

    number = number * radix + digit;
    int overflow = static_cast<int>(number >> kSignificandSize);
    if (overflow != 0) {
      // Overflow occurred. Need to determine which direction to round the
      // result.
      int overflow_bits_count = 1;
      while (overflow > 1) {
        overflow_bits_count++;
        overflow >>= 1;
      }

      int dropped_bits_mask = ((1 << overflow_bits_count) - 1);
      int dropped_bits = static_cast<int>(number) & dropped_bits_mask;
      number >>= overflow_bits_count;
      exponent = overflow_bits_count;

      bool zero_tail = true;
      while (true) {
        ++current;
        if (current == end || !isDigit(*current, radix)) break;
        zero_tail = zero_tail && *current == '0';
        exponent += radix_log_2;
      }

      if (!allow_trailing_junk && AdvanceToNonspace(&current, end)) {
        return junk_string_value;
      }

      int middle_value = (1 << (overflow_bits_count - 1));
      if (dropped_bits > middle_value) {
        number++;  // Rounding up.
      } else if (dropped_bits == middle_value) {
        // Rounding to even to consistency with decimals: half-way case rounds
        // up if significant part is odd and down otherwise.
        if ((number & 1) != 0 || !zero_tail) {
          number++;  // Rounding up.
        }
      }

      // Rounding up may cause overflow.
      if ((number & ((int64_t)1 << kSignificandSize)) != 0) {
        exponent++;
        number >>= 1;
      }
      break;
    }
    ++current;
  } while (current != end);

  ASSERT(number < ((int64_t)1 << kSignificandSize));
  ASSERT(static_cast<int64_t>(static_cast<double>(number)) == number);

  *trailing_pointer = current;

  if (exponent == 0) {
    if (sign) {
      if (number == 0) return -0.0;
      number = -number;
    }
    return static_cast<double>(number);
  }

  ASSERT(number != 0);
  return Double(DiyFp(number, exponent)).value();
}


double StringToDoubleConverter::StringToIeee(
    const char* input,
    int length,
    int* processed_characters_count,
    bool read_as_double) const {
  const char* current = input;
  const char* end = input + length;

  *processed_characters_count = 0;

  const bool allow_trailing_junk = (flags_ & ALLOW_TRAILING_JUNK) != 0;
  const bool allow_leading_spaces = (flags_ & ALLOW_LEADING_SPACES) != 0;
  const bool allow_trailing_spaces = (flags_ & ALLOW_TRAILING_SPACES) != 0;
  const bool allow_spaces_after_sign = (flags_ & ALLOW_SPACES_AFTER_SIGN) != 0;

  // To make sure that iterator dereferencing is valid the following
  // convention is used:
  // 1. Each '++current' statement is followed by check for equality to 'end'.
  // 2. If AdvanceToNonspace returned false then current == end.
  // 3. If 'current' becomes equal to 'end' the function returns or goes to
  // 'parsing_done'.
  // 4. 'current' is not dereferenced after the 'parsing_done' label.
  // 5. Code before 'parsing_done' may rely on 'current != end'.
  if (current == end) return empty_string_value_;

  if (allow_leading_spaces || allow_trailing_spaces) {
    if (!AdvanceToNonspace(&current, end)) {
      *processed_characters_count = current - input;
      return empty_string_value_;
    }
    if (!allow_leading_spaces && (input != current)) {
      // No leading spaces allowed, but AdvanceToNonspace moved forward.
      return junk_string_value_;
    }
  }

  // The longest form of simplified number is: "-<significant digits>.1eXXX\0".
  const int kBufferSize = kMaxSignificantDigits + 10;
  char buffer[kBufferSize];  // NOLINT: size is known at compile time.
  int buffer_pos = 0;

  // Exponent will be adjusted if insignificant digits of the integer part
  // or insignificant leading zeros of the fractional part are dropped.
  int exponent = 0;
  int significant_digits = 0;
  int insignificant_digits = 0;
  bool nonzero_digit_dropped = false;

  bool sign = false;

  if (*current == '+' || *current == '-') {
    sign = (*current == '-');
    ++current;
    const char* next_non_space = current;
    // Skip following spaces (if allowed).
    if (!AdvanceToNonspace(&next_non_space, end)) return junk_string_value_;
    if (!allow_spaces_after_sign && (current != next_non_space)) {
      return junk_string_value_;
    }
    current = next_non_space;
  }

  if (infinity_symbol_ != NULL) {
    if (*current == infinity_symbol_[0]) {
      if (!ConsumeSubString(&current, end, infinity_symbol_)) {
        return junk_string_value_;
      }

      if (!(allow_trailing_spaces || allow_trailing_junk) && (current != end)) {
        return junk_string_value_;
      }
      if (!allow_trailing_junk && AdvanceToNonspace(&current, end)) {
        return junk_string_value_;
      }

      ASSERT(buffer_pos == 0);
      *processed_characters_count = current - input;
      return sign ? -Double::Infinity() : Double::Infinity();
    }
  }

  if (nan_symbol_ != NULL) {
    if (*current == nan_symbol_[0]) {
      if (!ConsumeSubString(&current, end, nan_symbol_)) {
        return junk_string_value_;
      }

      if (!(allow_trailing_spaces || allow_trailing_junk) && (current != end)) {
        return junk_string_value_;
      }
      if (!allow_trailing_junk && AdvanceToNonspace(&current, end)) {
        return junk_string_value_;
      }

      ASSERT(buffer_pos == 0);
      *processed_characters_count = current - input;
      return sign ? -Double::NaN() : Double::NaN();
    }
  }

  bool leading_zero = false;
  if (*current == '0') {
    ++current;
    if (current == end) {
      *processed_characters_count = current - input;
      return SignedZero(sign);
    }

    leading_zero = true;

    // It could be hexadecimal value.
    if ((flags_ & ALLOW_HEX) && (*current == 'x' || *current == 'X')) {
      ++current;
      if (current == end || !isDigit(*current, 16)) {
        return junk_string_value_;  // "0x".
      }

      const char* tail_pointer = NULL;
      double result = RadixStringToIeee<4>(current,
                                           end,
                                           sign,
                                           allow_trailing_junk,
                                           junk_string_value_,
                                           read_as_double,
                                           &tail_pointer);
      if (tail_pointer != NULL) {
        if (allow_trailing_spaces) AdvanceToNonspace(&tail_pointer, end);
        *processed_characters_count = tail_pointer - input;
      }
      return result;
    }

    // Ignore leading zeros in the integer part.
    while (*current == '0') {
      ++current;
      if (current == end) {
        *processed_characters_count = current - input;
        return SignedZero(sign);
      }
    }
  }

  bool octal = leading_zero && (flags_ & ALLOW_OCTALS) != 0;

  // Copy significant digits of the integer part (if any) to the buffer.
  while (*current >= '0' && *current <= '9') {
    if (significant_digits < kMaxSignificantDigits) {
      ASSERT(buffer_pos < kBufferSize);
      buffer[buffer_pos++] = static_cast<char>(*current);
      significant_digits++;
      // Will later check if it's an octal in the buffer.
    } else {
      insignificant_digits++;  // Move the digit into the exponential part.
      nonzero_digit_dropped = nonzero_digit_dropped || *current != '0';
    }
    octal = octal && *current < '8';
    ++current;
    if (current == end) goto parsing_done;
  }

  if (significant_digits == 0) {
    octal = false;
  }

  if (*current == '.') {
    if (octal && !allow_trailing_junk) return junk_string_value_;
    if (octal) goto parsing_done;

    ++current;
    if (current == end) {
      if (significant_digits == 0 && !leading_zero) {
        return junk_string_value_;
      } else {
        goto parsing_done;
      }
    }

    if (significant_digits == 0) {
      // octal = false;
      // Integer part consists of 0 or is absent. Significant digits start after
      // leading zeros (if any).
      while (*current == '0') {
        ++current;
        if (current == end) {
          *processed_characters_count = current - input;
          return SignedZero(sign);
        }
        exponent--;  // Move this 0 into the exponent.
      }
    }

    // There is a fractional part.
    // We don't emit a '.', but adjust the exponent instead.
    while (*current >= '0' && *current <= '9') {
      if (significant_digits < kMaxSignificantDigits) {
        ASSERT(buffer_pos < kBufferSize);
        buffer[buffer_pos++] = static_cast<char>(*current);
        significant_digits++;
        exponent--;
      } else {
        // Ignore insignificant digits in the fractional part.
        nonzero_digit_dropped = nonzero_digit_dropped || *current != '0';
      }
      ++current;
      if (current == end) goto parsing_done;
    }
  }

  if (!leading_zero && exponent == 0 && significant_digits == 0) {
    // If leading_zeros is true then the string contains zeros.
    // If exponent < 0 then string was [+-]\.0*...
    // If significant_digits != 0 the string is not equal to 0.
    // Otherwise there are no digits in the string.
    return junk_string_value_;
  }

  // Parse exponential part.
  if (*current == 'e' || *current == 'E') {
    if (octal && !allow_trailing_junk) return junk_string_value_;
    if (octal) goto parsing_done;
    ++current;
    if (current == end) {
      if (allow_trailing_junk) {
        goto parsing_done;
      } else {
        return junk_string_value_;
      }
    }
    char sign = '+';
    if (*current == '+' || *current == '-') {
      sign = static_cast<char>(*current);
      ++current;
      if (current == end) {
        if (allow_trailing_junk) {
          goto parsing_done;
        } else {
          return junk_string_value_;
        }
      }
    }

    if (current == end || *current < '0' || *current > '9') {
      if (allow_trailing_junk) {
        goto parsing_done;
      } else {
        return junk_string_value_;
      }
    }

    const int max_exponent = INT_MAX / 2;
    ASSERT(-max_exponent / 2 <= exponent && exponent <= max_exponent / 2);
    int num = 0;
    do {
      // Check overflow.
      int digit = *current - '0';
      if (num >= max_exponent / 10
          && !(num == max_exponent / 10 && digit <= max_exponent % 10)) {
        num = max_exponent;
      } else {
        num = num * 10 + digit;
      }
      ++current;
    } while (current != end && *current >= '0' && *current <= '9');

    exponent += (sign == '-' ? -num : num);
  }

  if (!(allow_trailing_spaces || allow_trailing_junk) && (current != end)) {
    return junk_string_value_;
  }
  if (!allow_trailing_junk && AdvanceToNonspace(&current, end)) {
    return junk_string_value_;
  }
  if (allow_trailing_spaces) {
    AdvanceToNonspace(&current, end);
  }

  parsing_done:
  exponent += insignificant_digits;

  if (octal) {
    double result;
    const char* tail_pointer = NULL;
    result = RadixStringToIeee<3>(buffer,
                                  buffer + buffer_pos,
                                  sign,
                                  allow_trailing_junk,
                                  junk_string_value_,
                                  read_as_double,
                                  &tail_pointer);
    ASSERT(tail_pointer != NULL);
    *processed_characters_count = current - input;
    return result;
  }

  if (nonzero_digit_dropped) {
    buffer[buffer_pos++] = '1';
    exponent--;
  }

  ASSERT(buffer_pos < kBufferSize);
  buffer[buffer_pos] = '\0';

  double converted;
  if (read_as_double) {
    converted = Strtod(Vector<const char>(buffer, buffer_pos), exponent);
  } else {
    converted = Strtof(Vector<const char>(buffer, buffer_pos), exponent);
  }
  *processed_characters_count = current - input;
  return sign? -converted: converted;
}

}  // namespace double_conversion


================================================
FILE: src/kenlm/util/double-conversion/double-conversion.h
================================================
// Copyright 2012 the V8 project authors. All rights reserved.
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are
// met:
//
//     * Redistributions of source code must retain the above copyright
//       notice, this list of conditions and the following disclaimer.
//     * Redistributions in binary form must reproduce the above
//       copyright notice, this list of conditions and the following
//       disclaimer in the documentation and/or other materials provided
//       with the distribution.
//     * Neither the name of Google Inc. nor the names of its
//       contributors may be used to endorse or promote products derived
//       from this software without specific prior written permission.
//
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

#ifndef DOUBLE_CONVERSION_DOUBLE_CONVERSION_H_
#define DOUBLE_CONVERSION_DOUBLE_CONVERSION_H_

#include "utils.h"

namespace double_conversion {

class DoubleToStringConverter {
 public:
  // When calling ToFixed with a double > 10^kMaxFixedDigitsBeforePoint
  // or a requested_digits parameter > kMaxFixedDigitsAfterPoint then the
  // function returns false.
  static const int kMaxFixedDigitsBeforePoint = 60;
  static const int kMaxFixedDigitsAfterPoint = 60;

  // When calling ToExponential with a requested_digits
  // parameter > kMaxExponentialDigits then the function returns false.
  static const int kMaxExponentialDigits = 120;

  // When calling ToPrecision with a requested_digits
  // parameter < kMinPrecisionDigits or requested_digits > kMaxPrecisionDigits
  // then the function returns false.
  static const int kMinPrecisionDigits = 1;
  static const int kMaxPrecisionDigits = 120;

  enum Flags {
    NO_FLAGS = 0,
    EMIT_POSITIVE_EXPONENT_SIGN = 1,
    EMIT_TRAILING_DECIMAL_POINT = 2,
    EMIT_TRAILING_ZERO_AFTER_POINT = 4,
    UNIQUE_ZERO = 8
  };

  // Flags should be a bit-or combination of the possible Flags-enum.
  //  - NO_FLAGS: no special flags.
  //  - EMIT_POSITIVE_EXPONENT_SIGN: when the number is converted into exponent
  //    form, emits a '+' for positive exponents. Example: 1.2e+2.
  //  - EMIT_TRAILING_DECIMAL_POINT: when the input number is an integer and is
  //    converted into decimal format then a trailing decimal point is appended.
  //    Example: 2345.0 is converted to "2345.".
  //  - EMIT_TRAILING_ZERO_AFTER_POINT: in addition to a trailing decimal point
  //    emits a trailing '0'-character. This flag requires the
  //    EXMIT_TRAILING_DECIMAL_POINT flag.
  //    Example: 2345.0 is converted to "2345.0".
  //  - UNIQUE_ZERO: "-0.0" is converted to "0.0".
  //
  // Infinity symbol and nan_symbol provide the string representation for these
  // special values. If the string is NULL and the special value is encountered
  // then the conversion functions return false.
  //
  // The exponent_character is used in exponential representations. It is
  // usually 'e' or 'E'.
  //
  // When converting to the shortest representation the converter will
  // represent input numbers in decimal format if they are in the interval
  // [10^decimal_in_shortest_low; 10^decimal_in_shortest_high[
  //    (lower boundary included, greater boundary excluded).
  // Example: with decimal_in_shortest_low = -6 and
  //               decimal_in_shortest_high = 21:
  //   ToShortest(0.000001)  -> "0.000001"
  //   ToShortest(0.0000001) -> "1e-7"
  //   ToShortest(111111111111111111111.0)  -> "111111111111111110000"
  //   ToShortest(100000000000000000000.0)  -> "100000000000000000000"
  //   ToShortest(1111111111111111111111.0) -> "1.1111111111111111e+21"
  //
  // When converting to precision mode the converter may add
  // max_leading_padding_zeroes before returning the number in exponential
  // format.
  // Example with max_leading_padding_zeroes_in_precision_mode = 6.
  //   ToPrecision(0.0000012345, 2) -> "0.0000012"
  //   ToPrecision(0.00000012345, 2) -> "1.2e-7"
  // Similarily the converter may add up to
  // max_trailing_padding_zeroes_in_precision_mode in precision mode to avoid
  // returning an exponential representation. A zero added by the
  // EMIT_TRAILING_ZERO_AFTER_POINT flag is counted for this limit.
  // Examples for max_trailing_padding_zeroes_in_precision_mode = 1:
  //   ToPrecision(230.0, 2) -> "230"
  //   ToPrecision(230.0, 2) -> "230."  with EMIT_TRAILING_DECIMAL_POINT.
  //   ToPrecision(230.0, 2) -> "2.3e2" with EMIT_TRAILING_ZERO_AFTER_POINT.
  DoubleToStringConverter(int flags,
                          const char* infinity_symbol,
                          const char* nan_symbol,
                          char exponent_character,
                          int decimal_in_shortest_low,
                          int decimal_in_shortest_high,
                          int max_leading_padding_zeroes_in_precision_mode,
                          int max_trailing_padding_zeroes_in_precision_mode)
      : flags_(flags),
        infinity_symbol_(infinity_symbol),
        nan_symbol_(nan_symbol),
        exponent_character_(exponent_character),
        decimal_in_shortest_low_(decimal_in_shortest_low),
        decimal_in_shortest_high_(decimal_in_shortest_high),
        max_leading_padding_zeroes_in_precision_mode_(
            max_leading_padding_zeroes_in_precision_mode),
        max_trailing_padding_zeroes_in_precision_mode_(
            max_trailing_padding_zeroes_in_precision_mode) {
    // When 'trailing zero after the point' is set, then 'trailing point'
    // must be set too.
    ASSERT(((flags & EMIT_TRAILING_DECIMAL_POINT) != 0) ||
        !((flags & EMIT_TRAILING_ZERO_AFTER_POINT) != 0));
  }

  // Returns a converter following the EcmaScript specification.
  static const DoubleToStringConverter& EcmaScriptConverter();

  // Computes the shortest string of digits that correctly represent the input
  // number. Depending on decimal_in_shortest_low and decimal_in_shortest_high
  // (see constructor) it then either returns a decimal representation, or an
  // exponential representation.
  // Example with decimal_in_shortest_low = -6,
  //              decimal_in_shortest_high = 21,
  //              EMIT_POSITIVE_EXPONENT_SIGN activated, and
  //              EMIT_TRAILING_DECIMAL_POINT deactived:
  //   ToShortest(0.000001)  -> "0.000001"
  //   ToShortest(0.0000001) -> "1e-7"
  //   ToShortest(111111111111111111111.0)  -> "111111111111111110000"
  //   ToShortest(100000000000000000000.0)  -> "100000000000000000000"
  //   ToShortest(1111111111111111111111.0) -> "1.1111111111111111e+21"
  //
  // Note: the conversion may round the output if the returned string
  // is accurate enough to uniquely identify the input-number.
  // For example the most precise representation of the double 9e59 equals
  // "899999999999999918767229449717619953810131273674690656206848", but
  // the converter will return the shorter (but still correct) "9e59".
  //
  // Returns true if the conversion succeeds. The conversion always succeeds
  // except when the input value is special and no infinity_symbol or
  // nan_symbol has been given to the constructor.
  bool ToShortest(double value, StringBuilder* result_builder) const {
    return ToShortestIeeeNumber(value, result_builder, SHORTEST);
  }

  // Same as ToShortest, but for single-precision floats.
  bool ToShortestSingle(float value, StringBuilder* result_builder) const {
    return ToShortestIeeeNumber(value, result_builder, SHORTEST_SINGLE);
  }


  // Computes a decimal representation with a fixed number of digits after the
  // decimal point. The last emitted digit is rounded.
  //
  // Examples:
  //   ToFixed(3.12, 1) -> "3.1"
  //   ToFixed(3.1415, 3) -> "3.142"
  //   ToFixed(1234.56789, 4) -> "1234.5679"
  //   ToFixed(1.23, 5) -> "1.23000"
  //   ToFixed(0.1, 4) -> "0.1000"
  //   ToFixed(1e30, 2) -> "1000000000000000019884624838656.00"
  //   ToFixed(0.1, 30) -> "0.100000000000000005551115123126"
  //   ToFixed(0.1, 17) -> "0.10000000000000001"
  //
  // If requested_digits equals 0, then the tail of the result depends on
  // the EMIT_TRAILING_DECIMAL_POINT and EMIT_TRAILING_ZERO_AFTER_POINT.
  // Examples, for requested_digits == 0,
  //   let EMIT_TRAILING_DECIMAL_POINT and EMIT_TRAILING_ZERO_AFTER_POINT be
  //    - false and false: then 123.45 -> 123
  //                             0.678 -> 1
  //    - true and false: then 123.45 -> 123.
  //                            0.678 -> 1.
  //    - true and true: then 123.45 -> 123.0
  //                           0.678 -> 1.0
  //
  // Returns true if the conversion succeeds. The conversion always succeeds
  // except for the following cases:
  //   - the input value is special and no infinity_symbol or nan_symbol has
  //     been provided to the constructor,
  //   - 'value' > 10^kMaxFixedDigitsBeforePoint, or
  //   - 'requested_digits' > kMaxFixedDigitsAfterPoint.
  // The last two conditions imply that the result will never contain more than
  // 1 + kMaxFixedDigitsBeforePoint + 1 + kMaxFixedDigitsAfterPoint characters
  // (one additional character for the sign, and one for the decimal point).
  bool ToFixed(double value,
               int requested_digits,
               StringBuilder* result_builder) const;

  // Computes a representation in exponential format with requested_digits
  // after the decimal point. The last emitted digit is rounded.
  // If requested_digits equals -1, then the shortest exponential representation
  // is computed.
  //
  // Examples with EMIT_POSITIVE_EXPONENT_SIGN deactivated, and
  //               exponent_character set to 'e'.
  //   ToExponential(3.12, 1) -> "3.1e0"
  //   ToExponential(5.0, 3) -> "5.000e0"
  //   ToExponential(0.001, 2) -> "1.00e-3"
  //   ToExponential(3.1415, -1) -> "3.1415e0"
  //   ToExponential(3.1415, 4) -> "3.1415e0"
  //   ToExponential(3.1415, 3) -> "3.142e0"
  //   ToExponential(123456789000000, 3) -> "1.235e14"
  //   ToExponential(1000000000000000019884624838656.0, -1) -> "1e30"
  //   ToExponential(1000000000000000019884624838656.0, 32) ->
  //                     "1.00000000000000001988462483865600e30"
  //   ToExponential(1234, 0) -> "1e3"
  //
  // Returns true if the conversion succeeds. The conversion always succeeds
  // except for the following cases:
  //   - the input value is special and no infinity_symbol or nan_symbol has
  //     been provided to the constructor,
  //   - 'requested_digits' > kMaxExponentialDigits.
  // The last condition implies that the result will never contain more than
  // kMaxExponentialDigits + 8 characters (the sign, the digit before the
  // decimal point, the decimal point, the exponent character, the
  // exponent's sign, and at most 3 exponent digits).
  bool ToExponential(double value,
                     int requested_digits,
                     StringBuilder* result_builder) const;

  // Computes 'precision' leading digits of the given 'value' and returns them
  // either in exponential or decimal format, depending on
  // max_{leading|trailing}_padding_zeroes_in_precision_mode (given to the
  // constructor).
  // The last computed digit is rounded.
  //
  // Example with max_leading_padding_zeroes_in_precision_mode = 6.
  //   ToPrecision(0.0000012345, 2) -> "0.0000012"
  //   ToPrecision(0.00000012345, 2) -> "1.2e-7"
  // Similarily the converter may add up to
  // max_trailing_padding_zeroes_in_precision_mode in precision mode to avoid
  // returning an exponential representation. A zero added by the
  // EMIT_TRAILING_ZERO_AFTER_POINT flag is counted for this limit.
  // Examples for max_trailing_padding_zeroes_in_precision_mode = 1:
  //   ToPrecision(230.0, 2) -> "230"
  //   ToPrecision(230.0, 2) -> "230."  with EMIT_TRAILING_DECIMAL_POINT.
  //   ToPrecision(230.0, 2) -> "2.3e2" with EMIT_TRAILING_ZERO_AFTER_POINT.
  // Examples for max_trailing_padding_zeroes_in_precision_mode = 3, and no
  //    EMIT_TRAILING_ZERO_AFTER_POINT:
  //   ToPrecision(123450.0, 6) -> "123450"
  //   ToPrecision(123450.0, 5) -> "123450"
  //   ToPrecision(123450.0, 4) -> "123500"
  //   ToPrecision(123450.0, 3) -> "123000"
  //   ToPrecision(123450.0, 2) -> "1.2e5"
  //
  // Returns true if the conversion succeeds. The conversion always succeeds
  // except for the following cases:
  //   - the input value is special and no infinity_symbol or nan_symbol has
  //     been provided to the constructor,
  //   - precision < kMinPericisionDigits
  //   - precision > kMaxPrecisionDigits
  // The last condition implies that the result will never contain more than
  // kMaxPrecisionDigits + 7 characters (the sign, the decimal point, the
  // exponent character, the exponent's sign, and at most 3 exponent digits).
  bool ToPrecision(double value,
                   int precision,
                   StringBuilder* result_builder) const;

  enum DtoaMode {
    // Produce the shortest correct representation.
    // For example the output of 0.299999999999999988897 is (the less accurate
    // but correct) 0.3.
    SHORTEST,
    // Same as SHORTEST, but for single-precision floats.
    SHORTEST_SINGLE,
    // Produce a fixed number of digits after the decimal point.
    // For instance fixed(0.1, 4) becomes 0.1000
    // If the input number is big, the output will be big.
    FIXED,
    // Fixed number of digits (independent of the decimal point).
    PRECISION
  };

  // The maximal number of digits that are needed to emit a double in base 10.
  // A higher precision can be achieved by using more digits, but the shortest
  // accurate representation of any double will never use more digits than
  // kBase10MaximalLength.
  // Note that DoubleToAscii null-terminates its input. So the given buffer
  // should be at least kBase10MaximalLength + 1 characters long.
  static const int kBase10MaximalLength = 17;

  // Converts the given double 'v' to ascii. 'v' must not be NaN, +Infinity, or
  // -Infinity. In SHORTEST_SINGLE-mode this restriction also applies to 'v'
  // after it has been casted to a single-precision float. That is, in this
  // mode static_cast<float>(v) must not be NaN, +Infinity or -Infinity.
  //
  // The result should be interpreted as buffer * 10^(point-length).
  //
  // The output depends on the given mode:
  //  - SHORTEST: produce the least amount of digits for which the internal
  //   identity requirement is still satisfied. If the digits are printed
  //   (together with the correct exponent) then reading this number will give
  //   'v' again. The buffer will choose the representation that is closest to
  //   'v'. If there are two at the same distance, than the one farther away
  //   from 0 is chosen (halfway cases - ending with 5 - are rounded up).
  //   In this mode the 'requested_digits' parameter is ignored.
  //  - SHORTEST_SINGLE: same as SHORTEST but with single-precision.
  //  - FIXED: produces digits necessary to print a given number with
  //   'requested_digits' digits after the decimal point. The produced digits
  //   might be too short in which case the caller has to fill the remainder
  //   with '0's.
  //   Example: toFixed(0.001, 5) is allowed to return buffer="1", point=-2.
  //   Halfway cases are rounded towards +/-Infinity (away from 0). The call
  //   toFixed(0.15, 2) thus returns buffer="2", point=0.
  //   The returned buffer may contain digits that would be truncated from the
  //   shortest representation of the input.
  //  - PRECISION: produces 'requested_digits' where the first digit is not '0'.
  //   Even though the length of produced digits usually equals
  //   'requested_digits', the function is allowed to return fewer digits, in
  //   which case the caller has to fill the missing digits with '0's.
  //   Halfway cases are again rounded away from 0.
  // DoubleToAscii expects the given buffer to be big enough to hold all
  // digits and a terminating null-character. In SHORTEST-mode it expects a
  // buffer of at least kBase10MaximalLength + 1. In all other modes the
  // requested_digits parameter and the padding-zeroes limit the size of the
  // output. Don't forget the decimal point, the exponent character and the
  // terminating null-character when computing the maximal output size.
  // The given length is only used in debug mode to ensure the buffer is big
  // enough.
  static void DoubleToAscii(double v,
                            DtoaMode mode,
                            int requested_digits,
                            char* buffer,
                            int buffer_length,
                            bool* sign,
                            int* length,
                            int* point);

 private:
  // Implementation for ToShortest and ToShortestSingle.
  bool ToShortestIeeeNumber(double value,
                            StringBuilder* result_builder,
                            DtoaMode mode) const;

  // If the value is a special value (NaN or Infinity) constructs the
  // corresponding string using the configured infinity/nan-symbol.
  // If either of them is NULL or the value is not special then the
  // function returns false.
  bool HandleSpecialValues(double value, StringBuilder* result_builder) const;
  // Constructs an exponential representation (i.e. 1.234e56).
  // The given exponent assumes a decimal point after the first decimal digit.
  void CreateExponentialRepresentation(const char* decimal_digits,
                                       int length,
                                       int exponent,
                                       StringBuilder* result_builder) const;
  // Creates a decimal representation (i.e 1234.5678).
  void CreateDecimalRepresentation(const char* decimal_digits,
                                   int length,
                                   int decimal_point,
                                   int digits_after_point,
                                   StringBuilder* result_builder) const;

  const int flags_;
  const char* const infinity_symbol_;
  const char* const nan_symbol_;
  const char exponent_character_;
  const int decimal_in_shortest_low_;
  const int decimal_in_shortest_high_;
  const int max_leading_padding_zeroes_in_precision_mode_;
  const int max_trailing_padding_zeroes_in_precision_mode_;

  DISALLOW_IMPLICIT_CONSTRUCTORS(DoubleToStringConverter);
};


class StringToDoubleConverter {
 public:
  // Enumeration for allowing octals and ignoring junk when converting
  // strings to numbers.
  enum Flags {
    NO_FLAGS = 0,
    ALLOW_HEX = 1,
    ALLOW_OCTALS = 2,
    ALLOW_TRAILING_JUNK = 4,
    ALLOW_LEADING_SPACES = 8,
    ALLOW_TRAILING_SPACES = 16,
    ALLOW_SPACES_AFTER_SIGN = 32
  };

  // Flags should be a bit-or combination of the possible Flags-enum.
  //  - NO_FLAGS: no special flags.
  //  - ALLOW_HEX: recognizes the prefix "0x". Hex numbers may only be integers.
  //      Ex: StringToDouble("0x1234") -> 4660.0
  //          In StringToDouble("0x1234.56") the characters ".56" are trailing
  //          junk. The result of the call is hence dependent on
  //          the ALLOW_TRAILING_JUNK flag and/or the junk value.
  //      With this flag "0x" is a junk-string. Even with ALLOW_TRAILING_JUNK,
  //      the string will not be parsed as "0" followed by junk.
  //
  //  - ALLOW_OCTALS: recognizes the prefix "0" for octals:
  //      If a sequence of octal digits starts with '0', then the number is
  //      read as octal integer. Octal numbers may only be integers.
  //      Ex: StringToDouble("01234") -> 668.0
  //          StringToDouble("012349") -> 12349.0  // Not a sequence of octal
  //                                               // digits.
  //          In StringToDouble("01234.56") the characters ".56" are trailing
  //          junk. The result of the call is hence dependent on
  //          the ALLOW_TRAILING_JUNK flag and/or the junk value.
  //          In StringToDouble("01234e56") the characters "e56" are trailing
  //          junk, too.
  //  - ALLOW_TRAILING_JUNK: ignore trailing characters that are not part of
  //      a double literal.
  //  - ALLOW_LEADING_SPACES: skip over leading spaces.
  //  - ALLOW_TRAILING_SPACES: ignore trailing spaces.
  //  - ALLOW_SPACES_AFTER_SIGN: ignore spaces after the sign.
  //       Ex: StringToDouble("-   123.2") -> -123.2.
  //           StringToDouble("+   123.2") -> 123.2
  //
  // empty_string_value is returned when an empty string is given as input.
  // If ALLOW_LEADING_SPACES or ALLOW_TRAILING_SPACES are set, then a string
  // containing only spaces is converted to the 'empty_string_value', too.
  //
  // junk_string_value is returned when
  //  a) ALLOW_TRAILING_JUNK is not set, and a junk character (a character not
  //     part of a double-literal) is found.
  //  b) ALLOW_TRAILING_JUNK is set, but the string does not start with a
  //     double literal.
  //
  // infinity_symbol and nan_symbol are strings that are used to detect
  // inputs that represent infinity and NaN. They can be null, in which case
  // they are ignored.
  // The conversion routine first reads any possible signs. Then it compares the
  // following character of the input-string with the first character of
  // the infinity, and nan-symbol. If either matches, the function assumes, that
  // a match has been found, and expects the following input characters to match
  // the remaining characters of the special-value symbol.
  // This means that the following restrictions apply to special-value symbols:
  //  - they must not start with signs ('+', or '-'),
  //  - they must not have the same first character.
  //  - they must not start with digits.
  //
  // Examples:
  //  flags = ALLOW_HEX | ALLOW_TRAILING_JUNK,
  //  empty_string_value = 0.0,
  //  junk_string_value = NaN,
  //  infinity_symbol = "infinity",
  //  nan_symbol = "nan":
  //    StringToDouble("0x1234") -> 4660.0.
  //    StringToDouble("0x1234K") -> 4660.0.
  //    StringToDouble("") -> 0.0  // empty_string_value.
  //    StringToDouble(" ") -> NaN  // junk_string_value.
  //    StringToDouble(" 1") -> NaN  // junk_string_value.
  //    StringToDouble("0x") -> NaN  // junk_string_value.
  //    StringToDouble("-123.45") -> -123.45.
  //    StringToDouble("--123.45") -> NaN  // junk_string_value.
  //    StringToDouble("123e45") -> 123e45.
  //    StringToDouble("123E45") -> 123e45.
  //    StringToDouble("123e+45") -> 123e45.
  //    StringToDouble("123E-45") -> 123e-45.
  //    StringToDouble("123e") -> 123.0  // trailing junk ignored.
  //    StringToDouble("123e-") -> 123.0  // trailing junk ignored.
  //    StringToDouble("+NaN") -> NaN  // NaN string literal.
  //    StringToDouble("-infinity") -> -inf.  // infinity literal.
  //    StringToDouble("Infinity") -> NaN  // junk_string_value.
  //
  //  flags = ALLOW_OCTAL | ALLOW_LEADING_SPACES,
  //  empty_string_value = 0.0,
  //  junk_string_value = NaN,
  //  infinity_symbol = NULL,
  //  nan_symbol = NULL:
  //    StringToDouble("0x1234") -> NaN  // junk_string_value.
  //    StringToDouble("01234") -> 668.0.
  //    StringToDouble("") -> 0.0  // empty_string_value.
  //    StringToDouble(" ") -> 0.0  // empty_string_value.
  //    StringToDouble(" 1") -> 1.0
  //    StringToDouble("0x") -> NaN  // junk_string_value.
  //    StringToDouble("0123e45") -> NaN  // junk_string_value.
  //    StringToDouble("01239E45") -> 1239e45.
  //    StringToDouble("-infinity") -> NaN  // junk_string_value.
  //    StringToDouble("NaN") -> NaN  // junk_string_value.
  StringToDoubleConverter(int flags,
                          double empty_string_value,
                          double junk_string_value,
                          const char* infinity_symbol,
                          const char* nan_symbol)
      : flags_(flags),
        empty_string_value_(empty_string_value),
        junk_string_value_(junk_string_value),
        infinity_symbol_(infinity_symbol),
        nan_symbol_(nan_symbol) {
  }

  // Performs the conversion.
  // The output parameter 'processed_characters_count' is set to the number
  // of characters that have been processed to read the number.
  // Spaces than are processed with ALLOW_{LEADING|TRAILING}_SPACES are included
  // in the 'processed_characters_count'. Trailing junk is never included.
  double StringToDouble(const char* buffer,
                        int length,
                        int* processed_characters_count) const {
    return StringToIeee(buffer, length, processed_characters_count, true);
  }

  // Same as StringToDouble but reads a float.
  // Note that this is not equivalent to static_cast<float>(StringToDouble(...))
  // due to potential double-rounding.
  float StringToFloat(const char* buffer,
                      int length,
                      int* processed_characters_count) const {
    return static_cast<float>(StringToIeee(buffer, length,
                                           processed_characters_count, false));
  }

 private:
  const int flags_;
  const double empty_string_value_;
  const double junk_string_value_;
  const char* const infinity_symbol_;
  const char* const nan_symbol_;

  double StringToIeee(const char* buffer,
                      int length,
                      int* processed_characters_count,
                      bool read_as_double) const;

  DISALLOW_IMPLICIT_CONSTRUCTORS(StringToDoubleConverter);
};

}  // namespace double_conversion

#endif  // DOUBLE_CONVERSION_DOUBLE_CONVERSION_H_


================================================
FILE: src/kenlm/util/double-conversion/fast-dtoa.cc
================================================
// Copyright 2012 the V8 project authors. All rights reserved.
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are
// met:
//
//     * Redistributions of source code must retain the above copyright
//       notice, this list of conditions and the following disclaimer.
//     * Redistributions in binary form must reproduce the above
//       copyright notice, this list of conditions and the following
//       disclaimer in the documentation and/or other materials provided
//       with the distribution.
//     * Neither the name of Google Inc. nor the names of its
//       contributors may be used to endorse or promote products derived
//       from this software without specific prior written permission.
//
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

#include "fast-dtoa.h"

#include "cached-powers.h"
#include "diy-fp.h"
#include "ieee.h"

namespace double_conversion {

// The minimal and maximal target exponent define the range of w's binary
// exponent, where 'w' is the result of multiplying the input by a cached power
// of ten.
//
// A different range might be chosen on a different platform, to optimize digit
// generation, but a smaller range requires more powers of ten to be cached.
static const int kMinimalTargetExponent = -60;
static const int kMaximalTargetExponent = -32;


// Adjusts the last digit of the generated number, and screens out generated
// solutions that may be inaccurate. A solution may be inaccurate if it is
// outside the safe interval, or if we cannot prove that it is closer to the
// input than a neighboring representation of the same length.
//
// Input: * buffer containing the digits of too_high / 10^kappa
//        * the buffer's length
//        * distance_too_high_w == (too_high - w).f() * unit
//        * unsafe_interval == (too_high - too_low).f() * unit
//        * rest = (too_high - buffer * 10^kappa).f() * unit
//        * ten_kappa = 10^kappa * unit
//        * unit = the common multiplier
// Output: returns true if the buffer is guaranteed to contain the closest
//    representable number to the input.
//  Modifies the generated digits in the buffer to approach (round towards) w.
static bool RoundWeed(Vector<char> buffer,
                      int length,
                      uint64_t distance_too_high_w,
                      uint64_t unsafe_interval,
                      uint64_t rest,
                      uint64_t ten_kappa,
                      uint64_t unit) {
  uint64_t small_distance = distance_too_high_w - unit;
  uint64_t big_distance = distance_too_high_w + unit;
  // Let w_low  = too_high - big_distance, and
  //     w_high = too_high - small_distance.
  // Note: w_low < w < w_high
  //
  // The real w (* unit) must lie somewhere inside the interval
  // ]w_low; w_high[ (often written as "(w_low; w_high)")

  // Basically the buffer currently contains a number in the unsafe interval
  // ]too_low; too_high[ with too_low < w < too_high
  //
  //  too_high - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
  //                     ^v 1 unit            ^      ^                 ^      ^
  //  boundary_high ---------------------     .      .                 .      .
  //                     ^v 1 unit            .      .                 .      .
  //   - - - - - - - - - - - - - - - - - - -  +  - - + - - - - - -     .      .
  //                                          .      .         ^       .      .
  //                                          .  big_distance  .       .      .
  //                                          .      .         .       .    rest
  //                              small_distance     .         .       .      .
  //                                          v      .         .       .      .
  //  w_high - - - - - - - - - - - - - - - - - -     .         .       .      .
  //                     ^v 1 unit                   .         .       .      .
  //  w ----------------------------------------     .         .       .      .
  //                     ^v 1 unit                   v         .       .      .
  //  w_low  - - - - - - - - - - - - - - - - - - - - -         .       .      .
  //                                                           .       .      v
  //  buffer --------------------------------------------------+-------+--------
  //                                                           .       .
  //                                                  safe_interval    .
  //                                                           v       .
  //   - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -     .
  //                     ^v 1 unit                                     .
  //  boundary_low -------------------------                     unsafe_interval
  //                     ^v 1 unit                                     v
  //  too_low  - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
  //
  //
  // Note that the value of buffer could lie anywhere inside the range too_low
  // to too_high.
  //
  // boundary_low, boundary_high and w are approximations of the real boundaries
  // and v (the input number). They are guaranteed to be precise up to one unit.
  // In fact the error is guaranteed to be strictly less than one unit.
  //
  // Anything that lies outside the unsafe interval is guaranteed not to round
  // to v when read again.
  // Anything that lies inside the safe interval is guaranteed to round to v
  // when read again.
  // If the number inside the buffer lies inside the unsafe interval but not
  // inside the safe interval then we simply do not know and bail out (returning
  // false).
  //
  // Similarly we have to take into account the imprecision of 'w' when finding
  // the closest representation of 'w'. If we have two potential
  // representations, and one is closer to both w_low and w_high, then we know
  // it is closer to the actual value v.
  //
  // By generating the digits of too_high we got the largest (closest to
  // too_high) buffer that is still in the unsafe interval. In the case where
  // w_high < buffer < too_high we try to decrement the buffer.
  // This way the buffer approaches (rounds towards) w.
  // There are 3 conditions that stop the decrementation process:
  //   1) the buffer is already below w_high
  //   2) decrementing the buffer would make it leave the unsafe interval
  //   3) decrementing the buffer would yield a number below w_high and farther
  //      away than the current number. In other words:
  //              (buffer{-1} < w_high) && w_high - buffer{-1} > buffer - w_high
  // Instead of using the buffer directly we use its distance to too_high.
  // Conceptually rest ~= too_high - buffer
  // We need to do the following tests in this order to avoid over- and
  // underflows.
  ASSERT(rest <= unsafe_interval);
  while (rest < small_distance &&  // Negated condition 1
         unsafe_interval - rest >= ten_kappa &&  // Negated condition 2
         (rest + ten_kappa < small_distance ||  // buffer{-1} > w_high
          small_distance - rest >= rest + ten_kappa - small_distance)) {
    buffer[length - 1]--;
    rest += ten_kappa;
  }

  // We have approached w+ as much as possible. We now test if approaching w-
  // would require changing the buffer. If yes, then we have two possible
  // representations close to w, but we cannot decide which one is closer.
  if (rest < big_distance &&
      unsafe_interval - rest >= ten_kappa &&
      (rest + ten_kappa < big_distance ||
       big_distance - rest > rest + ten_kappa - big_distance)) {
    return false;
  }

  // Weeding test.
  //   The safe interval is [too_low + 2 ulp; too_high - 2 ulp]
  //   Since too_low = too_high - unsafe_interval this is equivalent to
  //      [too_high - unsafe_interval + 4 ulp; too_high - 2 ulp]
  //   Conceptually we have: rest ~= too_high - buffer
  return (2 * unit <= rest) && (rest <= unsafe_interval - 4 * unit);
}


// Rounds the buffer upwards if the result is closer to v by possibly adding
// 1 to the buffer. If the precision of the calculation is not sufficient to
// round correctly, return false.
// The rounding might shift the whole buffer in which case the kappa is
// adjusted. For example "99", kappa = 3 might become "10", kappa = 4.
//
// If 2*rest > ten_kappa then the buffer needs to be round up.
// rest can have an error of +/- 1 unit. This function accounts for the
// imprecision and returns false, if the rounding direction cannot be
// unambiguously determined.
//
// Precondition: rest < ten_kappa.
static bool RoundWeedCounted(Vector<char> buffer,
                             int length,
                             uint64_t rest,
                             uint64_t ten_kappa,
                             uint64_t unit,
                             int* kappa) {
  ASSERT(rest < ten_kappa);
  // The following tests are done in a specific order to avoid overflows. They
  // will work correctly with any uint64 values of rest < ten_kappa and unit.
  //
  // If the unit is too big, then we don't know which way to round. For example
  // a unit of 50 means that the real number lies within rest +/- 50. If
  // 10^kappa == 40 then there is no way to tell which way to round.
  if (unit >= ten_kappa) return false;
  // Even if unit is just half the size of 10^kappa we are already completely
  // lost. (And after the previous test we know that the expression will not
  // over/underflow.)
  if (ten_kappa - unit <= unit) return false;
  // If 2 * (rest + unit) <= 10^kappa we can safely round down.
  if ((ten_kappa - rest > rest) && (ten_kappa - 2 * rest >= 2 * unit)) {
    return true;
  }
  // If 2 * (rest - unit) >= 10^kappa, then we can safely round up.
  if ((rest > unit) && (ten_kappa - (rest - unit) <= (rest - unit))) {
    // Increment the last digit recursively until we find a non '9' digit.
    buffer[length - 1]++;
    for (int i = length - 1; i > 0; --i) {
      if (buffer[i] != '0' + 10) break;
      buffer[i] = '0';
      buffer[i - 1]++;
    }
    // If the first digit is now '0'+ 10 we had a buffer with all '9's. With the
    // exception of the first digit all digits are now '0'. Simply switch the
    // first digit to '1' and adjust the kappa. Example: "99" becomes "10" and
    // the power (the kappa) is increased.
    if (buffer[0] == '0' + 10) {
      buffer[0] = '1';
      (*kappa) += 1;
    }
    return true;
  }
  return false;
}

// Returns the biggest power of ten that is less than or equal to the given
// number. We furthermore receive the maximum number of bits 'number' has.
//
// Returns power == 10^(exponent_plus_one-1) such that
//    power <= number < power * 10.
// If number_bits == 0 then 0^(0-1) is returned.
// The number of bits must be <= 32.
// Precondition: number < (1 << (number_bits + 1)).

// Inspired by the method for finding an integer log base 10 from here:
// http://graphics.stanford.edu/~seander/bithacks.html#IntegerLog10
static unsigned int const kSmallPowersOfTen[] =
    {0, 1, 10, 100, 1000, 10000, 100000, 1000000, 10000000, 100000000,
     1000000000};

static void BiggestPowerTen(uint32_t number,
                            int number_bits,
                            uint32_t* power,
                            int* exponent_plus_one) {
  ASSERT(number < (1u << (number_bits + 1)));
  // 1233/4096 is approximately 1/lg(10).
  int exponent_plus_one_guess = ((number_bits + 1) * 1233 >> 12);
  // We increment to skip over the first entry in the kPowersOf10 table.
  // Note: kPowersOf10[i] == 10^(i-1).
  exponent_plus_one_guess++;
  // We don't have any guarantees that 2^number_bits <= number.
  // TODO(floitsch): can we change the 'while' into an 'if'? We definitely see
  // number < (2^number_bits - 1), but I haven't encountered
  // number < (2^number_bits - 2) yet.
  while (number < kSmallPowersOfTen[exponent_plus_one_guess]) {
    exponent_plus_one_guess--;
  }
  *power = kSmallPowersOfTen[exponent_plus_one_guess];
  *exponent_plus_one = exponent_plus_one_guess;
}

// Generates the digits of input number w.
// w is a floating-point number (DiyFp), consisting of a significand and an
// exponent. Its exponent is bounded by kMinimalTargetExponent and
// kMaximalTargetExponent.
//       Hence -60 <= w.e() <= -32.
//
// Returns false if it fails, in which case the generated digits in the buffer
// should not be used.
// Preconditions:
//  * low, w and high are correct up to 1 ulp (unit in the last place). That
//    is, their error must be less than a unit of their last digits.
//  * low.e() == w.e() == high.e()
//  * low < w < high, and taking into account their error: low~ <= high~
//  * kMinimalTargetExponent <= w.e() <= kMaximalTargetExponent
// Postconditions: returns false if procedure fails.
//   otherwise:
//     * buffer is not null-terminated, but len contains the number of digits.
//     * buffer contains the shortest possible decimal digit-sequence
//       such that LOW < buffer * 10^kappa < HIGH, where LOW and HIGH are the
//       correct values of low and high (without their error).
//     * if more than one decimal representation gives the minimal number of
//       decimal digits then the one closest to W (where W is the correct value
//       of w) is chosen.
// Remark: this procedure takes into account the imprecision of its input
//   numbers. If the precision is not enough to guarantee all the postconditions
//   then false is returned. This usually happens rarely (~0.5%).
//
// Say, for the sake of example, that
//   w.e() == -48, and w.f() == 0x1234567890abcdef
// w's value can be computed by w.f() * 2^w.e()
// We can obtain w's integral digits by simply shifting w.f() by -w.e().
//  -> w's integral part is 0x1234
//  w's fractional part is therefore 0x567890abcdef.
// Printing w's integral part is easy (simply print 0x1234 in decimal).
// In order to print its fraction we repeatedly multiply the fraction by 10 and
// get each digit. Example the first digit after the point would be computed by
//   (0x567890abcdef * 10) >> 48. -> 3
// The whole thing becomes slightly more complicated because we want to stop
// once we have enough digits. That is, once the digits inside the buffer
// represent 'w' we can stop. Everything inside the interval low - high
// represents w. However we have to pay attention to low, high and w's
// imprecision.
static bool DigitGen(DiyFp low,
                     DiyFp w,
                     DiyFp high,
                     Vector<char> buffer,
                     int* length,
                     int* kappa) {
  ASSERT(low.e() == w.e() && w.e() == high.e());
  ASSERT(low.f() + 1 <= high.f() - 1);
  ASSERT(kMinimalTargetExponent <= w.e() && w.e() <= kMaximalTargetExponent);
  // low, w and high are imprecise, but by less than one ulp (unit in the last
  // place).
  // If we remove (resp. add) 1 ulp from low (resp. high) we are certain that
  // the new numbers are outside of the interval we want the final
  // representation to lie in.
  // Inversely adding (resp. removing) 1 ulp from low (resp. high) would yield
  // numbers that are certain to lie in the interval. We will use this fact
  // later on.
  // We will now start by generating the digits within the uncertain
  // interval. Later we will weed out representations that lie outside the safe
  // interval and thus _might_ lie outside the correct interval.
  uint64_t unit = 1;
  DiyFp too_low = DiyFp(low.f() - unit, low.e());
  DiyFp too_high = DiyFp(high.f() + unit, high.e());
  // too_low and too_high are guaranteed to lie outside the interval we want the
  // generated number in.
  DiyFp unsafe_interval = DiyFp::Minus(too_high, too_low);
  // We now cut the input number into two parts: the integral digits and the
  // fractionals. We will not write any decimal separator though, but adapt
  // kappa instead.
  // Reminder: we are currently computing the digits (stored inside the buffer)
  // such that:   too_low < buffer * 10^kappa < too_high
  // We use too_high for the digit_generation and stop as soon as possible.
  // If we stop early we effectively round down.
  DiyFp one = DiyFp(static_cast<uint64_t>(1) << -w.e(), w.e());
  // Division by one is a shift.
  uint32_t integrals = static_cast<uint32_t>(too_high.f() >> -one.e());
  // Modulo by one is an and.
  uint64_t fractionals = too_high.f() & (one.f() - 1);
  uint32_t divisor;
  int divisor_exponent_plus_one;
  BiggestPowerTen(integrals, DiyFp::kSignificandSize - (-one.e()),
                  &divisor, &divisor_exponent_plus_one);
  *kappa = divisor_exponent_plus_one;
  *length = 0;
  // Loop invariant: buffer = too_high / 10^kappa  (integer division)
  // The invariant holds for the first iteration: kappa has been initialized
  // with the divisor exponent + 1. And the divisor is the biggest power of ten
  // that is smaller than integrals.
  while (*kappa > 0) {
    int digit = integrals / divisor;
    buffer[*length] = '0' + digit;
    (*length)++;
    integrals %= divisor;
    (*kappa)--;
    // Note that kappa now equals the exponent of the divisor and that the
    // invariant thus holds again.
    uint64_t rest =
        (static_cast<uint64_t>(integrals) << -one.e()) + fractionals;
    // Invariant: too_high = buffer * 10^kappa + DiyFp(rest, one.e())
    // Reminder: unsafe_interval.e() == one.e()
    if (rest < unsafe_interval.f()) {
      // Rounding down (by not emitting the remaining digits) yields a number
      // that lies within the unsafe interval.
      return RoundWeed(buffer, *length, DiyFp::Minus(too_high, w).f(),
                       unsafe_interval.f(), rest,
                       static_cast<uint64_t>(divisor) << -one.e(), unit);
    }
    divisor /= 10;
  }

  // The integrals have been generated. We are at the point of the decimal
  // separator. In the following loop we simply multiply the remaining digits by
  // 10 and divide by one. We just need to pay attention to multiply associated
  // data (like the interval or 'unit'), too.
  // Note that the multiplication by 10 does not overflow, because w.e >= -60
  // and thus one.e >= -60.
  ASSERT(one.e() >= -60);
  ASSERT(fractionals < one.f());
  ASSERT(UINT64_2PART_C(0xFFFFFFFF, FFFFFFFF) / 10 >= one.f());
  while (true) {
    fractionals *= 10;
    unit *= 10;
    unsafe_interval.set_f(unsafe_interval.f() * 10);
    // Integer division by one.
    int digit = static_cast<int>(fractionals >> -one.e());
    buffer[*length] = '0' + digit;
    (*length)++;
    fractionals &= one.f() - 1;  // Modulo by one.
    (*kappa)--;
    if (fractionals < unsafe_interval.f()) {
      return RoundWeed(buffer, *length, DiyFp::Minus(too_high, w).f() * unit,
                       unsafe_interval.f(), fractionals, one.f(), unit);
    }
  }
}


// Generates (at most) requested_digits digits of input number w.
// w is a floating-point number (DiyFp), consisting of a significand and an
// exponent. Its exponent is bounded by kMinimalTargetExponent and
// kMaximalTargetExponent.
//       Hence -60 <= w.e() <= -32.
//
// Returns false if it fails, in which case the generated digits in the buffer
// should not be used.
// Preconditions:
//  * w is correct up to 1 ulp (unit in the last place). That
//    is, its error must be strictly less than a unit of its last digit.
//  * kMinimalTargetExponent <= w.e() <= kMaximalTargetExponent
//
// Postconditions: returns false if procedure fails.
//   otherwise:
//     * buffer is not null-terminated, but length contains the number of
//       digits.
//     * the representation in buffer is the most precise representation of
//       requested_digits digits.
//     * buffer contains at most requested_digits digits of w. If there are less
//       than requested_digits digits then some trailing '0's have been removed.
//     * kappa is such that
//            w = buffer * 10^kappa + eps with |eps| < 10^kappa / 2.
//
// Remark: This procedure takes into account the imprecision of its input
//   numbers. If the precision is not enough to guarantee all the postconditions
//   then false is returned. This usually happens rarely, but the failure-rate
//   increases with higher requested_digits.
static bool DigitGenCounted(DiyFp w,
                            int requested_digits,
                            Vector<char> buffer,
                            int* length,
                            int* kappa) {
  ASSERT(kMinimalTargetExponent <= w.e() && w.e() <= kMaximalTargetExponent);
  ASSERT(kMinimalTargetExponent >= -60);
  ASSERT(kMaximalTargetExponent <= -32);
  // w is assumed to have an error less than 1 unit. Whenever w is scaled we
  // also scale its error.
  uint64_t w_error = 1;
  // We cut the input number into two parts: the integral digits and the
  // fractional digits. We don't emit any decimal separator, but adapt kappa
  // instead. Example: instead of writing "1.2" we put "12" into the buffer and
  // increase kappa by 1.
  DiyFp one = DiyFp(static_cast<uint64_t>(1) << -w.e(), w.e());
  // Division by one is a shift.
  uint32_t integrals = static_cast<uint32_t>(w.f() >> -one.e());
  // Modulo by one is an and.
  uint64_t fractionals = w.f() & (one.f() - 1);
  uint32_t divisor;
  int divisor_exponent_plus_one;
  BiggestPowerTen(integrals, DiyFp::kSignificandSize - (-one.e()),
                  &divisor, &divisor_exponent_plus_one);
  *kappa = divisor_exponent_plus_one;
  *length = 0;

  // Loop invariant: buffer = w / 10^kappa  (integer division)
  // The invariant holds for the first iteration: kappa has been initialized
  // with the divisor exponent + 1. And the divisor is the biggest power of ten
  // that is smaller than 'integrals'.
  while (*kappa > 0) {
    int digit = integrals / divisor;
    buffer[*length] = '0' + digit;
    (*length)++;
    requested_digits--;
    integrals %= divisor;
    (*kappa)--;
    // Note that kappa now equals the exponent of the divisor and that the
    // invariant thus holds again.
    if (requested_digits == 0) break;
    divisor /= 10;
  }

  if (requested_digits == 0) {
    uint64_t rest =
        (static_cast<uint64_t>(integrals) << -one.e()) + fractionals;
    return RoundWeedCounted(buffer, *length, rest,
                            static_cast<uint64_t>(divisor) << -one.e(), w_error,
                            kappa);
  }

  // The integrals have been generated. We are at the point of the decimal
  // separator. In the following loop we simply multiply the remaining digits by
  // 10 and divide by one. We just need to pay attention to multiply associated
  // data (the 'unit'), too.
  // Note that the multiplication by 10 does not overflow, because w.e >= -60
  // and thus one.e >= -60.
  ASSERT(one.e() >= -60);
  ASSERT(fractionals < one.f());
  ASSERT(UINT64_2PART_C(0xFFFFFFFF, FFFFFFFF) / 10 >= one.f());
  while (requested_digits > 0 && fractionals > w_error) {
    fractionals *= 10;
    w_error *= 10;
    // Integer division by one.
    int digit = static_cast<int>(fractionals >> -one.e());
    buffer[*length] = '0' + digit;
    (*length)++;
    requested_digits--;
    fractionals &= one.f() - 1;  // Modulo by one.
    (*kappa)--;
  }
  if (requested_digits != 0) return false;
  return RoundWeedCounted(buffer, *length, fractionals, one.f(), w_error,
                          kappa);
}


// Provides a decimal representation of v.
// Returns true if it succeeds, otherwise the result cannot be trusted.
// There will be *length digits inside the buffer (not null-terminated).
// If the function returns true then
//        v == (double) (buffer * 10^decimal_exponent).
// The digits in the buffer are the shortest representation possible: no
// 0.09999999999999999 instead of 0.1. The shorter representation will even be
// chosen even if the longer one would be closer to v.
// The last digit will be closest to the actual v. That is, even if several
// digits might correctly yield 'v' when read again, the closest will be
// computed.
static bool Grisu3(double v,
                   FastDtoaMode mode,
                   Vector<char> buffer,
                   int* length,
                   int* decimal_exponent) {
  DiyFp w = Double(v).AsNormalizedDiyFp();
  // boundary_minus and boundary_plus are the boundaries between v and its
  // closest floating-point neighbors. Any number strictly between
  // boundary_minus and boundary_plus will round to v when convert to a double.
  // Grisu3 will never output representations that lie exactly on a boundary.
  DiyFp boundary_minus, boundary_plus;
  if (mode == FAST_DTOA_SHORTEST) {
    Double(v).NormalizedBoundaries(&boundary_minus, &boundary_plus);
  } else {
    ASSERT(mode == FAST_DTOA_SHORTEST_SINGLE);
    float single_v = static_cast<float>(v);
    Single(single_v).NormalizedBoundaries(&boundary_minus, &boundary_plus);
  }
  ASSERT(boundary_plus.e() == w.e());
  DiyFp ten_mk;  // Cached power of ten: 10^-k
  int mk;        // -k
  int ten_mk_minimal_binary_exponent =
     kMinimalTargetExponent - (w.e() + DiyFp::kSignificandSize);
  int ten_mk_maximal_binary_exponent =
     kMaximalTargetExponent - (w.e() + DiyFp::kSignificandSize);
  PowersOfTenCache::GetCachedPowerForBinaryExponentRange(
      ten_mk_minimal_binary_exponent,
      ten_mk_maximal_binary_exponent,
      &ten_mk, &mk);
  ASSERT((kMinimalTargetExponent <= w.e() + ten_mk.e() +
          DiyFp::kSignificandSize) &&
         (kMaximalTargetExponent >= w.e() + ten_mk.e() +
          DiyFp::kSignificandSize));
  // Note that ten_mk is only an approximation of 10^-k. A DiyFp only contains a
  // 64 bit significand and ten_mk is thus only precise up to 64 bits.

  // The DiyFp::Times procedure rounds its result, and ten_mk is approximated
  // too. The variable scaled_w (as well as scaled_boundary_minus/plus) are now
  // off by a small amount.
  // In fact: scaled_w - w*10^k < 1ulp (unit in the last place) of scaled_w.
  // In other words: let f = scaled_w.f() and e = scaled_w.e(), then
  //           (f-1) * 2^e < w*10^k < (f+1) * 2^e
  DiyFp scaled_w = DiyFp::Times(w, ten_mk);
  ASSERT(scaled_w.e() ==
         boundary_plus.e() + ten_mk.e() + DiyFp::kSignificandSize);
  // In theory it would be possible to avoid some recomputations by computing
  // the difference between w and boundary_minus/plus (a power of 2) and to
  // compute scaled_boundary_minus/plus by subtracting/adding from
  // scaled_w. However the code becomes much less readable and the speed
  // enhancements are not terriffic.
  DiyFp scaled_boundary_minus = DiyFp::Times(boundary_minus, ten_mk);
  DiyFp scaled_boundary_plus  = DiyFp::Times(boundary_plus,  ten_mk);

  // DigitGen will generate the digits of scaled_w. Therefore we have
  // v == (double) (scaled_w * 10^-mk).
  // Set decimal_exponent == -mk and pass it to DigitGen. If scaled_w is not an
  // integer than it will be updated. For instance if scaled_w == 1.23 then
  // the buffer will be filled with "123" und the decimal_exponent will be
  // decreased by 2.
  int kappa;
  bool result = DigitGen(scaled_boundary_minus, scaled_w, scaled_boundary_plus,
                         buffer, length, &kappa);
  *decimal_exponent = -mk + kappa;
  return result;
}


// The "counted" version of grisu3 (see above) only generates requested_digits
// number of digits. This version does not generate the shortest representation,
// and with enough requested digits 0.1 will at some point print as 0.9999999...
// Grisu3 is too imprecise for real halfway cases (1.5 will not work) and
// therefore the rounding strategy for halfway cases is irrelevant.
static bool Grisu3Counted(double v,
                          int requested_digits,
                          Vector<char> buffer,
                          int* length,
                          int* decimal_exponent) {
  DiyFp w = Double(v).AsNormalizedDiyFp();
  DiyFp ten_mk;  // Cached power of ten: 10^-k
  int mk;        // -k
  int ten_mk_minimal_binary_exponent =
     kMinimalTargetExponent - (w.e() + DiyFp::kSignificandSize);
  int ten_mk_maximal_binary_exponent =
     kMaximalTargetExponent - (w.e() + DiyFp::kSignificandSize);
  PowersOfTenCache::GetCachedPowerForBinaryExponentRange(
      ten_mk_minimal_binary_exponent,
      ten_mk_maximal_binary_exponent,
      &ten_mk, &mk);
  ASSERT((kMinimalTargetExponent <= w.e() + ten_mk.e() +
          DiyFp::kSignificandSize) &&
         (kMaximalTargetExponent >= w.e() + ten_mk.e() +
          DiyFp::kSignificandSize));
  // Note that ten_mk is only an approximation of 10^-k. A DiyFp only contains a
  // 64 bit significand and ten_mk is thus only precise up to 64 bits.

  // The DiyFp::Times procedure rounds its result, and ten_mk is approximated
  // too. The variable scaled_w (as well as scaled_boundary_minus/plus) are now
  // off by a small amount.
  // In fact: scaled_w - w*10^k < 1ulp (unit in the last place) of scaled_w.
  // In other words: let f = scaled_w.f() and e = scaled_w.e(), then
  //           (f-1) * 2^e < w*10^k < (f+1) * 2^e
  DiyFp scaled_w = DiyFp::Times(w, ten_mk);

  // We now have (double) (scaled_w * 10^-mk).
  // DigitGen will generate the first requested_digits digits of scaled_w and
  // return together with a kappa such that scaled_w ~= buffer * 10^kappa. (It
  // will not always be exactly the same since DigitGenCounted only produces a
  // limited number of digits.)
  int kappa;
  bool result = DigitGenCounted(scaled_w, requested_digits,
                                buffer, length, &kappa);
  *decimal_exponent = -mk + kappa;
  return result;
}


bool FastDtoa(double v,
              FastDtoaMode mode,
              int requested_digits,
              Vector<char> buffer,
              int* length,
              int* decimal_point) {
  ASSERT(v > 0);
  ASSERT(!Double(v).IsSpecial());

  bool result = false;
  int decimal_exponent = 0;
  switch (mode) {
    case FAST_DTOA_SHORTEST:
    case FAST_DTOA_SHORTEST_SINGLE:
      result = Grisu3(v, mode, buffer, length, &decimal_exponent);
      break;
    case FAST_DTOA_PRECISION:
      result = Grisu3Counted(v, requested_digits,
                             buffer, length, &decimal_exponent);
      break;
    default:
      UNREACHABLE();
  }
  if (result) {
    *decimal_point = *length + decimal_exponent;
    buffer[*length] = '\0';
  }
  return result;
}

}  // namespace double_conversion


================================================
FILE: src/kenlm/util/double-conversion/fast-dtoa.h
================================================
// Copyright 2010 the V8 project authors. All rights reserved.
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are
// met:
//
//     * Redistributions of source code must retain the above copyright
//       notice, this list of conditions and the following disclaimer.
//     * Redistributions in binary form must reproduce the above
//       copyright notice, this list of conditions and the following
//       disclaimer in the documentation and/or other materials provided
//       with the distribution.
//     * Neither the name of Google Inc. nor the names of its
//       contributors may be used to endorse or promote products derived
//       from this software without specific prior written permission.
//
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

#ifndef DOUBLE_CONVERSION_FAST_DTOA_H_
#define DOUBLE_CONVERSION_FAST_DTOA_H_

#include "utils.h"

namespace double_conversion {

enum FastDtoaMode {
  // Computes the shortest representation of the given input. The returned
  // result will be the most accurate number of this length. Longer
  // representations might be more accurate.
  FAST_DTOA_SHORTEST,
  // Same as FAST_DTOA_SHORTEST but for single-precision floats.
  FAST_DTOA_SHORTEST_SINGLE,
  // Computes a representation where the precision (number of digits) is
  // given as input. The precision is independent of the decimal point.
  FAST_DTOA_PRECISION
};

// FastDtoa will produce at most kFastDtoaMaximalLength digits. This does not
// include the terminating '\0' character.
static const int kFastDtoaMaximalLength = 17;
// Same for single-precision numbers.
static const int kFastDtoaMaximalSingleLength = 9;

// Provides a decimal representation of v.
// The result should be interpreted as buffer * 10^(point - length).
//
// Precondition:
//   * v must be a strictly positive finite double.
//
// Returns true if it succeeds, otherwise the result can not be trusted.
// There will be *length digits inside the buffer followed by a null terminator.
// If the function returns true and mode equals
//   - FAST_DTOA_SHORTEST, then
//     the parameter requested_digits is ignored.
//     The result satisfies
//         v == (double) (buffer * 10^(point - length)).
//     The digits in the buffer are the shortest representation possible. E.g.
//     if 0.099999999999 and 0.1 represent the same double then "1" is returned
//     with point = 0.
//     The last digit will be closest to the actual v. That is, even if several
//     digits might correctly yield 'v' when read again, the buffer will contain
//     the one closest to v.
//   - FAST_DTOA_PRECISION, then
//     the buffer contains requested_digits digits.
//     the difference v - (buffer * 10^(point-length)) is closest to zero for
//     all possible representations of requested_digits digits.
//     If there are two values that are equally close, then FastDtoa returns
//     false.
// For both modes the buffer must be large enough to hold the result.
bool FastDtoa(double d,
              FastDtoaMode mode,
              int requested_digits,
              Vector<char> buffer,
              int* length,
              int* decimal_point);

}  // namespace double_conversion

#endif  // DOUBLE_CONVERSION_FAST_DTOA_H_


================================================
FILE: src/kenlm/util/double-conversion/fixed-dtoa.cc
================================================
// Copyright 2010 the V8 project authors. All rights reserved.
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are
// met:
//
//     * Redistributions of source code must retain the above copyright
//       notice, this list of conditions and the following disclaimer.
//     * Redistributions in binary form must reproduce the above
//       copyright notice, this list of conditions and the following
//       disclaimer in the documentation and/or other materials provided
//       with the distribution.
//     * Neither the name of Google Inc. nor the names of its
//       contributors may be used to endorse or promote products derived
//       from this software without specific prior written permission.
//
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

#include <math.h>

#include "fixed-dtoa.h"
#include "ieee.h"

namespace double_conversion {

// Represents a 128bit type. This class should be replaced by a native type on
// platforms that support 128bit integers.
class UInt128 {
 public:
  UInt128() : high_bits_(0), low_bits_(0) { }
  UInt128(uint64_t high, uint64_t low) : high_bits_(high), low_bits_(low) { }

  void Multiply(uint32_t multiplicand) {
    uint64_t accumulator;

    accumulator = (low_bits_ & kMask32) * multiplicand;
    uint32_t part = static_cast<uint32_t>(accumulator & kMask32);
    accumulator >>= 32;
    accumulator = accumulator + (low_bits_ >> 32) * multiplicand;
    low_bits_ = (accumulator << 32) + part;
    accumulator >>= 32;
    accumulator = accumulator + (high_bits_ & kMask32) * multiplicand;
    part = static_cast<uint32_t>(accumulator & kMask32);
    accumulator >>= 32;
    accumulator = accumulator + (high_bits_ >> 32) * multiplicand;
    high_bits_ = (accumulator << 32) + part;
    ASSERT((accumulator >> 32) == 0);
  }

  void Shift(int shift_amount) {
    ASSERT(-64 <= shift_amount && shift_amount <= 64);
    if (shift_amount == 0) {
      return;
    } else if (shift_amount == -64) {
      high_bits_ = low_bits_;
      low_bits_ = 0;
    } else if (shift_amount == 64) {
      low_bits_ = high_bits_;
      high_bits_ = 0;
    } else if (shift_amount <= 0) {
      high_bits_ <<= -shift_amount;
      high_bits_ += low_bits_ >> (64 + shift_amount);
      low_bits_ <<= -shift_amount;
    } else {
      low_bits_ >>= shift_amount;
      low_bits_ += high_bits_ << (64 - shift_amount);
      high_bits_ >>= shift_amount;
    }
  }

  // Modifies *this to *this MOD (2^power).
  // Returns *this DIV (2^power).
  int DivModPowerOf2(int power) {
    if (power >= 64) {
      int result = static_cast<int>(high_bits_ >> (power - 64));
      high_bits_ -= static_cast<uint64_t>(result) << (power - 64);
      return result;
    } else {
      uint64_t part_low = low_bits_ >> power;
      uint64_t part_high = high_bits_ << (64 - power);
      int result = static_cast<int>(part_low + part_high);
      high_bits_ = 0;
      low_bits_ -= part_low << power;
      return result;
    }
  }

  bool IsZero() const {
    return high_bits_ == 0 && low_bits_ == 0;
  }

  int BitAt(int position) {
    if (position >= 64) {
      return static_cast<int>(high_bits_ >> (position - 64)) & 1;
    } else {
      return static_cast<int>(low_bits_ >> position) & 1;
    }
  }

 private:
  static const uint64_t kMask32 = 0xFFFFFFFF;
  // Value == (high_bits_ << 64) + low_bits_
  uint64_t high_bits_;
  uint64_t low_bits_;
};


static const int kDoubleSignificandSize = 53;  // Includes the hidden bit.


static void FillDigits32FixedLength(uint32_t number, int requested_length,
                                    Vector<char> buffer, int* length) {
  for (int i = requested_length - 1; i >= 0; --i) {
    buffer[(*length) + i] = '0' + number % 10;
    number /= 10;
  }
  *length += requested_length;
}


static void FillDigits32(uint32_t number, Vector<char> buffer, int* length) {
  int number_length = 0;
  // We fill the digits in reverse order and exchange them afterwards.
  while (number != 0) {
    int digit = number % 10;
    number /= 10;
    buffer[(*length) + number_length] = '0' + digit;
    number_length++;
  }
  // Exchange the digits.
  int i = *length;
  int j = *length + number_length - 1;
  while (i < j) {
    char tmp = buffer[i];
    buffer[i] = buffer[j];
    buffer[j] = tmp;
    i++;
    j--;
  }
  *length += number_length;
}


static void FillDigits64FixedLength(uint64_t number, int requested_length,
                                    Vector<char> buffer, int* length) {
  const uint32_t kTen7 = 10000000;
  // For efficiency cut the number into 3 uint32_t parts, and print those.
  uint32_t part2 = static_cast<uint32_t>(number % kTen7);
  number /= kTen7;
  uint32_t part1 = static_cast<uint32_t>(number % kTen7);
  uint32_t part0 = static_cast<uint32_t>(number / kTen7);

  FillDigits32FixedLength(part0, 3, buffer, length);
  FillDigits32FixedLength(part1, 7, buffer, length);
  FillDigits32FixedLength(part2, 7, buffer, length);
}


static void FillDigits64(uint64_t number, Vector<char> buffer, int* length) {
  const uint32_t kTen7 = 10000000;
  // For efficiency cut the number into 3 uint32_t parts, and print those.
  uint32_t part2 = static_cast<uint32_t>(number % kTen7);
  number /= kTen7;
  uint32_t part1 = static_cast<uint32_t>(number % kTen7);
  uint32_t part0 = static_cast<uint32_t>(number / kTen7);

  if (part0 != 0) {
    FillDigits32(part0, buffer, length);
    FillDigits32FixedLength(part1, 7, buffer, length);
    FillDigits32FixedLength(part2, 7, buffer, length);
  } else if (part1 != 0) {
    FillDigits32(part1, buffer, length);
    FillDigits32FixedLength(part2, 7, buffer, length);
  } else {
    FillDigits32(part2, buffer, length);
  }
}


static void RoundUp(Vector<char> buffer, int* length, int* decimal_point) {
  // An empty buffer represents 0.
  if (*length == 0) {
    buffer[0] = '1';
    *decimal_point = 1;
    *length = 1;
    return;
  }
  // Round the last digit until we either have a digit that was not '9' or until
  // we reached the first digit.
  buffer[(*length) - 1]++;
  for (int i = (*length) - 1; i > 0; --i) {
    if (buffer[i] != '0' + 10) {
      return;
    }
    buffer[i] = '0';
    buffer[i - 1]++;
  }
  // If the first digit is now '0' + 10, we would need to set it to '0' and add
  // a '1' in front. However we reach the first digit only if all following
  // digits had been '9' before rounding up. Now all trailing digits are '0' and
  // we simply switch the first digit to '1' and update the decimal-point
  // (indicating that the point is now one digit to the right).
  if (buffer[0] == '0' + 10) {
    buffer[0] = '1';
    (*decimal_point)++;
  }
}


// The given fractionals number represents a fixed-point number with binary
// point at bit (-exponent).
// Preconditions:
//   -128 <= exponent <= 0.
//   0 <= fractionals * 2^exponent < 1
//   The buffer holds the result.
// The function will round its result. During the rounding-process digits not
// generated by this function might be updated, and the decimal-point variable
// might be updated. If this function generates the digits 99 and the buffer
// already contained "199" (thus yielding a buffer of "19999") then a
// rounding-up will change the contents of the buffer to "20000".
static void FillFractionals(uint64_t fractionals, int exponent,
                            int fractional_count, Vector<char> buffer,
                            int* length, int* decimal_point) {
  ASSERT(-128 <= exponent && exponent <= 0);
  // 'fractionals' is a fixed-point number, with binary point at bit
  // (-exponent). Inside the function the non-converted remainder of fractionals
  // is a fixed-point number, with binary point at bit 'point'.
  if (-exponent <= 64) {
    // One 64 bit number is sufficient.
    ASSERT(fractionals >> 56 == 0);
    int point = -exponent;
    for (int i = 0; i < fractional_count; ++i) {
      if (fractionals == 0) break;
      // Instead of multiplying by 10 we multiply by 5 and adjust the point
      // location. This way the fractionals variable will not overflow.
      // Invariant at the beginning of the loop: fractionals < 2^point.
      // Initially we have: point <= 64 and fractionals < 2^56
      // After each iteration the point is decremented by one.
      // Note that 5^3 = 125 < 128 = 2^7.
      // Therefore three iterations of this loop will not overflow fractionals
      // (even without the subtraction at the end of the loop body). At this
      // time point will satisfy point <= 61 and therefore fractionals < 2^point
      // and any further multiplication of fractionals by 5 will not overflow.
      fractionals *= 5;
      point--;
      int digit = static_cast<int>(fractionals >> point);
      buffer[*length] = '0' + digit;
      (*length)++;
      fractionals -= static_cast<uint64_t>(digit) << point;
    }
    // If the first bit after the point is set we have to round up.
    if (((fractionals >> (point - 1)) & 1) == 1) {
      RoundUp(buffer, length, decimal_point);
    }
  } else {  // We need 128 bits.
    ASSERT(64 < -exponent && -exponent <= 128);
    UInt128 fractionals128 = UInt128(fractionals, 0);
    fractionals128.Shift(-exponent - 64);
    int point = 128;
    for (int i = 0; i < fractional_count; ++i) {
      if (fractionals128.IsZero()) break;
      // As before: instead of multiplying by 10 we multiply by 5 and adjust the
      // point location.
      // This multiplication will not overflow for the same reasons as before.
      fractionals128.Multiply(5);
      point--;
      int digit = fractionals128.DivModPowerOf2(point);
      buffer[*length] = '0' + digit;
      (*length)++;
    }
    if (fractionals128.BitAt(point - 1) == 1) {
      RoundUp(buffer, length, decimal_point);
    }
  }
}


// Removes leading and trailing zeros.
// If leading zeros are removed then the decimal point position is adjusted.
static void TrimZeros(Vector<char> buffer, int* length, int* decimal_point) {
  while (*length > 0 && buffer[(*length) - 1] == '0') {
    (*length)--;
  }
  int first_non_zero = 0;
  while (first_non_zero < *length && buffer[first_non_zero] == '0') {
    first_non_zero++;
  }
  if (first_non_zero != 0) {
    for (int i = first_non_zero; i < *length; ++i) {
      buffer[i - first_non_zero] = buffer[i];
    }
    *length -= first_non_zero;
    *decimal_point -= first_non_zero;
  }
}


bool FastFixedDtoa(double v,
                   int fractional_count,
                   Vector<char> buffer,
                   int* length,
                   int* decimal_point) {
  const uint32_t kMaxUInt32 = 0xFFFFFFFF;
  uint64_t significand = Double(v).Significand();
  int exponent = Double(v).Exponent();
  // v = significand * 2^exponent (with significand a 53bit integer).
  // If the exponent is larger than 20 (i.e. we may have a 73bit number) then we
  // don't know how to compute the representation. 2^73 ~= 9.5*10^21.
  // If necessary this limit could probably be increased, but we don't need
  // more.
  if (exponent > 20) return false;
  if (fractional_count > 20) return false;
  *length = 0;
  // At most kDoubleSignificandSize bits of the significand are non-zero.
  // Given a 64 bit integer we have 11 0s followed by 53 potentially non-zero
  // bits:  0..11*..0xxx..53*..xx
  if (exponent + kDoubleSignificandSize > 64) {
    // The exponent must be > 11.
    //
    // We know that v = significand * 2^exponent.
    // And the exponent > 11.
    // We simplify the task by dividing v by 10^17.
    // The quotient delivers the first digits, and the remainder fits into a 64
    // bit number.
    // Dividing by 10^17 is equivalent to dividing by 5^17*2^17.
    const uint64_t kFive17 = UINT64_2PART_C(0xB1, A2BC2EC5);  // 5^17
    uint64_t divisor = kFive17;
    int divisor_power = 17;
    uint64_t dividend = significand;
    uint32_t quotient;
    uint64_t remainder;
    // Let v = f * 2^e with f == significand and e == exponent.
    // Then need q (quotient) and r (remainder) as follows:
    //   v            = q * 10^17       + r
    //   f * 2^e      = q * 10^17       + r
    //   f * 2^e      = q * 5^17 * 2^17 + r
    // If e > 17 then
    //   f * 2^(e-17) = q * 5^17        + r/2^17
    // else
    //   f  = q * 5^17 * 2^(17-e) + r/2^e
    if (exponent > divisor_power) {
      // We only allow exponents of up to 20 and therefore (17 - e) <= 3
      dividend <<= exponent - divisor_power;
      quotient = static_cast<uint32_t>(dividend / divisor);
      remainder = (dividend % divisor) << divisor_power;
    } else {
      divisor <<= divisor_power - exponent;
      quotient = static_cast<uint32_t>(dividend / divisor);
      remainder = (dividend % divisor) << exponent;
    }
    FillDigits32(quotient, buffer, length);
    FillDigits64FixedLength(remainder, divisor_power, buffer, length);
    *decimal_point = *length;
  } else if (exponent >= 0) {
    // 0 <= exponent <= 11
    significand <<= exponent;
    FillDigits64(significand, buffer, length);
    *decimal_point = *length;
  } else if (exponent > -kDoubleSignificandSize) {
    // We have to cut the number.
    uint64_t integrals = significand >> -exponent;
    uint64_t fractionals = significand - (integrals << -exponent);
    if (integrals > kMaxUInt32) {
      FillDigits64(integrals, buffer, length);
    } else {
      FillDigits32(static_cast<uint32_t>(integrals), buffer, length);
    }
    *decimal_point = *length;
    FillFractionals(fractionals, exponent, fractional_count,
                    buffer, length, decimal_point);
  } else if (exponent < -128) {
    // This configuration (with at most 20 digits) means that all digits must be
    // 0.
    ASSERT(fractional_count <= 20);
    buffer[0] = '\0';
    *length = 0;
    *decimal_point = -fractional_count;
  } else {
    *decimal_point = 0;
    FillFractionals(significand, exponent, fractional_count,
                    buffer, length, decimal_point);
  }
  TrimZeros(buffer, length, decimal_point);
  buffer[*length] = '\0';
  if ((*length) == 0) {
    // The string is empty and the decimal_point thus has no importance. Mimick
    // Gay's dtoa and and set it to -fractional_count.
    *decimal_point = -fractional_count;
  }
  return true;
}

}  // namespace double_conversion


================================================
FILE: src/kenlm/util/double-conversion/fixed-dtoa.h
================================================
// Copyright 2010 the V8 project authors. All rights reserved.
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are
// met:
//
//     * Redistributions of source code must retain the above copyright
//       notice, this list of conditions and the following disclaimer.
//     * Redistributions in binary form must reproduce the above
//       copyright notice, this list of conditions and the following
//       disclaimer in the documentation and/or other materials provided
//       with the distribution.
//     * Neither the name of Google Inc. nor the names of its
//       contributors may be used to endorse or promote products derived
//       from this software without specific prior written permission.
//
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

#ifndef DOUBLE_CONVERSION_FIXED_DTOA_H_
#define DOUBLE_CONVERSION_FIXED_DTOA_H_

#include "utils.h"

namespace double_conversion {

// Produces digits necessary to print a given number with
// 'fractional_count' digits after the decimal point.
// The buffer must be big enough to hold the result plus one terminating null
// character.
//
// The produced digits might be too short in which case the caller has to fill
// the gaps with '0's.
// Example: FastFixedDtoa(0.001, 5, ...) is allowed to return buffer = "1", and
// decimal_point = -2.
// Halfway cases are rounded towards +/-Infinity (away from 0). The call
// FastFixedDtoa(0.15, 2, ...) thus returns buffer = "2", decimal_point = 0.
// The returned buffer may contain digits that would be truncated from the
// shortest representation of the input.
//
// This method only works for some parameters. If it can't handle the input it
// returns false. The output is null-terminated when the function succeeds.
bool FastFixedDtoa(double v, int fractional_count,
                   Vector<char> buffer, int* length, int* decimal_point);

}  // namespace double_conversion

#endif  // DOUBLE_CONVERSION_FIXED_DTOA_H_


================================================
FILE: src/kenlm/util/double-conversion/ieee.h
================================================
// Copyright 2012 the V8 project authors. All rights reserved.
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are
// met:
//
//     * Redistributions of source code must retain the above copyright
//       notice, this list of conditions and the following disclaimer.
//     * Redistributions in binary form must reproduce the above
//       copyright notice, this list of conditions and the following
//       disclaimer in the documentation and/or other materials provided
//       with the distribution.
//     * Neither the name of Google Inc. nor the names of its
//       contributors may be used to endorse or promote products derived
//       from this software without specific prior written permission.
//
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

#ifndef DOUBLE_CONVERSION_DOUBLE_H_
#define DOUBLE_CONVERSION_DOUBLE_H_

#include "diy-fp.h"

namespace double_conversion {

// We assume that doubles and uint64_t have the same endianness.
static uint64_t double_to_uint64(double d) { return BitCast<uint64_t>(d); }
static double uint64_to_double(uint64_t d64) { return BitCast<double>(d64); }
static uint32_t float_to_uint32(float f) { return BitCast<uint32_t>(f); }
static float uint32_to_float(uint32_t d32) { return BitCast<float>(d32); }

// Helper functions for doubles.
class Double {
 public:
  static const uint64_t kSignMask = UINT64_2PART_C(0x80000000, 00000000);
  static const uint64_t kExponentMask = UINT64_2PART_C(0x7FF00000, 00000000);
  static const uint64_t kSignificandMask = UINT64_2PART_C(0x000FFFFF, FFFFFFFF);
  static const uint64_t kHiddenBit = UINT64_2PART_C(0x00100000, 00000000);
  static const int kPhysicalSignificandSize = 52;  // Excludes the hidden bit.
  static const int kSignificandSize = 53;

  Double() : d64_(0) {}
  explicit Double(double d) : d64_(double_to_uint64(d)) {}
  explicit Double(uint64_t d64) : d64_(d64) {}
  explicit Double(DiyFp diy_fp)
    : d64_(DiyFpToUint64(diy_fp)) {}

  // The value encoded by this Double must be greater or equal to +0.0.
  // It must not be special (infinity, or NaN).
  DiyFp AsDiyFp() const {
    ASSERT(Sign() > 0);
    ASSERT(!IsSpecial());
    return DiyFp(Significand(), Exponent());
  }

  // The value encoded by this Double must be strictly greater than 0.
  DiyFp AsNormalizedDiyFp() const {
    ASSERT(value() > 0.0);
    uint64_t f = Significand();
    int e = Exponent();

    // The current double could be a denormal.
    while ((f & kHiddenBit) == 0) {
      f <<= 1;
      e--;
    }
    // Do the final shifts in one go.
    f <<= DiyFp::kSignificandSize - kSignificandSize;
    e -= DiyFp::kSignificandSize - kSignificandSize;
    return DiyFp(f, e);
  }

  // Returns the double's bit as uint64.
  uint64_t AsUint64() const {
    return d64_;
  }

  // Returns the next greater double. Returns +infinity on input +infinity.
  double NextDouble() const {
    if (d64_ == kInfinity) return Double(kInfinity).value();
    if (Sign() < 0 && Significand() == 0) {
      // -0.0
      return 0.0;
    }
    if (Sign() < 0) {
      return Double(d64_ - 1).value();
    } else {
      return Double(d64_ + 1).value();
    }
  }

  double PreviousDouble() const {
    if (d64_ == (kInfinity | kSignMask)) return -Double::Infinity();
    if (Sign() < 0) {
      return Double(d64_ + 1).value();
    } else {
      if (Significand() == 0) return -0.0;
      return Double(d64_ - 1).value();
    }
  }

  int Exponent() const {
    if (IsDenormal()) return kDenormalExponent;

    uint64_t d64 = AsUint64();
    int biased_e =
        static_cast<int>((d64 & kExponentMask) >> kPhysicalSignificandSize);
    return biased_e - kExponentBias;
  }

  uint64_t Significand() const {
    uint64_t d64 = AsUint64();
    uint64_t significand = d64 & kSignificandMask;
    if (!IsDenormal()) {
      return significand + kHiddenBit;
    } else {
      return significand;
    }
  }

  // Returns true if the double is a denormal.
  bool IsDenormal() const {
    uint64_t d64 = AsUint64();
    return (d64 & kExponentMask) == 0;
  }

  // We consider denormals not to be special.
  // Hence only Infinity and NaN are special.
  bool IsSpecial() const {
    uint64_t d64 = AsUint64();
    return (d64 & kExponentMask) == kExponentMask;
  }

  bool IsNan() const {
    uint64_t d64 = AsUint64();
    return ((d64 & kExponentMask) == kExponentMask) &&
        ((d64 & kSignificandMask) != 0);
  }

  bool IsInfinite() const {
    uint64_t d64 = AsUint64();
    return ((d64 & kExponentMask) == kExponentMask) &&
        ((d64 & kSignificandMask) == 0);
  }

  int Sign() const {
    uint64_t d64 = AsUint64();
    return (d64 & kSignMask) == 0? 1: -1;
  }

  // Precondition: the value encoded by this Double must be greater or equal
  // than +0.0.
  DiyFp UpperBoundary() const {
    ASSERT(Sign() > 0);
    return DiyFp(Significand() * 2 + 1, Exponent() - 1);
  }

  // Computes the two boundaries of this.
  // The bigger boundary (m_plus) is normalized. The lower boundary has the same
  // exponent as m_plus.
  // Precondition: the value encoded by this Double must be greater than 0.
  void NormalizedBoundaries(DiyFp* out_m_minus, DiyFp* out_m_plus) const {
    ASSERT(value() > 0.0);
    DiyFp v = this->AsDiyFp();
    DiyFp m_plus = DiyFp::Normalize(DiyFp((v.f() << 1) + 1, v.e() - 1));
    DiyFp m_minus;
    if (LowerBoundaryIsCloser()) {
      m_minus = DiyFp((v.f() << 2) - 1, v.e() - 2);
    } else {
      m_minus = DiyFp((v.f() << 1) - 1, v.e() - 1);
    }
    m_minus.set_f(m_minus.f() << (m_minus.e() - m_plus.e()));
    m_minus.set_e(m_plus.e());
    *out_m_plus = m_plus;
    *out_m_minus = m_minus;
  }

  bool LowerBoundaryIsCloser() const {
    // The boundary is closer if the significand is of the form f == 2^p-1 then
    // the lower boundary is closer.
    // Think of v = 1000e10 and v- = 9999e9.
    // Then the boundary (== (v - v-)/2) is not just at a distance of 1e9 but
    // at a distance of 1e8.
    // The only exception is for the smallest normal: the largest denormal is
    // at the same distance as its successor.
    // Note: denormals have the same exponent as the smallest normals.
    bool physical_significand_is_zero = ((AsUint64() & kSignificandMask) == 0);
    return physical_significand_is_zero && (Exponent() != kDenormalExponent);
  }

  double value() const { return uint64_to_double(d64_); }

  // Returns the significand size for a given order of magnitude.
  // If v = f*2^e with 2^p-1 <= f <= 2^p then p+e is v's order of magnitude.
  // This function returns the number of significant binary digits v will have
  // once it's encoded into a double. In almost all cases this is equal to
  // kSignificandSize. The only exceptions are denormals. They start with
  // leading zeroes and their effective significand-size is hence smaller.
  static int SignificandSizeForOrderOfMagnitude(int order) {
    if (order >= (kDenormalExponent + kSignificandSize)) {
      return kSignificandSize;
    }
    if (order <= kDenormalExponent) return 0;
    return order - kDenormalExponent;
  }

  static double Infinity() {
    return Double(kInfinity).value();
  }

  static double NaN() {
    return Double(kNaN).value();
  }

 private:
  static const int kExponentBias = 0x3FF + kPhysicalSignificandSize;
  static const int kDenormalExponent = -kExponentBias + 1;
  static const int kMaxExponent = 0x7FF - kExponentBias;
  static const uint64_t kInfinity = UINT64_2PART_C(0x7FF00000, 00000000);
  static const uint64_t kNaN = UINT64_2PART_C(0x7FF80000, 00000000);

  const uint64_t d64_;

  static uint64_t DiyFpToUint64(DiyFp diy_fp) {
    uint64_t significand = diy_fp.f();
    int exponent = diy_fp.e();
    while (significand > kHiddenBit + kSignificandMask) {
      significand >>= 1;
      exponent++;
    }
    if (exponent >= kMaxExponent) {
      return kInfinity;
    }
    if (exponent < kDenormalExponent) {
      return 0;
    }
    while (exponent > kDenormalExponent && (significand & kHiddenBit) == 0) {
      significand <<= 1;
      exponent--;
    }
    uint64_t biased_exponent;
    if (exponent == kDenormalExponent && (significand & kHiddenBit) == 0) {
      biased_exponent = 0;
    } else {
      biased_exponent = static_cast<uint64_t>(exponent + kExponentBias);
    }
    return (significand & kSignificandMask) |
        (biased_exponent << kPhysicalSignificandSize);
  }
};

class Single {
 public:
  static const uint32_t kSignMask = 0x80000000;
  static const uint32_t kExponentMask = 0x7F800000;
  static const uint32_t kSignificandMask = 0x007FFFFF;
  static const uint32_t kHiddenBit = 0x00800000;
  static const int kPhysicalSignificandSize = 23;  // Excludes the hidden bit.
  static const int kSignificandSize = 24;

  Single() : d32_(0) {}
  explicit Single(float f) : d32_(float_to_uint32(f)) {}
  explicit Single(uint32_t d32) : d32_(d32) {}

  // The value encoded by this Single must be greater or equal to +0.0.
  // It must not be special (infinity, or NaN).
  DiyFp AsDiyFp() const {
    ASSERT(Sign() > 0);
    ASSERT(!IsSpecial());
    return DiyFp(Significand(), Exponent());
  }

  // Returns the single's bit as uint64.
  uint32_t AsUint32() const {
    return d32_;
  }

  int Exponent() const {
    if (IsDenormal()) return kDenormalExponent;

    uint32_t d32 = AsUint32();
    int biased_e =
        static_cast<int>((d32 & kExponentMask) >> kPhysicalSignificandSize);
    return biased_e - kExponentBias;
  }

  uint32_t Significand() const {
    uint32_t d32 = AsUint32();
    uint32_t significand = d32 & kSignificandMask;
    if (!IsDenormal()) {
      return significand + kHiddenBit;
    } else {
      return significand;
    }
  }

  // Returns true if the single is a denormal.
  bool IsDenormal() const {
    uint32_t d32 = AsUint32();
    return (d32 & kExponentMask) == 0;
  }

  // We consider denormals not to be special.
  // Hence only Infinity and NaN are special.
  bool IsSpecial() const {
    uint32_t d32 = AsUint32();
    return (d32 & kExponentMask) == kExponentMask;
  }

  bool IsNan() const {
    uint32_t d32 = AsUint32();
    return ((d32 & kExponentMask) == kExponentMask) &&
        ((d32 & kSignificandMask) != 0);
  }

  bool IsInfinite() const {
    uint32_t d32 = AsUint32();
    return ((d32 & kExponentMask) == kExponentMask) &&
        ((d32 & kSignificandMask) == 0);
  }

  int Sign() const {
    uint32_t d32 = AsUint32();
    return (d32 & kSignMask) == 0? 1: -1;
  }

  // Computes the two boundaries of this.
  // The bigger boundary (m_plus) is normalized. The lower boundary has the same
  // exponent as m_plus.
  // Precondition: the value encoded by this Single must be greater than 0.
  void NormalizedBoundaries(DiyFp* out_m_minus, DiyFp* out_m_plus) const {
    ASSERT(value() > 0.0);
    DiyFp v = this->AsDiyFp();
    DiyFp m_plus = DiyFp::Normalize(DiyFp((v.f() << 1) + 1, v.e() - 1));
    DiyFp m_minus;
    if (LowerBoundaryIsCloser()) {
      m_minus = DiyFp((v.f() << 2) - 1, v.e() - 2);
    } else {
      m_minus = DiyFp((v.f() << 1) - 1, v.e() - 1);
    }
    m_minus.set_f(m_minus.f() << (m_minus.e() - m_plus.e()));
    m_minus.set_e(m_plus.e());
    *out_m_plus = m_plus;
    *out_m_minus = m_minus;
  }

  // Precondition: the value encoded by this Single must be greater or equal
  // than +0.0.
  DiyFp UpperBoundary() const {
    ASSERT(Sign() > 0);
    return DiyFp(Significand() * 2 + 1, Exponent() - 1);
  }

  bool LowerBoundaryIsCloser() const {
    // The boundary is closer if the significand is of the form f == 2^p-1 then
    // the lower boundary is closer.
    // Think of v = 1000e10 and v- = 9999e9.
    // Then the boundary (== (v - v-)/2) is not just at a distance of 1e9 but
    // at a distance of 1e8.
    // The only exception is for the smallest normal: the largest denormal is
    // at the same distance as its successor.
    // Note: denormals have the same exponent as the smallest normals.
    bool physical_significand_is_zero = ((AsUint32() & kSignificandMask) == 0);
    return physical_significand_is_zero && (Exponent() != kDenormalExponent);
  }

  float value() const { return uint32_to_float(d32_); }

  static float Infinity() {
    return Single(kInfinity).value();
  }

  static float NaN() {
    return Single(kNaN).value();
  }

 private:
  static const int kExponentBias = 0x7F + kPhysicalSignificandSize;
  static const int kDenormalExponent = -kExponentBias + 1;
  static const int kMaxExponent = 0xFF - kExponentBias;
  static const uint32_t kInfinity = 0x7F800000;
  static const uint32_t kNaN = 0x7FC00000;

  const uint32_t d32_;
};

}  // namespace double_conversion

#endif  // DOUBLE_CONVERSION_DOUBLE_H_


================================================
FILE: src/kenlm/util/double-conversion/strtod.cc
================================================
// Copyright 2010 the V8 project authors. All rights reserved.
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are
// met:
//
//     * Redistributions of source code must retain the above copyright
//       notice, this list of conditions and the following disclaimer.
//     * Redistributions in binary form must reproduce the above
//       copyright notice, this list of conditions and the following
//       disclaimer in the documentation and/or other materials provided
//       with the distribution.
//     * Neither the name of Google Inc. nor the names of its
//       contributors may be used to endorse or promote products derived
//       from this software without specific prior written permission.
//
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

#include <stdarg.h>
#include <limits.h>

#include "strtod.h"
#include "bignum.h"
#include "cached-powers.h"
#include "ieee.h"

namespace double_conversion {

// 2^53 = 9007199254740992.
// Any integer with at most 15 decimal digits will hence fit into a double
// (which has a 53bit significand) without loss of precision.
static const int kMaxExactDoubleIntegerDecimalDigits = 15;
// 2^64 = 18446744073709551616 > 10^19
static const int kMaxUint64DecimalDigits = 19;

// Max double: 1.7976931348623157 x 10^308
// Min non-zero double: 4.9406564584124654 x 10^-324
// Any x >= 10^309 is interpreted as +infinity.
// Any x <= 10^-324 is interpreted as 0.
// Note that 2.5e-324 (despite being smaller than the min double) will be read
// as non-zero (equal to the min non-zero double).
static const int kMaxDecimalPower = 309;
static const int kMinDecimalPower = -324;

// 2^64 = 18446744073709551616
static const uint64_t kMaxUint64 = UINT64_2PART_C(0xFFFFFFFF, FFFFFFFF);


static const double exact_powers_of_ten[] = {
  1.0,  // 10^0
  10.0,
  100.0,
  1000.0,
  10000.0,
  100000.0,
  1000000.0,
  10000000.0,
  100000000.0,
  1000000000.0,
  10000000000.0,  // 10^10
  100000000000.0,
  1000000000000.0,
  10000000000000.0,
  100000000000000.0,
  1000000000000000.0,
  10000000000000000.0,
  100000000000000000.0,
  1000000000000000000.0,
  10000000000000000000.0,
  100000000000000000000.0,  // 10^20
  1000000000000000000000.0,
  // 10^22 = 0x21e19e0c9bab2400000 = 0x878678326eac9 * 2^22
  10000000000000000000000.0
};
static const int kExactPowersOfTenSize = ARRAY_SIZE(exact_powers_of_ten);

// Maximum number of significant digits in the decimal representation.
// In fact the value is 772 (see conversions.cc), but to give us some margin
// we round up to 780.
static const int kMaxSignificantDecimalDigits = 780;

static Vector<const char> TrimLeadingZeros(Vector<const char> buffer) {
  for (int i = 0; i < buffer.length(); i++) {
    if (buffer[i] != '0') {
      return buffer.SubVector(i, buffer.length());
    }
  }
  return Vector<const char>(buffer.start(), 0);
}


static Vector<const char> TrimTrailingZeros(Vector<const char> buffer) {
  for (int i = buffer.length() - 1; i >= 0; --i) {
    if (buffer[i] != '0') {
      return buffer.SubVector(0, i + 1);
    }
  }
  return Vector<const char>(buffer.start(), 0);
}


static void CutToMaxSignificantDigits(Vector<const char> buffer,
                                       int exponent,
                                       char* significant_buffer,
                                       int* significant_exponent) {
  for (int i = 0; i < kMaxSignificantDecimalDigits - 1; ++i) {
    significant_buffer[i] = buffer[i];
  }
  // The input buffer has been trimmed. Therefore the last digit must be
  // different from '0'.
  ASSERT(buffer[buffer.length() - 1] != '0');
  // Set the last digit to be non-zero. This is sufficient to guarantee
  // correct rounding.
  significant_buffer[kMaxSignificantDecimalDigits - 1] = '1';
  *significant_exponent =
      exponent + (buffer.length() - kMaxSignificantDecimalDigits);
}


// Trims the buffer and cuts it to at most kMaxSignificantDecimalDigits.
// If possible the input-buffer is reused, but if the buffer needs to be
// modified (due to cutting), then the input needs to be copied into the
// buffer_copy_space.
static void TrimAndCut(Vector<const char> buffer, int exponent,
                       char* buffer_copy_space, int space_size,
                       Vector<const char>* trimmed, int* updated_exponent) {
  Vector<const char> left_trimmed = TrimLeadingZeros(buffer);
  Vector<const char> right_trimmed = TrimTrailingZeros(left_trimmed);
  exponent += left_trimmed.length() - right_trimmed.length();
  if (right_trimmed.length() > kMaxSignificantDecimalDigits) {
    ASSERT(space_size >= kMaxSignificantDecimalDigits);
    CutToMaxSignificantDigits(right_trimmed, exponent,
                              buffer_copy_space, updated_exponent);
    *trimmed = Vector<const char>(buffer_copy_space,
                                 kMaxSignificantDecimalDigits);
  } else {
    *trimmed = right_trimmed;
    *updated_exponent = exponent;
  }
}


// Reads digits from the buffer and converts them to a uint64.
// Reads in as many digits as fit into a uint64.
// When the string starts with "1844674407370955161" no further digit is read.
// Since 2^64 = 18446744073709551616 it would still be possible read another
// digit if it was less or equal than 6, but this would complicate the code.
static uint64_t ReadUint64(Vector<const char> buffer,
                           int* number_of_read_digits) {
  uint64_t result = 0;
  int i = 0;
  while (i < buffer.length() && result <= (kMaxUint64 / 10 - 1)) {
    int digit = buffer[i++] - '0';
    ASSERT(0 <= digit && digit <= 9);
    result = 10 * result + digit;
  }
  *number_of_read_digits = i;
  return result;
}


// Reads a DiyFp from the buffer.
// The returned DiyFp is not necessarily normalized.
// If remaining_decimals is zero then the returned DiyFp is accurate.
// Otherwise it has been rounded and has error of at most 1/2 ulp.
static void ReadDiyFp(Vector<const char> buffer,
                      DiyFp* result,
                      int* remaining_decimals) {
  int read_digits;
  uint64_t significand = ReadUint64(buffer, &read_digits);
  if (buffer.length() == read_digits) {
    *result = DiyFp(significand, 0);
    *remaining_decimals = 0;
  } else {
    // Round the significand.
    if (buffer[read_digits] >= '5') {
      significand++;
    }
    // Compute the binary exponent.
    int exponent = 0;
    *result = DiyFp(significand, exponent);
    *remaining_decimals = buffer.length() - read_digits;
  }
}


static bool DoubleStrtod(Vector<const char> trimmed,
                         int exponent,
                         double* result) {
#if !defined(DOUBLE_CONVERSION_CORRECT_DOUBLE_OPERATIONS)
  // On x86 the floating-point stack can be 64 or 80 bits wide. If it is
  // 80 bits wide (as is the case on Linux) then double-rounding occurs and the
  // result is not accurate.
  // We know that Windows32 uses 64 bits and is therefore accurate.
  // Note that the ARM simulator is compiled for 32bits. It therefore exhibits
  // the same problem.
  return false;
#endif
  if (trimmed.length() <= kMaxExactDoubleIntegerDecimalDigits) {
    int read_digits;
    // The trimmed input fits into a double.
    // If the 10^exponent (resp. 10^-exponent) fits into a double too then we
    // can compute the result-double simply by multiplying (resp. dividing) the
    // two numbers.
    // This is possible because IEEE guarantees that floating-point operations
    // return the best possible approximation.
    if (exponent < 0 && -exponent < kExactPowersOfTenSize) {
      // 10^-exponent fits into a double.
      *result = static_cast<double>(ReadUint64(trimmed, &read_digits));
      ASSERT(read_digits == trimmed.length());
      *result /= exact_powers_of_ten[-exponent];
      return true;
    }
    if (0 <= exponent && exponent < kExactPowersOfTenSize) {
      // 10^exponent fits into a double.
      *result = static_cast<double>(ReadUint64(trimmed, &read_digits));
      ASSERT(read_digits == trimmed.length());
      *result *= exact_powers_of_ten[exponent];
      return true;
    }
    int remaining_digits =
        kMaxExactDoubleIntegerDecimalDigits - trimmed.length();
    if ((0 <= exponent) &&
        (exponent - remaining_digits < kExactPowersOfTenSize)) {
      // The trimmed string was short and we can multiply it with
      // 10^remaining_digits. As a result the remaining exponent now fits
      // into a double too.
      *result = static_cast<double>(ReadUint64(trimmed, &read_digits));
      ASSERT(read_digits == trimmed.length());
      *result *= exact_powers_of_ten[remaining_digits];
      *result *= exact_powers_of_ten[exponent - remaining_digits];
      return true;
    }
  }
  return false;
}


// Returns 10^exponent as an exact DiyFp.
// The given exponent must be in the range [1; kDecimalExponentDistance[.
static DiyFp AdjustmentPowerOfTen(int exponent) {
  ASSERT(0 < exponent);
  ASSERT(exponent < PowersOfTenCache::kDecimalExponentDistance);
  // Simply hardcode the remaining powers for the given decimal exponent
  // distance.
  ASSERT(PowersOfTenCache::kDecimalExponentDistance == 8);
  switch (exponent) {
    case 1: return DiyFp(UINT64_2PART_C(0xa0000000, 00000000), -60);
    case 2: return DiyFp(UINT64_2PART_C(0xc8000000, 00000000), -57);
    case 3: return DiyFp(UINT64_2PART_C(0xfa000000, 00000000), -54);
    case 4: return DiyFp(UINT64_2PART_C(0x9c400000, 00000000), -50);
    case 5: return DiyFp(UINT64_2PART_C(0xc3500000, 00000000), -47);
    case 6: return DiyFp(UINT64_2PART_C(0xf4240000, 00000000), -44);
    case 7: return DiyFp(UINT64_2PART_C(0x98968000, 00000000), -40);
    default:
      UNREACHABLE();
      return DiyFp(0, 0);
  }
}


// If the function returns true then the result is the correct double.
// Otherwise it is either the correct double or the double that is just below
// the correct double.
static bool DiyFpStrtod(Vector<const char> buffer,
                        int exponent,
                        double* result) {
  DiyFp input;
  int remaining_decimals;
  ReadDiyFp(buffer, &input, &remaining_decimals);
  // Since we may have dropped some digits the input is not accurate.
  // If remaining_decimals is different than 0 than the error is at most
  // .5 ulp (unit in the last place).
  // We don't want to deal with fractions and therefore keep a common
  // denominator.
  const int kDenominatorLog = 3;
  const int kDenominator = 1 << kDenominatorLog;
  // Move the remaining decimals into the exponent.
  exponent += remaining_decimals;
  int error = (remaining_decimals == 0 ? 0 : kDenominator / 2);

  int old_e = input.e();
  input.Normalize();
  error <<= old_e - input.e();

  ASSERT(exponent <= PowersOfTenCache::kMaxDecimalExponent);
  if (exponent < PowersOfTenCache::kMinDecimalExponent) {
    *result = 0.0;
    return true;
  }
  DiyFp cached_power;
  int cached_decimal_exponent;
  PowersOfTenCache::GetCachedPowerForDecimalExponent(exponent,
                                                     &cached_power,
                                                     &cached_decimal_exponent);

  if (cached_decimal_exponent != exponent) {
    int adjustment_exponent = exponent - cached_decimal_exponent;
    DiyFp adjustment_power = AdjustmentPowerOfTen(adjustment_exponent);
    input.Multiply(adjustment_power);
    if (kMaxUint64DecimalDigits - buffer.length() >= adjustment_exponent) {
      // The product of input with the adjustment power fits into a 64 bit
      // integer.
      ASSERT(DiyFp::kSignificandSize == 64);
    } else {
      // The adjustment power is exact. There is hence only an error of 0.5.
      error += kDenominator / 2;
    }
  }

  input.Multiply(cached_power);
  // The error introduced by a multiplication of a*b equals
  //   error_a + error_b + error_a*error_b/2^64 + 0.5
  // Substituting a with 'input' and b with 'cached_power' we have
  //   error_b = 0.5  (all cached powers have an error of less than 0.5 ulp),
  //   error_ab = 0 or 1 / kDenominator > error_a*error_b/ 2^64
  int error_b = kDenominator / 2;
  int error_ab = (error == 0 ? 0 : 1);  // We round up to 1.
  int fixed_error = kDenominator / 2;
  error += error_b + error_ab + fixed_error;

  old_e = input.e();
  input.Normalize();
  error <<= old_e - input.e();

  // See if the double's significand changes if we add/subtract the error.
  int order_of_magnitude = DiyFp::kSignificandSize + input.e();
  int effective_significand_size =
      Double::SignificandSizeForOrderOfMagnitude(order_of_magnitude);
  int precision_digits_count =
      DiyFp::kSignificandSize - effective_significand_size;
  if (precision_digits_count + kDenominatorLog >= DiyFp::kSignificandSize) {
    // This can only happen for very small denormals. In this case the
    // half-way multiplied by the denominator exceeds the range of an uint64.
    // Simply shift everything to the right.
    int shift_amount = (precision_digits_count + kDenominatorLog) -
        DiyFp::kSignificandSize + 1;
    input.set_f(input.f() >> shift_amount);
    input.set_e(input.e() + shift_amount);
    // We add 1 for the lost precision of error, and kDenominator for
    // the lost precision of input.f().
    error = (error >> shift_amount) + 1 + kDenominator;
    precision_digits_count -= shift_amount;
  }
  // We use uint64_ts now. This only works if the DiyFp uses uint64_ts too.
  ASSERT(DiyFp::kSignificandSize == 64);
  ASSERT(precision_digits_count < 64);
  uint64_t one64 = 1;
  uint64_t precision_bits_mask = (one64 << precision_digits_count) - 1;
  uint64_t precision_bits = input.f() & precision_bits_mask;
  uint64_t half_way = one64 << (precision_digits_count - 1);
  precision_bits *= kDenominator;
  half_way *= kDenominator;
  DiyFp rounded_input(input.f() >> precision_digits_count,
                      input.e() + precision_digits_count);
  if (precision_bits >= half_way + error) {
    rounded_input.set_f(rounded_input.f() + 1);
  }
  // If the last_bits are too close to the half-way case than we are too
  // inaccurate and round down. In this case we return false so that we can
  // fall back to a more precise algorithm.

  *result = Double(rounded_input).value();
  if (half_way - error < precision_bits && precision_bits < half_way + error) {
    // Too imprecise. The caller will have to fall back to a slower version.
    // However the returned number is guaranteed to be either the correct
    // double, or the next-lower double.
    return false;
  } else {
    return true;
  }
}


// Returns
//   - -1 if buffer*10^exponent < diy_fp.
//   -  0 if buffer*10^exponent == diy_fp.
//   - +1 if buffer*10^exponent > diy_fp.
// Preconditions:
//   buffer.length() + exponent <= kMaxDecimalPower + 1
//   buffer.length() + exponent > kMinDecimalPower
//   buffer.length() <= kMaxDecimalSignificantDigits
static int CompareBufferWithDiyFp(Vector<const char> buffer,
                                  int exponent,
                                  DiyFp diy_fp) {
  ASSERT(buffer.length() + exponent <= kMaxDecimalPower + 1);
  ASSERT(buffer.length() + exponent > kMinDecimalPower);
  ASSERT(buffer.length() <= kMaxSignificantDecimalDigits);
  // Make sure that the Bignum will be able to hold all our numbers.
  // Our Bignum implementation has a separate field for exponents. Shifts will
  // consume at most one bigit (< 64 bits).
  // ln(10) == 3.3219...
  ASSERT(((kMaxDecimalPower + 1) * 333 / 100) < Bignum::kMaxSignificantBits);
  Bignum buffer_bignum;
  Bignum diy_fp_bignum;
  buffer_bignum.AssignDecimalString(buffer);
  diy_fp_bignum.AssignUInt64(diy_fp.f());
  if (exponent >= 0) {
    buffer_bignum.MultiplyByPowerOfTen(exponent);
  } else {
    diy_fp_bignum.MultiplyByPowerOfTen(-exponent);
  }
  if (diy_fp.e() > 0) {
    diy_fp_bignum.ShiftLeft(diy_fp.e());
  } else {
    buffer_bignum.ShiftLeft(-diy_fp.e());
  }
  return Bignum::Compare(buffer_bignum, diy_fp_bignum);
}


// Returns true if the guess is the correct double.
// Returns false, when guess is either correct or the next-lower double.
static bool ComputeGuess(Vector<const char> trimmed, int exponent,
                         double* guess) {
  if (trimmed.length() == 0) {
    *guess = 0.0;
    return true;
  }
  if (exponent + trimmed.length() - 1 >= kMaxDecimalPower) {
    *guess = Double::Infinity();
    return true;
  }
  if (exponent + trimmed.length() <= kMinDecimalPower) {
    *guess = 0.0;
    return true;
  }

  if (DoubleStrtod(trimmed, exponent, guess) ||
      DiyFpStrtod(trimmed, exponent, guess)) {
    return true;
  }
  if (*guess == Double::Infinity()) {
    return true;
  }
  return false;
}

double Strtod(Vector<const char> buffer, int exponent) {
  char copy_buffer[kMaxSignificantDecimalDigits];
  Vector<const char> trimmed;
  int updated_exponent;
  TrimAndCut(buffer, exponent, copy_buffer, kMaxSignificantDecimalDigits,
             &trimmed, &updated_exponent);
  exponent = updated_exponent;

  double guess;
  bool is_correct = ComputeGuess(trimmed, exponent, &guess);
  if (is_correct) return guess;

  DiyFp upper_boundary = Double(guess).UpperBoundary();
  int comparison = CompareBufferWithDiyFp(trimmed, exponent, upper_boundary);
  if (comparison < 0) {
    return guess;
  } else if (comparison > 0) {
    return Double(guess).NextDouble();
  } else if ((Double(guess).Significand() & 1) == 0) {
    // Round towards even.
    return guess;
  } else {
    return Double(guess).NextDouble();
  }
}

float Strtof(Vector<const char> buffer, int exponent) {
  char copy_buffer[kMaxSignificantDecimalDigits];
  Vector<const char> trimmed;
  int updated_exponent;
  TrimAndCut(buffer, exponent, copy_buffer, kMaxSignificantDecimalDigits,
             &trimmed, &updated_exponent);
  exponent = updated_exponent;

  double double_guess;
  bool is_correct = ComputeGuess(trimmed, exponent, &double_guess);

  float float_guess = static_cast<float>(double_guess);
  if (float_guess == double_guess) {
    // This shortcut triggers for integer values.
    return float_guess;
  }

  // We must catch double-rounding. Say the double has been rounded up, and is
  // now a boundary of a float, and rounds up again. This is why we have to
  // look at previous too.
  // Example (in decimal numbers):
  //    input: 12349
  //    high-precision (4 digits): 1235
  //    low-precision (3 digits):
  //       when read from input: 123
  //       when rounded from high precision: 124.
  // To do this we simply look at the neigbors of the correct result and see
  // if they would round to the same float. If the guess is not correct we have
  // to look at four values (since two different doubles could be the correct
  // double).

  double double_next = Double(double_guess).NextDouble();
  double double_previous = Double(double_guess).PreviousDouble();

  float f1 = static_cast<float>(double_previous);
#ifndef NDEBUG
  float f2 = float_guess;
#endif
  float f3 = static_cast<float>(double_next);
  float f4;
  if (is_correct) {
    f4 = f3;
  } else {
    double double_next2 = Double(double_next).NextDouble();
    f4 = static_cast<float>(double_next2);
  }
#ifndef NDEBUG
  ASSERT(f1 <= f2 && f2 <= f3 && f3 <= f4);
#endif

  // If the guess doesn't lie near a single-precision boundary we can simply
  // return its float-value.
  if (f1 == f4) {
    return float_guess;
  }

  ASSERT((f1 != f2 && f2 == f3 && f3 == f4) ||
         (f1 == f2 && f2 != f3 && f3 == f4) ||
         (f1 == f2 && f2 == f3 && f3 != f4));

  // guess and next are the two possible canditates (in the same way that
  // double_guess was the lower candidate for a double-precision guess).
  float guess = f1;
  float next = f4;
  DiyFp upper_boundary;
  if (guess == 0.0f) {
    float min_float = 1e-45f;
    upper_boundary = Double(static_cast<double>(min_float) / 2).AsDiyFp();
  } else {
    upper_boundary = Single(guess).UpperBoundary();
  }
  int comparison = CompareBufferWithDiyFp(trimmed, exponent, upper_boundary);
  if (comparison < 0) {
    return guess;
  } else if (comparison > 0) {
    return next;
  } else if ((Single(guess).Significand() & 1) == 0) {
    // Round towards even.
    return guess;
  } else {
    return next;
  }
}

}  // namespace double_conversion


================================================
FILE: src/kenlm/util/double-conversion/strtod.h
================================================
// Copyright 2010 the V8 project authors. All rights reserved.
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are
// met:
//
//     * Redistributions of source code must retain the above copyright
//       notice, this list of conditions and the following disclaimer.
//     * Redistributions in binary form must reproduce the above
//       copyright notice, this list of conditions and the following
//       disclaimer in the documentation and/or other materials provided
//       with the distribution.
//     * Neither the name of Google Inc. nor the names of its
//       contributors may be used to endorse or promote products derived
//       from this software without specific prior written permission.
//
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

#ifndef DOUBLE_CONVERSION_STRTOD_H_
#define DOUBLE_CONVERSION_STRTOD_H_

#include "utils.h"

namespace double_conversion {

// The buffer must only contain digits in the range [0-9]. It must not
// contain a dot or a sign. It must not start with '0', and must not be empty.
double Strtod(Vector<const char> buffer, int exponent);

// The buffer must only contain digits in the range [0-9]. It must not
// contain a dot or a sign. It must not start with '0', and must not be empty.
float Strtof(Vector<const char> buffer, int exponent);

}  // namespace double_conversion

#endif  // DOUBLE_CONVERSION_STRTOD_H_


================================================
FILE: src/kenlm/util/double-conversion/utils.h
================================================
// Copyright 2010 the V8 project authors. All rights reserved.
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are
// met:
//
//     * Redistributions of source code must retain the above copyright
//       notice, this list of conditions and the following disclaimer.
//     * Redistributions in binary form must reproduce the above
//       copyright notice, this list of conditions and the following
//       disclaimer in the documentation and/or other materials provided
//       with the distribution.
//     * Neither the name of Google Inc. nor the names of its
//       contributors may be used to endorse or promote products derived
//       from this software without specific prior written permission.
//
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

#ifndef DOUBLE_CONVERSION_UTILS_H_
#define DOUBLE_CONVERSION_UTILS_H_

#include <stdlib.h>
#include <string.h>

#include <assert.h>
#ifndef ASSERT
#define ASSERT(condition)      (assert(condition))
#endif
#ifndef UNIMPLEMENTED
#define UNIMPLEMENTED() (abort())
#endif
#ifndef UNREACHABLE
#define UNREACHABLE()   (abort())
#endif

// Double operations detection based on target architecture.
// Linux uses a 80bit wide floating point stack on x86. This induces double
// rounding, which in turn leads to wrong results.
// An easy way to test if the floating-point operations are correct is to
// evaluate: 89255.0/1e22. If the floating-point stack is 64 bits wide then
// the result is equal to 89255e-22.
// The best way to test this, is to create a division-function and to compare
// the output of the division with the expected result. (Inlining must be
// disabled.)
// On Linux,x86 89255e-22 != Div_double(89255.0/1e22)
#if defined(_M_X64) || defined(__x86_64__) || \
    defined(__ARMEL__) || defined(__avr32__) || \
    defined(__hppa__) || defined(__ia64__) || \
    defined(__mips__) || defined(__powerpc__) || \
    defined(__sparc__) || defined(__sparc) || defined(__s390__) || \
    defined(__SH4__) || defined(__alpha__) || \
    defined(_MIPS_ARCH_MIPS32R2)
#define DOUBLE_CONVERSION_CORRECT_DOUBLE_OPERATIONS 1
#elif defined(_M_IX86) || defined(__i386__) || defined(__i386)
#if defined(_WIN32)
// Windows uses a 64bit wide floating point stack.
#define DOUBLE_CONVERSION_CORRECT_DOUBLE_OPERATIONS 1
#else
#undef DOUBLE_CONVERSION_CORRECT_DOUBLE_OPERATIONS
#endif  // _WIN32
#else
#error Target architecture was not detected as supported by Double-Conversion.
#endif


#if defined(_WIN32) && !defined(__MINGW32__)

typedef signed char int8_t;
typedef unsigned char uint8_t;
typedef short int16_t;  // NOLINT
typedef unsigned short uint16_t;  // NOLINT
typedef int int32_t;
typedef unsigned int uint32_t;
typedef __int64 int64_t;
typedef unsigned __int64 uint64_t;
// intptr_t and friends are defined in crtdefs.h through stdio.h.

#else

#include <stdint.h>

#endif

// The following macro works on both 32 and 64-bit platforms.
// Usage: instead of writing 0x1234567890123456
//      write UINT64_2PART_C(0x12345678,90123456);
#define UINT64_2PART_C(a, b) (((static_cast<uint64_t>(a) << 32) + 0x##b##u))


// The expression ARRAY_SIZE(a) is a compile-time constant of type
// size_t which represents the number of elements of the given
// array. You should only use ARRAY_SIZE on statically allocated
// arrays.
#ifndef ARRAY_SIZE
#define ARRAY_SIZE(a)                                   \
  ((sizeof(a) / sizeof(*(a))) /                         \
  static_cast<size_t>(!(sizeof(a) % sizeof(*(a)))))
#endif

// A macro to disallow the evil copy constructor and operator= functions
// This should be used in the private: declarations for a class
#ifndef DISALLOW_COPY_AND_ASSIGN
#define DISALLOW_COPY_AND_ASSIGN(TypeName)      \
  TypeName(const TypeName&);                    \
  void operator=(const TypeName&)
#endif

// A macro to disallow all the implicit constructors, namely the
// default constructor, copy constructor and operator= functions.
//
// This should be used in the private: declarations for a class
// that wants to prevent anyone from instantiating it. This is
// especially useful for classes containing only static methods.
#ifndef DISALLOW_IMPLICIT_CONSTRUCTORS
#define DISALLOW_IMPLICIT_CONSTRUCTORS(TypeName) \
  TypeName();                                    \
  DISALLOW_COPY_AND_ASSIGN(TypeName)
#endif

namespace double_conversion {

static const int kCharSize = sizeof(char);

// Returns the maximum of the two parameters.
template <typename T>
static T Max(T a, T b) {
  return a < b ? b : a;
}


// Returns the minimum of the two parameters.
template <typename T>
static T Min(T a, T b) {
  return a < b ? a : b;
}


inline int StrLength(const char* string) {
  size_t length = strlen(string);
  ASSERT(length == static_cast<size_t>(static_cast<int>(length)));
  return static_cast<int>(length);
}

// This is a simplified version of V8's Vector class.
template <typename T>
class Vector {
 public:
  Vector() : start_(NULL), length_(0) {}
  Vector(T* data, int length) : start_(data), length_(length) {
    ASSERT(length == 0 || (length > 0 && data != NULL));
  }

  // Returns a vector using the same backing storage as this one,
  // spanning from and including 'from', to but not including 'to'.
  Vector<T> SubVector(int from, int to) {
    ASSERT(to <= length_);
    ASSERT(from < to);
    ASSERT(0 <= from);
    return Vector<T>(start() + from, to - from);
  }

  // Returns the length of the vector.
  int length() const { return length_; }

  // Returns whether or not the vector is empty.
  bool is_empty() const { return length_ == 0; }

  // Returns the pointer to the start of the data in the vector.
  T* start() const { return start_; }

  // Access individual vector elements - checks bounds in debug mode.
  T& operator[](int index) const {
    ASSERT(0 <= index && index < length_);
    return start_[index];
  }

  T& first() { return start_[0]; }

  T& last() { return start_[length_ - 1]; }

 private:
  T* start_;
  int length_;
};


// Helper class for building result strings in a character buffer. The
// purpose of the class is to use safe operations that checks the
// buffer bounds on all operations in debug mode.
class StringBuilder {
 public:
  StringBuilder(char* buffer, int size)
      : buffer_(buffer, size), position_(0) { }

  ~StringBuilder() { if (!is_finalized()) Finalize(); }

  int size() const { return buffer_.length(); }

  // Get the current position in the builder.
  int position() const {
    ASSERT(!is_finalized());
    return position_;
  }

  // Reset the position.
  void Reset() { position_ = 0; }

  // Add a single character to the builder. It is not allowed to add
  // 0-characters; use the Finalize() method to terminate the string
  // instead.
  void AddCharacter(char c) {
    ASSERT(c != '\0');
    ASSERT(!is_finalized() && position_ < buffer_.length());
    buffer_[position_++] = c;
  }

  // Add an entire string to the builder. Uses strlen() internally to
  // compute the length of the input string.
  void AddString(const char* s) {
    AddSubstring(s, StrLength(s));
  }

  // Add the first 'n' characters of the given string 's' to the
  // builder. The input string must have enough characters.
  void AddSubstring(const char* s, int n) {
    ASSERT(!is_finalized() && position_ + n < buffer_.length());
    ASSERT(static_cast<size_t>(n) <= strlen(s));
    memmove(&buffer_[position_], s, n * kCharSize);
    position_ += n;
  }


  // Add character padding to the builder. If count is non-positive,
  // nothing is added to the builder.
  void AddPadding(char c, int count) {
    for (int i = 0; i < count; i++) {
      AddCharacter(c);
    }
  }

  // Finalize the string by 0-terminating it and returning the buffer.
  char* Finalize() {
    ASSERT(!is_finalized() && position_ < buffer_.length());
    buffer_[position_] = '\0';
    // Make sure nobody managed to add a 0-character to the
    // buffer while building the string.
    ASSERT(strlen(buffer_.start()) == static_cast<size_t>(position_));
    position_ = -1;
    ASSERT(is_finalized());
    return buffer_.start();
  }

 private:
  Vector<char> buffer_;
  int position_;

  bool is_finalized() const { return position_ < 0; }

  DISALLOW_IMPLICIT_CONSTRUCTORS(StringBuilder);
};

// The type-based aliasing rule allows the compiler to assume that pointers of
// different types (for some definition of different) never alias each other.
// Thus the following code does not work:
//
// float f = foo();
// int fbits = *(int*)(&f);
//
// The compiler 'knows' that the int pointer can't refer to f since the types
// don't match, so the compiler may cache f in a register, leaving random data
// in fbits.  Using C++ style casts makes no difference, however a pointer to
// char data is assumed to alias any other pointer.  This is the 'memcpy
// exception'.
//
// Bit_cast uses the memcpy exception to move the bits from a variable of one
// type of a variable of another type.  Of course the end result is likely to
// be implementation dependent.  Most compilers (gcc-4.2 and MSVC 2005)
// will completely optimize BitCast away.
//
// There is an additional use for BitCast.
// Recent gccs will warn when they see casts that may result in breakage due to
// the type-based aliasing rule.  If you have checked that there is no breakage
// you can use BitCast to cast one pointer type to another.  This confuses gcc
// enough that it can no longer see that you have cast one pointer type to
// another thus avoiding the warning.
template <class Dest, class Source>
inline Dest BitCast(const Source& source) {
  // Compile time assertion: sizeof(Dest) == sizeof(Source)
  // A compile error here means your Dest and Source have different sizes.
  typedef char VerifySizesAreEqual[sizeof(Dest) == sizeof(Source) ? 1 : -1];

  Dest dest;
  memmove(&dest, &source, sizeof(dest));
  return dest;
}

template <class Dest, class Source>
inline Dest BitCast(Source* source) {
  return BitCast<Dest>(reinterpret_cast<uintptr_t>(source));
}

}  // namespace double_conversion

#endif  // DOUBLE_CONVERSION_UTILS_H_


================================================
FILE: src/kenlm/util/ersatz_progress.cc
================================================
#include "util/ersatz_progress.hh"

#include <algorithm>
#include <ostream>
#include <limits>
#include <string>

namespace util {

namespace { const unsigned char kWidth = 100; }

const char kProgressBanner[] = "----5---10---15---20---25---30---35---40---45---50---55---60---65---70---75---80---85---90---95--100\n";

ErsatzProgress::ErsatzProgress() : current_(0), next_(std::numeric_limits<uint64_t>::max()), complete_(next_), out_(NULL) {}

ErsatzProgress::~ErsatzProgress() {
  if (out_) Finished();
}

ErsatzProgress::ErsatzProgress(uint64_t complete, std::ostream *to, const std::string &message) 
  : current_(0), next_(complete / kWidth), complete_(complete), stones_written_(0), out_(to) {
  if (!out_) {
    next_ = std::numeric_limits<uint64_t>::max();
    return;
  }
  if (!message.empty()) *out_ << message << '\n';
  *out_ << kProgressBanner;
}

void ErsatzProgress::Milestone() {
  if (!out_) { current_ = 0; return; }
  if (!complete_) return;
  unsigned char stone = std::min(static_cast<uint64_t>(kWidth), (current_ * kWidth) / complete_);

  for (; stones_written_ < stone; ++stones_written_) {
    (*out_) << '*';
  }
  if (stone == kWidth) {
    (*out_) << std::endl;
    next_ = std::numeric_limits<uint64_t>::max();
    out_ = NULL;
  } else {
    next_ = std::max(next_, ((stone + 1) * complete_ + kWidth - 1) / kWidth);
  }
}

} // namespace util


================================================
FILE: src/kenlm/util/ersatz_progress.hh
================================================
#ifndef UTIL_ERSATZ_PROGRESS__
#define UTIL_ERSATZ_PROGRESS__

#include <iostream>
#include <string>

#include <stdint.h>

// Ersatz version of boost::progress so core language model doesn't depend on
// boost.  Also adds option to print nothing.  

namespace util {

extern const char kProgressBanner[];

class ErsatzProgress {
  public:
    // No output.  
    ErsatzProgress();

    // Null means no output.  The null value is useful for passing along the ostream pointer from another caller.   
    explicit ErsatzProgress(uint64_t complete, std::ostream *to = &std::cerr, const std::string &message = "");

    ~ErsatzProgress();

    ErsatzProgress &operator++() {
      if (++current_ >= next_) Milestone();
      return *this;
    }

    ErsatzProgress &operator+=(uint64_t amount) {
      if ((current_ += amount) >= next_) Milestone();
      return *this;
    }

    void Set(uint64_t to) {
      if ((current_ = to) >= next_) Milestone();
    }

    void Finished() {
      Set(complete_);
    }

  private:
    void Milestone();

    uint64_t current_, next_, complete_;
    unsigned char stones_written_;
    std::ostream *out_;

    // noncopyable
    ErsatzProgress(const ErsatzProgress &other);
    ErsatzProgress &operator=(const ErsatzProgress &other);
};

} // namespace util

#endif // UTIL_ERSATZ_PROGRESS__


================================================
FILE: src/kenlm/util/exception.cc
================================================
#include "util/exception.hh"

#ifdef __GXX_RTTI
#include <typeinfo>
#endif

#include <errno.h>
#include <string.h>

namespace util {

Exception::Exception() throw() {}
Exception::~Exception() throw() {}

Exception::Exception(const Exception &from) : std::exception() {
  stream_ << from.stream_.str();
}

Exception &Exception::operator=(const Exception &from) {
  stream_ << from.stream_.str();
  return *this;
}

const char *Exception::what() const throw() {
  text_ = stream_.str();
  return text_.c_str();
}

void Exception::SetLocation(const char *file, unsigned int line, const char *func, const char *child_name, const char *condition) {
  /* The child class might have set some text, but we want this to come first.
   * Another option would be passing this information to the constructor, but
   * then child classes would have to accept constructor arguments and pass
   * them down.  
   */
  text_ = stream_.str();
  stream_.str("");
  stream_ << file << ':' << line;
  if (func) stream_ << " in " << func << " threw ";
  if (child_name) {
    stream_ << child_name;
  } else {
#ifdef __GXX_RTTI
    stream_ << typeid(this).name();
#else
    stream_ << "an exception";
#endif
  }
  if (condition) stream_ << " because `" << condition;
  stream_ << "'.\n";
  stream_ << text_;
}

namespace {
// The XOPEN version.
const char *HandleStrerror(int ret, const char *buf) {
  if (!ret) return buf;
  return NULL;
}

// The GNU version.
const char *HandleStrerror(const char *ret, const char * /*buf*/) {
  return ret;
}
} // namespace

ErrnoException::ErrnoException() throw() : errno_(errno) {
  char buf[200];
  buf[0] = 0;
#if defined(sun) || defined(_WIN32) || defined(_WIN64)
  const char *add = strerror(errno);
#else
  const char *add = HandleStrerror(strerror_r(errno, buf, 200), buf);
#endif

  if (add) {
    *this << add << ' ';
  }
}

ErrnoException::~ErrnoException() throw() {}

OverflowException::OverflowException() throw() {}
OverflowException::~OverflowException() throw() {}

} // namespace util


================================================
FILE: src/kenlm/util/exception.hh
================================================
#ifndef UTIL_EXCEPTION__
#define UTIL_EXCEPTION__

#include <exception>
#include <limits>
#include <sstream>
#include <string>

#include <stdint.h>

namespace util {

template <class Except, class Data> typename Except::template ExceptionTag<Except&>::Identity operator<<(Except &e, const Data &data);

class Exception : public std::exception {
  public:
    Exception() throw();
    virtual ~Exception() throw();

    Exception(const Exception &from);
    Exception &operator=(const Exception &from);

    // Not threadsafe, but probably doesn't matter.  FWIW, Boost's exception guidance implies that what() isn't threadsafe.  
    const char *what() const throw();

    // For use by the UTIL_THROW macros.  
    void SetLocation(
        const char *file,
        unsigned int line,
        const char *func,
        const char *child_name,
        const char *condition);

  private:
    template <class Except, class Data> friend typename Except::template ExceptionTag<Except&>::Identity operator<<(Except &e, const Data &data);

    // This helps restrict operator<< defined below.  
    template <class T> struct ExceptionTag {
      typedef T Identity;
    };

    std::stringstream stream_;
    mutable std::string text_;
};

/* This implements the normal operator<< for Exception and all its children. 
 * SFINAE means it only applies to Exception.  Think of this as an ersatz
 * boost::enable_if.  
 */
template <class Except, class Data> typename Except::template ExceptionTag<Except&>::Identity operator<<(Except &e, const Data &data) {
  e.stream_ << data;
  return e;
}

#ifdef __GNUC__
#define UTIL_FUNC_NAME __PRETTY_FUNCTION__
#else
#ifdef _WIN32
#define UTIL_FUNC_NAME __FUNCTION__
#else
#define UTIL_FUNC_NAME NULL
#endif
#endif

/* Create an instance of Exception, add the message Modify, and throw it.
 * Modify is appended to the what() message and can contain << for ostream
 * operations.  
 *
 * do .. while kludge to swallow trailing ; character
 * http://gcc.gnu.org/onlinedocs/cpp/Swallowing-the-Semicolon.html .  
 * Arg can be a constructor argument to the exception.
 */
#define UTIL_THROW_BACKEND(Condition, Exception, Arg, Modify) do { \
  Exception UTIL_e Arg; \
  UTIL_e.SetLocation(__FILE__, __LINE__, UTIL_FUNC_NAME, #Exception, Condition); \
  UTIL_e << Modify; \
  throw UTIL_e; \
} while (0)

#define UTIL_THROW_ARG(Exception, Arg, Modify) \
  UTIL_THROW_BACKEND(NULL, Exception, Arg, Modify)

#define UTIL_THROW(Exception, Modify) \
  UTIL_THROW_BACKEND(NULL, Exception, , Modify);

#if __GNUC__ >= 3
#define UTIL_UNLIKELY(x) __builtin_expect (!!(x), 0)
#else
#define UTIL_UNLIKELY(x) (x)
#endif

#define UTIL_THROW_IF_ARG(Condition, Exception, Arg, Modify) do { \
  if (UTIL_UNLIKELY(Condition)) { \
    UTIL_THROW_BACKEND(#Condition, Exception, Arg, Modify); \
  } \
} while (0)

#define UTIL_THROW_IF(Condition, Exception, Modify) \
  UTIL_THROW_IF_ARG(Condition, Exception, , Modify)

// Exception that records errno and adds it to the message.
class ErrnoException : public Exception {
  public:
    ErrnoException() throw();

    virtual ~ErrnoException() throw();

    int Error() const throw() { return errno_; }

  private:
    int errno_;
};

// Utilities for overflow checking.  
class OverflowException : public Exception {
  public:
    OverflowException() throw();
    ~OverflowException() throw();
};

template <unsigned len> inline std::size_t CheckOverflowInternal(uint64_t value) {
  UTIL_THROW_IF(value > static_cast<uint64_t>(std::numeric_limits<std::size_t>::max()), OverflowException, "Integer overflow detected.  This model is too big for 32-bit code.");
  return value;
}

template <> inline std::size_t CheckOverflowInternal<8>(uint64_t value) {
  return value;
}

inline std::size_t CheckOverflow(uint64_t value) {
  return CheckOverflowInternal<sizeof(std::size_t)>(value);
}

} // namespace util

#endif // UTIL_EXCEPTION__


================================================
FILE: src/kenlm/util/fake_ofstream.hh
================================================
/* Like std::ofstream but without being incredibly slow.  Backed by a raw fd.
 * Does not support many data types.  Currently, it's targeted at writing ARPA
 * files quickly.
 */
#include "util/double-conversion/double-conversion.h"
#include "util/double-conversion/utils.h"
#include "util/file.hh"
#include "util/scoped.hh"
#include "util/string_piece.hh"

#define BOOST_LEXICAL_CAST_ASSUME_C_LOCALE
#include <boost/lexical_cast.hpp>

namespace util {
class FakeOFStream {
  public:
    static const std::size_t kOutBuf = 1048576;

    // Does not take ownership of out.
    explicit FakeOFStream(int out)
      : buf_(util::MallocOrThrow(kOutBuf)),
        builder_(static_cast<char*>(buf_.get()), kOutBuf),
        // Mostly the default but with inf instead.  And no flags.
        convert_(double_conversion::DoubleToStringConverter::NO_FLAGS, "inf", "NaN", 'e', -6, 21, 6, 0),
        fd_(out) {}

    ~FakeOFStream() {
      Flush();
    }

    FakeOFStream &operator<<(float value) {
      // Odd, but this is the largest number found in the comments.
      EnsureRemaining(double_conversion::DoubleToStringConverter::kMaxPrecisionDigits + 8);
      convert_.ToShortestSingle(value, &builder_);
      return *this;
    }

    FakeOFStream &operator<<(double value) {
      EnsureRemaining(double_conversion::DoubleToStringConverter::kMaxPrecisionDigits + 8);
      convert_.ToShortest(value, &builder_);
      return *this;
    }

    FakeOFStream &operator<<(StringPiece str) {
      if (str.size() > kOutBuf) {
        Flush();
        util::WriteOrThrow(fd_, str.data(), str.size());
      } else {
        EnsureRemaining(str.size());
        builder_.AddSubstring(str.data(), str.size());
      }
      return *this;
    }

    // Inefficient!  TODO: more efficient implementation
    FakeOFStream &operator<<(unsigned value) {
      return *this << boost::lexical_cast<std::string>(value);
    }

    FakeOFStream &operator<<(char c) {
      EnsureRemaining(1);
      builder_.AddCharacter(c);
      return *this;
    }

    // Note this does not sync.
    void Flush() {
      util::WriteOrThrow(fd_, buf_.get(), builder_.position());
      builder_.Reset();
    }

  private:
    void EnsureRemaining(std::size_t amount) {
      if (static_cast<std::size_t>(builder_.size() - builder_.position()) < amount) {
        Flush();
      }
    }

    util::scoped_malloc buf_;
    double_conversion::StringBuilder builder_;
    double_conversion::DoubleToStringConverter convert_;
    int fd_;
};

} // namespace


================================================
FILE: src/kenlm/util/file.cc
================================================
#define _LARGEFILE64_SOURCE
#define _FILE_OFFSET_BITS 64

#include "util/file.hh"

#include "util/exception.hh"

#include <cstdlib>
#include <cstdio>
#include <sstream>
#include <iostream>

#include <assert.h>
#include <errno.h>
#include <sys/types.h>
#include <sys/stat.h>
#include <fcntl.h>
#include <stdint.h>

#if defined(_WIN32) || defined(_WIN64)
#include <windows.h>
#include <io.h>
#include <algorithm>
#include <limits.h>
#include <limits>
#else
#include <unistd.h>
#endif

namespace util {

scoped_fd::~scoped_fd() {
  if (fd_ != -1 && close(fd_)) {
    std::cerr << "Could not close file " << fd_ << std::endl;
    std::abort();
  }
}

scoped_FILE::~scoped_FILE() {
  if (file_ && std::fclose(file_)) {
    std::cerr << "Could not close file " << std::endl;
    std::abort();
  }
}

// Note that ErrnoException records errno before NameFromFD is called.
FDException::FDException(int fd) throw() : fd_(fd), name_guess_(NameFromFD(fd)) {
  *this << "in " << name_guess_ << ' ';
}

FDException::~FDException() throw() {}

EndOfFileException::EndOfFileException() throw() {
  *this << "End of file";
}
EndOfFileException::~EndOfFileException() throw() {}

int OpenReadOrThrow(const char *name) {
  int ret;
#if defined(_WIN32) || defined(_WIN64)
  UTIL_THROW_IF(-1 == (ret = _open(name, _O_BINARY | _O_RDONLY)), ErrnoException, "while opening " << name);
#else
  UTIL_THROW_IF(-1 == (ret = open(name, O_RDONLY)), ErrnoException, "while opening " << name);
#endif
  return ret;
}

int CreateOrThrow(const char *name) {
  int ret;
#if defined(_WIN32) || defined(_WIN64)
  UTIL_THROW_IF(-1 == (ret = _open(name, _O_CREAT | _O_TRUNC | _O_RDWR | _O_BINARY, _S_IREAD | _S_IWRITE)), ErrnoException, "while creating " << name);
#else
  UTIL_THROW_IF(-1 == (ret = open(name, O_CREAT | O_TRUNC | O_RDWR, S_IRUSR | S_IWUSR | S_IRGRP | S_IROTH)), ErrnoException, "while creating " << name);
#endif
  return ret;
}

uint64_t SizeFile(int fd) {
#if defined(_WIN32) || defined(_WIN64)
  __int64 ret = _filelengthi64(fd);
  return (ret == -1) ? kBadSize : ret;
#else // Not windows.

#ifdef OS_ANDROID
  struct stat64 sb;
  int ret = fstat64(fd, &sb);
#else
  struct stat sb;
  int ret = fstat(fd, &sb);
#endif
  if (ret == -1 || (!sb.st_size && !S_ISREG(sb.st_mode))) return kBadSize;
  return sb.st_size;
#endif
}

uint64_t SizeOrThrow(int fd) {
  uint64_t ret = SizeFile(fd);
  UTIL_THROW_IF_ARG(ret == kBadSize, FDException, (fd), "Failed to size");
  return ret;
}

void ResizeOrThrow(int fd, uint64_t to) {
#if defined(_WIN32) || defined(_WIN64)
    errno_t ret = _chsize_s
#elif defined(OS_ANDROID)
    int ret = ftruncate64
#else
    int ret = ftruncate
#endif
    (fd, to);
  UTIL_THROW_IF_ARG(ret, FDException, (fd), "while resizing to " << to << " bytes");
}

std::size_t PartialRead(int fd, void *to, std::size_t amount) {
#if defined(_WIN32) || defined(_WIN64)
  amount = min(static_cast<std::size_t>(INT_MAX), amount);
  int ret = _read(fd, to, amount); 
#else
  errno = 0;
  ssize_t ret;
  do {
    ret = read(fd, to, amount);
  } while (ret == -1 && errno == EINTR);
#endif
  UTIL_THROW_IF_ARG(ret < 0, FDException, (fd), "while reading " << amount << " bytes");
  return static_cast<std::size_t>(ret);
}

void ReadOrThrow(int fd, void *to_void, std::size_t amount) {
  uint8_t *to = static_cast<uint8_t*>(to_void);
  while (amount) {
    std::size_t ret = PartialRead(fd, to, amount);
    UTIL_THROW_IF(ret == 0, EndOfFileException, " in " << NameFromFD(fd) << " but there should be " << amount << " more bytes to read.");
    amount -= ret;
    to += ret;
  }
}

std::size_t ReadOrEOF(int fd, void *to_void, std::size_t amount) {
  uint8_t *to = static_cast<uint8_t*>(to_void);
  std::size_t remaining = amount;
  while (remaining) {
    std::size_t ret = PartialRead(fd, to, remaining);
    if (!ret) return amount - remaining;
    remaining -= ret;
    to += ret;
  }
  return amount;
}

void PReadOrThrow(int fd, void *to_void, std::size_t size, uint64_t off) {
  uint8_t *to = static_cast<uint8_t*>(to_void);
#if defined(_WIN32) || defined(_WIN64)
  UTIL_THROW(Exception, "This pread implementation for windows is broken.  Please send me a patch that does not change the file pointer.  Atomically.  Or send me an implementation of pwrite that is allowed to change the file pointer but can be called concurrently with pread.");
  const std::size_t kMaxDWORD = static_cast<std::size_t>(4294967295UL);
#endif
  for (;size ;) {
#if defined(_WIN32) || defined(_WIN64)
    /* BROKEN: changes file pointer.  Even if you save it and change it back, it won't be safe to use concurrently with write() or read() which lmplz does. */
    // size_t might be 64-bit.  DWORD is always 32.
    DWORD reading = static_cast<DWORD>(std::min<std::size_t>(kMaxDWORD, size));
    DWORD ret;
    OVERLAPPED overlapped;
    memset(&overlapped, 0, sizeof(OVERLAPPED));
    overlapped.Offset = static_cast<DWORD>(off);
    overlapped.OffsetHigh = static_cast<DWORD>(off >> 32);
    UTIL_THROW_IF(!ReadFile((HANDLE)_get_osfhandle(fd), to, reading, &ret, &overlapped), Exception, "ReadFile failed for offset " << off);
#else
    ssize_t ret;
    errno = 0;
    do {
#ifdef OS_ANDROID
      ret = pread64(fd, to, size, off);
#else
      ret = pread(fd, to, size, off);
#endif
    } while (ret == -1 && errno == EINTR);
    if (ret <= 0) {
      UTIL_THROW_IF(ret == 0, EndOfFileException, " for reading " << size << " bytes at " << off << " from " << NameFromFD(fd));
      UTIL_THROW_ARG(FDException, (fd), "while reading " << size << " bytes at offset " << off);
    }
#endif
    size -= ret;
    off += ret;
    to += ret;
  }
}

void WriteOrThrow(int fd, const void *data_void, std::size_t size) {
  const uint8_t *data = static_cast<const uint8_t*>(data_void);
  while (size) {
#if defined(_WIN32) || defined(_WIN64)
    int ret = write(fd, data, min(static_cast<std::size_t>(INT_MAX), size));
#else
    errno = 0;
    ssize_t ret;
    do {
      ret = write(fd, data, size);
    } while (ret == -1 && errno == EINTR);
#endif
    UTIL_THROW_IF_ARG(ret < 1, FDException, (fd), "while writing " << size << " bytes");
    data += ret;
    size -= ret;
  }
}

void WriteOrThrow(FILE *to, const void *data, std::size_t size) {
  if (!size) return;
  UTIL_THROW_IF(1 != std::fwrite(data, size, 1, to), ErrnoException, "Short write; requested size " << size);
}

void FSyncOrThrow(int fd) {
// Apparently windows doesn't have fsync?  
#if !defined(_WIN32) && !defined(_WIN64)
  UTIL_THROW_IF_ARG(-1 == fsync(fd), FDException, (fd), "while syncing");
#endif
}

namespace {

// Static assert for 64-bit off_t size.
#if !defined(_WIN32) && !defined(_WIN64) && !defined(OS_ANDROID)
template <unsigned> struct CheckOffT;
template <> struct CheckOffT<8> {
  struct True {};
};
// If there's a compiler error on the next line, then off_t isn't 64 bit.  And
// that makes me a sad panda.
typedef CheckOffT<sizeof(off_t)>::True IgnoredType;
#endif

// Can't we all just get along?  
void InternalSeek(int fd, int64_t off, int whence) {
  if (
#if defined(_WIN32) || defined(_WIN64)
    (__int64)-1 == _lseeki64(fd, off, whence)
#elif defined(OS_ANDROID)
    (off64_t)-1 == lseek64(fd, off, whence)
#else
    (off_t)-1 == lseek(fd, off, whence)
#endif
  ) UTIL_THROW_ARG(FDException, (fd), "while seeking to " << off << " whence " << whence);
}
} // namespace

void SeekOrThrow(int fd, uint64_t off) {
  InternalSeek(fd, off, SEEK_SET);
}

void AdvanceOrThrow(int fd, int64_t off) {
  InternalSeek(fd, off, SEEK_CUR);
}

void SeekEnd(int fd) {
  InternalSeek(fd, 0, SEEK_END);
}

std::FILE *FDOpenOrThrow(scoped_fd &file) {
  std::FILE *ret = fdopen(file.get(), "r+b");
  UTIL_THROW_IF_ARG(!ret, FDException, (file.get()), "Could not fdopen for write");
  file.release();
  return ret;
}

std::FILE *FDOpenReadOrThrow(scoped_fd &file) {
  std::FILE *ret = fdopen(file.get(), "rb");
  UTIL_THROW_IF_ARG(!ret, FDException, (file.get()), "Could not fdopen for read");
  file.release();
  return ret;
}

// Sigh.  Windows temporary file creation is full of race conditions.
#if defined(_WIN32) || defined(_WIN64)
/* mkstemp extracted from libc/sysdeps/posix/tempname.c.  Copyright
   (C) 1991-1999, 2000, 2001, 2006 Free Software Foundation, Inc.

   The GNU C Library is free software; you can redistribute it and/or
   modify it under the terms of the GNU Lesser General Public
   License as published by the Free Software Foundation; either
   version 2.1 of the License, or (at your option) any later version.  */

/* This has been modified from the original version to rename the function and
 * set the Windows temporary flag. */

static const char letters[] =
"abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ0123456789";

/* Generate a temporary file name based on TMPL.  TMPL must match the
   rules for mk[s]temp (i.e. end in "XXXXXX").  The name constructed
   does not exist at the time of the call to mkstemp.  TMPL is
   overwritten with the result.  */
int
mkstemp_and_unlink(char *tmpl)
{
  int len;
  char *XXXXXX;
  static unsigned long long value;
  unsigned long long random_time_bits;
  unsigned int count;
  int fd = -1;
  int save_errno = errno;

  /* A lower bound on the number of temporary files to attempt to
     generate.  The maximum total number of temporary file names that
     can exist for a given template is 62**6.  It should never be
     necessary to try all these combinations.  Instead if a reasonable
     number of names is tried (we define reasonable as 62**3) fail to
     give the system administrator the chance to remove the problems.  */
#define ATTEMPTS_MIN (62 * 62 * 62)

  /* The number of times to attempt to generate a temporary file.  To
     conform to POSIX, this must be no smaller than TMP_MAX.  */
#if ATTEMPTS_MIN < TMP_MAX
  unsigned int attempts = TMP_MAX;
#else
  unsigned int attempts = ATTEMPTS_MIN;
#endif

  len = strlen (tmpl);
  if (len < 6 || strcmp (&tmpl[len - 6], "XXXXXX"))
    {
      errno = EINVAL;
      return -1;
    }

/* This is where the Xs start.  */
  XXXXXX = &tmpl[len - 6];

  /* Get some more or less random data.  */
  {
    SYSTEMTIME      stNow;
    FILETIME ftNow;

    // get system time
    GetSystemTime(&stNow);
    stNow.wMilliseconds = 500;
    if (!SystemTimeToFileTime(&stNow, &ftNow))
    {
        errno = -1;
        return -1;
    }

    random_time_bits = (((unsigned long long)ftNow.dwHighDateTime << 32)
                        | (unsigned long long)ftNow.dwLowDateTime);
  }
  value += random_time_bits ^ (unsigned long long)GetCurrentThreadId ();

  for (count = 0; count < attempts; value += 7777, ++count)
  {
    unsigned long long v = value;

    /* Fill in the random bits.  */
    XXXXXX[0] = letters[v % 62];
    v /= 62;
    XXXXXX[1] = letters[v % 62];
    v /= 62;
    XXXXXX[2] = letters[v % 62];
    v /= 62;
    XXXXXX[3] = letters[v % 62];
    v /= 62;
    XXXXXX[4] = letters[v % 62];
    v /= 62;
    XXXXXX[5] = letters[v % 62];

    /* Modified for windows and to unlink */
    //      fd = open (tmpl, O_RDWR | O_CREAT | O_EXCL, _S_IREAD | _S_IWRITE);
    int flags = _O_RDWR | _O_CREAT | _O_EXCL | _O_BINARY;
    flags |= _O_TEMPORARY;
    fd = _open (tmpl, flags, _S_IREAD | _S_IWRITE);
    if (fd >= 0)
    {
      errno = save_errno;
      return fd;
    }
    else if (errno != EEXIST)
      return -1;
  }

  /* We got out of the loop because we ran out of combinations to try.  */
  errno = EEXIST;
  return -1;
}
#else
int
mkstemp_and_unlink(char *tmpl) {
  int ret = mkstemp(tmpl);
  if (ret != -1) {
    UTIL_THROW_IF(unlink(tmpl), ErrnoException, "while deleting delete " << tmpl);
  }
  return ret;
}
#endif

// If it's a directory, add a /.  This lets users say -T /tmp without creating
// /tmpAAAAAA
void NormalizeTempPrefix(std::string &base) {
  if (base.empty()) return;
  if (base[base.size() - 1] == '/') return;
  struct stat sb;
  // It's fine for it to not exist.
  if (-1 == stat(base.c_str(), &sb)) return;
  if (
#if defined(_WIN32) || defined(_WIN64)
    sb.st_mode & _S_IFDIR
#else
    S_ISDIR(sb.st_mode)
#endif
    ) base += '/';
}

int MakeTemp(const std::string &base) {
  std::string name(base);
  name += "XXXXXX";
  name.push_back(0);
  int ret;
  UTIL_THROW_IF(-1 == (ret = mkstemp_and_unlink(&name[0])), ErrnoException, "while making a temporary based on " << base);
  return ret;
}

std::FILE *FMakeTemp(const std::string &base) {
  util::scoped_fd file(MakeTemp(base));
  return FDOpenOrThrow(file);
}

int DupOrThrow(int fd) {
  int ret = dup(fd);
  UTIL_THROW_IF_ARG(ret == -1, FDException, (fd), "in duplicating the file descriptor");
  return ret;
}

namespace {
// Try to name things but be willing to fail too.
bool TryName(int fd, std::string &out) {
#if defined(_WIN32) || defined(_WIN64)
  return false;
#else
  std::string name("/proc/self/fd/");
  std::ostringstream convert;
  convert << fd;
  name += convert.str();
  
  struct stat sb;
  if (-1 == lstat(name.c_str(), &sb)) 
    return false;
  out.resize(sb.st_size + 1);
  ssize_t ret = readlink(name.c_str(), &out[0], sb.st_size + 1);
  if (-1 == ret)
    return false;
  if (ret > sb.st_size) {
    // Increased in size?!
    return false;
  }
  out.resize(ret);
  // Don't use the non-file names.
  if (!out.empty() && out[0] != '/') 
    return false;
  return true;
#endif
}
} // namespace

std::string NameFromFD(int fd) {
  std::string ret;
  if (TryName(fd, ret)) return ret;
  switch (fd) {
    case 0: return "stdin";
    case 1: return "stdout";
    case 2: return "stderr";
  }
  ret = "fd ";
  std::ostringstream convert;
  convert << fd;
  ret += convert.str();
  return ret;
}

} // namespace util


================================================
FILE: src/kenlm/util/file.hh
================================================
#ifndef UTIL_FILE__
#define UTIL_FILE__

#include "util/exception.hh"

#include <cstddef>
#include <cstdio>
#include <string>

#include <stdint.h>

namespace util {

class scoped_fd {
  public:
    scoped_fd() : fd_(-1) {}

    explicit scoped_fd(int fd) : fd_(fd) {}

    ~scoped_fd();

    void reset(int to = -1) {
      scoped_fd other(fd_);
      fd_ = to;
    }

    int get() const { return fd_; }

    int operator*() const { return fd_; }

    int release() {
      int ret = fd_;
      fd_ = -1;
      return ret;
    }

  private:
    int fd_;

    scoped_fd(const scoped_fd &);
    scoped_fd &operator=(const scoped_fd &);
};

class scoped_FILE {
  public:
    explicit scoped_FILE(std::FILE *file = NULL) : file_(file) {}

    ~scoped_FILE();

    std::FILE *get() { return file_; }
    const std::FILE *get() const { return file_; }

    void reset(std::FILE *to = NULL) {
      scoped_FILE other(file_);
      file_ = to;
    }

    std::FILE *release() {
      std::FILE *ret = file_;
      file_ = NULL;
      return ret;
    }

  private:
    std::FILE *file_;
};

/* Thrown for any operation where the fd is known. */
class FDException : public ErrnoException {
  public:
    explicit FDException(int fd) throw();

    virtual ~FDException() throw();

    // This may no longer be valid if the exception was thrown past open.
    int FD() const { return fd_; }

    // Guess from NameFromFD.
    const std::string &NameGuess() const { return name_guess_; }

  private:
    int fd_;

    std::string name_guess_;
};

// End of file reached.
class EndOfFileException : public Exception {
  public:
    EndOfFileException() throw();
    ~EndOfFileException() throw();
};

// Open for read only.  
int OpenReadOrThrow(const char *name);
// Create file if it doesn't exist, truncate if it does.  Opened for write.   
int CreateOrThrow(const char *name);

// Return value for SizeFile when it can't size properly.  
const uint64_t kBadSize = (uint64_t)-1;
uint64_t SizeFile(int fd);
uint64_t SizeOrThrow(int fd);

void ResizeOrThrow(int fd, uint64_t to);

std::size_t PartialRead(int fd, void *to, std::size_t size);
void ReadOrThrow(int fd, void *to, std::size_t size);
std::size_t ReadOrEOF(int fd, void *to_void, std::size_t size);
// Positioned: unix only for now.  
void PReadOrThrow(int fd, void *to, std::size_t size, uint64_t off);

void WriteOrThrow(int fd, const void *data_void, std::size_t size);
void WriteOrThrow(FILE *to, const void *data, std::size_t size);

void FSyncOrThrow(int fd);

// Seeking
void SeekOrThrow(int fd, uint64_t off);
void AdvanceOrThrow(int fd, int64_t off);
void SeekEnd(int fd);

std::FILE *FDOpenOrThrow(scoped_fd &file);
std::FILE *FDOpenReadOrThrow(scoped_fd &file);

// Temporary files
// Append a / if base is a directory.
void NormalizeTempPrefix(std::string &base);
int MakeTemp(const std::string &prefix);
std::FILE *FMakeTemp(const std::string &prefix);

// dup an fd.
int DupOrThrow(int fd);

/* Attempt get file name from fd.  This won't always work (i.e. on Windows or
 * a pipe).  The file might have been renamed.  It's intended for diagnostics
 * and logging only.
 */
std::string NameFromFD(int fd);

} // namespace util

#endif // UTIL_FILE__


================================================
FILE: src/kenlm/util/file_piece.cc
================================================
#include "util/file_piece.hh"

#include "util/double-conversion/double-conversion.h"
#include "util/exception.hh"
#include "util/file.hh"
#include "util/mmap.hh"

#if defined(_WIN32) || defined(_WIN64)
#include <io.h>
#else
#include <unistd.h>
#endif

#include <iostream>
#include <string>
#include <limits>

#include <assert.h>
#include <fcntl.h>
#include <stdlib.h>
#include <sys/types.h>
#include <sys/stat.h>

namespace util {

ParseNumberException::ParseNumberException(StringPiece value) throw() {
  *this << "Could not parse \"" << value << "\" into a number";
}

// Sigh this is the only way I could come up with to do a _const_ bool.  It has ' ', '\f', '\n', '\r', '\t', and '\v' (same as isspace on C locale). 
const bool kSpaces[256] = {0,0,0,0,0,0,0,0,0,1,1,1,1,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0};

FilePiece::FilePiece(const char *name, std::ostream *show_progress, std::size_t min_buffer) : 
  file_(OpenReadOrThrow(name)), total_size_(SizeFile(file_.get())), page_(SizePage()),
  progress_(total_size_, total_size_ == kBadSize ? NULL : show_progress, std::string("Reading ") + name) {
  Initialize(name, show_progress, min_buffer);
}

namespace {
std::string NamePossiblyFind(int fd, const char *name) {
  if (name) return name;
  return NameFromFD(fd);
}
} // namespace

FilePiece::FilePiece(int fd, const char *name, std::ostream *show_progress, std::size_t min_buffer) : 
  file_(fd), total_size_(SizeFile(file_.get())), page_(SizePage()),
  progress_(total_size_, total_size_ == kBadSize ? NULL : show_progress, std::string("Reading ") + NamePossiblyFind(fd, name)) {
  Initialize(NamePossiblyFind(fd, name).c_str(), show_progress, min_buffer);
}

FilePiece::FilePiece(std::istream &stream, const char *name, std::size_t min_buffer) :
  total_size_(kBadSize), page_(SizePage()) {
  InitializeNoRead("istream", min_buffer);

  fallback_to_read_ = true;
  data_.reset(MallocOrThrow(default_map_size_), default_map_size_, scoped_memory::MALLOC_ALLOCATED);
  position_ = data_.begin();
  position_end_ = position_;
  
  fell_back_.Reset(stream);
}

FilePiece::~FilePiece() {}

StringPiece FilePiece::ReadLine(char delim) {
  std::size_t skip = 0;
  while (true) {
    for (const char *i = position_ + skip; i < position_end_; ++i) {
      if (*i == delim) {
        StringPiece ret(position_, i - position_);
        position_ = i + 1;
        return ret;
      }
    }
    if (at_end_) {
      if (position_ == position_end_) Shift();
      return Consume(position_end_);
    }
    skip = position_end_ - position_;
    Shift();
  }
}

float FilePiece::ReadFloat() {
  return ReadNumber<float>();
}
double FilePiece::ReadDouble() {
  return ReadNumber<double>();
}
long int FilePiece::ReadLong() {
  return ReadNumber<long int>();
}
unsigned long int FilePiece::ReadULong() {
  return ReadNumber<unsigned long int>();
}

// Factored out so that istream can call this.
void FilePiece::InitializeNoRead(const char *name, std::size_t min_buffer) {
  file_name_ = name;

  default_map_size_ = page_ * std::max<std::size_t>((min_buffer / page_ + 1), 2);
  position_ = NULL;
  position_end_ = NULL;
  mapped_offset_ = 0;
  at_end_ = false;
}

void FilePiece::Initialize(const char *name, std::ostream *show_progress, std::size_t min_buffer) {
  InitializeNoRead(name, min_buffer);

  if (total_size_ == kBadSize) {
    // So the assertion passes.  
    fallback_to_read_ = false;
    if (show_progress) 
      *show_progress << "File " << name << " isn't normal.  Using slower read() instead of mmap().  No progress bar." << std::endl;
    TransitionToRead();
  } else {
    fallback_to_read_ = false;
  }
  Shift();
  // gzip detect.
  if ((position_end_ >= position_ + ReadCompressed::kMagicSize) && ReadCompressed::DetectCompressedMagic(position_)) {
    if (!fallback_to_read_) {
      at_end_ = false;
      TransitionToRead();
    }
  }
}

namespace {

static const double_conversion::StringToDoubleConverter kConverter(
    double_conversion::StringToDoubleConverter::ALLOW_TRAILING_JUNK | double_conversion::StringToDoubleConverter::ALLOW_LEADING_SPACES,
    std::numeric_limits<double>::quiet_NaN(),
    std::numeric_limits<double>::quiet_NaN(),
    "inf",
    "NaN");

void ParseNumber(const char *begin, const char *&end, float &out) {
  int count;
  out = kConverter.StringToFloat(begin, end - begin, &count);
  end = begin + count;
}
void ParseNumber(const char *begin, const char *&end, double &out) {
  int count;
  out = kConverter.StringToDouble(begin, end - begin, &count);
  end = begin + count;
}
void ParseNumber(const char *begin, const char *&end, long int &out) {
  char *silly_end;
  out = strtol(begin, &silly_end, 10);
  end = silly_end;
}
void ParseNumber(const char *begin, const char *&end, unsigned long int &out) {
  char *silly_end;
  out = strtoul(begin, &silly_end, 10);
  end = silly_end;
}
} // namespace

template <class T> T FilePiece::ReadNumber() {
  SkipSpaces();
  while (last_space_ < position_) {
    if (at_end_) {
      // Hallucinate a null off the end of the file.
      std::string buffer(position_, position_end_);
      const char *buf = buffer.c_str();
      const char *end = buf + buffer.size();
      T ret;
      ParseNumber(buf, end, ret);
      if (buf == end) throw ParseNumberException(buffer);
      position_ += end - buf;
      return ret;
    }
    Shift();
  }
  const char *end = last_space_;
  T ret;
  ParseNumber(position_, end, ret);
  if (end == position_) throw ParseNumberException(ReadDelimited());
  position_ = end;
  return ret;
}

const char *FilePiece::FindDelimiterOrEOF(const bool *delim)  {
  std::size_t skip = 0;
  while (true) {
    for (const char *i = position_ + skip; i < position_end_; ++i) {
      if (delim[static_cast<unsigned char>(*i)]) return i;
    }
    if (at_end_) {
      if (position_ == position_end_) Shift();
      return position_end_;
    }
    skip = position_end_ - position_;
    Shift();
  }
}

void FilePiece::Shift() {
  if (at_end_) {
    progress_.Finished();
    throw EndOfFileException();
  }
  uint64_t desired_begin = position_ - data_.begin() + mapped_offset_;

  if (!fallback_to_read_) MMapShift(desired_begin);
  // Notice an mmap failure might set the fallback.  
  if (fallback_to_read_) ReadShift();

  for (last_space_ = position_end_ - 1; last_space_ >= position_; --last_space_) {
    if (kSpaces[static_cast<unsigned char>(*last_space_)])  break;
  }
}

void FilePiece::MMapShift(uint64_t desired_begin) {
  // Use mmap.  
  uint64_t ignore = desired_begin % page_;
  // Duplicate request for Shift means give more data.  
  if (position_ == data_.begin() + ignore && position_) {
    default_map_size_ *= 2;
  }
  // Local version so that in case of failure it doesn't overwrite the class variable.  
  uint64_t mapped_offset = desired_begin - ignore;

  uint64_t mapped_size;
  if (default_map_size_ >= static_cast<std::size_t>(total_size_ - mapped_offset)) {
    at_end_ = true;
    mapped_size = total_size_ - mapped_offset;
  } else {
    mapped_size = default_map_size_;
  }

  // Forcibly clear the existing mmap first.  
  data_.reset();
  try {
    MapRead(POPULATE_OR_LAZY, *file_, mapped_offset, mapped_size, data_);
  } catch (const util::ErrnoException &e) {
    if (desired_begin) {
      SeekOrThrow(*file_, desired_begin);
    }
    // The mmap was scheduled to end the file, but now we're going to read it.  
    at_end_ = false;
    TransitionToRead();
    return;
  }
  mapped_offset_ = mapped_offset;
  position_ = data_.begin() + ignore;
  position_end_ = data_.begin() + mapped_size;

  progress_.Set(desired_begin);
}

void FilePiece::TransitionToRead() {
  assert(!fallback_to_read_);
  fallback_to_read_ = true;
  data_.reset();
  data_.reset(MallocOrThrow(default_map_size_), default_map_size_, scoped_memory::MALLOC_ALLOCATED);
  position_ = data_.begin();
  position_end_ = position_;

  try {
    fell_back_.Reset(file_.release());
  } catch (util::Exception &e) {
    e << " in file " << file_name_;
    throw;
  }
}

void FilePiece::ReadShift() {
  assert(fallback_to_read_);
  // Bytes [data_.begin(), position_) have been consumed.  
  // Bytes [position_, position_end_) have been read into the buffer.  

  // Start at the beginning of the buffer if there's nothing useful in it.  
  if (position_ == position_end_) {
    mapped_offset_ += (position_end_ - data_.begin());
    position_ = data_.begin();
    position_end_ = position_;
  }

  std::size_t already_read = position_end_ - data_.begin();

  if (already_read == default_map_size_) {
    if (position_ == data_.begin()) {
      // Buffer too small.  
      std::size_t valid_length = position_end_ - position_;
      default_map_size_ *= 2;
      data_.call_realloc(default_map_size_);
      UTIL_THROW_IF(!data_.get(), ErrnoException, "realloc failed for " << default_map_size_);
      position_ = data_.begin();
      position_end_ = position_ + valid_length;
    } else {
      std::size_t moving = position_end_ - position_;
      memmove(data_.get(), position_, moving);
      position_ = data_.begin();
      position_end_ = position_ + moving;
      already_read = moving;
    }
  }

  std::size_t read_return = fell_back_.Read(static_cast<uint8_t*>(data_.get()) + already_read, default_map_size_ - already_read);
  progress_.Set(fell_back_.RawAmount());

  if (read_return == 0) {
    at_end_ = true;
  }
  position_end_ += read_return;
}

} // namespace util


================================================
FILE: src/kenlm/util/file_piece.hh
================================================
#ifndef UTIL_FILE_PIECE__
#define UTIL_FILE_PIECE__

#include "util/ersatz_progress.hh"
#include "util/exception.hh"
#include "util/file.hh"
#include "util/mmap.hh"
#include "util/read_compressed.hh"
#include "util/string_piece.hh"

#include <cstddef>
#include <iosfwd>
#include <string>

#include <stdint.h>

namespace util {

class ParseNumberException : public Exception {
  public:
    explicit ParseNumberException(StringPiece value) throw();
    ~ParseNumberException() throw() {}
};

extern const bool kSpaces[256];

// Memory backing the returned StringPiece may vanish on the next call.
class FilePiece {
  public:
    // 1 MB default.
    explicit FilePiece(const char *file, std::ostream *show_progress = NULL, std::size_t min_buffer = 1048576);
    // Takes ownership of fd.  name is used for messages.
    explicit FilePiece(int fd, const char *name = NULL, std::ostream *show_progress = NULL, std::size_t min_buffer = 1048576);

    /* Read from an istream.  Don't use this if you can avoid it.  Raw fd IO is
     * much faster.  But sometimes you just have an istream like Boost's HTTP
     * server and want to parse it the same way.
     * name is just used for messages and FileName().
     */
    explicit FilePiece(std::istream &stream, const char *name = NULL, std::size_t min_buffer = 1048576);

    ~FilePiece();

    char get() {
      if (position_ == position_end_) {
        Shift();
        if (at_end_) throw EndOfFileException();
      }
      return *(position_++);
    }

    // Leaves the delimiter, if any, to be returned by get().  Delimiters defined by isspace().
    StringPiece ReadDelimited(const bool *delim = kSpaces) {
      SkipSpaces(delim);
      return Consume(FindDelimiterOrEOF(delim));
    }

    // Unlike ReadDelimited, this includes leading spaces and consumes the delimiter.
    // It is similar to getline in that way.
    StringPiece ReadLine(char delim = '\n');

    float ReadFloat();
    double ReadDouble();
    long int ReadLong();
    unsigned long int ReadULong();

    // Skip spaces defined by isspace.
    void SkipSpaces(const bool *delim = kSpaces) {
      for (; ; ++position_) {
        if (position_ == position_end_) Shift();
        if (!delim[static_cast<unsigned char>(*position_)]) return;
      }
    }

    uint64_t Offset() const {
      return position_ - data_.begin() + mapped_offset_;
    }

    const std::string &FileName() const { return file_name_; }

  private:
    void InitializeNoRead(const char *name, std::size_t min_buffer);
    // Calls InitializeNoRead, so don't call both.
    void Initialize(const char *name, std::ostream *show_progress, std::size_t min_buffer);

    template <class T> T ReadNumber();

    StringPiece Consume(const char *to) {
      StringPiece ret(position_, to - position_);
      position_ = to;
      return ret;
    }

    const char *FindDelimiterOrEOF(const bool *delim = kSpaces);

    void Shift();
    // Backends to Shift().
    void MMapShift(uint64_t desired_begin);

    void TransitionToRead();
    void ReadShift();

    const char *position_, *last_space_, *position_end_;

    scoped_fd file_;
    const uint64_t total_size_;
    const uint64_t page_;

    std::size_t default_map_size_;
    uint64_t mapped_offset_;

    // Order matters: file_ should always be destroyed after this.
    scoped_memory data_;

    bool at_end_;
    bool fallback_to_read_;

    ErsatzProgress progress_;

    std::string file_name_;

    ReadCompressed fell_back_;
};

} // namespace util

#endif // UTIL_FILE_PIECE__


================================================
FILE: src/kenlm/util/file_piece_test.cc
================================================
// Tests might fail if you have creative characters in your path.  Sue me.  
#include "util/file_piece.hh"

#include "util/file.hh"
#include "util/scoped.hh"

#define BOOST_TEST_MODULE FilePieceTest
#include <boost/test/unit_test.hpp>
#include <fstream>
#include <iostream>

#include <stdio.h>
#include <sys/types.h>
#include <sys/stat.h>

namespace util {
namespace {

std::string FileLocation() {
  if (boost::unit_test::framework::master_test_suite().argc < 2) {
    return "file_piece.cc";
  }
  std::string ret(boost::unit_test::framework::master_test_suite().argv[1]);
  return ret;
}

/* istream */
BOOST_AUTO_TEST_CASE(IStream) {
  std::fstream ref(FileLocation().c_str(), std::ios::in);
  std::fstream backing(FileLocation().c_str(), std::ios::in);
  FilePiece test(backing);
  std::string ref_line;
  while (getline(ref, ref_line)) {
    StringPiece test_line(test.ReadLine());
    BOOST_CHECK_EQUAL(ref_line, test_line);
  }
  BOOST_CHECK_THROW(test.get(), EndOfFileException);
  BOOST_CHECK_THROW(test.get(), EndOfFileException);
}

/* mmap implementation */
BOOST_AUTO_TEST_CASE(MMapReadLine) {
  std::fstream ref(FileLocation().c_str(), std::ios::in);
  FilePiece test(FileLocation().c_str(), NULL, 1);
  std::string ref_line;
  while (getline(ref, ref_line)) {
    StringPiece test_line(test.ReadLine());
    // I submitted a bug report to ICU: http://bugs.icu-project.org/trac/ticket/7924
    if (!test_line.empty() || !ref_line.empty()) {
      BOOST_CHECK_EQUAL(ref_line, test_line);
    }
  }
  BOOST_CHECK_THROW(test.get(), EndOfFileException);
}

#if !defined(_WIN32) && !defined(_WIN64) && !defined(__APPLE__)
/* Apple isn't happy with the popen, fileno, dup.  And I don't want to
 * reimplement popen.  This is an issue with the test.  
 */
/* read() implementation */
BOOST_AUTO_TEST_CASE(StreamReadLine) {
  std::fstream ref(FileLocation().c_str(), std::ios::in);

  std::string popen_args = "cat \"";
  popen_args += FileLocation();
  popen_args += '"';

  FILE *catter = popen(popen_args.c_str(), "r");
  BOOST_REQUIRE(catter);
  
  FilePiece test(dup(fileno(catter)), "file_piece.cc", NULL, 1);
  std::string ref_line;
  while (getline(ref, ref_line)) {
    StringPiece test_line(test.ReadLine());
    // I submitted a bug report to ICU: http://bugs.icu-project.org/trac/ticket/7924
    if (!test_line.empty() || !ref_line.empty()) {
      BOOST_CHECK_EQUAL(ref_line, test_line);
    }
  }
  BOOST_CHECK_THROW(test.get(), EndOfFileException);
  BOOST_REQUIRE(!pclose(catter));
}
#endif

#ifdef HAVE_ZLIB

// gzip file
BOOST_AUTO_TEST_CASE(PlainZipReadLine) {
  std::string location(FileLocation());
  std::fstream ref(location.c_str(), std::ios::in);

  std::string command("gzip <\"");
  command += location + "\" >\"" + location + "\".gz";

  BOOST_REQUIRE_EQUAL(0, system(command.c_str()));
  FilePiece test((location + ".gz").c_str(), NULL, 1);
  unlink((location + ".gz").c_str());
  std::string ref_line;
  while (getline(ref, ref_line)) {
    StringPiece test_line(test.ReadLine());
    // I submitted a bug report to ICU: http://bugs.icu-project.org/trac/ticket/7924
    if (!test_line.empty() || !ref_line.empty()) {
      BOOST_CHECK_EQUAL(ref_line, test_line);
    }
  }
  BOOST_CHECK_THROW(test.get(), EndOfFileException);
}

// gzip stream.  Apple doesn't like popen, fileno, dup.  This is an issue with
// the test.  
#ifndef __APPLE__
BOOST_AUTO_TEST_CASE(StreamZipReadLine) {
  std::fstream ref(FileLocation().c_str(), std::ios::in);

  std::string command("gzip <\"");
  command += FileLocation() + "\"";

  FILE * catter = popen(command.c_str(), "r");
  BOOST_REQUIRE(catter);
  
  FilePiece test(dup(fileno(catter)), "file_piece.cc.gz", NULL, 1);
  std::string ref_line;
  while (getline(ref, ref_line)) {
    StringPiece test_line(test.ReadLine());
    // I submitted a bug report to ICU: http://bugs.icu-project.org/trac/ticket/7924
    if (!test_line.empty() || !ref_line.empty()) {
      BOOST_CHECK_EQUAL(ref_line, test_line);
    }
  }
  BOOST_CHECK_THROW(test.get(), EndOfFileException);
  BOOST_REQUIRE(!pclose(catter));
}
#endif // __APPLE__

#endif // HAVE_ZLIB

} // namespace
} // namespace util


================================================
FILE: src/kenlm/util/getopt.c
================================================
/*
POSIX getopt for Windows

AT&T Public License

Code given out at the 1985 UNIFORUM conference in Dallas.  
*/

#ifndef __GNUC__

#include "getopt.hh"
#include <stdio.h>
#include <string.h>

#define NULL	0
#define EOF	(-1)
#define ERR(s, c)	if(opterr){\
	char errbuf[2];\
	errbuf[0] = c; errbuf[1] = '\n';\
	fputs(argv[0], stderr);\
	fputs(s, stderr);\
	fputc(c, stderr);}
	//(void) write(2, argv[0], (unsigned)strlen(argv[0]));\
	//(void) write(2, s, (unsigned)strlen(s));\
	//(void) write(2, errbuf, 2);}

int	opterr = 1;
int	optind = 1;
int	optopt;
char	*optarg;

int
getopt(argc, argv, opts)
int	argc;
char	**argv, *opts;
{
	static int sp = 1;
	register int c;
	register char *cp;

	if(sp == 1)
		if(optind >= argc ||
		   argv[optind][0] != '-' || argv[optind][1] == '\0')
			return(EOF);
		else if(strcmp(argv[optind], "--") == NULL) {
			optind++;
			return(EOF);
		}
	optopt = c = argv[optind][sp];
	if(c == ':' || (cp=strchr(opts, c)) == NULL) {
		ERR(": illegal option -- ", c);
		if(argv[optind][++sp] == '\0') {
			optind++;
			sp = 1;
		}
		return('?');
	}
	if(*++cp == ':') {
		if(argv[optind][sp+1] != '\0')
			optarg = &argv[optind++][sp+1];
		else if(++optind >= argc) {
			ERR(": option requires an argument -- ", c);
			sp = 1;
			return('?');
		} else
			optarg = argv[optind++];
		sp = 1;
	} else {
		if(argv[optind][++sp] == '\0') {
			sp = 1;
			optind++;
		}
		optarg = NULL;
	}
	return(c);
}

#endif  /* __GNUC__ */


================================================
FILE: src/kenlm/util/getopt.hh
================================================
/*
POSIX getopt for Windows

AT&T Public License

Code given out at the 1985 UNIFORUM conference in Dallas.  
*/

#ifdef __GNUC__
#include <getopt.h>
#endif
#ifndef __GNUC__

#ifndef _WINGETOPT_H_
#define _WINGETOPT_H_

#ifdef __cplusplus
extern "C" {
#endif

extern int opterr;
extern int optind;
extern int optopt;
extern char *optarg;
extern int getopt(int argc, char **argv, char *opts);

#ifdef __cplusplus
}
#endif

#endif  /* _GETOPT_H_ */
#endif  /* __GNUC__ */


================================================
FILE: src/kenlm/util/have.hh
================================================
/* Optional packages.  You might want to integrate this with your build system e.g. config.h from ./configure. */
#ifndef UTIL_HAVE__
#define UTIL_HAVE__

#ifdef HAVE_CONFIG_H
#include "config.h"
#endif

#ifndef HAVE_ICU
//#define HAVE_ICU
#endif

#endif // UTIL_HAVE__


================================================
FILE: src/kenlm/util/joint_sort.hh
================================================
#ifndef UTIL_JOINT_SORT__
#define UTIL_JOINT_SORT__

/* A terrifying amount of C++ to coax std::sort into soring one range while
 * also permuting another range the same way.
 */

#include "util/proxy_iterator.hh"

#include <algorithm>
#include <functional>
#include <iostream>

namespace util {

namespace detail {

template <class KeyIter, class ValueIter> class JointProxy;

template <class KeyIter, class ValueIter> class JointIter {
  public:
    JointIter() {}

    JointIter(const KeyIter &key_iter, const ValueIter &value_iter) : key_(key_iter), value_(value_iter) {}

    bool operator==(const JointIter<KeyIter, ValueIter> &other) const { return key_ == other.key_; }

    bool operator<(const JointIter<KeyIter, ValueIter> &other) const { return (key_ < other.key_); }

    std::ptrdiff_t operator-(const JointIter<KeyIter, ValueIter> &other) const { return key_ - other.key_; }

    JointIter<KeyIter, ValueIter> &operator+=(std::ptrdiff_t amount) {
      key_ += amount;
      value_ += amount;
      return *this;
    }

    void swap(const JointIter &other) {
      std::swap(key_, other.key_);
      std::swap(value_, other.value_);
    }

  private:
    friend class JointProxy<KeyIter, ValueIter>;
    KeyIter key_;
    ValueIter value_;
};

template <class KeyIter, class ValueIter> class JointProxy {
  private:
    typedef JointIter<KeyIter, ValueIter> InnerIterator;

  public:
    typedef struct {
      typename std::iterator_traits<KeyIter>::value_type key;
      typename std::iterator_traits<ValueIter>::value_type value;
      const typename std::iterator_traits<KeyIter>::value_type &GetKey() const { return key; }
    } value_type;

    JointProxy(const KeyIter &key_iter, const ValueIter &value_iter) : inner_(key_iter, value_iter) {}
    JointProxy(const JointProxy<KeyIter, ValueIter> &other) : inner_(other.inner_) {}

    operator value_type() const {
      value_type ret;
      ret.key = *inner_.key_;
      ret.value = *inner_.value_;
      return ret;
    }

    JointProxy &operator=(const JointProxy &other) {
      *inner_.key_ = *other.inner_.key_;
      *inner_.value_ = *other.inner_.value_;
      return *this;
    }

    JointProxy &operator=(const value_type &other) {
      *inner_.key_ = other.key;
      *inner_.value_ = other.value;
      return *this;
    }

    typename std::iterator_traits<KeyIter>::reference GetKey() const {
      return *(inner_.key_);
    }

    void swap(JointProxy<KeyIter, ValueIter> &other) {
      std::swap(*inner_.key_, *other.inner_.key_);
      std::swap(*inner_.value_, *other.inner_.value_);
    }

  private:
    friend class ProxyIterator<JointProxy<KeyIter, ValueIter> >;

    InnerIterator &Inner() { return inner_; }
    const InnerIterator &Inner() const { return inner_; }
    InnerIterator inner_;
};

template <class Proxy, class Less> class LessWrapper : public std::binary_function<const typename Proxy::value_type &, const typename Proxy::value_type &, bool> {
  public:
    explicit LessWrapper(const Less &less) : less_(less) {}

    bool operator()(const Proxy &left, const Proxy &right) const {
      return less_(left.GetKey(), right.GetKey());
    }
    bool operator()(const Proxy &left, const typename Proxy::value_type &right) const {
      return less_(left.GetKey(), right.GetKey());
    }
    bool operator()(const typename Proxy::value_type &left, const Proxy &right) const {
      return less_(left.GetKey(), right.GetKey());
    }
    bool operator()(const typename Proxy::value_type &left, const typename Proxy::value_type &right) const {
      return less_(left.GetKey(), right.GetKey());
    }

  private:
    const Less less_;
};

} // namespace detail

template <class KeyIter, class ValueIter> class PairedIterator : public ProxyIterator<detail::JointProxy<KeyIter, ValueIter> > {
  public:
    PairedIterator(const KeyIter &key, const ValueIter &value) :
      ProxyIterator<detail::JointProxy<KeyIter, ValueIter> >(detail::JointProxy<KeyIter, ValueIter>(key, value)) {}
};

template <class KeyIter, class ValueIter, class Less> void JointSort(const KeyIter &key_begin, const KeyIter &key_end, const ValueIter &value_begin, const Less &less) {
  ProxyIterator<detail::JointProxy<KeyIter, ValueIter> > full_begin(detail::JointProxy<KeyIter, ValueIter>(key_begin, value_begin));
  detail::LessWrapper<detail::JointProxy<KeyIter, ValueIter>, Less> less_wrap(less);
  std::sort(full_begin, full_begin + (key_end - key_begin), less_wrap);
}


template <class KeyIter, class ValueIter> void JointSort(const KeyIter &key_begin, const KeyIter &key_end, const ValueIter &value_begin) {
  JointSort(key_begin, key_end, value_begin, std::less<typename std::iterator_traits<KeyIter>::value_type>());
}

} // namespace util

namespace std {
template <class KeyIter, class ValueIter> void swap(util::detail::JointIter<KeyIter, ValueIter> &left, util::detail::JointIter<KeyIter, ValueIter> &right) {
  left.swap(right);
}

template <class KeyIter, class ValueIter> void swap(util::detail::JointProxy<KeyIter, ValueIter> &left, util::detail::JointProxy<KeyIter, ValueIter> &right) {
  left.swap(right);
}
} // namespace std

#endif // UTIL_JOINT_SORT__


================================================
FILE: src/kenlm/util/joint_sort_test.cc
================================================
#include "util/joint_sort.hh"

#define BOOST_TEST_MODULE JointSortTest
#include <boost/test/unit_test.hpp>

namespace util { namespace {

BOOST_AUTO_TEST_CASE(just_flip) {
  char keys[2];
  int values[2];
  keys[0] = 1; values[0] = 327;
  keys[1] = 0; values[1] = 87897;
  JointSort<char *, int *>(keys + 0, keys + 2, values + 0);
  BOOST_CHECK_EQUAL(0, keys[0]);
  BOOST_CHECK_EQUAL(87897, values[0]);
  BOOST_CHECK_EQUAL(1, keys[1]);
  BOOST_CHECK_EQUAL(327, values[1]);
}

BOOST_AUTO_TEST_CASE(three) {
  char keys[3];
  int values[3];
  keys[0] = 1; values[0] = 327;
  keys[1] = 2; values[1] = 87897;
  keys[2] = 0; values[2] = 10;
  JointSort<char *, int *>(keys + 0, keys + 3, values + 0);
  BOOST_CHECK_EQUAL(0, keys[0]);
  BOOST_CHECK_EQUAL(1, keys[1]);
  BOOST_CHECK_EQUAL(2, keys[2]);
}

BOOST_AUTO_TEST_CASE(char_int) {
  char keys[4];
  int values[4];
  keys[0] = 3; values[0] = 327;
  keys[1] = 1; values[1] = 87897;
  keys[2] = 2; values[2] = 10;
  keys[3] = 0; values[3] = 24347;
  JointSort<char *, int *>(keys + 0, keys + 4, values + 0);
  BOOST_CHECK_EQUAL(0, keys[0]);
  BOOST_CHECK_EQUAL(24347, values[0]);
  BOOST_CHECK_EQUAL(1, keys[1]);
  BOOST_CHECK_EQUAL(87897, values[1]);
  BOOST_CHECK_EQUAL(2, keys[2]);
  BOOST_CHECK_EQUAL(10, values[2]);
  BOOST_CHECK_EQUAL(3, keys[3]);
  BOOST_CHECK_EQUAL(327, values[3]);
}

}} // namespace anonymous util


================================================
FILE: src/kenlm/util/mmap.cc
================================================
/* Memory mapping wrappers.
 * ARM and MinGW ports contributed by Hideo Okuma and Tomoyuki Yoshimura at
 * NICT.
 */
#include "util/mmap.hh"

#include "util/exception.hh"
#include "util/file.hh"
#include "util/scoped.hh"

#include <iostream>

#include <assert.h>
#include <fcntl.h>
#include <sys/types.h>
#include <sys/stat.h>
#include <stdlib.h>

#if defined(_WIN32) || defined(_WIN64)
#include <windows.h>
#include <io.h>
#else
#include <sys/mman.h>
#include <unistd.h>
#endif

namespace util {

long SizePage() {
#if defined(_WIN32) || defined(_WIN64)
  SYSTEM_INFO si;
  GetSystemInfo(&si);
  return si.dwAllocationGranularity;
#else
  return sysconf(_SC_PAGE_SIZE);
#endif
}

void SyncOrThrow(void *start, size_t length) {
#if defined(_WIN32) || defined(_WIN64)
  UTIL_THROW_IF(!::FlushViewOfFile(start, length), ErrnoException, "Failed to sync mmap");
#else
  UTIL_THROW_IF(msync(start, length, MS_SYNC), ErrnoException, "Failed to sync mmap");
#endif
}

void UnmapOrThrow(void *start, size_t length) {
#if defined(_WIN32) || defined(_WIN64)
  UTIL_THROW_IF(!::UnmapViewOfFile(start), ErrnoException, "Failed to unmap a file");
#else
  UTIL_THROW_IF(munmap(start, length), ErrnoException, "munmap failed");
#endif
}

scoped_mmap::~scoped_mmap() {
  if (data_ != (void*)-1) {
    try {
      // Thanks Denis Filimonov for pointing out NFS likes msync first.  
      SyncOrThrow(data_, size_);
      UnmapOrThrow(data_, size_);
    } catch (const util::ErrnoException &e) {
      std::cerr << e.what();
      abort();
    }
  }
}

void scoped_memory::reset(void *data, std::size_t size, Alloc source) {
  switch(source_) {
    case MMAP_ALLOCATED:
      scoped_mmap(data_, size_);
      break;
    case ARRAY_ALLOCATED:
      delete [] reinterpret_cast<char*>(data_);
      break;
    case MALLOC_ALLOCATED:
      free(data_);
      break;
    case NONE_ALLOCATED:
      break;
  }
  data_ = data;
  size_ = size;
  source_ = source;
}

void scoped_memory::call_realloc(std::size_t size) {
  assert(source_ == MALLOC_ALLOCATED || source_ == NONE_ALLOCATED);
  void *new_data = realloc(data_, size);
  if (!new_data) {
    reset();
  } else {
    reset(new_data, size, MALLOC_ALLOCATED);
  }
}

void *MapOrThrow(std::size_t size, bool for_write, int flags, bool prefault, int fd, uint64_t offset) {
#ifdef MAP_POPULATE // Linux specific
  if (prefault) {
    flags |= MAP_POPULATE;
  }
#endif
#if defined(_WIN32) || defined(_WIN64)
  int protectC = for_write ? PAGE_READWRITE : PAGE_READONLY;
  int protectM = for_write ? FILE_MAP_WRITE : FILE_MAP_READ;
  uint64_t total_size = size + offset;
  HANDLE hMapping = CreateFileMapping((HANDLE)_get_osfhandle(fd), NULL, protectC, total_size >> 32, static_cast<DWORD>(total_size), NULL);
  UTIL_THROW_IF(!hMapping, ErrnoException, "CreateFileMapping failed");
  LPVOID ret = MapViewOfFile(hMapping, protectM, offset >> 32, offset, size);
  CloseHandle(hMapping);
  UTIL_THROW_IF(!ret, ErrnoException, "MapViewOfFile failed");
#else
  int protect = for_write ? (PROT_READ | PROT_WRITE) : PROT_READ;
  void *ret;
  UTIL_THROW_IF((ret = mmap(NULL, size, protect, flags, fd, offset)) == MAP_FAILED, ErrnoException, "mmap failed for size " << size << " at offset " << offset);
#  ifdef MADV_HUGEPAGE
  /* We like huge pages but it's fine if we can't have them.  Note that huge
   * pages are not supported for file-backed mmap on linux.
   */
  madvise(ret, size, MADV_HUGEPAGE);
#  endif
#endif
  return ret;
}

const int kFileFlags =
#if defined(_WIN32) || defined(_WIN64)
  0 // MapOrThrow ignores flags on windows
#elif defined(MAP_FILE)
  MAP_FILE | MAP_SHARED
#else
  MAP_SHARED
#endif
  ;

void MapRead(LoadMethod method, int fd, uint64_t offset, std::size_t size, scoped_memory &out) {
  switch (method) {
    case LAZY:
      out.reset(MapOrThrow(size, false, kFileFlags, false, fd, offset), size, scoped_memory::MMAP_ALLOCATED);
      break;
    case POPULATE_OR_LAZY:
#ifdef MAP_POPULATE
    case POPULATE_OR_READ:
#endif
      out.reset(MapOrThrow(size, false, kFileFlags, true, fd, offset), size, scoped_memory::MMAP_ALLOCATED);
      break;
#ifndef MAP_POPULATE
    case POPULATE_OR_READ:
#endif
    case READ:
      out.reset(MallocOrThrow(size), size, scoped_memory::MALLOC_ALLOCATED);
      SeekOrThrow(fd, offset);
      ReadOrThrow(fd, out.get(), size);
      break;
  }
}

// Allocates zeroed memory in to.
void MapAnonymous(std::size_t size, util::scoped_memory &to) {
  to.reset();
#if defined(_WIN32) || defined(_WIN64)
  to.reset(calloc(1, size), size, scoped_memory::MALLOC_ALLOCATED);
#else
  to.reset(MapOrThrow(size, true,
#  if defined(MAP_ANONYMOUS)
      MAP_ANONYMOUS | MAP_PRIVATE // Linux
#  else
      MAP_ANON | MAP_PRIVATE // BSD
#  endif
      , false, -1, 0), size, scoped_memory::MMAP_ALLOCATED);
#endif
}

void *MapZeroedWrite(int fd, std::size_t size) {
  ResizeOrThrow(fd, 0);
  ResizeOrThrow(fd, size);
  return MapOrThrow(size, true, kFileFlags, false, fd, 0);
}

void *MapZeroedWrite(const char *name, std::size_t size, scoped_fd &file) {
  file.reset(CreateOrThrow(name));
  try {
    return MapZeroedWrite(file.get(), size);
  } catch (ErrnoException &e) {
    e << " in file " << name;
    throw;
  }
}

} // namespace util


================================================
FILE: src/kenlm/util/mmap.hh
================================================
#ifndef UTIL_MMAP__
#define UTIL_MMAP__
// Utilities for mmaped files.  

#include <cstddef>

#include <stdint.h>
#include <sys/types.h>

namespace util {

class scoped_fd;

long SizePage();

// (void*)-1 is MAP_FAILED; this is done to avoid including the mmap header here.  
class scoped_mmap {
  public:
    scoped_mmap() : data_((void*)-1), size_(0) {}
    scoped_mmap(void *data, std::size_t size) : data_(data), size_(size) {}
    ~scoped_mmap();

    void *get() const { return data_; }

    const uint8_t *begin() const { return reinterpret_cast<uint8_t*>(data_); }
    const uint8_t *end() const { return reinterpret_cast<uint8_t*>(data_) + size_; }
    std::size_t size() const { return size_; }

    void reset(void *data, std::size_t size) {
      scoped_mmap other(data_, size_);
      data_ = data;
      size_ = size;
    }

    void reset() {
      reset((void*)-1, 0);
    }

  private:
    void *data_;
    std::size_t size_;

    scoped_mmap(const scoped_mmap &);
    scoped_mmap &operator=(const scoped_mmap &);
};

/* For when the memory might come from mmap, new char[], or malloc.  Uses NULL
 * and 0 for blanks even though mmap signals errors with (void*)-1).  The reset
 * function checks that blank for mmap.  
 */
class scoped_memory {
  public:
    typedef enum {MMAP_ALLOCATED, ARRAY_ALLOCATED, MALLOC_ALLOCATED, NONE_ALLOCATED} Alloc;

    scoped_memory() : data_(NULL), size_(0), source_(NONE_ALLOCATED) {}

    ~scoped_memory() { reset(); }

    void *get() const { return data_; }
    const char *begin() const { return reinterpret_cast<char*>(data_); }
    const char *end() const { return reinterpret_cast<char*>(data_) + size_; }
    std::size_t size() const { return size_; }

    Alloc source() const { return source_; }

    void reset() { reset(NULL, 0, NONE_ALLOCATED); }

    void reset(void *data, std::size_t size, Alloc from);

    // realloc allows the current data to escape hence the need for this call
    // If realloc fails, destroys the original too and get() returns NULL.
    void call_realloc(std::size_t to);

  private:

    void *data_;
    std::size_t size_;

    Alloc source_;

    scoped_memory(const scoped_memory &);
    scoped_memory &operator=(const scoped_memory &);
};

typedef enum {
  // mmap with no prepopulate
  LAZY,
  // On linux, pass MAP_POPULATE to mmap.
  POPULATE_OR_LAZY,
  // Populate on Linux.  malloc and read on non-Linux.  
  POPULATE_OR_READ,
  // malloc and read.  
  READ
} LoadMethod;

extern const int kFileFlags;

// Wrapper around mmap to check it worked and hide some platform macros.  
void *MapOrThrow(std::size_t size, bool for_write, int flags, bool prefault, int fd, uint64_t offset = 0);

void MapRead(LoadMethod method, int fd, uint64_t offset, std::size_t size, scoped_memory &out);

void MapAnonymous(std::size_t size, scoped_memory &to);

// Open file name with mmap of size bytes, all of which are initially zero.  
void *MapZeroedWrite(int fd, std::size_t size);
void *MapZeroedWrite(const char *name, std::size_t size, scoped_fd &file);

// msync wrapper 
void SyncOrThrow(void *start, size_t length);

} // namespace util

#endif // UTIL_MMAP__


================================================
FILE: src/kenlm/util/multi_intersection.hh
================================================
#ifndef UTIL_MULTI_INTERSECTION__
#define UTIL_MULTI_INTERSECTION__

#include <boost/optional.hpp>
#include <boost/range/iterator_range.hpp>

#include <algorithm>
#include <functional>
#include <vector>

namespace util {

namespace detail {
template <class Range> struct RangeLessBySize : public std::binary_function<const Range &, const Range &, bool> {
  bool operator()(const Range &left, const Range &right) const {
    return left.size() < right.size();
  }
};

/* Takes sets specified by their iterators and a boost::optional containing
 * the lowest intersection if any.  Each set must be sorted in increasing
 * order.  sets is changed to truncate the beginning of each sequence to the
 * location of the match or an empty set.  Precondition: sets is not empty
 * since the intersection over null is the universe and this function does not
 * know the universe.   
 */
template <class Iterator, class Less> boost::optional<typename std::iterator_traits<Iterator>::value_type> FirstIntersectionSorted(std::vector<boost::iterator_range<Iterator> > &sets, const Less &less = std::less<typename std::iterator_traits<Iterator>::value_type>()) {
  typedef std::vector<boost::iterator_range<Iterator> > Sets;
  typedef typename std::iterator_traits<Iterator>::value_type Value;

  assert(!sets.empty());

  if (sets.front().empty()) return boost::optional<Value>();
  // Possibly suboptimal to copy for general Value; makes unsigned int go slightly faster.  
  Value highest(sets.front().front());
  for (typename Sets::iterator i(sets.begin()); i != sets.end(); ) {
    i->advance_begin(std::lower_bound(i->begin(), i->end(), highest, less) - i->begin());
    if (i->empty()) return boost::optional<Value>();
    if (less(highest, i->front())) {
      highest = i->front();
      // start over
      i = sets.begin();
    } else {
      ++i;
    }
  }
  return boost::optional<Value>(highest);
}

} // namespace detail

template <class Iterator, class Less> boost::optional<typename std::iterator_traits<Iterator>::value_type> FirstIntersection(std::vector<boost::iterator_range<Iterator> > &sets, const Less less) {
  assert(!sets.empty());

  std::sort(sets.begin(), sets.end(), detail::RangeLessBySize<boost::iterator_range<Iterator> >());
  return detail::FirstIntersectionSorted(sets, less);
}

template <class Iterator> boost::optional<typename std::iterator_traits<Iterator>::value_type> FirstIntersection(std::vector<boost::iterator_range<Iterator> > &sets) {
  return FirstIntersection(sets, std::less<typename std::iterator_traits<Iterator>::value_type>());
}

template <class Iterator, class Output, class Less> void AllIntersection(std::vector<boost::iterator_range<Iterator> > &sets, Output &out, const Less less) {
  typedef typename std::iterator_traits<Iterator>::value_type Value;
  assert(!sets.empty());

  std::sort(sets.begin(), sets.end(), detail::RangeLessBySize<boost::iterator_range<Iterator> >());
  boost::optional<Value> ret;
  for (boost::optional<Value> ret; ret = detail::FirstIntersectionSorted(sets, less); sets.front().advance_begin(1)) {
    out(*ret);
  }
}

template <class Iterator, class Output> void AllIntersection(std::vector<boost::iterator_range<Iterator> > &sets, Output &out) {
  AllIntersection(sets, out, std::less<typename std::iterator_traits<Iterator>::value_type>());
}

} // namespace util

#endif // UTIL_MULTI_INTERSECTION__


================================================
FILE: src/kenlm/util/multi_intersection_test.cc
================================================
#include "util/multi_intersection.hh"

#define BOOST_TEST_MODULE MultiIntersectionTest
#include <boost/test/unit_test.hpp>

namespace util {
namespace {

BOOST_AUTO_TEST_CASE(Empty) {
  std::vector<boost::iterator_range<const unsigned int*> > sets;
  
  sets.push_back(boost::iterator_range<const unsigned int*>(static_cast<const unsigned int*>(NULL), static_cast<const unsigned int*>(NULL)));
  BOOST_CHECK(!FirstIntersection(sets));
}

BOOST_AUTO_TEST_CASE(Single) {
  std::vector<unsigned int> nums;
  nums.push_back(1);
  nums.push_back(4);
  nums.push_back(100);
  std::vector<boost::iterator_range<std::vector<unsigned int>::const_iterator> > sets;
  sets.push_back(nums);

  boost::optional<unsigned int> ret(FirstIntersection(sets));

  BOOST_REQUIRE(ret);
  BOOST_CHECK_EQUAL(static_cast<unsigned int>(1), *ret);
}

template <class T, unsigned int len> boost::iterator_range<const T*> RangeFromArray(const T (&arr)[len]) {
  return boost::iterator_range<const T*>(arr, arr + len);
}

BOOST_AUTO_TEST_CASE(MultiNone) {
  unsigned int nums0[] = {1, 3, 4, 22};
  unsigned int nums1[] = {2, 5, 12};
  unsigned int nums2[] = {4, 17};

  std::vector<boost::iterator_range<const unsigned int*> > sets;
  sets.push_back(RangeFromArray(nums0));
  sets.push_back(RangeFromArray(nums1));
  sets.push_back(RangeFromArray(nums2));

  BOOST_CHECK(!FirstIntersection(sets));
}

BOOST_AUTO_TEST_CASE(MultiOne) {
  unsigned int nums0[] = {1, 3, 4, 17, 22};
  unsigned int nums1[] = {2, 5, 12, 17};
  unsigned int nums2[] = {4, 17};

  std::vector<boost::iterator_range<const unsigned int*> > sets;
  sets.push_back(RangeFromArray(nums0));
  sets.push_back(RangeFromArray(nums1));
  sets.push_back(RangeFromArray(nums2));

  boost::optional<unsigned int> ret(FirstIntersection(sets));
  BOOST_REQUIRE(ret);
  BOOST_CHECK_EQUAL(static_cast<unsigned int>(17), *ret);
}

} // namespace
} // namespace util


================================================
FILE: src/kenlm/util/murmur_hash.cc
================================================
/* Downloaded from http://sites.google.com/site/murmurhash/ which says "All
 * code is released to the public domain. For business purposes, Murmurhash is
 * under the MIT license."
 * This is modified from the original:
 * ULL tag on 0xc6a4a7935bd1e995 so this will compile on 32-bit.  
 * length changed to unsigned int.  
 * placed in namespace util
 * add MurmurHashNative
 * default option = 0 for seed
 * ARM port from NICT
 */

#include "util/murmur_hash.hh"
#include <string.h>

namespace util {

//-----------------------------------------------------------------------------
// MurmurHash2, 64-bit versions, by Austin Appleby

// The same caveats as 32-bit MurmurHash2 apply here - beware of alignment 
// and endian-ness issues if used across multiple platforms.

// 64-bit hash for 64-bit platforms

uint64_t MurmurHash64A ( const void * key, std::size_t len, uint64_t seed )
{
  const uint64_t m = 0xc6a4a7935bd1e995ULL;
  const int r = 47;

  uint64_t h = seed ^ (len * m);

#if defined(__arm) || defined(__arm__)
  const size_t ksize = sizeof(uint64_t);
  const unsigned char * data = (const unsigned char *)key;
  const unsigned char * end = data + (std::size_t)(len/8) * ksize;
#else
  const uint64_t * data = (const uint64_t *)key;
  const uint64_t * end = data + (len/8);
#endif

  while(data != end)
  {
#if defined(__arm) || defined(__arm__)
    uint64_t k;
    memcpy(&k, data, ksize);
    data += ksize;
#else
    uint64_t k = *data++;
#endif

    k *= m; 
    k ^= k >> r; 
    k *= m; 
    
    h ^= k;
    h *= m; 
  }

  const unsigned char * data2 = (const unsigned char*)data;

  switch(len & 7)
  {
  case 7: h ^= uint64_t(data2[6]) << 48;
  case 6: h ^= uint64_t(data2[5]) << 40;
  case 5: h ^= uint64_t(data2[4]) << 32;
  case 4: h ^= uint64_t(data2[3]) << 24;
  case 3: h ^= uint64_t(data2[2]) << 16;
  case 2: h ^= uint64_t(data2[1]) << 8;
  case 1: h ^= uint64_t(data2[0]);
          h *= m;
  };
 
  h ^= h >> r;
  h *= m;
  h ^= h >> r;

  return h;
} 


// 64-bit hash for 32-bit platforms

uint64_t MurmurHash64B ( const void * key, std::size_t len, uint64_t seed )
{
  const unsigned int m = 0x5bd1e995;
  const int r = 24;

  unsigned int h1 = seed ^ len;
  unsigned int h2 = 0;

#if defined(__arm) || defined(__arm__)
  size_t ksize = sizeof(unsigned int);
  const unsigned char * data = (const unsigned char *)key;
#else
  const unsigned int * data = (const unsigned int *)key;
#endif

  unsigned int k1, k2;
  while(len >= 8)
  {
#if defined(__arm) || defined(__arm__)
    memcpy(&k1, data, ksize);
    data += ksize;
    memcpy(&k2, data, ksize);
    data += ksize;
#else
    k1 = *data++;
    k2 = *data++;
#endif

    k1 *= m; k1 ^= k1 >> r; k1 *= m;
    h1 *= m; h1 ^= k1;
    len -= 4;

    k2 *= m; k2 ^= k2 >> r; k2 *= m;
    h2 *= m; h2 ^= k2;
    len -= 4;
  }

  if(len >= 4)
  {
#if defined(__arm) || defined(__arm__)
    memcpy(&k1, data, ksize);
    data += ksize;
#else
    k1 = *data++;
#endif
    k1 *= m; k1 ^= k1 >> r; k1 *= m;
    h1 *= m; h1 ^= k1;
    len -= 4;
  }

  switch(len)
  {
  case 3: h2 ^= ((unsigned char*)data)[2] << 16;
  case 2: h2 ^= ((unsigned char*)data)[1] << 8;
  case 1: h2 ^= ((unsigned char*)data)[0];
      h2 *= m;
  };

  h1 ^= h2 >> 18; h1 *= m;
  h2 ^= h1 >> 22; h2 *= m;
  h1 ^= h2 >> 17; h1 *= m;
  h2 ^= h1 >> 19; h2 *= m;

  uint64_t h = h1;

  h = (h << 32) | h2;

  return h;
}

// Trick to test for 64-bit architecture at compile time.  
namespace {
template <unsigned L> inline uint64_t MurmurHashNativeBackend(const void * key, std::size_t len, uint64_t seed) {
  return MurmurHash64A(key, len, seed);
}
template <> inline uint64_t MurmurHashNativeBackend<4>(const void * key, std::size_t len, uint64_t seed) {
  return MurmurHash64B(key, len, seed);
}
} // namespace

uint64_t MurmurHashNative(const void * key, std::size_t len, uint64_t seed) {
  return MurmurHashNativeBackend<sizeof(void*)>(key, len, seed);
}

} // namespace util


================================================
FILE: src/kenlm/util/murmur_hash.hh
================================================
#ifndef UTIL_MURMUR_HASH__
#define UTIL_MURMUR_HASH__
#include <cstddef>
#include <stdint.h>

namespace util {

uint64_t MurmurHash64A(const void * key, std::size_t len, uint64_t seed = 0);
uint64_t MurmurHash64B(const void * key, std::size_t len, uint64_t seed = 0);
uint64_t MurmurHashNative(const void * key, std::size_t len, uint64_t seed = 0);

} // namespace util

#endif // UTIL_MURMUR_HASH__


================================================
FILE: src/kenlm/util/pcqueue.hh
================================================
#ifndef UTIL_PCQUEUE__
#define UTIL_PCQUEUE__

#include <boost/interprocess/sync/interprocess_semaphore.hpp>
#include <boost/scoped_array.hpp>
#include <boost/thread/mutex.hpp>
#include <boost/utility.hpp>

#include <errno.h>

namespace util {

inline void WaitSemaphore (boost::interprocess::interprocess_semaphore &on) {
  while (1) {
    try {
      on.wait();
      break;
    }
    catch (boost::interprocess::interprocess_exception &e) {
      if (e.get_native_error() != EINTR) throw;
    }
  }
}

/* Producer consumer queue safe for multiple producers and multiple consumers.
 * T must be default constructable and have operator=.  
 * The value is copied twice for Consume(T &out) or three times for Consume(),
 * so larger objects should be passed via pointer.
 * Strong exception guarantee if operator= throws.  Undefined if semaphores throw.  
 */
template <class T> class PCQueue : boost::noncopyable {
 public:
  explicit PCQueue(size_t size)
   : empty_(size), used_(0),
     storage_(new T[size]),
     end_(storage_.get() + size),
     produce_at_(storage_.get()),
     consume_at_(storage_.get()) {}

  // Add a value to the queue.
  void Produce(const T &val) {
    WaitSemaphore(empty_);
    {
      boost::unique_lock<boost::mutex> produce_lock(produce_at_mutex_);
      try {
        *produce_at_ = val;
      }
      catch (...) {
        empty_.post();
        throw;
      }
      if (++produce_at_ == end_) produce_at_ = storage_.get();
    }
    used_.post();
  }

  // Consume a value, assigning it to out.
  T& Consume(T &out) {
    WaitSemaphore(used_);
    {
      boost::unique_lock<boost::mutex> consume_lock(consume_at_mutex_);
      try {
        out = *consume_at_;
      }
      catch (...) {
        used_.post();
        throw;
      }
      if (++consume_at_ == end_) consume_at_ = storage_.get();
    }
    empty_.post();
    return out;
  }

  // Convenience version of Consume that copies the value to return.
  // The other version is faster.
  T Consume() {
    T ret;
    Consume(ret);
    return ret;
  }
   
 private:
  // Number of empty spaces in storage_.
  boost::interprocess::interprocess_semaphore empty_;
  // Number of occupied spaces in storage_.
  boost::interprocess::interprocess_semaphore used_;

  boost::scoped_array<T> storage_;

  T *const end_;

  // Index for next write in storage_.
  T *produce_at_;
  boost::mutex produce_at_mutex_;

  // Index for next read from storage_.
  T *consume_at_;
  boost::mutex consume_at_mutex_;

};

} // namespace util

#endif // UTIL_PCQUEUE__


================================================
FILE: src/kenlm/util/pool.cc
================================================
#include "util/pool.hh"

#include "util/scoped.hh"

#include <stdlib.h>

namespace util {

Pool::Pool() {
  current_ = NULL;
  current_end_ = NULL;
}

Pool::~Pool() {
  FreeAll();
}

void Pool::FreeAll() {
  for (std::vector<void *>::const_iterator i(free_list_.begin()); i != free_list_.end(); ++i) {
    free(*i);
  }
  free_list_.clear();
  current_ = NULL;
  current_end_ = NULL;
}

void *Pool::More(std::size_t size) {
  std::size_t amount = std::max(static_cast<size_t>(32) << free_list_.size(), size);
  uint8_t *ret = static_cast<uint8_t*>(MallocOrThrow(amount));
  free_list_.push_back(ret);
  current_ = ret + size;
  current_end_ = ret + amount;
  return ret;
}

} // namespace util


================================================
FILE: src/kenlm/util/pool.hh
================================================
// Very simple pool.  It can only allocate memory.  And all of the memory it
// allocates must be freed at the same time.  

#ifndef UTIL_POOL__
#define UTIL_POOL__

#include <vector>

#include <stdint.h>

namespace util {

class Pool {
  public:
    Pool();

    ~Pool();

    void *Allocate(std::size_t size) {
      void *ret = current_;
      current_ += size;
      if (current_ < current_end_) {
        return ret;
      } else {
        return More(size);
      }
    }

    void FreeAll();

  private:
    void *More(std::size_t size);

    std::vector<void *> free_list_;

    uint8_t *current_, *current_end_;

    // no copying
    Pool(const Pool &);
    Pool &operator=(const Pool &);
}; 

} // namespace util

#endif // UTIL_POOL__


================================================
FILE: src/kenlm/util/probing_hash_table.hh
================================================
#ifndef UTIL_PROBING_HASH_TABLE__
#define UTIL_PROBING_HASH_TABLE__

#include "util/exception.hh"

#include <algorithm>
#include <cstddef>
#include <functional>
#include <vector>

#include <assert.h>
#include <stdint.h>

namespace util {

/* Thrown when table grows too large */
class ProbingSizeException : public Exception {
  public:
    ProbingSizeException() throw() {}
    ~ProbingSizeException() throw() {}
};

// std::identity is an SGI extension :-(
struct IdentityHash {
  template <class T> T operator()(T arg) const { return arg; }
};

/* Non-standard hash table
 * Buckets must be set at the beginning and must be greater than maximum number
 * of elements, else it throws ProbingSizeException.
 * Memory management and initialization is externalized to make it easier to
 * serialize these to disk and load them quickly.
 * Uses linear probing to find value.
 * Only insert and lookup operations.  
 */

template <class EntryT, class HashT, class EqualT = std::equal_to<typename EntryT::Key> > class ProbingHashTable {
  public:
    typedef EntryT Entry;
    typedef typename Entry::Key Key;
    typedef const Entry *ConstIterator;
    typedef Entry *MutableIterator;
    typedef HashT Hash;
    typedef EqualT Equal;

  public:
    static uint64_t Size(uint64_t entries, float multiplier) {
      uint64_t buckets = std::max(entries + 1, static_cast<uint64_t>(multiplier * static_cast<float>(entries)));
      return buckets * sizeof(Entry);
    }

    // Must be assigned to later.  
    ProbingHashTable() : entries_(0)
#ifdef DEBUG
      , initialized_(false)
#endif
    {}

    ProbingHashTable(void *start, std::size_t allocated, const Key &invalid = Key(), const Hash &hash_func = Hash(), const Equal &equal_func = Equal())
      : begin_(reinterpret_cast<MutableIterator>(start)),
        buckets_(allocated / sizeof(Entry)),
        end_(begin_ + buckets_),
        invalid_(invalid),
        hash_(hash_func),
        equal_(equal_func),
        entries_(0)
#ifdef DEBUG
        , initialized_(true)
#endif
    {}

    template <class T> MutableIterator Insert(const T &t) {
#ifdef DEBUG
      assert(initialized_);
#endif
      UTIL_THROW_IF(++entries_ >= buckets_, ProbingSizeException, "Hash table with " << buckets_ << " buckets is full.");
      return UncheckedInsert(t);
    }

    // Return true if the value was found (and not inserted).  This is consistent with Find but the opposite if hash_map!
    template <class T> bool FindOrInsert(const T &t, MutableIterator &out) {
#ifdef DEBUG
      assert(initialized_);
#endif
      for (MutableIterator i(begin_ + (hash_(t.GetKey()) % buckets_));;) {
        Key got(i->GetKey());
        if (equal_(got, t.GetKey())) { out = i; return true; }
        if (equal_(got, invalid_)) {
          UTIL_THROW_IF(++entries_ >= buckets_, ProbingSizeException, "Hash table with " << buckets_ << " buckets is full.");
          *i = t;
          out = i;
          return false;
        }
        if (++i == end_) i = begin_;
      }   
    }

    void FinishedInserting() {}

    void LoadedBinary() {}

    // Don't change anything related to GetKey,  
    template <class Key> bool UnsafeMutableFind(const Key key, MutableIterator &out) {
#ifdef DEBUG
      assert(initialized_);
#endif
      for (MutableIterator i(begin_ + (hash_(key) % buckets_));;) {
        Key got(i->GetKey());
        if (equal_(got, key)) { out = i; return true; }
        if (equal_(got, invalid_)) return false;
        if (++i == end_) i = begin_;
      }   
    }

    template <class Key> bool Find(const Key key, ConstIterator &out) const {
#ifdef DEBUG
      assert(initialized_);
#endif
      for (ConstIterator i(begin_ + (hash_(key) % buckets_));;) {
        Key got(i->GetKey());
        if (equal_(got, key)) { out = i; return true; }
        if (equal_(got, invalid_)) return false;
        if (++i == end_) i = begin_;
      }    
    }

    void Clear() {
      Entry invalid;
      invalid.SetKey(invalid_);
      std::fill(begin_, end_, invalid);
      entries_ = 0;
    }

    // Return number of entries assuming no serialization went on.
    std::size_t SizeNoSerialization() const {
      return entries_;
    }

    // Return memory size expected by Double.
    std::size_t DoubleTo() const {
      return buckets_ * 2 * sizeof(Entry);
    }

    // Inform the table that it has double the amount of memory.
    // Pass clear_new = false if you are sure the new memory is initialized
    // properly (to invalid_) i.e. by mremap.
    void Double(void *new_base, bool clear_new = true) {
      begin_ = static_cast<MutableIterator>(new_base);
      MutableIterator old_end = begin_ + buckets_;
      buckets_ *= 2;
      end_ = begin_ + buckets_;
      if (clear_new) {
        Entry invalid;
        invalid.SetKey(invalid_);
        std::fill(old_end, end_, invalid);
      }
      std::vector<Entry> rolled_over;
      // Move roll-over entries to a buffer because they might not roll over anymore.  This should be small.
      for (MutableIterator i = begin_; i != old_end && !equal_(i->GetKey(), invalid_); ++i) {
        rolled_over.push_back(*i);
        i->SetKey(invalid_);
      }
      /* Re-insert everything.  Entries might go backwards to take over a
       * recently opened gap, stay, move to new territory, or wrap around.   If
       * an entry wraps around, it might go to a pointer greater than i (which
       * can happen at the beginning) and it will be revisited to possibly fill
       * in a gap created later.
       */
      Entry temp;
      for (MutableIterator i = begin_; i != old_end; ++i) {
        if (!equal_(i->GetKey(), invalid_)) {
          temp = *i;
          i->SetKey(invalid_);
          UncheckedInsert(temp);
        }
      }
      // Put the roll-over entries back in.
      for (typename std::vector<Entry>::const_iterator i(rolled_over.begin()); i != rolled_over.end(); ++i) {
        UncheckedInsert(*i);
      }
    }

    // Mostly for tests, check consistency of every entry.
    void CheckConsistency() {
      MutableIterator last;
      for (last = end_ - 1; last >= begin_ && !equal_(last->GetKey(), invalid_); --last) {}
      UTIL_THROW_IF(last == begin_, ProbingSizeException, "Completely full");
      MutableIterator i;
      // Beginning can be wrap-arounds.
      for (i = begin_; !equal_(i->GetKey(), invalid_); ++i) {
        MutableIterator ideal = Ideal(*i);
        UTIL_THROW_IF(ideal > i && ideal <= last, Exception, "Inconsistency at position " << (i - begin_) << " should be at " << (ideal - begin_));
      }
      MutableIterator pre_gap = i;
      for (; i != end_; ++i) {
        if (equal_(i->GetKey(), invalid_)) {
          pre_gap = i;
          continue;
        }
        MutableIterator ideal = Ideal(*i);
        UTIL_THROW_IF(ideal > i || ideal <= pre_gap, Exception, "Inconsistency at position " << (i - begin_) << " with ideal " << (ideal - begin_));
      }
    }

  private:
    template <class T> MutableIterator Ideal(const T &t) {
      return begin_ + (hash_(t.GetKey()) % buckets_);
    }

    template <class T> MutableIterator UncheckedInsert(const T &t) {
      for (MutableIterator i(Ideal(t));;) {
        if (equal_(i->GetKey(), invalid_)) { *i = t; return i; }
        if (++i == end_) { i = begin_; }
      }
    }

    MutableIterator begin_;
    std::size_t buckets_;
    MutableIterator end_;
    Key invalid_;
    Hash hash_;
    Equal equal_;
    std::size_t entries_;
#ifdef DEBUG
    bool initialized_;
#endif
};

} // namespace util

#endif // UTIL_PROBING_HASH_TABLE__


================================================
FILE: src/kenlm/util/probing_hash_table_test.cc
================================================
#include "util/probing_hash_table.hh"

#include "util/murmur_hash.hh"
#include "util/scoped.hh"

#define BOOST_TEST_MODULE ProbingHashTableTest
#include <boost/test/unit_test.hpp>
#include <boost/scoped_array.hpp>
#include <boost/functional/hash.hpp>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <stdint.h>

namespace util {
namespace {

struct Entry {
  unsigned char key;
  typedef unsigned char Key;

  unsigned char GetKey() const {
    return key;
  }

  void SetKey(unsigned char to) {
    key = to;
  }

  uint64_t GetValue() const {
    return value;
  }

  uint64_t value;
};

typedef ProbingHashTable<Entry, boost::hash<unsigned char> > Table;

BOOST_AUTO_TEST_CASE(simple) {
  size_t size = Table::Size(10, 1.2);
  boost::scoped_array<char> mem(new char[size]);
  memset(mem.get(), 0, size);

  Table table(mem.get(), size);
  const Entry *i = NULL;
  BOOST_CHECK(!table.Find(2, i));
  Entry to_ins;
  to_ins.key = 3;
  to_ins.value = 328920;
  table.Insert(to_ins);
  BOOST_REQUIRE(table.Find(3, i));
  BOOST_CHECK_EQUAL(3, i->GetKey());
  BOOST_CHECK_EQUAL(static_cast<uint64_t>(328920), i->GetValue());
  BOOST_CHECK(!table.Find(2, i));
}

struct Entry64 {
  uint64_t key;
  typedef uint64_t Key;

  Entry64() {}

  explicit Entry64(uint64_t key_in) {
    key = key_in;
  }

  Key GetKey() const { return key; }
  void SetKey(uint64_t to) { key = to; }
};

struct MurmurHashEntry64 {
  std::size_t operator()(uint64_t value) const {
    return util::MurmurHash64A(&value, 8);
  }
};

typedef ProbingHashTable<Entry64, MurmurHashEntry64> Table64;

BOOST_AUTO_TEST_CASE(Double) {
  for (std::size_t initial = 19; initial < 30; ++initial) {
    size_t size = Table64::Size(initial, 1.2);
    scoped_malloc mem(MallocOrThrow(size));
    Table64 table(mem.get(), size, std::numeric_limits<uint64_t>::max());
    table.Clear();
    for (uint64_t i = 0; i < 19; ++i) {
      table.Insert(Entry64(i));
    }
    table.CheckConsistency();
    mem.call_realloc(table.DoubleTo());
    table.Double(mem.get());
    table.CheckConsistency();
    for (uint64_t i = 20; i < 40 ; ++i) {
      table.Insert(Entry64(i));
    }
    mem.call_realloc(table.DoubleTo());
    table.Double(mem.get());
    table.CheckConsistency();
  }
}

} // namespace
} // namespace util


================================================
FILE: src/kenlm/util/proxy_iterator.hh
================================================
#ifndef UTIL_PROXY_ITERATOR__
#define UTIL_PROXY_ITERATOR__

#include <cstddef>
#include <iterator>

/* This is a RandomAccessIterator that uses a proxy to access the underlying
 * data.  Useful for packing data at bit offsets but still using STL
 * algorithms.  
 *
 * Normally I would use boost::iterator_facade but some people are too lazy to
 * install boost and still want to use my language model.  It's amazing how
 * many operators an iterator has. 
 *
 * The Proxy needs to provide:
 *   class InnerIterator;
 *   InnerIterator &Inner();
 *   const InnerIterator &Inner() const;
 *
 * InnerIterator has to implement:
 *   operator==(InnerIterator)
 *   operator<(InnerIterator)
 *   operator+=(std::ptrdiff_t)
 *   operator-(InnerIterator)
 * and of course whatever Proxy needs to dereference it.  
 *
 * It's also a good idea to specialize std::swap for Proxy.  
 */

namespace util {
template <class Proxy> class ProxyIterator {
  private:
    // Self.  
    typedef ProxyIterator<Proxy> S;
    typedef typename Proxy::InnerIterator InnerIterator;

  public:
    typedef std::random_access_iterator_tag iterator_category;
    typedef typename Proxy::value_type value_type;
    typedef std::ptrdiff_t difference_type;
    typedef Proxy reference;
    typedef Proxy * pointer;

    ProxyIterator() {}

    // For cast from non const to const.  
    template <class AlternateProxy> ProxyIterator(const ProxyIterator<AlternateProxy> &in) : p_(*in) {}
    explicit ProxyIterator(const Proxy &p) : p_(p) {}

    // p_'s operator= does value copying, but here we want iterator copying.  
    S &operator=(const S &other) {
      I() = other.I();
      return *this;
    }

    bool operator==(const S &other) const { return I() == other.I(); }
    bool operator!=(const S &other) const { return !(*this == other); }
    bool operator<(const S &other) const { return I() < other.I(); }
    bool operator>(const S &other) const { return other < *this; }
    bool operator<=(const S &other) const { return !(*this > other); }
    bool operator>=(const S &other) const { return !(*this < other); }

    S &operator++() { return *this += 1; }
    S operator++(int) { S ret(*this); ++*this; return ret; }
    S &operator+=(std::ptrdiff_t amount) { I() += amount; return *this; }
    S operator+(std::ptrdiff_t amount) const { S ret(*this); ret += amount; return ret; }

    S &operator--() { return *this -= 1; }
    S operator--(int) { S ret(*this); --*this; return ret; }
    S &operator-=(std::ptrdiff_t amount) { I() += (-amount); return *this; }
    S operator-(std::ptrdiff_t amount) const { S ret(*this); ret -= amount; return ret; }

    std::ptrdiff_t operator-(const S &other) const { return I() - other.I(); }

    Proxy operator*() { return p_; }
    const Proxy operator*() const { return p_; }
    Proxy *operator->() { return &p_; }
    const Proxy *operator->() const { return &p_; }
    Proxy operator[](std::ptrdiff_t amount) const { return *(*this + amount); }

    const InnerIterator &Inner() { return p_.Inner(); }

  private:
    InnerIterator &I() { return p_.Inner(); }
    const InnerIterator &I() const { return p_.Inner(); }

    Proxy p_;
};

template <class Proxy> ProxyIterator<Proxy> operator+(std::ptrdiff_t amount, const ProxyIterator<Proxy> &it) {
  return it + amount;
}

} // namespace util

#endif // UTIL_PROXY_ITERATOR__


================================================
FILE: src/kenlm/util/read_compressed.cc
================================================
#include "util/read_compressed.hh"

#include "util/file.hh"
#include "util/have.hh"
#include "util/scoped.hh"

#include <algorithm>
#include <iostream>

#include <assert.h>
#include <limits.h>
#include <stdlib.h>
#include <string.h>

#ifdef HAVE_ZLIB
#include <zlib.h>
#endif

#ifdef HAVE_BZLIB
#include <bzlib.h>
#endif

#ifdef HAVE_XZLIB
#include <lzma.h>
#endif

namespace util {

CompressedException::CompressedException() throw() {}
CompressedException::~CompressedException() throw() {}

GZException::GZException() throw() {}
GZException::~GZException() throw() {}

BZException::BZException() throw() {}
BZException::~BZException() throw() {}

XZException::XZException() throw() {}
XZException::~XZException() throw() {}

class ReadBase {
  public:
    virtual ~ReadBase() {}

    virtual std::size_t Read(void *to, std::size_t amount, ReadCompressed &thunk) = 0;

  protected:
    static void ReplaceThis(ReadBase *with, ReadCompressed &thunk) {
      thunk.internal_.reset(with);
    }

    static uint64_t &ReadCount(ReadCompressed &thunk) {
      return thunk.raw_amount_;
    }
};

namespace {

// Completed file that other classes can thunk to.  
class Complete : public ReadBase {
  public:
    std::size_t Read(void *, std::size_t, ReadCompressed &) {
      return 0;
    }
};

class Uncompressed : public ReadBase {
  public:
    explicit Uncompressed(int fd) : fd_(fd) {}

    std::size_t Read(void *to, std::size_t amount, ReadCompressed &thunk) {
      std::size_t got = PartialRead(fd_.get(), to, amount);
      ReadCount(thunk) += got;
      return got;
    }

  private:
    scoped_fd fd_;
};

class UncompressedWithHeader : public ReadBase {
  public:
    UncompressedWithHeader(int fd, void *already_data, std::size_t already_size) : fd_(fd) {
      assert(already_size);
      buf_.reset(malloc(already_size));
      if (!buf_.get()) throw std::bad_alloc();
      memcpy(buf_.get(), already_data, already_size);
      remain_ = static_cast<uint8_t*>(buf_.get());
      end_ = remain_ + already_size;
    }

    std::size_t Read(void *to, std::size_t amount, ReadCompressed &thunk) {
      assert(buf_.get());
      std::size_t sending = std::min<std::size_t>(amount, end_ - remain_);
      memcpy(to, remain_, sending);
      remain_ += sending;
      if (remain_ == end_) {
        ReplaceThis(new Uncompressed(fd_.release()), thunk);
      }
      return sending;
    }

  private:
    scoped_malloc buf_;
    uint8_t *remain_;
    uint8_t *end_;

    scoped_fd fd_;
};

#ifdef HAVE_ZLIB
class GZip : public ReadBase {
  private:
    static const std::size_t kInputBuffer = 16384;
  public:
    GZip(int fd, void *already_data, std::size_t already_size) 
      : file_(fd), in_buffer_(malloc(kInputBuffer)) {
      if (!in_buffer_.get()) throw std::bad_alloc();
      assert(already_size < kInputBuffer);
      if (already_size) {
        memcpy(in_buffer_.get(), already_data, already_size);
        stream_.next_in = static_cast<Bytef *>(in_buffer_.get());
        stream_.avail_in = already_size;
        stream_.avail_in += ReadOrEOF(file_.get(), static_cast<uint8_t*>(in_buffer_.get()) + already_size, kInputBuffer - already_size);
      } else {
        stream_.avail_in = 0;
      }
      stream_.zalloc = Z_NULL;
      stream_.zfree = Z_NULL;
      stream_.opaque = Z_NULL;
      stream_.msg = NULL;
      // 32 for zlib and gzip decoding with automatic header detection.  
      // 15 for maximum window size.  
      UTIL_THROW_IF(Z_OK != inflateInit2(&stream_, 32 + 15), GZException, "Failed to initialize zlib.");
    }

    ~GZip() {
      if (Z_OK != inflateEnd(&stream_)) {
        std::cerr << "zlib could not close properly." << std::endl;
        abort();
      }
    }

    std::size_t Read(void *to, std::size_t amount, ReadCompressed &thunk) {
      if (amount == 0) return 0;
      stream_.next_out = static_cast<Bytef*>(to);
      stream_.avail_out = std::min<std::size_t>(std::numeric_limits<uInt>::max(), amount);
      do {
        if (!stream_.avail_in) ReadInput(thunk);
        int result = inflate(&stream_, 0);
        switch (result) {
          case Z_OK:
            break;
          case Z_STREAM_END:
            {
              std::size_t ret = static_cast<uint8_t*>(stream_.next_out) - static_cast<uint8_t*>(to);
              ReplaceThis(new Complete(), thunk);
              return ret;
            }
          case Z_ERRNO:
            UTIL_THROW(ErrnoException, "zlib error");
          default:
            UTIL_THROW(GZException, "zlib encountered " << (stream_.msg ? stream_.msg : "an error ") << " code " << result);
        }
      } while (stream_.next_out == to);
      return static_cast<uint8_t*>(stream_.next_out) - static_cast<uint8_t*>(to);
    }

  private:
    void ReadInput(ReadCompressed &thunk) {
      assert(!stream_.avail_in);
      stream_.next_in = static_cast<Bytef *>(in_buffer_.get());
      stream_.avail_in = ReadOrEOF(file_.get(), in_buffer_.get(), kInputBuffer);
      ReadCount(thunk) += stream_.avail_in;
    }

    scoped_fd file_;
    scoped_malloc in_buffer_;
    z_stream stream_;
};
#endif // HAVE_ZLIB

#ifdef HAVE_BZLIB
class BZip : public ReadBase {
  public:
    explicit BZip(int fd, void *already_data, std::size_t already_size) {
      scoped_fd hold(fd);
      closer_.reset(FDOpenReadOrThrow(hold));
      int bzerror = BZ_OK;
      file_ = BZ2_bzReadOpen(&bzerror, closer_.get(), 0, 0, already_data, already_size);
      switch (bzerror) {
        case BZ_OK:
          return;
        case BZ_CONFIG_ERROR:
          UTIL_THROW(BZException, "Looks like bzip2 was miscompiled.");
        case BZ_PARAM_ERROR:
          UTIL_THROW(BZException, "Parameter error");
        case BZ_IO_ERROR:
          UTIL_THROW(BZException, "IO error reading file");
        case BZ_MEM_ERROR:
          throw std::bad_alloc();
      }
    }

    ~BZip() {
      int bzerror = BZ_OK;
      BZ2_bzReadClose(&bzerror, file_);
      if (bzerror != BZ_OK) {
        std::cerr << "bz2 readclose error" << std::endl;
        abort();
      }
    }

    std::size_t Read(void *to, std::size_t amount, ReadCompressed &thunk) {
      int bzerror = BZ_OK;
      int ret = BZ2_bzRead(&bzerror, file_, to, std::min<std::size_t>(static_cast<std::size_t>(INT_MAX), amount));
      long pos;
      switch (bzerror) {
        case BZ_STREAM_END:
          pos = ftell(closer_.get());
          if (pos != -1) ReadCount(thunk) = pos;
          ReplaceThis(new Complete(), thunk);
          return ret;
        case BZ_OK:
          pos = ftell(closer_.get());
          if (pos != -1) ReadCount(thunk) = pos;
          return ret;
        default:
          UTIL_THROW(BZException, "bzip2 error " << BZ2_bzerror(file_, &bzerror) << " code " << bzerror);
      }
    }

  private:
    scoped_FILE closer_;
    BZFILE *file_;
};
#endif // HAVE_BZLIB

#ifdef HAVE_XZLIB
class XZip : public ReadBase {
  private:
    static const std::size_t kInputBuffer = 16384;
  public:
    XZip(int fd, void *already_data, std::size_t already_size) 
      : file_(fd), in_buffer_(malloc(kInputBuffer)), stream_(), action_(LZMA_RUN) {
      if (!in_buffer_.get()) throw std::bad_alloc();
      assert(already_size < kInputBuffer);
      if (already_size) {
        memcpy(in_buffer_.get(), already_data, already_size);
        stream_.next_in = static_cast<const uint8_t*>(in_buffer_.get());
        stream_.avail_in = already_size;
        stream_.avail_in += ReadOrEOF(file_.get(), static_cast<uint8_t*>(in_buffer_.get()) + already_size, kInputBuffer - already_size);
      } else {
        stream_.avail_in = 0;
      }
      stream_.allocator = NULL;
      lzma_ret ret = lzma_stream_decoder(&stream_, UINT64_MAX, LZMA_CONCATENATED);
      switch (ret) {
        case LZMA_OK:
          break;
        case LZMA_MEM_ERROR:
          UTIL_THROW(ErrnoException, "xz open error");
        default:
          UTIL_THROW(XZException, "xz error code " << ret);
      }
    }

    ~XZip() {
      lzma_end(&stream_);
    }

    std::size_t Read(void *to, std::size_t amount, ReadCompressed &thunk) {
      if (amount == 0) return 0;
      stream_.next_out = static_cast<uint8_t*>(to);
      stream_.avail_out = amount;
      do {
        if (!stream_.avail_in) ReadInput(thunk);
        lzma_ret status = lzma_code(&stream_, action_);
        switch (status) {
          case LZMA_OK:
            break;
          case LZMA_STREAM_END:
            UTIL_THROW_IF(action_ != LZMA_FINISH, XZException, "Input not finished yet.");
            {
              std::size_t ret = static_cast<uint8_t*>(stream_.next_out) - static_cast<uint8_t*>(to);
              ReplaceThis(new Complete(), thunk);
              return ret;
            }
          case LZMA_MEM_ERROR:
            throw std::bad_alloc();
          case LZMA_FORMAT_ERROR:
            UTIL_THROW(XZException, "xzlib says file format not recognized");
          case LZMA_OPTIONS_ERROR:
            UTIL_THROW(XZException, "xzlib says unsupported compression options");
          case LZMA_DATA_ERROR:
            UTIL_THROW(XZException, "xzlib says this file is corrupt");
          case LZMA_BUF_ERROR:
            UTIL_THROW(XZException, "xzlib says unexpected end of input");
          default:
            UTIL_THROW(XZException, "unrecognized xzlib error " << status);
        }
      } while (stream_.next_out == to);
      return static_cast<uint8_t*>(stream_.next_out) - static_cast<uint8_t*>(to);
    }

  private:
    void ReadInput(ReadCompressed &thunk) {
      assert(!stream_.avail_in);
      stream_.next_in = static_cast<const uint8_t*>(in_buffer_.get());
      stream_.avail_in = ReadOrEOF(file_.get(), in_buffer_.get(), kInputBuffer);
      if (!stream_.avail_in) action_ = LZMA_FINISH;
      ReadCount(thunk) += stream_.avail_in;
    }

    scoped_fd file_;
    scoped_malloc in_buffer_;
    lzma_stream stream_;

    lzma_action action_;
};
#endif // HAVE_XZLIB

class IStreamReader : public ReadBase {
  public:
    explicit IStreamReader(std::istream &stream) : stream_(stream) {}

    std::size_t Read(void *to, std::size_t amount, ReadCompressed &thunk) {
      if (!stream_.read(static_cast<char*>(to), amount)) {
        UTIL_THROW_IF(!stream_.eof(), ErrnoException, "istream error");
        amount = stream_.gcount();
      }
      ReadCount(thunk) += amount;
      return amount;
    }

  private:
    std::istream &stream_;
};

enum MagicResult {
  UNKNOWN, GZIP, BZIP, XZIP
};

MagicResult DetectMagic(const void *from_void) {
  const uint8_t *header = static_cast<const uint8_t*>(from_void);
  if (header[0] == 0x1f && header[1] == 0x8b) {
    return GZIP;
  }
  if (header[0] == 'B' && header[1] == 'Z' && header[2] == 'h') {
    return BZIP;
  }
  const uint8_t xzmagic[6] = { 0xFD, '7', 'z', 'X', 'Z', 0x00 };
  if (!memcmp(header, xzmagic, 6)) {
    return XZIP;
  }
  return UNKNOWN;
}

ReadBase *ReadFactory(int fd, uint64_t &raw_amount) {
  scoped_fd hold(fd);
  unsigned char header[ReadCompressed::kMagicSize];
  raw_amount = ReadOrEOF(fd, header, ReadCompressed::kMagicSize);
  if (!raw_amount)
    return new Uncompressed(hold.release());
  if (raw_amount != ReadCompressed::kMagicSize)
    return new UncompressedWithHeader(hold.release(), header, raw_amount);
  switch (DetectMagic(header)) {
    case GZIP:
#ifdef HAVE_ZLIB
      return new GZip(hold.release(), header, ReadCompressed::kMagicSize);
#else
      UTIL_THROW(CompressedException, "This looks like a gzip file but gzip support was not compiled in.");
#endif
    case BZIP:
#ifdef HAVE_BZLIB
      return new BZip(hold.release(), header, ReadCompressed::kMagicSize);
#else
      UTIL_THROW(CompressedException, "This looks like a bzip file (it begins with BZ), but bzip support was not compiled in.");
#endif
    case XZIP:
#ifdef HAVE_XZLIB
      return new XZip(hold.release(), header, ReadCompressed::kMagicSize);
#else
      UTIL_THROW(CompressedException, "This looks like an xz file, but xz support was not compiled in.");
#endif
    case UNKNOWN:
      break;
  }
  try {
    SeekOrThrow(fd, 0);
  } catch (const util::ErrnoException &e) {
    return new UncompressedWithHeader(hold.release(), header, ReadCompressed::kMagicSize);
  }
  return new Uncompressed(hold.release());
}

} // namespace

bool ReadCompressed::DetectCompressedMagic(const void *from_void) {
  return DetectMagic(from_void) != UNKNOWN;
}

ReadCompressed::ReadCompressed(int fd) {
  Reset(fd);
}

ReadCompressed::ReadCompressed(std::istream &in) {
  Reset(in);
}

ReadCompressed::ReadCompressed() {}

ReadCompressed::~ReadCompressed() {}

void ReadCompressed::Reset(int fd) {
  internal_.reset();
  internal_.reset(ReadFactory(fd, raw_amount_));
}

void ReadCompressed::Reset(std::istream &in) {
  internal_.reset();
  internal_.reset(new IStreamReader(in));
}

std::size_t ReadCompressed::Read(void *to, std::size_t amount) {
  return internal_->Read(to, amount, *this);
}

} // namespace util


================================================
FILE: src/kenlm/util/read_compressed.hh
================================================
#ifndef UTIL_READ_COMPRESSED__
#define UTIL_READ_COMPRESSED__

#include "util/exception.hh"
#include "util/scoped.hh"

#include <cstddef>

#include <stdint.h>

namespace util {

class CompressedException : public Exception {
  public:
    CompressedException() throw();
    virtual ~CompressedException() throw();
};

class GZException : public CompressedException {
  public:
    GZException() throw();
    ~GZException() throw();
};

class BZException : public CompressedException {
  public:
    BZException() throw();
    ~BZException() throw();
};

class XZException : public CompressedException {
  public:
    XZException() throw();
    ~XZException() throw();
};

class ReadBase;

class ReadCompressed {
  public:
    static const std::size_t kMagicSize = 6;
    // Must have at least kMagicSize bytes.  
    static bool DetectCompressedMagic(const void *from);

    // Takes ownership of fd.   
    explicit ReadCompressed(int fd);

    // Try to avoid using this.  Use the fd instead.
    // There is no decompression support for istreams.
    explicit ReadCompressed(std::istream &in);

    // Must call Reset later.
    ReadCompressed();

    ~ReadCompressed();

    // Takes ownership of fd.  
    void Reset(int fd);

    // Same advice as the constructor.
    void Reset(std::istream &in);

    std::size_t Read(void *to, std::size_t amount);

    uint64_t RawAmount() const { return raw_amount_; }

  private:
    friend class ReadBase;

    scoped_ptr<ReadBase> internal_;

    uint64_t raw_amount_;

    // No copying.  
    ReadCompressed(const ReadCompressed &);
    void operator=(const ReadCompressed &);
};

} // namespace util

#endif // UTIL_READ_COMPRESSED__


================================================
FILE: src/kenlm/util/read_compressed_test.cc
================================================
#include "util/read_compressed.hh"

#include "util/file.hh"
#include "util/have.hh"

#define BOOST_TEST_MODULE ReadCompressedTest
#include <boost/test/unit_test.hpp>
#include <boost/scoped_ptr.hpp>

#include <fstream>
#include <string>

#include <stdlib.h>

namespace util {
namespace {

void ReadLoop(ReadCompressed &reader, void *to_void, std::size_t amount) {
  uint8_t *to = static_cast<uint8_t*>(to_void);
  while (amount) {
    std::size_t ret = reader.Read(to, amount);
    BOOST_REQUIRE(ret);
    to += ret;
    amount -= ret;
  }
}

const uint32_t kSize4 = 100000 / 4;

std::string WriteRandom() {
  char name[] = "tempXXXXXX";
  scoped_fd original(mkstemp(name));
  BOOST_REQUIRE(original.get() > 0);
  for (uint32_t i = 0; i < kSize4; ++i) {
    WriteOrThrow(original.get(), &i, sizeof(uint32_t));
  }
  return name;
}

void VerifyRead(ReadCompressed &reader) {
  for (uint32_t i = 0; i < kSize4; ++i) {
    uint32_t got;
    ReadLoop(reader, &got, sizeof(uint32_t));
    BOOST_CHECK_EQUAL(i, got);
  }

  char ignored;
  BOOST_CHECK_EQUAL((std::size_t)0, reader.Read(&ignored, 1));
  // Test double EOF call.
  BOOST_CHECK_EQUAL((std::size_t)0, reader.Read(&ignored, 1));
}

void TestRandom(const char *compressor) {
  std::string name(WriteRandom());

  char gzname[] = "tempXXXXXX";
  scoped_fd gzipped(mkstemp(gzname));

  std::string command(compressor);
#ifdef __CYGWIN__
  command += ".exe";
#endif
  command += " <\"";
  command += name;
  command += "\" >\"";
  command += gzname;
  command += "\"";
  BOOST_REQUIRE_EQUAL(0, system(command.c_str()));

  BOOST_CHECK_EQUAL(0, unlink(name.c_str()));
  BOOST_CHECK_EQUAL(0, unlink(gzname));

  ReadCompressed reader(gzipped.release());
  VerifyRead(reader);
}

BOOST_AUTO_TEST_CASE(Uncompressed) {
  TestRandom("cat");
}

#ifdef HAVE_ZLIB
BOOST_AUTO_TEST_CASE(ReadGZ) {
  TestRandom("gzip");
}
#endif // HAVE_ZLIB

#ifdef HAVE_BZLIB
BOOST_AUTO_TEST_CASE(ReadBZ) {
  TestRandom("bzip2");
}
#endif // HAVE_BZLIB

#ifdef HAVE_XZLIB
BOOST_AUTO_TEST_CASE(ReadXZ) {
  TestRandom("xz");
}
#endif

BOOST_AUTO_TEST_CASE(IStream) {
  std::string name(WriteRandom());
  std::fstream stream(name.c_str(), std::ios::in);
  BOOST_CHECK_EQUAL(0, unlink(name.c_str()));
  ReadCompressed reader;
  reader.Reset(stream);
  VerifyRead(reader);
}

} // namespace
} // namespace util


================================================
FILE: src/kenlm/util/scoped.cc
================================================
#include "util/scoped.hh"

#include <cstdlib>
#if !defined(_WIN32) && !defined(_WIN64)
#include <sys/mman.h>
#endif

namespace util {

MallocException::MallocException(std::size_t requested) throw() {
  *this << "for " << requested << " bytes ";
}

MallocException::~MallocException() throw() {}

namespace {
void *InspectAddr(void *addr, std::size_t requested, const char *func_name) {
  UTIL_THROW_IF_ARG(!addr && requested, MallocException, (requested), "in " << func_name);
  // These routines are often used for large chunks of memory where huge pages help.
#if MADV_HUGEPAGE
  madvise(addr, requested, MADV_HUGEPAGE);
#endif
  return addr;
}
} // namespace

void *MallocOrThrow(std::size_t requested) {
  return InspectAddr(std::malloc(requested), requested, "malloc");
}

void *CallocOrThrow(std::size_t requested) {
  return InspectAddr(std::calloc(1, requested), requested, "calloc");
}

scoped_malloc::~scoped_malloc() {
  std::free(p_);
}

void scoped_malloc::call_realloc(std::size_t requested) {
  p_ = InspectAddr(std::realloc(p_, requested), requested, "realloc");
}

} // namespace util


================================================
FILE: src/kenlm/util/scoped.hh
================================================
#ifndef UTIL_SCOPED__
#define UTIL_SCOPED__
/* Other scoped objects in the style of scoped_ptr. */

#include "util/exception.hh"
#include <cstddef>

namespace util {

class MallocException : public ErrnoException {
  public:
    explicit MallocException(std::size_t requested) throw();
    ~MallocException() throw();
};

void *MallocOrThrow(std::size_t requested);
void *CallocOrThrow(std::size_t requested);

class scoped_malloc {
  public:
    scoped_malloc() : p_(NULL) {}

    scoped_malloc(void *p) : p_(p) {}

    ~scoped_malloc();

    void reset(void *p = NULL) {
      scoped_malloc other(p_);
      p_ = p;
    }

    void call_realloc(std::size_t to);

    void *get() { return p_; }
    const void *get() const { return p_; }

  private:
    void *p_;

    scoped_malloc(const scoped_malloc &);
    scoped_malloc &operator=(const scoped_malloc &);
};

// Hat tip to boost.  
template <class T> class scoped_array {
  public:
    explicit scoped_array(T *content = NULL) : c_(content) {}

    ~scoped_array() { delete [] c_; }

    T *get() { return c_; }
    const T* get() const { return c_; }

    T &operator*() { return *c_; }
    const T&operator*() const { return *c_; }

    T &operator[](std::size_t idx) { return c_[idx]; }
    const T &operator[](std::size_t idx) const { return c_[idx]; }

    void reset(T *to = NULL) {
      scoped_array<T> other(c_);
      c_ = to;
    }

  private:
    T *c_;

    scoped_array(const scoped_array &);
    void operator=(const scoped_array &);
};

template <class T> class scoped_ptr {
  public:
    explicit scoped_ptr(T *content = NULL) : c_(content) {}

    ~scoped_ptr() { delete c_; }

    T *get() { return c_; }
    const T* get() const { return c_; }

    T &operator*() { return *c_; }
    const T&operator*() const { return *c_; }

    T *operator->() { return c_; }
    const T*operator->() const { return c_; }

    T &operator[](std::size_t idx) { return c_[idx]; }
    const T &operator[](std::size_t idx) const { return c_[idx]; }

    void reset(T *to = NULL) {
      scoped_ptr<T> other(c_);
      c_ = to;
    }

  private:
    T *c_;

    scoped_ptr(const scoped_ptr &);
    void operator=(const scoped_ptr &);
};

} // namespace util

#endif // UTIL_SCOPED__


================================================
FILE: src/kenlm/util/sized_iterator.hh
================================================
#ifndef UTIL_SIZED_ITERATOR__
#define UTIL_SIZED_ITERATOR__

#include "util/proxy_iterator.hh"

#include <functional>
#include <string>

#include <stdint.h>
#include <string.h>

namespace util {

class SizedInnerIterator {
  public:
    SizedInnerIterator() {}

    SizedInnerIterator(void *ptr, std::size_t size) : ptr_(static_cast<uint8_t*>(ptr)), size_(size) {}

    bool operator==(const SizedInnerIterator &other) const {
      return ptr_ == other.ptr_;
    }
    bool operator<(const SizedInnerIterator &other) const {
      return ptr_ < other.ptr_;
    }
    SizedInnerIterator &operator+=(std::ptrdiff_t amount) {
      ptr_ += amount * size_;
      return *this;
    }
    std::ptrdiff_t operator-(const SizedInnerIterator &other) const {
      return (ptr_ - other.ptr_) / size_;
    }

    const void *Data() const { return ptr_; }
    void *Data() { return ptr_; }
    std::size_t EntrySize() const { return size_; }

  private:
    uint8_t *ptr_;
    std::size_t size_;
};

class SizedProxy {
  public:
    SizedProxy() {}

    SizedProxy(void *ptr, std::size_t size) : inner_(ptr, size) {}

    operator std::string() const {
      return std::string(reinterpret_cast<const char*>(inner_.Data()), inner_.EntrySize());
    }

    SizedProxy &operator=(const SizedProxy &from) {
      memcpy(inner_.Data(), from.inner_.Data(), inner_.EntrySize());
      return *this;
    }

    SizedProxy &operator=(const std::string &from) {
      memcpy(inner_.Data(), from.data(), inner_.EntrySize());
      return *this;
    }

    const void *Data() const { return inner_.Data(); }
    void *Data() { return inner_.Data(); }

  private:
    friend class util::ProxyIterator<SizedProxy>;

    typedef std::string value_type;

    typedef SizedInnerIterator InnerIterator;

    InnerIterator &Inner() { return inner_; }
    const InnerIterator &Inner() const { return inner_; }
    InnerIterator inner_;
};

typedef ProxyIterator<SizedProxy> SizedIterator;

inline SizedIterator SizedIt(void *ptr, std::size_t size) { return SizedIterator(SizedProxy(ptr, size)); }

// Useful wrapper for a comparison function i.e. sort.  
template <class Delegate, class Proxy = SizedProxy> class SizedCompare : public std::binary_function<const Proxy &, const Proxy &, bool> {
  public:
    explicit SizedCompare(const Delegate &delegate = Delegate()) : delegate_(delegate) {}

    bool operator()(const Proxy &first, const Proxy &second) const {
      return delegate_(first.Data(), second.Data());
    }
    bool operator()(const Proxy &first, const std::string &second) const {
      return delegate_(first.Data(), second.data());
    }
    bool operator()(const std::string &first, const Proxy &second) const {
      return delegate_(first.data(), second.Data());
    }
    bool operator()(const std::string &first, const std::string &second) const {
      return delegate_(first.data(), second.data());
    }

    const Delegate &GetDelegate() const { return delegate_; }
    
  private:
    const Delegate delegate_;
};

} // namespace util
#endif // UTIL_SIZED_ITERATOR__


================================================
FILE: src/kenlm/util/sorted_uniform.hh
================================================
#ifndef UTIL_SORTED_UNIFORM__
#define UTIL_SORTED_UNIFORM__

#include <algorithm>
#include <cstddef>

#include <assert.h>
#include <stdint.h>

namespace util {

template <class T> class IdentityAccessor {
  public:
    typedef T Key;
    T operator()(const T *in) const { return *in; }
};

struct Pivot64 {
  static inline std::size_t Calc(uint64_t off, uint64_t range, std::size_t width) {
    std::size_t ret = static_cast<std::size_t>(static_cast<float>(off) / static_cast<float>(range) * static_cast<float>(width));
    // Cap for floating point rounding
    return (ret < width) ? ret : width - 1;
  }
};

// Use when off * width is <2^64.  This is guaranteed when each of them is actually a 32-bit value.   
struct Pivot32 {
  static inline std::size_t Calc(uint64_t off, uint64_t range, uint64_t width) {
    return static_cast<std::size_t>((off * width) / (range + 1));
  }
};

// Usage: PivotSelect<sizeof(DataType)>::T
template <unsigned> struct PivotSelect;
template <> struct PivotSelect<8> { typedef Pivot64 T; };
template <> struct PivotSelect<4> { typedef Pivot32 T; };
template <> struct PivotSelect<2> { typedef Pivot32 T; };

/* Binary search. */
template <class Iterator, class Accessor> bool BinaryFind(
    const Accessor &accessor,
    Iterator begin,
    Iterator end,
    const typename Accessor::Key key, Iterator &out) {
  while (end > begin) {
    Iterator pivot(begin + (end - begin) / 2);
    typename Accessor::Key mid(accessor(pivot));
    if (mid < key) {
      begin = pivot + 1;
    } else if (mid > key) {
      end = pivot;
    } else {
      out = pivot;
      return true;
    }
  }
  return false;
}

// Search the range [before_it + 1, after_it - 1] for key.  
// Preconditions:
// before_v <= key <= after_v
// before_v <= all values in the range [before_it + 1, after_it - 1] <= after_v
// range is sorted.
template <class Iterator, class Accessor, class Pivot> bool BoundedSortedUniformFind(
    const Accessor &accessor,
    Iterator before_it, typename Accessor::Key before_v,
    Iterator after_it, typename Accessor::Key after_v,
    const typename Accessor::Key key, Iterator &out) {
  while (after_it - before_it > 1) {
    Iterator pivot(before_it + (1 + Pivot::Calc(key - before_v, after_v - before_v, after_it - before_it - 1)));
    typename Accessor::Key mid(accessor(pivot));
    if (mid < key) {
      before_it = pivot;
      before_v = mid;
    } else if (mid > key) {
      after_it = pivot;
      after_v = mid;
    } else {
      out = pivot;
      return true;
    }
  }
  return false;
}

template <class Iterator, class Accessor, class Pivot> bool SortedUniformFind(const Accessor &accessor, Iterator begin, Iterator end, const typename Accessor::Key key, Iterator &out) {
  if (begin == end) return false;
  typename Accessor::Key below(accessor(begin));
  if (key <= below) {
    if (key == below) { out = begin; return true; }
    return false;
  }
  // Make the range [begin, end].  
  --end;
  typename Accessor::Key above(accessor(end));
  if (key >= above) {
    if (key == above) { out = end; return true; }
    return false;
  }
  return BoundedSortedUniformFind<Iterator, Accessor, Pivot>(accessor, begin, below, end, above, key, out);
}

// May return begin - 1.
template <class Iterator, class Accessor> Iterator BinaryBelow(
    const Accessor &accessor,
    Iterator begin,
    Iterator end,
    const typename Accessor::Key key) {
  while (end > begin) {
    Iterator pivot(begin + (end - begin) / 2);
    typename Accessor::Key mid(accessor(pivot));
    if (mid < key) {
      begin = pivot + 1;
    } else if (mid > key) {
      end = pivot;
    } else {
      for (++pivot; (pivot < end) && accessor(pivot) == mid; ++pivot) {}
      return pivot - 1;
    }
  }
  return begin - 1;
}

} // namespace util

#endif // UTIL_SORTED_UNIFORM__


================================================
FILE: src/kenlm/util/sorted_uniform_test.cc
================================================
#include "util/sorted_uniform.hh"

#include <boost/random/mersenne_twister.hpp>
#include <boost/random/uniform_int.hpp>
#include <boost/random/variate_generator.hpp>
#include <boost/scoped_array.hpp>
#include <boost/unordered_map.hpp>

#define BOOST_TEST_MODULE SortedUniformTest
#include <boost/test/unit_test.hpp>

#include <algorithm>
#include <limits>
#include <vector>

namespace util {
namespace {

template <class KeyT, class ValueT> struct Entry {
  typedef KeyT Key;
  typedef ValueT Value;

  Key key;
  Value value;

  Key GetKey() const {
    return key;
  }

  Value GetValue() const {
    return value;
  }

  bool operator<(const Entry<Key,Value> &other) const {
    return key < other.key;
  }
};

template <class KeyT> struct Accessor {
  typedef KeyT Key;
  template <class Value> Key operator()(const Entry<Key, Value> *entry) const {
    return entry->GetKey();
  }
};

template <class Key, class Value> void Check(const Entry<Key, Value> *begin, const Entry<Key, Value> *end, const boost::unordered_map<Key, Value> &reference, const Key key) {
  typename boost::unordered_map<Key, Value>::const_iterator ref = reference.find(key);
  typedef const Entry<Key, Value> *It;
  // g++ can't tell that require will crash and burn.
  It i = NULL;
  bool ret = SortedUniformFind<It, Accessor<Key>, Pivot64>(Accessor<Key>(), begin, end, key, i);
  if (ref == reference.end()) {
    BOOST_CHECK(!ret);
  } else {
    BOOST_REQUIRE(ret);
    BOOST_CHECK_EQUAL(ref->second, i->GetValue());
  }
}

BOOST_AUTO_TEST_CASE(empty) {
  typedef const Entry<uint64_t, float> T;
  const T *i;
  bool ret = SortedUniformFind<const T*, Accessor<uint64_t>, Pivot64>(Accessor<uint64_t>(), (const T*)NULL, (const T*)NULL, (uint64_t)10, i);
  BOOST_CHECK(!ret);
}

template <class Key> void RandomTest(Key upper, size_t entries, size_t queries) {
  typedef unsigned char Value;
  boost::mt19937 rng;
  boost::uniform_int<Key> range_key(0, upper);
  boost::uniform_int<Value> range_value(0, 255);
  boost::variate_generator<boost::mt19937&, boost::uniform_int<Key> > gen_key(rng, range_key);
  boost::variate_generator<boost::mt19937&, boost::uniform_int<unsigned char> > gen_value(rng, range_value);

  typedef Entry<Key, Value> Ent;
  std::vector<Ent> backing;
  boost::unordered_map<Key, unsigned char> reference;
  Ent ent;
  for (size_t i = 0; i < entries; ++i) {
    Key key = gen_key();
    unsigned char value = gen_value();
    if (reference.insert(std::make_pair(key, value)).second) {
      ent.key = key;
      ent.value = value;
      backing.push_back(ent);
    }
  }
  std::sort(backing.begin(), backing.end());

  // Random queries.  
  for (size_t i = 0; i < queries; ++i) {
    const Key key = gen_key();
    Check<Key, unsigned char>(&*backing.begin(), &*backing.end(), reference, key);
  }

  typename boost::unordered_map<Key, unsigned char>::const_iterator it = reference.begin();
  for (size_t i = 0; (i < queries) && (it != reference.end()); ++i, ++it) {
    Check<Key, unsigned char>(&*backing.begin(), &*backing.end(), reference, it->second);
  }
}

BOOST_AUTO_TEST_CASE(basic) {
  RandomTest<uint8_t>(11, 10, 200);
}

BOOST_AUTO_TEST_CASE(tiny_dense_random) {
  RandomTest<uint8_t>(11, 50, 200);
}

BOOST_AUTO_TEST_CASE(small_dense_random) {
  RandomTest<uint8_t>(100, 100, 200);
}

BOOST_AUTO_TEST_CASE(small_sparse_random) {
  RandomTest<uint8_t>(200, 15, 200);
}

BOOST_AUTO_TEST_CASE(medium_sparse_random) {
  RandomTest<uint16_t>(32000, 1000, 2000);
}

BOOST_AUTO_TEST_CASE(sparse_random) {
  RandomTest<uint64_t>(std::numeric_limits<uint64_t>::max(), 100000, 2000);
}

} // namespace
} // namespace util


================================================
FILE: src/kenlm/util/string_piece.cc
================================================
// Copyright 2004 The RE2 Authors.  All Rights Reserved.
// Use of this source code is governed by a BSD-style
// license that can be found in string_piece.hh.

#include "util/string_piece.hh"

#include <algorithm>

#include <limits.h>

#ifndef HAVE_ICU

typedef StringPiece::size_type size_type;

void StringPiece::CopyToString(std::string* target) const {
  target->assign(ptr_, length_);
}

size_type StringPiece::find(const StringPiece& s, size_type pos) const {
  // Not sure why length_ < 0 was here since it's std::size_t.
  if (/*length_ < 0 || */pos > static_cast<size_type>(length_))
    return npos;

  const char* result = std::search(ptr_ + pos, ptr_ + length_,
                                   s.ptr_, s.ptr_ + s.length_);
  const size_type xpos = result - ptr_;
  return xpos + s.length_ <= length_ ? xpos : npos;
}

size_type StringPiece::find(char c, size_type pos) const {
  if (length_ <= 0 || pos >= static_cast<size_type>(length_)) {
    return npos;
  }
  const char* result = std::find(ptr_ + pos, ptr_ + length_, c);
  return result != ptr_ + length_ ? result - ptr_ : npos;
}

size_type StringPiece::rfind(const StringPiece& s, size_type pos) const {
  if (length_ < s.length_) return npos;
  const size_t ulen = length_;
  if (s.length_ == 0) return std::min(ulen, pos);

  const char* last = ptr_ + std::min(ulen - s.length_, pos) + s.length_;
  const char* result = std::find_end(ptr_, last, s.ptr_, s.ptr_ + s.length_);
  return result != last ? result - ptr_ : npos;
}

size_type StringPiece::rfind(char c, size_type pos) const {
  if (length_ <= 0) return npos;
  for (int i = std::min(pos, static_cast<size_type>(length_ - 1));
       i >= 0; --i) {
    if (ptr_[i] == c) {
      return i;
    }
  }
  return npos;
}

// For each character in characters_wanted, sets the index corresponding
// to the ASCII code of that character to 1 in table.  This is used by
// the find_.*_of methods below to tell whether or not a character is in
// the lookup table in constant time.
// The argument `table' must be an array that is large enough to hold all
// the possible values of an unsigned char.  Thus it should be be declared
// as follows:
//   bool table[UCHAR_MAX + 1]
static inline void BuildLookupTable(const StringPiece& characters_wanted,
                                    bool* table) {
  const size_type length = characters_wanted.length();
  const char* const data = characters_wanted.data();
  for (size_type i = 0; i < length; ++i) {
    table[static_cast<unsigned char>(data[i])] = true;
  }
}

size_type StringPiece::find_first_of(const StringPiece& s,
                                     size_type pos) const {
  if (length_ == 0 || s.length_ == 0)
    return npos;

  // Avoid the cost of BuildLookupTable() for a single-character search.
  if (s.length_ == 1)
    return find_first_of(s.ptr_[0], pos);

  bool lookup[UCHAR_MAX + 1] = { false };
  BuildLookupTable(s, lookup);
  for (size_type i = pos; i < length_; ++i) {
    if (lookup[static_cast<unsigned char>(ptr_[i])]) {
      return i;
    }
  }
  return npos;
}

size_type StringPiece::find_first_not_of(const StringPiece& s,
                                         size_type pos) const {
  if (length_ == 0)
    return npos;

  if (s.length_ == 0)
    return 0;

  // Avoid the cost of BuildLookupTable() for a single-character search.
  if (s.length_ == 1)
    return find_first_not_of(s.ptr_[0], pos);

  bool lookup[UCHAR_MAX + 1] = { false };
  BuildLookupTable(s, lookup);
  for (size_type i = pos; i < length_; ++i) {
    if (!lookup[static_cast<unsigned char>(ptr_[i])]) {
      return i;
    }
  }
  return npos;
}

size_type StringPiece::find_first_not_of(char c, size_type pos) const {
  if (length_ == 0)
    return npos;

  for (; pos < length_; ++pos) {
    if (ptr_[pos] != c) {
      return pos;
    }
  }
  return npos;
}

size_type StringPiece::find_last_of(const StringPiece& s, size_type pos) const {
  if (length_ == 0 || s.length_ == 0)
    return npos;

  // Avoid the cost of BuildLookupTable() for a single-character search.
  if (s.length_ == 1)
    return find_last_of(s.ptr_[0], pos);

  bool lookup[UCHAR_MAX + 1] = { false };
  BuildLookupTable(s, lookup);
  for (size_type i = std::min(pos, length_ - 1); ; --i) {
    if (lookup[static_cast<unsigned char>(ptr_[i])])
      return i;
    if (i == 0)
      break;
  }
  return npos;
}

size_type StringPiece::find_last_not_of(const StringPiece& s,
                                        size_type pos) const {
  if (length_ == 0)
    return npos;

  size_type i = std::min(pos, length_ - 1);
  if (s.length_ == 0)
    return i;

  // Avoid the cost of BuildLookupTable() for a single-character search.
  if (s.length_ == 1)
    return find_last_not_of(s.ptr_[0], pos);

  bool lookup[UCHAR_MAX + 1] = { false };
  BuildLookupTable(s, lookup);
  for (; ; --i) {
    if (!lookup[static_cast<unsigned char>(ptr_[i])])
      return i;
    if (i == 0)
      break;
  }
  return npos;
}

size_type StringPiece::find_last_not_of(char c, size_type pos) const {
  if (length_ == 0)
    return npos;

  for (size_type i = std::min(pos, length_ - 1); ; --i) {
    if (ptr_[i] != c)
      return i;
    if (i == 0)
      break;
  }
  return npos;
}

StringPiece StringPiece::substr(size_type pos, size_type n) const {
  if (pos > length_) pos = length_;
  if (n > length_ - pos) n = length_ - pos;
  return StringPiece(ptr_ + pos, n);
}

const size_type StringPiece::npos = size_type(-1);

#endif // !HAVE_ICU


================================================
FILE: src/kenlm/util/string_piece.hh
================================================
/* If you use ICU in your program, then compile with -DHAVE_ICU -licui18n.  If
 * you don't use ICU, then this will use the Google implementation from Chrome.
 * This has been modified from the original version to let you choose.
 */

// Copyright 2008, Google Inc.
// All rights reserved.
//
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are
// met:
//
//    * Redistributions of source code must retain the above copyright
// notice, this list of conditions and the following disclaimer.
//    * Redistributions in binary form must reproduce the above
// copyright notice, this list of conditions and the following disclaimer
// in the documentation and/or other materials provided with the
// distribution.
//    * Neither the name of Google Inc. nor the names of its
// contributors may be used to endorse or promote products derived from
// this software without specific prior written permission.
//
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
// Copied from strings/stringpiece.h with modifications
//
// A string-like object that points to a sized piece of memory.
//
// Functions or methods may use const StringPiece& parameters to accept either
// a "const char*" or a "string" value that will be implicitly converted to
// a StringPiece.  The implicit conversion means that it is often appropriate
// to include this .h file in other files rather than forward-declaring
// StringPiece as would be appropriate for most other Google classes.
//
// Systematic usage of StringPiece is encouraged as it will reduce unnecessary
// conversions from "const char*" to "string" and back again.
//

#ifndef BASE_STRING_PIECE_H__
#define BASE_STRING_PIECE_H__

#include "util/have.hh"

#include <cstring>
#include <iosfwd>
#include <ostream>

#ifdef HAVE_ICU
#include <unicode/stringpiece.h>
#include <unicode/uversion.h>

// Old versions of ICU don't define operator== and operator!=.
#if (U_ICU_VERSION_MAJOR_NUM < 4) || ((U_ICU_VERSION_MAJOR_NUM == 4) && (U_ICU_VERSION_MINOR_NUM < 4))
#warning You are using an old version of ICU.  Consider upgrading to ICU >= 4.6.
inline bool operator==(const StringPiece& x, const StringPiece& y) {
  if (x.size() != y.size())
    return false;

  return std::memcmp(x.data(), y.data(), x.size()) == 0;
}

inline bool operator!=(const StringPiece& x, const StringPiece& y) {
  return !(x == y);
}
#endif // old version of ICU

U_NAMESPACE_BEGIN
#else

#include <algorithm>
#include <cstddef>
#include <string>
#include <string.h>

#ifdef WIN32
#undef max
#undef min
#endif

class StringPiece {
 public:
  typedef size_t size_type;

 private:
  const char*   ptr_;
  size_type     length_;

 public:
  // We provide non-explicit singleton constructors so users can pass
  // in a "const char*" or a "string" wherever a "StringPiece" is
  // expected.
  StringPiece() : ptr_(NULL), length_(0) { }
  StringPiece(const char* str)
    : ptr_(str), length_((str == NULL) ? 0 : strlen(str)) { }
  StringPiece(const std::string& str)
    : ptr_(str.data()), length_(str.size()) { }
  StringPiece(const char* offset, size_type len)
    : ptr_(offset), length_(len) { }

  // data() may return a pointer to a buffer with embedded NULs, and the
  // returned buffer may or may not be null terminated.  Therefore it is
  // typically a mistake to pass data() to a routine that expects a NUL
  // terminated string.
  const char* data() const { return ptr_; }
  size_type size() const { return length_; }
  size_type length() const { return length_; }
  bool empty() const { return length_ == 0; }

  void clear() { ptr_ = NULL; length_ = 0; }
  void set(const char* data, size_type len) { ptr_ = data; length_ = len; }
  void set(const char* str) {
    ptr_ = str;
    length_ = str ? strlen(str) : 0;
  }
  void set(const void* data, size_type len) {
    ptr_ = reinterpret_cast<const char*>(data);
    length_ = len;
  }

  char operator[](size_type i) const { return ptr_[i]; }

  void remove_prefix(size_type n) {
    ptr_ += n;
    length_ -= n;
  }

  void remove_suffix(size_type n) {
    length_ -= n;
  }

  int compare(const StringPiece& x) const {
    int r = wordmemcmp(ptr_, x.ptr_, std::min(length_, x.length_));
    if (r == 0) {
      if (length_ < x.length_) r = -1;
      else if (length_ > x.length_) r = +1;
    }
    return r;
  }

  std::string as_string() const {
    // std::string doesn't like to take a NULL pointer even with a 0 size.
    return std::string(!empty() ? data() : "", size());
  }

  void CopyToString(std::string* target) const;
  void AppendToString(std::string* target) const;

  // Does "this" start with "x"
  bool starts_with(const StringPiece& x) const {
    return ((length_ >= x.length_) &&
            (wordmemcmp(ptr_, x.ptr_, x.length_) == 0));
  }

  // Does "this" end with "x"
  bool ends_with(const StringPiece& x) const {
    return ((length_ >= x.length_) &&
            (wordmemcmp(ptr_ + (length_-x.length_), x.ptr_, x.length_) == 0));
  }

  // standard STL container boilerplate
  typedef char value_type;
  typedef const char* pointer;
  typedef const char& reference;
  typedef const char& const_reference;
  typedef ptrdiff_t difference_type;
  static const size_type npos;
  typedef const char* const_iterator;
  typedef const char* iterator;
  typedef std::reverse_iterator<const_iterator> const_reverse_iterator;
  typedef std::reverse_iterator<iterator> reverse_iterator;
  iterator begin() const { return ptr_; }
  iterator end() const { return ptr_ + length_; }
  const_reverse_iterator rbegin() const {
    return const_reverse_iterator(ptr_ + length_);
  }
  const_reverse_iterator rend() const {
    return const_reverse_iterator(ptr_);
  }

  size_type max_size() const { return length_; }
  size_type capacity() const { return length_; }

  size_type copy(char* buf, size_type n, size_type pos = 0) const;

  size_type find(const StringPiece& s, size_type pos = 0) const;
  size_type find(char c, size_type pos = 0) const;
  size_type rfind(const StringPiece& s, size_type pos = npos) const;
  size_type rfind(char c, size_type pos = npos) const;

  size_type find_first_of(const StringPiece& s, size_type pos = 0) const;
  size_type find_first_of(char c, size_type pos = 0) const {
    return find(c, pos);
  }
  size_type find_first_not_of(const StringPiece& s, size_type pos = 0) const;
  size_type find_first_not_of(char c, size_type pos = 0) const;
  size_type find_last_of(const StringPiece& s, size_type pos = npos) const;
  size_type find_last_of(char c, size_type pos = npos) const {
    return rfind(c, pos);
  }
  size_type find_last_not_of(const StringPiece& s, size_type pos = npos) const;
  size_type find_last_not_of(char c, size_type pos = npos) const;

  StringPiece substr(size_type pos, size_type n = npos) const;

  static int wordmemcmp(const char* p, const char* p2, size_type N) {
    return memcmp(p, p2, N);
  }
};

inline bool operator==(const StringPiece& x, const StringPiece& y) {
  if (x.size() != y.size())
    return false;

  return std::memcmp(x.data(), y.data(), x.size()) == 0;
}

inline bool operator!=(const StringPiece& x, const StringPiece& y) {
  return !(x == y);
}

#endif // HAVE_ICU undefined

inline bool operator<(const StringPiece& x, const StringPiece& y) {
  const int r = std::memcmp(x.data(), y.data(),
                                       std::min(x.size(), y.size()));
  return ((r < 0) || ((r == 0) && (x.size() < y.size())));
}

inline bool operator>(const StringPiece& x, const StringPiece& y) {
  return y < x;
}

inline bool operator<=(const StringPiece& x, const StringPiece& y) {
  return !(x > y);
}

inline bool operator>=(const StringPiece& x, const StringPiece& y) {
  return !(x < y);
}

// allow StringPiece to be logged (needed for unit testing).
inline std::ostream& operator<<(std::ostream& o, const StringPiece& piece) {
  return o.write(piece.data(), static_cast<std::streamsize>(piece.size()));
}

#ifdef HAVE_ICU
U_NAMESPACE_END
using U_NAMESPACE_QUALIFIER StringPiece;
#endif

#endif  // BASE_STRING_PIECE_H__


================================================
FILE: src/kenlm/util/string_piece_hash.hh
================================================
#ifndef UTIL_STRING_PIECE_HASH__
#define UTIL_STRING_PIECE_HASH__

#include "util/string_piece.hh"

#include <boost/functional/hash.hpp>
#include <boost/version.hpp>

inline size_t hash_value(const StringPiece &str) {
  return boost::hash_range(str.data(), str.data() + str.length());
}

/* Support for lookup of StringPiece in boost::unordered_map<std::string> */
struct StringPieceCompatibleHash : public std::unary_function<const StringPiece &, size_t> {
  size_t operator()(const StringPiece &str) const {
    return hash_value(str);
  }
};

struct StringPieceCompatibleEquals : public std::binary_function<const StringPiece &, const std::string &, bool> {
  bool operator()(const StringPiece &first, const StringPiece &second) const {
    return first == second;
  }
};
template <class T> typename T::const_iterator FindStringPiece(const T &t, const StringPiece &key) {
#if BOOST_VERSION < 104200
  std::string temp(key.data(), key.size());
  return t.find(temp);
#else
  return t.find(key, StringPieceCompatibleHash(), StringPieceCompatibleEquals());
#endif
}

template <class T> typename T::iterator FindStringPiece(T &t, const StringPiece &key) {
#if BOOST_VERSION < 104200
  std::string temp(key.data(), key.size());
  return t.find(temp);
#else
  return t.find(key, StringPieceCompatibleHash(), StringPieceCompatibleEquals());
#endif
}

#endif // UTIL_STRING_PIECE_HASH__


================================================
FILE: src/kenlm/util/thread_pool.hh
================================================
#ifndef UTIL_THREAD_POOL__
#define UTIL_THREAD_POOL__

#include "util/pcqueue.hh"

#include <boost/ptr_container/ptr_vector.hpp>
#include <boost/optional.hpp>
#include <boost/thread.hpp>

#include <iostream>

#include <stdlib.h>

namespace util {

template <class HandlerT> class Worker : boost::noncopyable {
  public:
    typedef HandlerT Handler;
    typedef typename Handler::Request Request;

    template <class Construct> Worker(PCQueue<Request> &in, Construct &construct, Request &poison)
      : in_(in), handler_(construct), thread_(boost::ref(*this)), poison_(poison) {}

    // Only call from thread.
    void operator()() {
      Request request;
      while (1) {
        in_.Consume(request);
        if (request == poison_) return;
        try {
          (*handler_)(request);
        }
        catch(std::exception &e) {
          std::cerr << "Handler threw " << e.what() << std::endl;
          abort();
        }
        catch(...) {
          std::cerr << "Handler threw an exception, dropping request" << std::endl;
          abort();
        }
      }
    }

    void Join() {
      thread_.join();
    }

  private:
    PCQueue<Request> &in_;

    boost::optional<Handler> handler_;

    boost::thread thread_;

    Request poison_;
};

template <class HandlerT> class ThreadPool : boost::noncopyable {
  public:
    typedef HandlerT Handler;
    typedef typename Handler::Request Request;

    template <class Construct> ThreadPool(size_t queue_length, size_t workers, Construct handler_construct, Request poison) : in_(queue_length), poison_(poison) {
      for (size_t i = 0; i < workers; ++i) {
        workers_.push_back(new Worker<Handler>(in_, handler_construct, poison));
      }
    }

    ~ThreadPool() {
      for (size_t i = 0; i < workers_.size(); ++i) {
        Produce(poison_);
      }
      for (typename boost::ptr_vector<Worker<Handler> >::iterator i = workers_.begin(); i != workers_.end(); ++i) {
        i->Join();
      }
    }

    void Produce(const Request &request) {
      in_.Produce(request);
    }

    // For adding to the queue.
    PCQueue<Request> &In() { return in_; }

  private:
    PCQueue<Request> in_;

    boost::ptr_vector<Worker<Handler> > workers_;

    Request poison_;
};

} // namespace util

#endif // UTIL_THREAD_POOL__


================================================
FILE: src/kenlm/util/tokenize_piece.hh
================================================
#ifndef UTIL_TOKENIZE_PIECE__
#define UTIL_TOKENIZE_PIECE__

#include "util/exception.hh"
#include "util/string_piece.hh"

#include <boost/iterator/iterator_facade.hpp>

#include <algorithm>
#include <iostream>

namespace util {

// Thrown on dereference when out of tokens to parse
class OutOfTokens : public Exception {
  public:
    OutOfTokens() throw() {}
    ~OutOfTokens() throw() {}
};

class SingleCharacter {
  public:
    SingleCharacter() {}
    explicit SingleCharacter(char delim) : delim_(delim) {}

    StringPiece Find(const StringPiece &in) const {
      return StringPiece(std::find(in.data(), in.data() + in.size(), delim_), 1);
    }

  private:
    char delim_;
};

class MultiCharacter {
  public:
    MultiCharacter() {}

    explicit MultiCharacter(const StringPiece &delimiter) : delimiter_(delimiter) {}

    StringPiece Find(const StringPiece &in) const {
      return StringPiece(std::search(in.data(), in.data() + in.size(), delimiter_.data(), delimiter_.data() + delimiter_.size()), delimiter_.size());
    }

  private:
    StringPiece delimiter_;
};

class AnyCharacter {
  public:
    AnyCharacter() {}
    explicit AnyCharacter(const StringPiece &chars) : chars_(chars) {}

    StringPiece Find(const StringPiece &in) const {
      return StringPiece(std::find_first_of(in.data(), in.data() + in.size(), chars_.data(), chars_.data() + chars_.size()), 1);
    }

  private:
    StringPiece chars_;
};

class AnyCharacterLast {
  public:
    AnyCharacterLast() {}

    explicit AnyCharacterLast(const StringPiece &chars) : chars_(chars) {}

    StringPiece Find(const StringPiece &in) const {
      return StringPiece(std::find_end(in.data(), in.data() + in.size(), chars_.data(), chars_.data() + chars_.size()), 1);
    }

  private:
    StringPiece chars_;
};

template <class Find, bool SkipEmpty = false> class TokenIter : public boost::iterator_facade<TokenIter<Find, SkipEmpty>, const StringPiece, boost::forward_traversal_tag> {
  public:
    TokenIter() {}

    template <class Construct> TokenIter(const StringPiece &str, const Construct &construct) : after_(str), finder_(construct) {
      increment();
    }

    bool operator!() const {
      return current_.data() == 0;
    }
    operator bool() const {
      return current_.data() != 0;
    }

    static TokenIter<Find, SkipEmpty> end() {
      return TokenIter<Find, SkipEmpty>();
    }

  private:
    friend class boost::iterator_core_access;

    void increment() {
      do {
        StringPiece found(finder_.Find(after_));
        current_ = StringPiece(after_.data(), found.data() - after_.data());
        if (found.data() == after_.data() + after_.size()) {
          after_ = StringPiece(NULL, 0);
        } else {
          after_ = StringPiece(found.data() + found.size(), after_.data() - found.data() + after_.size() - found.size());
        }
      } while (SkipEmpty && current_.data() && current_.empty()); // Compiler should optimize this away if SkipEmpty is false.  
    }

    bool equal(const TokenIter<Find, SkipEmpty> &other) const {
      return current_.data() == other.current_.data();
    }

    const StringPiece &dereference() const {
      UTIL_THROW_IF(!current_.data(), OutOfTokens, "Ran out of tokens");
      return current_;
    }

    StringPiece current_;
    StringPiece after_;

    Find finder_;
};

} // namespace util

#endif // UTIL_TOKENIZE_PIECE__


================================================
FILE: src/kenlm/util/tokenize_piece_test.cc
================================================
#include "util/tokenize_piece.hh"
#include "util/string_piece.hh"

#define BOOST_TEST_MODULE TokenIteratorTest
#include <boost/test/unit_test.hpp>

#include <iostream>

namespace util {
namespace {

BOOST_AUTO_TEST_CASE(pipe_pipe_none) {
  const char str[] = "nodelimit at all";
  TokenIter<MultiCharacter> it(str, MultiCharacter("|||"));
  BOOST_REQUIRE(it);
  BOOST_CHECK_EQUAL(StringPiece(str), *it);
  ++it;
  BOOST_CHECK(!it);
}
BOOST_AUTO_TEST_CASE(pipe_pipe_two) {
  const char str[] = "|||";
  TokenIter<MultiCharacter> it(str, MultiCharacter("|||"));
  BOOST_REQUIRE(it);
  BOOST_CHECK_EQUAL(StringPiece(), *it);
  ++it;
  BOOST_REQUIRE(it);
  BOOST_CHECK_EQUAL(StringPiece(), *it);
  ++it;
  BOOST_CHECK(!it);
}

BOOST_AUTO_TEST_CASE(remove_empty) {
  const char str[] = "|||";
  TokenIter<MultiCharacter, true> it(str, MultiCharacter("|||"));
  BOOST_CHECK(!it);
}

BOOST_AUTO_TEST_CASE(remove_empty_keep) {
  const char str[] = " |||";
  TokenIter<MultiCharacter, true> it(str, MultiCharacter("|||"));
  BOOST_REQUIRE(it);
  BOOST_CHECK_EQUAL(StringPiece(" "), *it);
  ++it;
  BOOST_CHECK(!it);
}

} // namespace
} // namespace util


================================================
FILE: src/kenlm/util/usage.cc
================================================
#include "util/usage.hh"

#include "util/exception.hh"

#include <fstream>
#include <ostream>
#include <sstream>

#include <string.h>
#include <ctype.h>
#if !defined(_WIN32) && !defined(_WIN64)
#include <sys/resource.h>
#include <sys/time.h>
#include <unistd.h>
#endif

namespace util {

namespace {
#if !defined(_WIN32) && !defined(_WIN64)
float FloatSec(const struct timeval &tv) {
  return static_cast<float>(tv.tv_sec) + (static_cast<float>(tv.tv_usec) / 1000000.0);
}
#endif
} // namespace

void PrintUsage(std::ostream &out) {
#if !defined(_WIN32) && !defined(_WIN64)
  struct rusage usage;
  if (getrusage(RUSAGE_SELF, &usage)) {
    perror("getrusage");
    return;
  }
  out << "user\t" << FloatSec(usage.ru_utime) << "\nsys\t" << FloatSec(usage.ru_stime) << '\n';

  // Linux doesn't set memory usage :-(.  
  std::ifstream status("/proc/self/status", std::ios::in);
  std::string line;
  while (getline(status, line)) {
    if (!strncmp(line.c_str(), "VmRSS:\t", 7)) {
      out << "VmRSS:  " << (line.c_str() + 7) << '\n';
      break;
    } else if (!strncmp(line.c_str(), "VmPeak:\t", 8)) {
      out << "VmPeak: " << (line.c_str() + 8) << '\n';
    }
  }
#endif
}

uint64_t GuessPhysicalMemory() {
#if defined(_WIN32) || defined(_WIN64)
  return 0;
#elif defined(_SC_PHYS_PAGES) && defined(_SC_PAGESIZE)
  long pages = sysconf(_SC_PHYS_PAGES);
  if (pages == -1) return 0;
  long page_size = sysconf(_SC_PAGESIZE);
  if (page_size == -1) return 0;
  return static_cast<uint64_t>(pages) * static_cast<uint64_t>(page_size);
#else
  return 0;
#endif
}

namespace {
class SizeParseError : public Exception {
  public:
    explicit SizeParseError(const std::string &str) throw() {
      *this << "Failed to parse " << str << " into a memory size ";
    }
};

template <class Num> uint64_t ParseNum(const std::string &arg) {
  std::stringstream stream(arg);
  Num value;
  stream >> value;
  UTIL_THROW_IF_ARG(!stream, SizeParseError, (arg), "for the leading number.");
  std::string after;
  stream >> after;
  UTIL_THROW_IF_ARG(after.size() > 1, SizeParseError, (arg), "because there are more than two characters after the number.");
  std::string throwaway;
  UTIL_THROW_IF_ARG(stream >> throwaway, SizeParseError, (arg), "because there was more cruft " << throwaway << " after the number.");

  // Silly sort, using kilobytes as your default unit.  
  if (after.empty()) after = "K";
  if (after == "%") {
    uint64_t mem = GuessPhysicalMemory();
    UTIL_THROW_IF_ARG(!mem, SizeParseError, (arg), "because % was specified but the physical memory size could not be determined.");
    return static_cast<double>(value) * static_cast<double>(mem) / 100.0;
  }
  
  std::string units("bKMGTPEZY");
  std::string::size_type index = units.find(after[0]);
  UTIL_THROW_IF_ARG(index == std::string::npos, SizeParseError, (arg), "the allowed suffixes are " << units << "%.");
  for (std::string::size_type i = 0; i < index; ++i) {
    value *= 1024;
  }
  return value;
}

} // namespace

uint64_t ParseSize(const std::string &arg) {
  return arg.find('.') == std::string::npos ? ParseNum<double>(arg) : ParseNum<uint64_t>(arg);
}

} // namespace util


================================================
FILE: src/kenlm/util/usage.hh
================================================
#ifndef UTIL_USAGE__
#define UTIL_USAGE__
#include <cstddef>
#include <iosfwd>
#include <string>

#include <stdint.h>

namespace util {
void PrintUsage(std::ostream &to);

// Determine how much physical memory there is.  Return 0 on failure.
uint64_t GuessPhysicalMemory();

// Parse a size like unix sort.  Sadly, this means the default multiplier is K.
uint64_t ParseSize(const std::string &arg);
} // namespace util
#endif // UTIL_USAGE__


================================================
FILE: src/opennlp/ccg/Parse.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2010 Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg;

import java.io.*;
import java.net.URL;
import java.util.HashMap;
import java.util.Map;

import org.jdom.Document;
import org.jdom.Element;
import org.jdom.output.Format;
import org.jdom.output.XMLOutputter;

import opennlp.ccg.grammar.Grammar;
import opennlp.ccg.hylo.HyloHelper;
import opennlp.ccg.hylo.Nominal;
import opennlp.ccg.lexicon.Tokenizer;
import opennlp.ccg.parse.ParseException;
import opennlp.ccg.parse.Parser;
import opennlp.ccg.parse.Supertagger;
import opennlp.ccg.parse.supertagger.WordAndPOSDictionaryLabellingStrategy;
import opennlp.ccg.synsem.Category;
import opennlp.ccg.synsem.LF;
import opennlp.ccg.synsem.Sign;
import opennlp.ccg.synsem.SignScorer;
import opennlp.ccg.test.RegressionInfo;
import opennlp.ccg.test.DerivMaker;
import opennlp.ccgbank.extract.Testbed;

/**
 * Creates a testbed file by parsing a text file.
 * Text is assumed to be tokenized, with one sentence per line.
 *
 * @author      Michael White
 * @version     $Revision: 1.2 $, $Date: 2010/10/28 02:46:32 $
 */
public class Parse {

	public static void main(String[] args) throws IOException {
		
        String usage = "Usage: java opennlp.ccg.Parse \n" + 
        	"  (-g <grammarfile>) \n" + 
        	"  -parsescorer <scorerclass> \n" +
        	"  -supertagger <supertaggerclass> | -stconfig <configfile> \n" +
	        "  (-nbestListSize <nbestListSize>) \n" +
	        "  (-includederivs) \n" +
	        "  (-includescores) \n" +
        	"  <inputfile> <outputfile>";
        
        if (args.length == 0 || args[0].equals("-h")) {
            System.out.println(usage);
            System.exit(0);
        }
        
        // args
        String grammarfile = "grammar.xml";
        String inputfile = null;
        String outputfile = null;
        String parseScorerClass = null;
        String supertaggerClass = null, stconfig = null;
        boolean includederivs = false;
        boolean includescores = false;
        int nbestListSize = 1;
        
        for (int i = 0; i < args.length; i++) {
        	if (args[i].equals("-g")) { grammarfile = args[++i]; continue; }
            if (args[i].equals("-parsescorer")) { parseScorerClass = args[++i]; continue; }
            if (args[i].equals("-supertagger")) { supertaggerClass = args[++i]; continue; }
            if (args[i].equals("-stconfig")) { stconfig = args[++i]; continue; }
            if (args[i].equals("-nbestListSize")) { nbestListSize = Integer.parseInt(args[++i]); continue; }
            if (args[i].equals("-includederivs")) { includederivs = true; continue; }
            if (args[i].equals("-includescores")) { includescores = true; continue; }
            if (inputfile == null) { inputfile = args[i]; continue; }
            outputfile = args[i];
        }
        if (nbestListSize < 1) nbestListSize = 1;

        if (inputfile == null || outputfile == null || 
        	parseScorerClass == null || (supertaggerClass == null && stconfig == null)) 
        {
            System.out.println(usage);
            System.exit(0);
        }
        
		// make test doc, sign map
		Document outDoc = new Document();
		Element outRoot = new Element("regression");
		outDoc.setRootElement(outRoot);
		Map<String,Sign> signMap = new HashMap<String,Sign>();

        // load grammar
        URL grammarURL = new File(grammarfile).toURI().toURL();
        System.out.println("Loading grammar from URL: " + grammarURL);
        Grammar grammar = new Grammar(grammarURL);
        Tokenizer tokenizer = grammar.lexicon.tokenizer;
        System.out.println();
        
        // set up parser
        Parser parser = new Parser(grammar);
        // instantiate scorer
        try {
            System.out.println("Instantiating parsing sign scorer from class: " + parseScorerClass);
            SignScorer parseScorer = (SignScorer) Class.forName(parseScorerClass).newInstance();
            parser.setSignScorer(parseScorer);
            System.out.println();
        } catch (Exception exc) {
            throw (RuntimeException) new RuntimeException().initCause(exc);
        }
        // instantiate supertagger
        try {
        	Supertagger supertagger;
        	if (supertaggerClass != null) {
                System.out.println("Instantiating supertagger from class: " + supertaggerClass);
                supertagger = (Supertagger) Class.forName(supertaggerClass).newInstance();
        	}
        	else {
        		System.out.println("Instantiating supertagger from config file: " + stconfig);
        		supertagger = WordAndPOSDictionaryLabellingStrategy.supertaggerFactory(stconfig);
        	}
            parser.setSupertagger(supertagger);
            System.out.println();
        } catch (Exception exc) {
            throw (RuntimeException) new RuntimeException().initCause(exc);
        }
        
        // loop through input
        BufferedReader in = new BufferedReader(new FileReader(inputfile));
        String line;
        Map<String,String> predInfoMap = new HashMap<String,String>();
        System.out.println("Parsing " + inputfile);
        System.out.println();
        int count = 1;
        while ((line = in.readLine()) != null) {
        	String id = "s" + count;
        	try {
        		// parse it
        		System.out.println(line);
        		parser.parse(line);
        		int numParses = Math.min(nbestListSize, parser.getResult().size());
        		for (int i=0; i < numParses; i++) {
        			Sign thisParse = parser.getResult().get(i);
        			// convert lf
        			Category cat = thisParse.getCategory();
        			LF convertedLF = null;
        			String predInfo = null;
        			if (cat.getLF() != null) {
        				// convert LF
        				LF flatLF = cat.getLF();
        				cat = cat.copy();
        				Nominal index = cat.getIndexNominal(); 
        				convertedLF = HyloHelper.compactAndConvertNominals(flatLF, index, thisParse);
        				// get pred info
        				predInfoMap.clear();
        				Testbed.extractPredInfo(flatLF, predInfoMap);
        				predInfo = Testbed.getPredInfo(predInfoMap);
        			}
        			// add test item, sign
        			Element item = RegressionInfo.makeTestItem(grammar, line, 1, convertedLF);
        			String actualID = (nbestListSize == 1) ? id : id + "-" + (i+1);
        			item.setAttribute("info", actualID);
        			item.setAttribute("test","true");
        			outRoot.addContent(item);
        			signMap.put(actualID, thisParse);
        			// Add parsed words as a separate LF element
        			Element fullWordsElt = new Element("full-words");
        			fullWordsElt.addContent(tokenizer.format(thisParse.getWords()));
        			item.addContent(fullWordsElt);
        			if (predInfo != null) {
        				Element predInfoElt = new Element("pred-info");
        				predInfoElt.setAttribute("data", predInfo);
        				item.addContent(predInfoElt);
        			}
        			if (includederivs) {
        				Element derivElt = new Element("deriv");
        				derivElt.addContent(DerivMaker.makeDeriv(thisParse));
        				item.addContent(derivElt);
        			}
        			if (includescores) {
        				String score = parser.getScores().get(i).toString();
        				item.setAttribute("score", score);
        			}
        		}
        	} catch (ParseException e) {
        		System.out.println("Unable to parse!");
        		// add test item with zero parses
        		Element item = RegressionInfo.makeTestItem(grammar, line, 0, null);
        		item.setAttribute("info", id);
        		outRoot.addContent(item);
        	}
        	count++;
        }
        System.out.println();

		// write test doc, saved signs
        System.out.println("Writing parses to " + outputfile);
		XMLOutputter outputter = new XMLOutputter(Format.getPrettyFormat());
		File regressionFile = new File(outputfile);
		outputter.output(outDoc, new FileOutputStream(regressionFile));
		RegressionInfo.writeSerFile(signMap, regressionFile);
        System.out.println();
		
        // done
        in.close();
        System.out.println("Done.");
	}
}


================================================
FILE: src/opennlp/ccg/Realize.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003-7 University of Edinburgh, Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg;

import opennlp.ccg.realize.*;
import opennlp.ccg.realize.hypertagger.ZLMaxentHypertagger;
import opennlp.ccg.grammar.*;
import opennlp.ccg.synsem.*;
import opennlp.ccg.ngrams.*;

import org.jdom.*;
import org.jdom.output.*;

import java.io.*;
import java.net.*;
import java.util.*;
import java.util.prefs.*;

/**
 * Sample front-end to the realizer, showing the intermediate steps of realization.
 *
 * @author      Michael White
 * @version     $Revision: 1.38 $, $Date: 2011/08/10 17:58:45 $
 */
public class Realize
{
    private static PrintWriter out;
    
    @SuppressWarnings("unchecked")
	public static void main(String[] args) throws Exception {
        
        String usage = "Usage: java opennlp.ccg.Realize (-g <grammarfile>) (-exactmatches) (-ngramorder N) <inputfile> (<outputfile>)";
        
        if (args.length > 0 && args[0].equals("-h")) {
            System.out.println(usage);
            System.exit(0);
        }
        
        // args
        String grammarfile = "grammar.xml";
        String inputfile = null;
        String outputfile = null;
        boolean exactMatches = false;
        int ngramOrder = 0;
        for (int i = 0; i < args.length; i++) {
        	if (args[i].startsWith("-D")) {
        		String prop = args[i].substring(2); int equalpos = prop.indexOf("=");
        		String key = prop.substring(0, equalpos); String val = prop.substring(equalpos+1);
        		System.setProperty(key, val); continue;
        	}
            if (args[i].equals("-g")) { grammarfile = args[++i]; continue; }
            if (args[i].equals("-exactmatches")) { exactMatches = true; continue; }
            if (args[i].equals("-ngramorder")) { ngramOrder = Integer.parseInt(args[++i]); continue; }
            if (inputfile == null) { inputfile = args[i]; continue; }
            outputfile = args[i];
        }
        if (inputfile == null) {
            System.out.println(usage);
            System.exit(0);
        }
        
        // set out accordingly
        if (outputfile != null) {
            out = new PrintWriter(new BufferedWriter(new FileWriter(outputfile)));
        }
        else {
            out = new PrintWriter(System.out); 
        }
        
        // remember, modify prefs
        Preferences prefs = Preferences.userNodeForPackage(TextCCG.class);
        boolean oldShowCompleteness = prefs.getBoolean(Edge.SHOW_COMPLETENESS, false);
        boolean oldShowBitset = prefs.getBoolean(Edge.SHOW_BITSET, false);
        prefs.putBoolean(Edge.SHOW_COMPLETENESS, true);
        prefs.putBoolean(Edge.SHOW_BITSET, true);
        
        // load grammar
        URL grammarURL = new File(grammarfile).toURI().toURL();
        out.println("Loading grammar from URL: " + grammarURL);
        Grammar grammar = new Grammar(grammarURL);

        // instantiate realizer        
        Realizer realizer = new Realizer(grammar);
        
        // get request
        out.println();
        out.println("Request:");
        out.println();
        Document doc = grammar.loadFromXml(inputfile);
        org.jdom.output.XMLOutputter outputter = new org.jdom.output.XMLOutputter(Format.getPrettyFormat()); 
        out.flush();
        outputter.output(doc, out);
        out.flush();
        
        LF lf = Realizer.getLfFromDoc(doc);
        out.println();
        out.println("** Initial run");
        out.println();
        out.println("Input LF: " + lf);
        
        // set up n-gram scorer
        SignScorer ngramScorer;
        Element root = doc.getRootElement();
        Element ngramModelElt = root.getChild("ngram-model");
        if (ngramModelElt == null) {
            // just use targets
            List<Element> targetElts = root.getChildren("target");
            String[] targets = new String[targetElts.size()];
            out.println();
            out.println("Targets:");
            for (int i=0; i < targetElts.size(); i++) {
                Element ex = (Element) targetElts.get(i);
                String target = ex.getText();
                out.println(target);
                targets[i] = target;
            }
            if (ngramOrder > 0) {
                out.println();
                out.println("Using order " + ngramOrder + " in n-gram precision.");
            	ngramScorer = new NgramPrecisionModel(targets, ngramOrder); 
            }
            else ngramScorer = new NgramPrecisionModel(targets);
            if (exactMatches) {
                out.println();
                out.println("Only counting exact matches in n-gram precision.");
                ((NgramPrecisionModel)ngramScorer).setExactMatches(exactMatches);
            }
        }
        else if (ngramModelElt.getAttributeValue("class") != null) {
            // load scorer from class
            String scorerClass = ngramModelElt.getAttributeValue("class");
            out.println();
            out.println("Instantiating scorer from class: " + scorerClass);
            ngramScorer = (SignScorer) Class.forName(scorerClass).newInstance();
        }
        else {
            // load n-gram model
            String filename = ngramModelElt.getAttributeValue("file");
            String reverseStr = ngramModelElt.getAttributeValue("reverse");
            boolean reverse = (reverseStr != null) ? reverseStr.equals("true") : false; 
            String factoredStr = ngramModelElt.getAttributeValue("factored");
            boolean factored = (factoredStr != null) ? factoredStr.equals("true") : false; 
            String semClassesStr = ngramModelElt.getAttributeValue("sem-classes");
            boolean useSemClasses = (semClassesStr != null) ? semClassesStr.equals("true") : true;
            int order = 3; // order can only be changed for standard n-gram models
            String orderStr = ngramModelElt.getAttributeValue("order"); 
            if (orderStr != null) { order = Integer.parseInt(orderStr); }
            if (ngramOrder > 0) order = ngramOrder; // preference given to command-line value
            out.println();
            String msg = "Loading ";
            if (reverse) msg += "reversed ";
            if (factored) msg += "factored ";
            msg += "n-gram model ";
            if (!factored) msg += "of order " + order + " ";
            if (useSemClasses) msg += "with semantic class replacement ";
            msg += "from: " + filename;
            out.println(msg);
            if (factored)
                ngramScorer = new FactoredNgramModelFamily(filename, useSemClasses);
            else
                ngramScorer = new StandardNgramModel(order, filename, useSemClasses);
            if (reverse) ((NgramScorer)ngramScorer).setReverse(true);
        }
        
        // set pruning strategy (if any)
        Element pruningStrategyElt = root.getChild("pruning-strategy");
        if (pruningStrategyElt != null) {
            // load pruning strategy from class
            String pruningStrategyClass = pruningStrategyElt.getAttributeValue("class");
            out.println();
            out.println("Instantiating pruning strategy from class: " + pruningStrategyClass);
            realizer.pruningStrategy = (PruningStrategy) 
                Class.forName(pruningStrategyClass).newInstance();
        }
        
        // set hypertagger (if any)
        Element htModelElt = root.getChild("ht-model");
        if (htModelElt != null) {
            String htconfig = htModelElt.getAttributeValue("config");
            if (htconfig != null) {
                out.println();
                out.println("Instantiating hypertagger from: " + htconfig);
            	realizer.hypertagger = ZLMaxentHypertagger.ZLMaxentHypertaggerFactory(htconfig);
            }
            else {
	            String htModelClass = htModelElt.getAttributeValue("class");
	            out.println();
	            out.println("Instantiating hypertagger from class: " + htModelClass);
	            realizer.hypertagger = (Hypertagger) Class.forName(htModelClass).newInstance();
            }
        }

        // run request
        realizer.realize(lf, ngramScorer);
        Chart chart = realizer.getChart();
        chart.out = out;

        out.println();
        out.println("Preds:");
        chart.printEPs();
        
        out.println();
        out.println("LF chunks:");
        chart.printLfChunks();

        out.println();
        out.println("LF alts:");
        chart.printLfAlts();

        out.println();
        out.println("LF optional parts:");
        chart.printLfOpts();

        out.println();
        out.println("Initial Edges:");
        chart.printInitialEdges();

        out.println();
        out.println("Marked Edges:");
        chart.printMarkedEdges(); 
        
        out.println();
        out.println("Instantiated Semantically Null Edges:");
        chart.printInstantiatedNoSemEdges();

        out.println();
        out.println("Uninstantiated Semantically Null Edges:");
        chart.printNoSemEdges();

        out.println();
        out.println("Rule Instances:");
        chart.printRuleInstances();

        out.println();
        out.println("All Edges:");
        chart.printEdges();

        out.println();
        out.println("Complete Edges (unsorted):");
        chart.printEdges(true);

        out.println();
        out.println("Complete Edges (sorted):");
        chart.printEdges(true, true);

        out.println();
        out.println("Best Edge:");
        chart.printBestEdge();
        
        out.println();
        out.println("Best Edge Derivation:");
        out.println(chart.bestEdge.getSign().getDerivationHistory());
        out.flush();
        
        if (chart.bestJoinedEdge != null) {
            out.println();
            out.println("Best Joined Edge:");
            chart.printBestJoinedEdge();
        
            out.println();
            out.println("Best Joined Edge Derivation:");
            out.println(chart.bestJoinedEdge.getSign().getDerivationHistory());
            out.flush();
        }


        // reset prefs
        prefs.putBoolean(Edge.SHOW_COMPLETENESS, oldShowCompleteness);
        prefs.putBoolean(Edge.SHOW_BITSET, oldShowBitset);
    }
}


================================================
FILE: src/opennlp/ccg/TextCCG.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003-4 Jason Baldridge, Gann Bierner, 
//                      University of Edinburgh (Michael White), 
//                      Alexandros Triantafyllidis and David Reitter
// Copyright (C) 2006 Ben Wing
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg;

import opennlp.ccg.lexicon.*;
import opennlp.ccg.grammar.*;
import opennlp.ccg.parse.*;
import opennlp.ccg.util.*;
import opennlp.ccg.synsem.*;
import opennlp.ccg.realize.*;
import opennlp.ccg.hylo.*;
import opennlp.ccg.ngrams.*;
import opennlp.ccg.test.*;
import opennlp.ccg.realize.Edge; // only realization edges referenced (for preferences)

import org.jdom.*;

import java.io.*;
import java.net.*;
import java.util.*;
import java.util.prefs.*;

/**
 * A text interface for testing grammars.
 *
 * @author  Jason Baldridge
 * @author  Gann Bierner
 * @author  Michael White
 * @author  Alexandros Triantafyllidis
 * @author  David Reitter
 * @version $Revision: 1.67 $, $Date: 2011/12/13 04:00:54 $
 */
public class TextCCG {
    
    /** Preference key for showing all results. */
    public static final String SHOW_ALL_RESULTS = "Show All Results";
    
    /** Preference key for showing derivations. */
    public static final String SHOW_DERIVATIONS = "Show Derivations";
    
    /** Preference key for showing features. */
    public static final String SHOW_FEATURES = "Show Features";
    
    /** Preference key for showing semantics. */
    public static final String SHOW_SEMANTICS = "Show Semantics";
    
    /** Preference key for showing features. */
    public static final String FEATURES_TO_SHOW = "Features to Show";
    
    /** Preference key for showing realizer timing. */
    public static final String SHOW_TIMING = "Show Timing";
    
    /** Preference key for showing incomplete edges during realization. */
    public static final String SHOW_INCOMPLETE_EDGES = "Show Incomplete Edges";
    
    /** Preference key for visualizing a derivation. */
    public static final String VISUALIZE = "Visualize";

    /** Preference key for command line history. */
    public static final String HISTORY = "Command Line History";	
	
	
    /** Main method for tccg. */
    @SuppressWarnings("unchecked")
	public static void main(String[] args) throws IOException, LexException { 

        String usage = "java opennlp.ccg.TextCCG " + 
                       "(<grammarfile>) | (-exportprefs <prefsfile>) | (-importprefs <prefsfile>)";

        if (args.length > 0 && args[0].equals("-h")) {
            System.out.println("Usage: " + usage);
            System.exit(0);
        }

        // args        
        String grammarfile = "grammar.xml";
        String prefsfile = null;
        boolean exportPrefs = false;
        boolean importPrefs = false;
        for (int i = 0; i < args.length; i++) {
            if (args[i].equals("-exportprefs")) {
                exportPrefs = true; prefsfile = args[++i]; continue; 
            }
            if (args[i].equals("-importprefs")) {
                importPrefs = true; prefsfile = args[++i]; continue; 
            }
            grammarfile = args[i];
        }

        // prefs
        Preferences prefs = Preferences.userNodeForPackage(TextCCG.class);
        try {
            if (exportPrefs) {
                System.out.println("Exporting preferences to prefsfile: " + prefsfile);
                prefs.exportNode(new FileOutputStream(prefsfile));
                return;
            }
            if (importPrefs) {
                System.out.println("Importing preferences from prefsfile: " + prefsfile);
                Preferences.importPreferences(new FileInputStream(prefsfile));
                return;
            }
        } catch (Exception exc) {
            throw (IOException) new IOException().initCause(exc);
        }

        // load grammar
        URL grammarURL = new File(grammarfile).toURI().toURL();
        System.out.println("Loading grammar from URL: " + grammarURL);
        Grammar grammar = new Grammar(grammarURL);
		
		if (grammar.getName() != null)
			System.out.println("Grammar '" + grammar.getName() + "' loaded.");
        System.out.println();

        // create parser and realizer
        Parser parser = new Parser(grammar);
        Realizer realizer = new Realizer(grammar);

        // stuff to remember during loop
        Sign[] lastResults = null;
        LF[] lastLFs = null;
        String lastSentence = "";
        int lastReading = 0;
        
		// prepare to accept input from user 
        String[] completions = 
            { ":sh", ":v", ":reset", ":feats", ":nofeats", ":foff", ":sem", ":nosem", ":all", ":notall", 
              ":derivs", ":noderivs", ":doff", ":vison", ":visoff", 
              ":wordpos", ":nowordpos", ":eisner", ":noeisner",
              ":ptl", ":noptl", ":pel", ":nopel", ":ppv", ":noppv", ":pcpv", ":nopcpv", ":plazy", ":noplazy", 
              ":r", ":sel", ":2xml", ":2tb", ":2apml", ":tl", ":notl", ":el", ":noel",
              ":nbtl", ":nonbtl", ":pv", ":nopv", ":cpv", ":nocpv", ":upon", ":upoff", 
              ":t", ":toff", ":inc", ":noinc",
              ":ion", ":ioff", ":mion", ":mioff", ":con", ":coff", ":flon", ":floff", ":ccon", ":ccoff", ":pon", ":poff",
              ":q", ":h"};
		LineReader lineReader = LineReader.createLineReader(completions);
		
		// initialize history, per grammar, from prefs
		String historyKey = HISTORY + "_" + grammar.getName();
		String histStr = prefs.get(historyKey, "");
        lineReader.setCommandHistory(histStr);

        // welcome msg
        System.out.println("Enter strings to parse.");
        System.out.println("Type ':r' to realize selected reading of previous parse.");
        System.out.println("Type ':h' for help on display options and ':q' to quit.");
        System.out.println("You can use the tab key for command completion, ");
        System.out.println("Ctrl-P (prev) and Ctrl-N (next) to access the command history, ");
        System.out.println("and emacs-style control keys to edit the line.");
        System.out.println();
        
        while (true) {
        
			String input = lineReader.readLine("tccg> ");
			if (input == null) break; // control-D or the like
            input = input.trim();			
			if (input.equals(":show settings") || input.equals(":sh")) {
                showSettings(prefs);
            } else if (input.equals(":v")) {
                prefs.putBoolean(SHOW_ALL_RESULTS, true);
                prefs.putBoolean(SHOW_DERIVATIONS, true);
                prefs.putBoolean(SHOW_FEATURES, true);
                prefs.putBoolean(SHOW_SEMANTICS, true);
                prefs.put(FEATURES_TO_SHOW, "");
            } else if (input.equals(":q")) {
                break; // end of while loop
            } else if (input.equals(":h")) {
                showHelp();
            } else if (input.equals(":reset")) {
                prefs.putBoolean(SHOW_ALL_RESULTS, false);
                prefs.putBoolean(SHOW_DERIVATIONS, false);
                prefs.putBoolean(SHOW_TIMING, false);
                prefs.putBoolean(SHOW_INCOMPLETE_EDGES, false);
                prefs.putBoolean(Edge.SHOW_COMPLETENESS, false);
                prefs.putBoolean(Edge.SHOW_BITSET, false);
                prefs.putBoolean(SHOW_FEATURES, false);
                prefs.putBoolean(SHOW_SEMANTICS, false);
                prefs.put(FEATURES_TO_SHOW, "");
                prefs.putBoolean(VISUALIZE, false);     
                prefs.put("VISFNAME", "");
                prefs.putBoolean(Converter.USE_WORD_POSITIONS_FOR_ATOM_CONVERSION, true);
                prefs.putBoolean(AbstractCompositionRule.EISNER_CONSTRAINTS, true);
                AbstractCompositionRule.useEisnerConstraints = true; 
                prefs.putInt(Parser.PARSE_TIME_LIMIT, Parser.NO_TIME_LIMIT);
                prefs.putInt(Parser.PARSE_EDGE_LIMIT, Parser.NO_EDGE_LIMIT);
                prefs.putInt(Parser.PARSE_PRUNING_VALUE, Parser.NO_PRUNING);
                prefs.putInt(Parser.PARSE_CELL_PRUNING_VALUE, Parser.NO_PRUNING);
                prefs.putBoolean(Parser.PARSE_LAZY_UNPACKING, true);
                prefs.putBoolean(EdgeFactory.USE_INDEXING, true);
                prefs.putBoolean(EdgeFactory.ALLOW_MISSING_INDEX_COMBOS, false);		
                prefs.putBoolean(EdgeFactory.USE_CHUNKS, true);
                prefs.putBoolean(EdgeFactory.USE_FEATURE_LICENSING, true);
                prefs.putBoolean(opennlp.ccg.realize.Chart.USE_COMBOS, true);
                prefs.putBoolean(opennlp.ccg.realize.Chart.USE_PACKING, false);
                prefs.putInt(opennlp.ccg.realize.Chart.TIME_LIMIT, opennlp.ccg.realize.Chart.NO_TIME_LIMIT);
                prefs.putDouble(opennlp.ccg.realize.Chart.NEW_BEST_TIME_LIMIT, opennlp.ccg.realize.Chart.NO_TIME_LIMIT);
                prefs.putInt(opennlp.ccg.realize.Chart.EDGE_LIMIT, opennlp.ccg.realize.Chart.NO_EDGE_LIMIT);
                prefs.putInt(opennlp.ccg.realize.Chart.PRUNING_VALUE, opennlp.ccg.realize.Chart.NO_PRUNING);
                prefs.putInt(opennlp.ccg.realize.Chart.CELL_PRUNING_VALUE, opennlp.ccg.realize.Chart.NO_PRUNING);
                prefs.putBoolean(opennlp.ccg.realize.Chart.DO_UNPACKING, true);
            } else if (input.equals(":show feats") || input.equals(":feats") || input.equals(":f")) {
                prefs.putBoolean(SHOW_FEATURES, true);
                prefs.put(FEATURES_TO_SHOW, "");
                Grammar.theGrammar.prefs.showFeats = true;
                Grammar.theGrammar.prefs.featsToShow = "";
            } else if (input.startsWith(":show feats ") || input.startsWith(":feats ") || input.startsWith(":f ")) {
                prefs.putBoolean(SHOW_FEATURES, true);
                String s = input.substring(input.indexOf(' ') + 1);
                if (s.startsWith("feats ")) { s = s.substring(6); }
                prefs.put(FEATURES_TO_SHOW, s);
                Grammar.theGrammar.prefs.showFeats = true;
                Grammar.theGrammar.prefs.featsToShow = s;
            } else if (input.equals(":nofeats") || input.equals(":foff")) {
                prefs.putBoolean(SHOW_FEATURES, false);
                prefs.put(FEATURES_TO_SHOW, "");
                Grammar.theGrammar.prefs.showFeats = false;
                Grammar.theGrammar.prefs.featsToShow = "";
            } else if (input.equals(":show semantics") || input.equals(":sem") || input.equals(":s")) {
                prefs.putBoolean(SHOW_SEMANTICS, true);
                Grammar.theGrammar.prefs.showSem = true;
            } else if (input.equals(":nosem") || input.equals(":soff")) {
                prefs.putBoolean(SHOW_SEMANTICS, false);
                Grammar.theGrammar.prefs.showSem = false;
            } else if (input.equals(":show all") || input.equals(":all") || input.equals(":a")) {
                prefs.putBoolean(SHOW_ALL_RESULTS, true);
            } else if (input.equals(":notall") || input.equals(":aoff")) {
                prefs.putBoolean(SHOW_ALL_RESULTS, false);
            } else if (input.equals(":show derivs") || input.equals(":derivs") || input.equals(":d")) {
                prefs.putBoolean(SHOW_DERIVATIONS, true);
            } else if (input.equals(":noderivs") || input.equals(":doff")) {
                prefs.putBoolean(SHOW_DERIVATIONS, false);
            } else if (input.startsWith(":time limit") || input.startsWith(":tl")) {
                String[] tokens = input.split("\\s+");
                String last = tokens[tokens.length-1];
                try {
                    int limit = Integer.parseInt(last);
                    prefs.putInt(opennlp.ccg.realize.Chart.TIME_LIMIT, limit);
                } catch (NumberFormatException exc) {
                    System.out.println("Expecting a time limit in ms, rather than: " + last);
                }
            } else if (input.startsWith(":no time limit") || input.startsWith(":notl")) {
                prefs.putInt(opennlp.ccg.realize.Chart.TIME_LIMIT, opennlp.ccg.realize.Chart.NO_TIME_LIMIT);
            } else if (input.startsWith(":nbtl")) {
                String[] tokens = input.split("\\s+");
                String last = tokens[tokens.length-1];
                try {
                    double limit = Double.parseDouble(last);
                    prefs.putDouble(opennlp.ccg.realize.Chart.NEW_BEST_TIME_LIMIT, limit);
                } catch (NumberFormatException exc) {
                    System.out.println("Expecting a time limit in ms, rather than: " + last);
                }
            } else if (input.startsWith(":nonbtl")) {
                prefs.putDouble(opennlp.ccg.realize.Chart.NEW_BEST_TIME_LIMIT, opennlp.ccg.realize.Chart.NO_TIME_LIMIT);
            } else if (input.startsWith(":edge limit") || input.startsWith(":el")) {
                String[] tokens = input.split("\\s+");
                String last = tokens[tokens.length-1];
                try {
                    int limit = Integer.parseInt(last);
                    prefs.putInt(opennlp.ccg.realize.Chart.EDGE_LIMIT, limit);
                } catch (NumberFormatException exc) {
                    System.out.println("Expecting an edge limit, rather than: " + last);
                }
            } else if (input.startsWith(":no edge limit") || input.startsWith(":noel")) {
                prefs.putInt(opennlp.ccg.realize.Chart.EDGE_LIMIT, opennlp.ccg.realize.Chart.NO_EDGE_LIMIT);
            } else if (input.startsWith(":pruning value") || input.startsWith(":pv")) {
                String[] tokens = input.split("\\s+");
                String last = tokens[tokens.length-1];
                try {
                    int val = Integer.parseInt(last);
                    prefs.putInt(opennlp.ccg.realize.Chart.PRUNING_VALUE, val);
                } catch (NumberFormatException exc) {
                    System.out.println("Expecting an integer pruning value, rather than: " + last);
                }
            } else if (input.startsWith(":no pruning value") || input.startsWith(":nopv")) {
                prefs.putInt(opennlp.ccg.realize.Chart.PRUNING_VALUE, opennlp.ccg.realize.Chart.NO_PRUNING);
            } else if (input.startsWith(":cell pruning value") || input.startsWith(":cpv")) {
                String[] tokens = input.split("\\s+");
                String last = tokens[tokens.length-1];
                try {
                    int val = Integer.parseInt(last);
                    prefs.putInt(opennlp.ccg.realize.Chart.CELL_PRUNING_VALUE, val);
                } catch (NumberFormatException exc) {
                    System.out.println("Expecting an integer cell pruning value, rather than: " + last);
                }
            } else if (input.startsWith(":no cell pruning value") || input.startsWith(":nocpv")) {
                prefs.putInt(opennlp.ccg.realize.Chart.CELL_PRUNING_VALUE, opennlp.ccg.realize.Chart.NO_PRUNING);
            } else if (input.equals(":upon")) {
                prefs.putBoolean(opennlp.ccg.realize.Chart.DO_UNPACKING, true);
            } else if (input.equals(":upoff")) {
                prefs.putBoolean(opennlp.ccg.realize.Chart.DO_UNPACKING, false);
            } else if (input.startsWith(":select reading") || input.startsWith(":sel")) {
                String[] tokens = input.split("\\s+");
                String last = tokens[tokens.length-1];
                try {
                    int reading = Integer.parseInt(last);
                    if (reading > lastResults.length) {
                        System.out.println("Only " + lastResults.length + " parses found.");
                    } else if (lastLFs[reading-1] == null) {
                        System.out.println("LF not available, use :all command and reparse.");
                    } else {
                        lastReading = reading-1;
                    }
                } catch (NumberFormatException exc) {
                    System.out.println("Expecting a reading number, rather than: " + last);
                }
            } else if (input.equals(":timing on") || input.equals(":ton") || input.equals(":t")) {
                prefs.putBoolean(SHOW_TIMING, true);
            } else if (input.equals(":timing off") || input.equals(":toff")) {
                prefs.putBoolean(SHOW_TIMING, false);
            } else if (input.equals(":show incomplete") || input.equals(":inc")) {
                prefs.putBoolean(SHOW_INCOMPLETE_EDGES, true);
                prefs.putBoolean(Edge.SHOW_COMPLETENESS, true);
            } else if (input.equals(":noinc")) {
                prefs.putBoolean(SHOW_INCOMPLETE_EDGES, false);
                prefs.putBoolean(Edge.SHOW_COMPLETENESS, false);
            } else if (input.equals(":indexing on") || input.equals(":ion")) {
                prefs.putBoolean(EdgeFactory.USE_INDEXING, true);
            } else if (input.equals(":indexing off") || input.equals(":ioff")) {
                prefs.putBoolean(EdgeFactory.USE_INDEXING, false);
            } else if (input.equals(":missing index combos on") || input.equals(":mion")) {
                prefs.putBoolean(EdgeFactory.ALLOW_MISSING_INDEX_COMBOS, true);		
            } else if (input.equals(":missing index combos off") || input.equals(":mioff")) {
                prefs.putBoolean(EdgeFactory.ALLOW_MISSING_INDEX_COMBOS, false);		
            } else if (input.equals(":chunks on") || input.equals(":con")) {
                prefs.putBoolean(EdgeFactory.USE_CHUNKS, true);
            } else if (input.equals(":chunks off") || input.equals(":coff")) {
                prefs.putBoolean(EdgeFactory.USE_CHUNKS, false);
            } else if (input.equals(":feature licensing on") || input.equals(":flon")) {
                prefs.putBoolean(EdgeFactory.USE_FEATURE_LICENSING, true);
            } else if (input.equals(":feature licensing off") || input.equals(":floff")) {
                prefs.putBoolean(EdgeFactory.USE_FEATURE_LICENSING, false);
            } else if (input.equals(":combos on") || input.equals(":ccon")) {
                prefs.putBoolean(opennlp.ccg.realize.Chart.USE_COMBOS, true);
            } else if (input.equals(":combos off") || input.equals(":ccoff")) {
                prefs.putBoolean(opennlp.ccg.realize.Chart.USE_COMBOS, false);
            } else if (input.equals(":pon")) {
                prefs.putBoolean(opennlp.ccg.realize.Chart.USE_PACKING, true);
            } else if (input.equals(":poff")) {
                prefs.putBoolean(opennlp.ccg.realize.Chart.USE_PACKING, false);
            } else if (input.startsWith(":realize") || input.startsWith(":r")) {
                LF lf;
                NgramScorer ngramScorer;
                // nb: need to upgrade, consolidate :r FN option with Realize.java ...
                int space = input.indexOf(" ");
                if (space != -1) { // check for filename
                    String filename = readFilename(input.substring(space));
                    if (filename == null) {
                        System.out.println("Expecting a filename to read from.");
                        continue;
                    }
                    try {
                        Document doc = grammar.loadFromXml(filename);
                        lf = Realizer.getLfFromDoc(doc);
                        // nb: just handling explicit targets for now ...
                        List<Element> targetElts = doc.getRootElement().getChildren("target");
                        String[] targets = new String[targetElts.size()];
                        for (int i=0; i < targetElts.size(); i++) {
                            Element ex = (Element) targetElts.get(i);
                            String target = ex.getText();
                            targets[i] = target;
                        }
                        ngramScorer = new NgramPrecisionModel(targets);
                    }
                    catch (IOException exc) {
                        System.out.println("Unable to read: " + filename);
                        System.out.println(exc.toString());
                        continue;
                    }
                }
                else { // otherwise use last reading of last LF
                    if (lastLFs == null || lastLFs[lastReading] == null) {
                        System.out.println("Nothing to realize!");
                        continue;
                    }
                    lf = grammar.transformLF(lastLFs[lastReading]);
                    String[] targets = new String[1];
                    targets[0] = lastSentence;
                    ngramScorer = new NgramPrecisionModel(targets);
                }
                realizer.realize(lf, ngramScorer);
                opennlp.ccg.realize.Chart chart = realizer.getChart();
                boolean showIncompleteEdges = prefs.getBoolean(SHOW_INCOMPLETE_EDGES, false);
                boolean showTiming = prefs.getBoolean(SHOW_TIMING, false);
                if (showIncompleteEdges) chart.printEdges();
                else chart.printEdges(true, true);
                if (showTiming) { chart.printTiming(); }
            } else if (input.startsWith(":2xml")) {
                if (lastLFs == null || lastLFs[lastReading] == null) {
                    System.out.println("Nothing to save!");
                    continue;
                }
                String filename = readFilename(input.substring(5));
                if (filename == null) {
                    System.out.println("Expecting a filename to save to.");
                    continue;
                }
                grammar.saveToXml(lastLFs[lastReading], lastSentence, filename);
                System.out.println("Wrote LF to \"" + filename + "\"");
            } else if (input.startsWith(":2tb")) {
                if (lastLFs == null || lastLFs[lastReading] == null) {
                    System.out.println("Nothing to save!");
                    continue;
                }
                String filename = readFilename(input.substring(4));
                if (filename == null) { filename = "testbed.xml"; }
                RegressionInfo.addToTestbed(grammar, lastResults[lastReading], lastResults.length, lastLFs[lastReading], filename);
                System.out.println("Added test item to \"" + filename + "\"");
            } else if (input.startsWith(":2apml")) {
                if (lastSentence.length() == 0) {
                    System.out.println("Nothing to save!");
                    continue;
                }
                String filename = readFilename(input.substring(6));
                if (filename == null) {
                    System.out.println("Expecting a filename to save to.");
                    continue;
                }
                grammar.saveToApml(lastResults[lastReading], filename);
                System.out.println("Wrote \"" + lastSentence + "\" to \"" + filename + "\" as APML");
            } else if (input.startsWith(":vison")) {
                prefs.putBoolean(VISUALIZE, true);
                if ((input.startsWith(":vison ")) && (input.length( )>= 8)) {   
                    String fname = input.substring(7);
                    if (fname.lastIndexOf('.')!=-1) {  
                        System.out.println("Filename should not contain a suffix. Suffixes .tex and .dvi are assumed.");
                        prefs.put("VISFNAME", "");
                    } 
                    else
                        prefs.put("VISFNAME", fname);
                } 
                else
                    prefs.put("VISFNAME", "");
            } else if (input.equals(":visoff")) {
                prefs.putBoolean(VISUALIZE, false);     
                prefs.put("VISFNAME", "");
            } else if (input.equals(":wordpos")) {
                prefs.putBoolean(Converter.USE_WORD_POSITIONS_FOR_ATOM_CONVERSION, true);     
            } else if (input.equals(":nowordpos")) {
                prefs.putBoolean(Converter.USE_WORD_POSITIONS_FOR_ATOM_CONVERSION, false);     
            } else if (input.equals(":eisner")) {
                prefs.putBoolean(AbstractCompositionRule.EISNER_CONSTRAINTS, true);
                AbstractCompositionRule.useEisnerConstraints = true; 
            } else if (input.equals(":noeisner")) {
                prefs.putBoolean(AbstractCompositionRule.EISNER_CONSTRAINTS, false);
                AbstractCompositionRule.useEisnerConstraints = false; 
            } else if (input.startsWith(":parse time limit") || input.startsWith(":ptl")) {
                String[] tokens = input.split("\\s+");
                String last = tokens[tokens.length-1];
                try {
                    int limit = Integer.parseInt(last);
                    prefs.putInt(Parser.PARSE_TIME_LIMIT, limit);
                } catch (NumberFormatException exc) {
                    System.out.println("Expecting a time limit in ms, rather than: " + last);
                }
            } else if (input.startsWith(":no parse time limit") || input.startsWith(":noptl")) {
                prefs.putInt(Parser.PARSE_TIME_LIMIT, Parser.NO_TIME_LIMIT);
            } else if (input.startsWith(":parse edge limit") || input.startsWith(":pel")) {
                String[] tokens = input.split("\\s+");
                String last = tokens[tokens.length-1];
                try {
                    int limit = Integer.parseInt(last);
                    prefs.putInt(Parser.PARSE_EDGE_LIMIT, limit);
                } catch (NumberFormatException exc) {
                    System.out.println("Expecting an edge limit, rather than: " + last);
                }
            } else if (input.startsWith(":no parse edge limit") || input.startsWith(":nopel")) {
                prefs.putInt(Parser.PARSE_EDGE_LIMIT, Parser.NO_EDGE_LIMIT);
            } else if (input.startsWith(":parse pruning value") || input.startsWith(":ppv")) {
                String[] tokens = input.split("\\s+");
                String last = tokens[tokens.length-1];
                try {
                    int val = Integer.parseInt(last);
                    prefs.putInt(Parser.PARSE_PRUNING_VALUE, val);
                } catch (NumberFormatException exc) {
                    System.out.println("Expecting an integer pruning value, rather than: " + last);
                }
            } else if (input.startsWith(":no parse pruning value") || input.startsWith(":noppv")) {
                prefs.putInt(Parser.PARSE_PRUNING_VALUE, Parser.NO_PRUNING);
            } else if (input.startsWith(":parse cell pruning value") || input.startsWith(":pcpv")) {
                String[] tokens = input.split("\\s+");
                String last = tokens[tokens.length-1];
                try {
                    int val = Integer.parseInt(last);
                    prefs.putInt(Parser.PARSE_CELL_PRUNING_VALUE, val);
                } catch (NumberFormatException exc) {
                    System.out.println("Expecting an integer cell pruning value, rather than: " + last);
                }
            } else if (input.startsWith(":no parse cell pruning value") || input.startsWith(":nopcpv")) {
                prefs.putInt(Parser.PARSE_CELL_PRUNING_VALUE, Parser.NO_PRUNING);
            } else if (input.equals(":plazy")) {
                prefs.putBoolean(Parser.PARSE_LAZY_UNPACKING, true);     
            } else if (input.equals(":noplazy")) {
                prefs.putBoolean(Parser.PARSE_LAZY_UNPACKING, false);     
            } else { 
                try {
                    if (input.length() == 0) {
                        if (lastSentence.length() > 0) { 
                            input = lastSentence; 
                        } else {
                            System.out.println("Nothing to parse!");
                            continue;
                        }
                    }
                    parser.parse(input);
                    List<Sign> parses = parser.getResult();
                    Sign[] results = new Sign[parses.size()];
                    parses.toArray(results);
                    int resLength = results.length;
                    switch (resLength) {
                        case 0: break;
                        case 1: 
                            System.out.println(resLength + " parse found.\n"); 
                            break;
                        default: System.out.println(resLength + " parses found.\n"); 
                    }
                    
                    lastResults = results;
                    lastLFs = new LF[resLength];
                    if (input.length() > 0) { lastSentence = input; }
                    lastReading = 0;
    
                    boolean showall = prefs.getBoolean(SHOW_ALL_RESULTS, false);
                    boolean showderivs = prefs.getBoolean(SHOW_DERIVATIONS, false);
                    boolean showsem = prefs.getBoolean(SHOW_SEMANTICS, true);
                    boolean visualize = prefs.getBoolean(VISUALIZE, false); 
                    boolean showfeats = prefs.getBoolean(SHOW_FEATURES, false);
                    String feats_to_show = prefs.get(FEATURES_TO_SHOW, "");
                    Visualizer vis = null;
                    String baseFileName = null;
				    grammar.prefs.showSem = showsem;
				    grammar.prefs.showFeats = showfeats;
				    grammar.prefs.featsToShow = feats_to_show;
                    if (visualize) { 
                        vis = new Visualizer(); 
                        if (prefs.get("VISFNAME", "").equals(""))
                            baseFileName = vis.getTempFileName();
                        else
                            baseFileName = prefs.get("VISFNAME", "");
                        vis.writeHeader(baseFileName+".tex");  
                    }
                    int numToShow = (showall) ? resLength : 1;
                    for (int i=0; i < numToShow; i++) {
                        Category cat = results[i].getCategory();
                        LF convertedLF = null;
                        if (cat.getLF() != null) {
                            cat = cat.copy();
                            Nominal index = cat.getIndexNominal(); 
                            Sign rootSign = results[i]; // could add a switch here for naming convention
                            convertedLF = HyloHelper.compactAndConvertNominals(cat.getLF(), index, rootSign);
                            lastLFs[i] = convertedLF; 
                            cat.setLF(null);
                        }
                        String parseNum = (resLength == 1) ? "Parse: " : ("Parse "+(i+1)+": "); 
                        System.out.print(parseNum + cat.toString());
                        if (showsem && convertedLF != null) {
                            System.out.println(" : ");
                            System.out.println("  " + convertedLF.prettyPrint("  "));
                        }
                        else System.out.println();
                        if (showderivs) {
                            System.out.println("------------------------------");
                            System.out.println(results[i].getDerivationHistory());
                        }
                        if (visualize)
                            vis.saveTeXFile(results[i], baseFileName + ".tex" );
                    }
                    if (visualize) {
                        vis.writeFooter(baseFileName + ".tex"); 
                        vis.show(baseFileName); 
                        if (prefs.get("VISFNAME","").equals("")) // If temporary file,
                            vis.cleanFiles(baseFileName);       // clean it
                        else {
                            vis.cleanAuxFiles(baseFileName);
                            System.out.println("Saved to files " + baseFileName + ".tex and " + baseFileName + ".dvi");
                        }
                        vis = null; 
                    }
                } catch(ParseException pe) {
                    System.out.println(pe);
                }
            }
        }
		
		// store command input history in preferences
		prefs.put(historyKey, lineReader.getCommandHistory());
		
        // done
		System.out.println("Exiting tccg.");
		System.exit(0);
    }


    // reads the next token in the string as a filename
    private static String readFilename(String s) throws IOException {
        StreamTokenizer st = new StreamTokenizer(new StringReader(s));
        st.wordChars('/','/'); st.wordChars('\\','\\'); st.wordChars(':',':'); 
        st.nextToken();
        return st.sval;
    }
    
    
    /** Shows help for the command-line tool. */
    public static void showHelp() {
        System.out.println();
        System.out.println("Commands for tccg (otherwise input is parsed):");
        System.out.println();
        System.out.println("  :sh\t\t\tshow current preference settings");
        System.out.println("  :v\t\t\tverbose output");
        System.out.println("  :reset\t\treset options to defaults");
        System.out.println("  :feats (L)\t\tshow features (or just show features in list L)");
        System.out.println("  :nofeats\t\tdon't show features");
        System.out.println("  :sem\t\t\tshow semantics");
        System.out.println("  :nosem\t\tdon't show semantics");
        System.out.println("  :all\t\t\tshow all parse results");
        System.out.println("  :notall\t\tdon't show all parse results");
        System.out.println("  :derivs\t\tshow derivations");
        System.out.println("  :noderivs\t\tdon't show derivations");
        System.out.println("  :vison (FN)\t\tturn visualization on (saving to file with name FN)");
        System.out.println("  :visoff\t\tturn visualization off");
        System.out.println("  :wordpos\t\tuse word positions to name converted nominals");
        System.out.println("  :nowordpos\t\tdon't use word positions to name converted nominals");
        System.out.println("  :eisner\t\tuse Eisner constraints on composition");
        System.out.println("  :noeisner\t\tturn off Eisner constraints on composition");
        System.out.println();
        System.out.println("  :ptl N\t\tset parse time limit to N ms");
        System.out.println("  :noptl\t\tset parse time limit to none");
        System.out.println("  :pel N\t\tset parse edge limit to N");
        System.out.println("  :nopel\t\tset parse edge limit to none");
        System.out.println("  :ppv N\t\tset parse pruning value to N");
        System.out.println("  :noppv\t\tset parse pruning value to none");
        System.out.println("  :pcpv N\t\tset parse cell pruning value to N");
        System.out.println("  :nopcpv\t\tset parse cell pruning value to none");
        System.out.println("  :plazy\t\tturn lazy unpacking on in parser");
        System.out.println("  :noplazy\t\tturn lazy unpacking off in parser");
        System.out.println();
        System.out.println("  :r (FN)\t\trealize selected reading (or from XML file with name FN)");
        System.out.println("  :sel N\t\tselect reading N for realization or saving");
        System.out.println("  :2xml FN\t\tsave last input and LF to XML file with name FN");
        System.out.println("  :2tb (FN)\t\tadd last input and LF as a test item (to file with name FN)");
        System.out.println("  :2apml FN\t\tsave last input to APML file with name FN");
        System.out.println();
        System.out.println("  :tl N\t\t\tset realization time limit to N ms");
        System.out.println("  :notl\t\t\tset realization time limit to none");
        System.out.println("  :nbtl N\t\tset realization new best time limit to N ms | N < 1 of first");
        System.out.println("  :nonbtl\t\tset realization new best time limit to none");
        System.out.println("  :el N\t\t\tset realization edge limit to N");
        System.out.println("  :noel\t\t\tset realization edge limit to none");
        System.out.println("  :pv N\t\t\tset realization pruning value to N");
        System.out.println("  :nopv\t\t\tset realization pruning value to none");
        System.out.println("  :cpv N\t\tset realization cell pruning value to N");
        System.out.println("  :nocpv\t\tset realization cell pruning value to none");
        System.out.println("  :upon\t\t\tturn unpacking on");
        System.out.println("  :upoff\t\tturn unpacking off");
        System.out.println("  :t\t\t\tturn realization timing on");
        System.out.println("  :toff\t\t\tturn realization timing off");
        System.out.println("  :inc\t\t\tshow incomplete realization edges");
        System.out.println("  :noinc\t\tdon't show incomplete realization edges");
        System.out.println();
        System.out.println("  :ion\t\t\tturn index filtering on");
        System.out.println("  :ioff\t\t\tturn index filtering off");
        System.out.println("  :mion\t\t\tturn missing index combos on");
        System.out.println("  :mioff\t\tturn missing index combos off");
        System.out.println("  :con\t\t\tturn LF chunks on");
        System.out.println("  :coff\t\t\tturn LF chunks off");
        System.out.println("  :flon\t\t\tturn feature licensing on");
        System.out.println("  :floff\t\tturn feature licensing off");
        System.out.println("  :ccon\t\t\tturn collected combos on");
        System.out.println("  :ccoff\t\tturn collected combos off");
        System.out.println("  :pon\t\t\tturn packing on");
        System.out.println("  :poff\t\t\tturn packing off");
        
        System.out.println();
        System.out.println("  :q\t\t\tquit tccg");
        System.out.println("  :h\t\t\tshow this message");
        System.out.println();
    }

    /** Shows current settings. */
    public static void showSettings(Preferences prefs) {
        System.out.println();
        System.out.println("Current preference settings:"); 
        System.out.println();
        boolean showfeats = prefs.getBoolean(SHOW_FEATURES, false);
        boolean showsem = prefs.getBoolean(SHOW_SEMANTICS, true);
        String feats = prefs.get(FEATURES_TO_SHOW, "");
        System.out.println("  show feats:\t\t" + showfeats); 
        System.out.println("  show semantics:\t" + showsem);
        if (showfeats) {
            System.out.println("  feats to show:\t" + ((feats.length() > 0) ? feats : "all")); 
        }
        boolean showall = prefs.getBoolean(SHOW_ALL_RESULTS, false);
        boolean showderivs = prefs.getBoolean(SHOW_DERIVATIONS, false);
        System.out.println("  show all:\t\t" + showall); 
        System.out.println("  show derivs:\t\t" + showderivs);
        boolean visualize = prefs.getBoolean(VISUALIZE, false); 
        String visfname = prefs.get("VISFNAME", "");
        System.out.println("  visualize:\t\t" + ((visualize) ? "on" : "off"));
        if (visfname.length() > 0) {
            System.out.println("  vis file name:\t" + visfname);
        }
        boolean wordpos = prefs.getBoolean(Converter.USE_WORD_POSITIONS_FOR_ATOM_CONVERSION, true); 
        System.out.println("  word pos:\t\t" + ((wordpos) ? "on" : "off"));
        boolean eisner = prefs.getBoolean(AbstractCompositionRule.EISNER_CONSTRAINTS, true); 
        System.out.println("  Eisner constraints:\t" + ((eisner) ? "on" : "off"));
        System.out.println();
        int ptl = prefs.getInt(Parser.PARSE_TIME_LIMIT, Parser.NO_TIME_LIMIT);
        System.out.println("  parse time limit:\t" + ((ptl == Parser.NO_TIME_LIMIT) ? "none" : "" + ptl + " ms"));
        int pel = prefs.getInt(Parser.PARSE_EDGE_LIMIT, Parser.NO_EDGE_LIMIT);
        System.out.println("  parse edge limit:\t" + ((pel == Parser.NO_EDGE_LIMIT) ? "none" : "" + pel));
        int ppv = prefs.getInt(Parser.PARSE_PRUNING_VALUE, Parser.NO_PRUNING);
        System.out.println("  parse pruning value:\t" + ((ppv == Parser.NO_PRUNING) ? "none" : "" + ppv));
        int pcpv = prefs.getInt(Parser.PARSE_CELL_PRUNING_VALUE, Parser.NO_PRUNING);
        System.out.println("  parse cell prune val:\t" + ((pcpv == Parser.NO_PRUNING) ? "none" : "" + pcpv));
        boolean plazy = prefs.getBoolean(Parser.PARSE_LAZY_UNPACKING, true);
        System.out.println("  lazy unpacking:\t" + ((plazy) ? "on" : "off")); 
        System.out.println();
        int tl = prefs.getInt(opennlp.ccg.realize.Chart.TIME_LIMIT, opennlp.ccg.realize.Chart.NO_TIME_LIMIT);
        System.out.println("  time limit:\t\t" + ((tl == opennlp.ccg.realize.Chart.NO_TIME_LIMIT) ? "none" : "" + tl + " ms"));
        double nbtl = prefs.getDouble(opennlp.ccg.realize.Chart.NEW_BEST_TIME_LIMIT, opennlp.ccg.realize.Chart.NO_TIME_LIMIT);
        String nbtlStr = (nbtl >= 1) ? (((int)nbtl) + " ms") : (nbtl + " of first");
        System.out.println("  new best time limit:\t" + ((nbtl == opennlp.ccg.realize.Chart.NO_TIME_LIMIT) ? "none" : nbtlStr));
        int el = prefs.getInt(opennlp.ccg.realize.Chart.EDGE_LIMIT, opennlp.ccg.realize.Chart.NO_EDGE_LIMIT);
        System.out.println("  edge limit:\t\t" + ((el == opennlp.ccg.realize.Chart.NO_EDGE_LIMIT) ? "none" : "" + el));
        int pv = prefs.getInt(opennlp.ccg.realize.Chart.PRUNING_VALUE, opennlp.ccg.realize.Chart.NO_PRUNING);
        System.out.println("  pruning value:\t" + ((pv == opennlp.ccg.realize.Chart.NO_PRUNING) ? "none" : "" + pv));
        int cpv = prefs.getInt(opennlp.ccg.realize.Chart.CELL_PRUNING_VALUE, opennlp.ccg.realize.Chart.NO_PRUNING);
        System.out.println("  cell pruning value:\t" + ((cpv == opennlp.ccg.realize.Chart.NO_PRUNING) ? "none" : "" + cpv));
        boolean unpacking = prefs.getBoolean(opennlp.ccg.realize.Chart.DO_UNPACKING, true);
        System.out.println("  unpacking:\t\t" + ((unpacking) ? "on" : "off")); 
        boolean showtiming = prefs.getBoolean(SHOW_TIMING, false);
        System.out.println("  timing:\t\t" + ((showtiming) ? "on" : "off")); 
        boolean showinc = prefs.getBoolean(SHOW_INCOMPLETE_EDGES, false);
        System.out.println("  show incomplete:\t" + ((showinc) ? "on" : "off")); 
        System.out.println();
        boolean indexing = prefs.getBoolean(EdgeFactory.USE_INDEXING, true);
	boolean missingIndexCombos = prefs.getBoolean(EdgeFactory.ALLOW_MISSING_INDEX_COMBOS, false);		
        boolean chunks = prefs.getBoolean(EdgeFactory.USE_CHUNKS, true);
        boolean licensing = prefs.getBoolean(EdgeFactory.USE_FEATURE_LICENSING, true);
        boolean combos = prefs.getBoolean(opennlp.ccg.realize.Chart.USE_COMBOS, true);
        boolean packing = prefs.getBoolean(opennlp.ccg.realize.Chart.USE_PACKING, false);
        System.out.println("  index filtering:\t" + ((indexing) ? "on" : "off"));
        System.out.println("  missing index combos:\t" + ((missingIndexCombos) ? "on" : "off"));
        System.out.println("  chunks:\t\t" + ((chunks) ? "on" : "off"));
        System.out.println("  licensing:\t\t" + ((licensing) ? "on" : "off"));
        System.out.println("  combos:\t\t" + ((combos) ? "on" : "off"));
        System.out.println("  packing:\t\t" + ((packing) ? "on" : "off"));
        System.out.println();
    }
}


================================================
FILE: src/opennlp/ccg/WebCCG.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2006 Ben Wing.
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg;

import opennlp.ccg.lexicon.*;
import opennlp.ccg.grammar.*;
import opennlp.ccg.parse.*;
import opennlp.ccg.util.*;
import opennlp.ccg.synsem.*;
//import opennlp.ccg.realize.*;
import opennlp.ccg.hylo.*;
//import opennlp.ccg.ngrams.*;
//import opennlp.ccg.test.*;

//import org.jdom.*;

import java.io.*;
import java.net.*;
import java.util.*;

/**
 * An interface for use with a higher-level web interface.  This should
 * provide as simple an interface onto parsing as possible, with its output
 * in a format that can be easily handled by a CGI program or similar.
 * Called as
 *
 * webccg [-showall] [-showderivs] [-showsem] [-visualize FILE] GRAMMARDIR

-showall shows all parses rather than just the first one.
-showderivs shows the derivation history of each parse.
-showsem shows the logical form of each parse.
-visualize output a visualization of the parses into FILE (in PNG format).
 *
 * @author  Ben Wing
 * @version $Revision: 1.4 $, $Date: 2009/12/21 03:27:18 $
 */
public class WebCCG {
    /** Main method for tccg. */
    public static void main(String[] args) throws IOException, LexException { 
	String usage = "java opennlp.ccg.WebCCG " + 
"[-showall] [-showderivs] [-showsem] [-showfeats] [-visualize FILE] GRAMMARDIR\n" +
"\n" +
"-showall shows all parses rather than just the first one.\n" +
"-showderivs shows the derivation history of each parse.\n" +
"-showsem shows the logical form of each parse.\n" +
"-showfeats shows the features associated with each nonterminal.\n" +
"-visualize output a visualization of the parses into FILE (in TEX format).\n"+
"   to convert to an image, try this:\n" +
"   latex foo.tex; dvips foo.dvi | pstopnm | pnmtopng > foo.png\n" +
"\n" +
"Sentences to parse are read from standard input.\n";

	if (args.length > 0 && (args[0].equals("-h") || args[0].equals("-help"))) {
	    System.out.println("Usage: " + usage);
	    System.exit(0);
	}

	// args        
	//String prefsfile = null;
	boolean showall = false;
	boolean showderivs = false;
	boolean showsem = false;
	boolean showfeats = false;
	String visfile = null;
	int i;
	for (i = 0; i < args.length; i++) {
	    if (args[i].equals("-showall"))
		showall = true;
	    else if (args[i].equals("-showderivs"))
		showderivs = true;
	    else if (args[i].equals("-showsem"))
		showsem = true;
	    else if (args[i].equals("-showfeats"))
		showfeats = true;
	    else if (args[i].equals("-visualize"))
		visfile = args[++i];
	    else
		break;
	}
	if (i != args.length - 1) {
	    System.out.println("Usage: " + usage);
	    System.exit(0);
	}
	String grammarfile = args[i] + "/grammar.xml";

	// load grammar
	URL grammarURL = new File(grammarfile).toURI().toURL();
	//System.out.println("Loading grammar from URL: " + grammarURL);
	Grammar grammar = new Grammar(grammarURL);

	//if (grammar.getName() != null)
	//  System.out.println("Grammar '" + grammar.getName() + "' loaded.");

	// create parser and realizer
	Parser parser = new Parser(grammar);
	//Realizer realizer = new Realizer(grammar);

	BufferedReader br = new BufferedReader(new InputStreamReader(System.in));
	while (true) {
	    String input = br.readLine();
	    if (input == null) break; // EOF
	    input = input.trim();
	    if (input.equals(""))
		continue;
	    try {
		parser.parse(input);
		List<Sign> parses = parser.getResult();
		Sign[] results = new Sign[parses.size()];
		parses.toArray(results);
		int resLength = results.length;
		System.out.print("\"" + input + "\": ");
		switch (resLength) {
		case 0: break;
		case 1: 
		    System.out.println(resLength + " parse found.\n"); 
		    break;
		default: System.out.println(resLength + " parses found.\n"); 
		}
                    
		Visualizer vis = null; 
		grammar.prefs.showSem = showsem;
		grammar.prefs.showFeats = showfeats;
		grammar.prefs.featsToShow = "";
		if (visfile != null) { 
		    vis = new Visualizer(); 
		    vis.writeHeader(visfile);
		}
		int numToShow = (showall) ? resLength : 1;
		for (i=0; i < numToShow; i++) {
		    Category cat = results[i].getCategory();
		    LF convertedLF = null;
		    if (cat.getLF() != null) {
			cat = cat.copy();
			Nominal index = cat.getIndexNominal(); 
			convertedLF = HyloHelper.compactAndConvertNominals(cat.getLF(), index, results[i]);
			cat.setLF(null);
		    }
		    String parseNum = (resLength == 1) ? "Parse: " : ("Parse "+(i+1)+": "); 
		    System.out.print(parseNum + cat.toString());
		    if (showsem && convertedLF != null) {
			System.out.println(" : ");
			System.out.println("  " + convertedLF.prettyPrint("  "));
		    }
		    else System.out.println();
		    if (showderivs) {
			System.out.println("------------------------------");
			System.out.println(results[i].getDerivationHistory());
		    }
		    if (visfile != null)
			vis.saveTeXFile(results[i], visfile);
		}
		if (visfile != null) {
		    vis.writeFooter(visfile);
		}
	    } catch(ParseException pe) {
		System.out.print("\"" + input + "\": ");
		System.out.println(pe + ".\n");
	    }
	}
    }
}


================================================
FILE: src/opennlp/ccg/alignment/AbstractEncodingScheme.java
================================================
//////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2012 Scott Martin
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.alignment;

import java.util.Arrays;
import java.util.Collections;
import java.util.List;
import java.util.Set;

/**
 * Abstract class for implementing encoding schemes. This base class provides a constructor taking all the
 * necessary arguments for implementing {@link EncodingScheme}, and gives getter methods for all of them,
 * as required.
 * @author <a href="http://www.ling.osu.edu/~scott/">Scott Martin</a>
 * @see EncodingScheme
 */
public abstract class AbstractEncodingScheme implements EncodingScheme {
	
	/**
	 * Delimits a field within a mapping.
	 */
	protected Character fieldDelimiter;
	
	/**
	 * Delimits a mapping.
	 */
	protected Character mappingDelimiter;
	
	/**
	 * Delimits a group of mappings.
	 */
	protected Character groupDelimiter;
	
	/**
	 * The index base for IDs.
	 */
	protected IndexBase phraseNumberBase;
	
	/**
	 * The index base for indices.
	 */
	protected IndexBase indexBase;
	
	/**
	 * The order of the fields in mappings corresponding to this encoding scheme.
	 */
	protected List<MappingFormat.Field> order;
	
	/**
	 * The set of required fields in this encoding scheme.
	 */
	protected Set<MappingFormat.Field> required;
	
	/**
	 * The fields that this encoding scheme uses by default.
	 */
	protected Set<MappingFormat.Field> defaults;
	
	final boolean fieldDelimSep, mappingDelimSep, groupDelimSep;	
	
	protected AbstractEncodingScheme(Character fieldDelimiter, Character mappingDelimiter,
			Character groupDelimiter, IndexBase phraseNumberBase, IndexBase indexBase,
			Set<MappingFormat.Field> defaults, Set<MappingFormat.Field> required,
			MappingFormat.Field... order) {
		this.fieldDelimiter = fieldDelimiter;
		this.mappingDelimiter = mappingDelimiter;
		this.groupDelimiter = groupDelimiter;
		this.phraseNumberBase = phraseNumberBase;
		this.indexBase = indexBase;
		
		fieldDelimSep = isLineSeparator(fieldDelimiter);
		mappingDelimSep = isLineSeparator(mappingDelimiter);
		groupDelimSep = isLineSeparator(groupDelimiter);
		
		this.defaults = Collections.unmodifiableSet(defaults);
		this.required = Collections.unmodifiableSet(required);
		this.order = Collections.unmodifiableList(Arrays.asList(order));
	}
	
	static boolean isLineSeparator(Character c) {
		// TODO why doesn't Character.getType(c) == Character.LINE_SEPARATOR work?
		return c == '\r' || c == '\n';
	}
	
	/**
	 * Tests whether the supplied character counts as a field delimiter according to this encoding scheme.
	 * @return true if <code>c</code> is equal to {@link #fieldDelimiter} or both <code>c</code> and 
	 * {@link #fieldDelimiter} are line separators.
	 */
	public boolean isFieldDelimiter(Character c) {
		return fieldDelimiter.equals(c) || (fieldDelimSep && isLineSeparator(c)); 
	}
	
	/**
	 * Tests whether the supplied character counts as a mapping delimiter according to this encoding scheme.
	 * @return true if <code>c</code> is equal to {@link #mappingDelimiter} or both <code>c</code> and 
	 * {@link #mappingDelimiter} are line separators.
	 */
	public boolean isMappingDelimiter(Character c) {
		return mappingDelimiter.equals(c) || (mappingDelimSep && isLineSeparator(c)); 
	}
	
	/**
	 * Tests whether the supplied character counts as a group delimiter according to this encoding scheme.
	 * @return true if <code>c</code> is equal to {@link #groupDelimiter} or both <code>c</code> and 
	 * {@link #groupDelimiter} are line separators.
	 */
	public boolean isGroupDelimiter(Character c) {
		return groupDelimiter.equals(c) || (groupDelimSep && isLineSeparator(c)); 
	}

	/**
	 * Gets the delimiter for fields.
	 */
	public Character getFieldDelimiter() {
		return fieldDelimiter;
	}

	/**
	 * Gets the delimiter for mappings.
	 */
	public Character getMappingDelimiter() {
		return mappingDelimiter;
	}

	/**
	 * Gets the delimiter for groups.
	 */
	public Character getGroupDelimiter() {
		return groupDelimiter;
	}

	/**
	 * Gets the numbering base used for phrases.
	 */
	public IndexBase getPhraseNumberBase() {
		return phraseNumberBase;
	}

	/**
	 * Gets the numbering base used for mapping indices.
	 */
	public IndexBase getIndexBase() {
		return indexBase;
	}

	/**
	 * Gets the order in which fields occur in this encoding scheme.
	 */
	public List<MappingFormat.Field> getOrder() {
		return order;
	}

	/**
	 * Gets the required (non-optional) fields in this scheme.
	 */
	public Set<MappingFormat.Field> getRequired() {
		return required;
	}

	/**
	 * @return Gets the default fields used by this scheme.
	 */
	public Set<MappingFormat.Field> getDefaults() {
		return defaults;
	}

	/**
	 * Gets a hash code for this encoding scheme based on its delimiters, index bases, and fields.
	 */
	@Override
	public int hashCode() {
		return 37 * fieldDelimiter.hashCode() + groupDelimiter.hashCode() + mappingDelimiter.hashCode()
				+ indexBase.hashCode() + phraseNumberBase.hashCode() + order.hashCode()
				+ required.hashCode() + defaults.hashCode();
	}

	/**
	 * Tests whether this encoding scheme is equal to another based on its delimiters, index bases, and fields.
	 */
	@Override
	public boolean equals(Object obj) {
		if(obj instanceof AbstractEncodingScheme) {
			AbstractEncodingScheme e = (AbstractEncodingScheme)obj;
			
			return fieldDelimiter.equals(e.fieldDelimiter) && groupDelimiter.equals(e.groupDelimiter)
					&& mappingDelimiter.equals(e.mappingDelimiter) && indexBase.equals(e.indexBase)
					&& phraseNumberBase.equals(e.phraseNumberBase) && order.equals(e.order)
					&& required.equals(e.required) && defaults.equals(e.defaults);
		}
		
		return false;
	}

}


================================================
FILE: src/opennlp/ccg/alignment/Alignment.java
================================================
//////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2012 Scott Martin
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.alignment;

import static opennlp.ccg.alignment.PhrasePosition.A;
import static opennlp.ccg.alignment.PhrasePosition.B;

import java.util.AbstractMap;
import java.util.AbstractSet;
import java.util.Collection;
import java.util.Collections;
import java.util.Iterator;
import java.util.LinkedHashMap;
import java.util.LinkedHashSet;
import java.util.Map;
import java.util.Set;

import opennlp.ccg.util.DelegatedFilter;
import opennlp.ccg.util.Filter;
import opennlp.ccg.util.FilteredSet;
import opennlp.ccg.util.VisitedFilter;

/**
 * An alignment consisting of a pair of phrases and a set of mappings between them.
 * <p>
 * This class is a flat representation of the mappings between indices in its 
 * {@linkplain #getA() A-position} phrase and its {@linkplain #getB() B-position} phrase in that it is
 * simply a set of mappings. More granularity is available by calling
 * {@link #getTargets(Integer, PhrasePosition)}, which returns all the indices a certain index is mapped to
 * from a specified position.
 * Alignments also allow their indices to be accessed when the phrase position is not necessarily known, 
 * via {@link #get(PhrasePosition)}, {@link #getIndices(PhrasePosition)}, and {@link #asMap(PhrasePosition)}.
 * <p>
 * A detached view of this alignment as a map whose keys are the indices in a
 * specified position and whose values are the sets of indices that index maps to can be obtained by calling
 * {@link #asMap(PhrasePosition)}. If only the set of indices mapped to by a certain index is required,
 * {@link #getTargets(Integer, PhrasePosition)} provides similar functionality. The static method
 * {@link #fromMap(Phrase, Phrase, Map)} allows an alignment to be reconstructed from a map of indices to
 * sets of indices. 
 * <p>
 * A version of this alignment with the phrase positions reversed and all the mappings
 * {@linkplain Mapping#reverse() reversed} can be obtained by calling {@link #reverse()}.
 * 
 * @author <a href="http://www.ling.ohio-state.edu/~scott/">Scott Martin</a>
 * @see PhrasePosition
 * @see Phrase
 * @see Mapping
 */
public class Alignment extends AbstractSet<Mapping> implements Comparable<Alignment> {

	final Phrase a, b;
	final Set<Mapping> mappings;
	
	/**
	 * Creates a new alignment with the specified phrases and mappings between them. The specified set of
	 * mappings is copied in a way that preserves whatever ordering is present in the original set,
	 * via {@link LinkedHashSet}.
	 * 
	 * @param a The phrase to use for {@linkplain PhrasePosition#A the &quot;A&quot; position}.
	 * @param b The phrase to use for {@linkplain PhrasePosition#B the &quot;B&quot; position}.
	 * @param mappings The mappings between <tt>a</tt> and <tt>b</tt>, where the
	 * {@linkplain Mapping#getA() first index} is understood to belong to <tt>a</tt> and the
	 * {@linkplain Mapping#getB() second index} is understood to belong to <tt>b</tt>.
	 * 
	 * @throws IllegalArgumentException If either phrase is null, or if phrases <tt>a</tt> and <tt>b</tt> do not
	 * have matching {@linkplain Phrase#getNumber() numbers}, if <tt>mappings</tt> is <tt>null</tt>,
	 * or if any of the mappings have a non-null phrase number that is not equal to the phrases' numbers. 
	 * @throws IndexOutOfBoundsException If any of the mappings contains an index that does not
	 * exist in the phrase in the corresponding position.
	 * 
	 * @see LinkedHashSet
	 */
	public Alignment(Phrase a, Phrase b, Collection<? extends Mapping> mappings) {
		checkPhrases(a, b);
		
		if(mappings == null) {
			throw new IllegalArgumentException("mappings is null");
		}
		
		// have to set these first or checkMapping() throws exception
		this.a = a;
		this.b = b;
		
		for(Mapping m : mappings) {
			checkMapping(m);
		}
		
		
		this.mappings = new LinkedHashSet<Mapping>(mappings);
	}
	
	/**
	 * Creates a new alignment based on the specified phrases and map view of their mappings.
	 * @param a The {@linkplain PhrasePosition#A A-position} phrase.
	 * @param b The {@linkplain PhrasePosition#B B-position} phrase.
	 * @param map A map whose keys are the A-position indices and whose values are the B-position indices 
	 * that the corresponding key is mapped to.
	 * @return A new alignment with mappings created based on the specified <tt>map</tt>.
	 * 
	 * @see #asMap()
	 */
	public static Alignment fromMap(Phrase a, Phrase b, Map<Integer, Set<Integer>> map) {
		@SuppressWarnings("unchecked")
		Set<Mapping> ms = map.isEmpty() ? Collections.EMPTY_SET : new LinkedHashSet<Mapping>();
		
		for(Integer k : map.keySet()) {
			for(Integer v : map.get(k)) {
				ms.add(new Mapping(a.getNumber(), k, v));
			}
		}
		
		return new Alignment(a, b, ms);
	}
	
	/**
	 * Creates an alignment based on this one except that the phrases have
	 * switched positions and all of the mappings are reversed.
	 * 
	 * @return A new alignment with the phrases swapped and all the mappings'
	 * indices swapped.
	 * 
	 * @see Mapping#reverse()
	 */
	public Alignment reverse() {
		@SuppressWarnings("unchecked")
		Alignment r = new Alignment(getB(), getA(), Collections.EMPTY_SET);
		
		for(Mapping m : mappings) {
			r.add(m.reverse());
		}
		
		return r;
	}

	/**
	 * Gets this alignment's number.
	 * @return The value of the {@linkplain Phrase#getNumber() number} of the phrase in
	 * both {@linkplain PhrasePosition positions}.
	 */
	public Integer getNumber() {
		return a.number;
	}
	
	/**
	 * Gets the phrase in {@linkplain PhrasePosition#A A-position}.
	 */
	public Phrase getA() {
		return get(A);
	}

	/**
	 * Gets the phrase in {@linkplain PhrasePosition#B B-position}.
	 */
	public Phrase getB() {
		return get(B);
	}

	/**
	 * Gets the phrase in the specified position.
	 * @param pos The position in which to find the phrase.
	 * @return If <tt>pos</tt> is {@link PhrasePosition#notifyAll()}, the A-phrase; otherwise the B-phrase.
	 */
	public Phrase get(PhrasePosition pos) {
		return (pos == A) ? a : b;
	}
	
	/**
	 * Adds a new mapping to this alignment.
	 * @throws IndexOutOfBoundsException If either of the indices in <tt>m</tt> are out of bounds for the
	 * phrase in the corresponding {@linkplain PhrasePosition position}.
	 */
	@Override
	public boolean add(Mapping m) {
		checkMapping(m);
		return mappings.add(m);
	}

	/**
	 * Gets an iterator over the mappings in this alignment.
	 */
	@Override
	public Iterator<Mapping> iterator() {
		return mappings.iterator();
	}

	/**
	 * Gets the number of mappings in this alignment.
	 */
	@Override
	public int size() {
		return mappings.size();
	}
	
	/**
	 * Compares this alignment to another by comparing their {@linkplain #getNumber() numbers}.
	 * @param o The alignment to compare to.
	 * @return The value of <tt>getNumber().compareTo(o.getNumber())</tt>.
	 * @see Integer#compareTo(Integer)
	 */
	@Override
	public int compareTo(Alignment o) {
		return getNumber().compareTo(o.getNumber());
	}

	/**
	 * Tests whether this alignment is equal to another by comparing their mappings and their phrases.
	 * @see Phrase#equals(Object)
	 */
	@Override
	public boolean equals(Object o) {
		if(o instanceof Alignment) {
			Alignment al = (Alignment)o;
			return super.equals(o) && a.equals(al.a) && b.equals(al.b); 
		}
		
		return false;
	}

	/**
	 * Generates a hash code for this alignment based on its mappings and phrases.
	 */
	@Override
	public int hashCode() {
		return 37 * super.hashCode() + a.hashCode() + b.hashCode();
	}

	/**
	 * Gets a string representation of this alignment with both phrases and the mappings between them.
	 */
	@Override
	public String toString() {
		StringBuilder sb = new StringBuilder(A.name());
		sb.append(": ");
		sb.append(a.toString());
		sb.append(", ");
		sb.append(B.name());
		sb.append(": ");
		sb.append(b.toString());
		sb.append(", mappings: ");
		sb.append(super.toString());
		
		return sb.toString();
	}
	
	// Views and conveniences
	
	/**
	 * Gets the indices mapped to from the specified <tt>source</tt>, assuming that the source is in the
	 * {@linkplain PhrasePosition#A A-position}.
	 * 
	 * @return the value of <tt>getTargets(source, PhrasePosition.A)</tt>
	 * @see #getTargets(Integer, PhrasePosition)
	 */
	public Set<Integer> getTargets(Integer source) {
		return getTargets(source, A);
	}
	
	/**
	 * Gets the indices mapped to by a specified index starting from the specified position. For example, if
	 * an alignment contains the following mappings:
	 * <blockquote><pre>
	 * 7 <-> 4
	 * 3 <-> 4
	 * 4 <-> 4
	 * ...</pre></blockquote>
	 * Then calling <tt>getTargets(4,</tt> {@link PhrasePosition#B}<tt>)</tt> returns a set containing 7, 3,
	 * and 4.
	 * <p>
	 * Calling this method is equivalent to calling
	 * {@link #asMap(PhrasePosition) asMap}<tt>(sourcePosition).get(source)</tt>, with the exception that if
	 * no mappings have <tt>source</tt> in the source position, the empty set is returned rather than
	 * <tt>null</tt>.
	 * 
	 * @param source The index to look for targets of.
	 * @param sourcePosition The phrase position to assume the <tt>source</tt> index belongs to.
	 *  
	 * @return A set of indices in the {@linkplain PhrasePosition#opposite() opposite position} that the
	 * specified <tt>source</tt> index maps to (the same as <tt>asMap(sourcePosition).get(source)</tt>),
	 * or the empty set if no such indices are present.
	 * 
	 * @see #add(Mapping)
	 * @see #asMap(PhrasePosition)
	 */
	public Set<Integer> getTargets(Integer source, PhrasePosition sourcePosition) {
		return new LinkedHashSet<Integer>(new ValueView(source, sourcePosition));
	}
	
	/**
	 * Gets the indices in a specified phrase position. Specifically, returns a set containing every
	 * integer <tt>i</tt> such that there exists a mapping in this alignment that returns <tt>i</tt>
	 * for the call {@link Mapping#get(PhrasePosition)} with the specified <tt>position</tt> as argument.
	 * @param position The position to get indices for.
	 * @return The same value as <tt>asMap(position).keySet()</tt>.
	 * @see #asMap(PhrasePosition)
	 */
	public Set<Integer> getIndices(PhrasePosition position) {
		return new LinkedHashSet<Integer>(new KeyView(position));
	}

	/**
	 * Gets a map view of this alignment from the {@linkplain Alignments#DEFAULT_PHRASE_POSITION 
	 * default phrase position}. 
	 * @see #asMap(PhrasePosition)
	 */
	public Map<Integer, Set<Integer>> asMap() {
		return asMap(Alignments.DEFAULT_PHRASE_POSITION);
	}
	
	/**
	 * Gets a map view of this alignment from the specified key position. The returned map's keys are drawn
	 * from the mappings by accessing the specified key position, while the values are aggregated together
	 * into sets from the indices at <tt>keyPosition</tt>'s {@linkplain PhrasePosition#opposite() opposite
	 * position}. The returned map contains key/value pairs that can be used to reconstruct the alignment
	 * it is based on via the {@link #fromMap(Phrase, Phrase, Map)} method. That is, calling
	 * <blockquote><pre>Alignment.fromMap(a.getA(), a.getB(), a.asMap(PhrasePosition.A))</pre></blockquote>
	 * for any alignment <tt>a</tt> always returns an alignment that is equivalent to <tt>a</tt> according
	 * to the {@link #equals(Object)} method.
	 * <p>
	 * For example, if this alignment contains the following mappings
	 * <blockquote><pre>
	 * 0 <-> 0
	 * 0 <-> 1
	 * 1 <-> 2
	 * 3 <-> 2</pre>
	 * </blockquote>
	 * then calling <code>asMap(PhrasePosition.A)</code> returns a map with the key/value pairings
	 * <blockquote><pre>
	 * 0=[0, 1]
	 * 1=[2]
	 * 3=[2]</pre>
	 * </blockquote>
	 * while calling <code>asMap(PhrasePosition.B)</code> gives the map view from the &quot;opposite
	 * direction&quot;, i.e.
	 * <blockquote><pre>
	 * 0=[0]
	 * 1=[0]
	 * 2=[1, 3]</pre>
	 * </blockquote>
	 * Note that the order of the keys and values reflects the ordering of the alignment's mappings via
	 * {@link LinkedHashMap} and {@link LinkedHashSet}, and is dependent
	 * on its {@linkplain #iterator() iterator}. Also, the behavior of
	 * the returned map is not specified if mappings are added are removed to this alignment after a call to
	 * <code>asMap()</code>.
	 * <p>
	 * The returned map is detached from (not backed by) this set of mappings, so keys can be removed from and 
	 * added to it without any effect on this alignment. Similarly, the sets of indices that are the values
	 * of its entry set can be modified without affecting this alignment. The
	 * {@link #fromMap(Phrase, Phrase, Map)} provides the ability to create an alignment based on a map of
	 * A indices to sets of B indices.
	 * 
	 * @param keyPosition The phrase position that the resulting maps keys should be taken from. 
	 * @return A map whose {@linkplain Map#keySet() keys} are from the phrase in the specified position, and
	 * whose values are sets of indices from the phrase in the {@linkplain PhrasePosition#opposite() opposite}
	 * position.
	 * 
	 * @see #fromMap(Phrase, Phrase, Map)
	 * @see LinkedHashMap
	 * @see LinkedHashSet
	 */
	public Map<Integer, Set<Integer>> asMap(PhrasePosition keyPosition) {
		return new LinkedHashMap<Integer, Set<Integer>>(new MapView(keyPosition));
	}
	
	void checkPhrases(Phrase ap, Phrase bp) {
		if(ap == null) {
			throw new IllegalArgumentException(A.name() + " phrase is null");
		}
		
		if(bp == null) {
			throw new IllegalArgumentException(B.name() + " phrase is null");
		}
		
		if(!ap.number.equals(bp.number)) {
			throw new IllegalArgumentException("phrases have different numbers");
		}
	}
	
	void checkMapping(Mapping m) {
		if(m == null) {
			throw new IllegalArgumentException("attempt to add null mapping");
		}
		
		if(m.phraseNumber != null && !m.phraseNumber.equals(a.number)) {
			throw new IllegalArgumentException("mapping's phrase number does not match: expected "
					+ a.number + ", but was " + m.phraseNumber);
		}
		
		for(PhrasePosition pos : PhrasePosition.values()) {
			checkIndex(m.get(pos), pos);
		}
	}
	
	void checkIndex(Integer index, PhrasePosition intendedPosition) {
		if(index == null) {
			throw new IllegalArgumentException("attempt to add null index in position "
				+ intendedPosition.name()); 
		}
		
		if(index < -1 || get(intendedPosition).size() <= index) {
			throw new IndexOutOfBoundsException(intendedPosition.name() + " index out of bounds: " + index);
		}
	}
	
	class MapView extends AbstractMap<Integer, Set<Integer>> {
		PhrasePosition keyPosition;
		
		MapView(PhrasePosition keyPosition) {
			this.keyPosition = keyPosition;
		}

		@Override
		public Set<Entry<Integer, Set<Integer>>> entrySet() {
			return new AbstractSet<Entry<Integer, Set<Integer>>>() {
				private Set<Integer> keys = new KeyView(keyPosition);
				
				@Override
				public int size() {
					return keys.size();
				}

				@Override
				public Iterator<Entry<Integer, Set<Integer>>> iterator() {
					return new Iterator<Entry<Integer,Set<Integer>>>() {
						private Iterator<Integer> i = keys.iterator();
						
						@Override
						public boolean hasNext() {
							return i.hasNext();
						}

						@Override
						public Entry<Integer, Set<Integer>> next() {
							final Integer key = i.next();
							
							// copy values because HashMap's constructor doesn't
							return new SimpleImmutableEntry<Integer, Set<Integer>>(
									key, new LinkedHashSet<Integer>(new ValueView(key, keyPosition)));
						}
						
						@Override
						public void remove() {
							i.remove(); // throws UnsupportedOperationException
						}
					};
				}
			};
		}
	}
	
	abstract class IndexView extends AbstractSet<Integer> {

		PhrasePosition indexPosition;
		Filter<Mapping> indexFilter;
	
		private Set<Mapping> indices;
		
		IndexView(PhrasePosition indexPosition, Filter<Mapping> indexFilter) {
			this.indexPosition = indexPosition;
			this.indexFilter = indexFilter;
		}
		
		Set<Mapping> indices() {
			return (indices == null)
					? (indices = new FilteredSet<Mapping>(Alignment.this.mappings, indexFilter))
					: indices;
		}
		
		@Override
		public int size() {
			return indices().size();
		}

		@Override
		public Iterator<Integer> iterator() {
			return new Iterator<Integer>() {
				private Iterator<Mapping> i = indices().iterator();

				@Override
				public boolean hasNext() {
					return i.hasNext();
				}

				@Override
				public Integer next() {
					return i.next().get(indexPosition);
				}
				
				@Override
				public void remove() {
					throw new UnsupportedOperationException(); // just in case
				}
			};
		}		
	}
	
	class KeyView extends IndexView {
		KeyView(final PhrasePosition keyPosition) {
			super(keyPosition, new DelegatedFilter<Mapping, Integer>(new VisitedFilter<Integer>()) {
				@Override
				public Integer delegateValueFor(Mapping e) {
					return e.get(keyPosition);
				}
			});
		}
	}
	
	class ValueView extends IndexView {
		ValueView(final Integer key, final PhrasePosition keyPosition) {
			super(keyPosition.opposite(), new Filter<Mapping>() {
				@Override
				public boolean allows(Mapping m) {
					return key.equals(m.get(keyPosition));
				}
			});
		}		
	}
}


================================================
FILE: src/opennlp/ccg/alignment/Alignments.java
================================================
//////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2012 Scott Martin
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.alignment;

import static opennlp.ccg.alignment.MappingFormat.Field.A_INDEX_FIELD;
import static opennlp.ccg.alignment.MappingFormat.Field.B_INDEX_FIELD;
import static opennlp.ccg.alignment.MappingFormat.Field.PHRASE_NUMBER_FIELD;
import static opennlp.ccg.alignment.MappingFormat.Field.STATUS_FIELD;

import java.io.BufferedReader;
import java.io.BufferedWriter;
import java.io.File;
import java.io.FileReader;
import java.io.FileWriter;
import java.io.IOException;
import java.io.Reader;
import java.io.Writer;
import java.util.ArrayList;
import java.util.Collections;
import java.util.HashSet;
import java.util.LinkedHashMap;
import java.util.LinkedHashSet;
import java.util.List;
import java.util.Map;
import java.util.Set;
import java.util.SortedMap;
import java.util.SortedSet;
import java.util.TreeMap;
import java.util.TreeSet;
import java.util.regex.Pattern;

import opennlp.ccg.alignment.MappingFormat.Field;

/**
 * Static non-instantiable class that provides convenience methods for reading
 * and writing phrases, mappings, and alignments.
 * <p>
 * The convenience methods <tt>tokenize</tt> split a string into an array of strings, and the
 * <tt>untokenize</tt> methods provide their inverses. 
 * <p>
 * The <code>readXxxPhrases()</code> methods all call {@link #readPhrases(PhraseReader)} to read
 * {@linkplain Phrase phrases} from an underlying reader. Depending on the method, phrases are assumed to be
 * identified or to merely occur in sequence. Similarly, the <code>writeXxxPhrases</code> all call
 * {@link #writePhrases(List, PhraseWriter)}.
 * <p>
 * {@linkplain Mapping Mappings} can be read using <code>readMappings(...)</code> methods, which will read
 * mappings as formatted by the specified
 * format. The <code>readSortedMappings(...)</code> methods are variants of these that return a map with
 * sorted keys that map to {@linkplain SortedSet sorted sets} of mappings.  
 * The methods {@link #writeMappings(Map, File, MappingFormat)} and
 * {@link #writeMappings(Map, Writer, MappingFormat)} perform the inverse of the methods for reading. 
 * <p>
 * Finally, the <code>readXxxAlignments()</code> methods combine the methods for reading phrases and mappings to
 * allow {@linkplain Alignments alignments} to be read. The methods
 * {@link #writeAlignments(List, File, File, File, String, MappingFormat)} and
 * {@link #writeAlignments(List, Writer, Writer, Writer, String, MappingFormat)} write alignments according to
 * a specified word separator and mapping format.
 * 
 * @see PhraseReader
 * @see PhraseWriter
 * @see IdentifiedPhraseReader
 * @see IdentifiedPhraseWriter
 * @see MappingReader
 * @see MappingWriter 
 * @see MappingFormat
 * @author <a href="http://www.ling.ohio-state.edu/~scott/">Scott Martin</a>
 */
public final class Alignments {

	/**
	 * The default status: {@link Status#SURE}.
	 */
	public static final Status DEFAULT_STATUS = Status.SURE;
	
	/**
	 * The default mapping confidence: <tt>1.0</tt>.
	 */
	public static final Double DEFAULT_CONFIDENCE = Double.valueOf(1.0d);
	
	/**
	 * The default phrase numbering base: {@link IndexBase#ZERO}.
	 */
	public static final IndexBase DEFAULT_PHRASE_NUMBER_BASE = IndexBase.ZERO;
	
	/**
	 * The default index base: {@link IndexBase#ZERO}.
	 */
	public static final IndexBase DEFAULT_INDEX_BASE = IndexBase.ZERO;
	
	/**
	 * The default phrase position: {@link PhrasePosition#A}.
	 */
	public static final PhrasePosition DEFAULT_PHRASE_POSITION = PhrasePosition.A;
	
	/**
	 * The default word delimiter pattern, which matches multiple whitespace characters.
	 */
	public static final Pattern DEFAULT_WORD_DELIMITER = Pattern.compile("\\s+");
	
	/**
	 * The default word separator, a single space.
	 */
	public static final String DEFAULT_WORD_SEPARATOR = " ";
	
	/**
	 * The default phrase identifier attribute name, &quot;snum&quot;.
	 */
	public static final String DEFAULT_PHRASE_IDENTIFIER_ATTRIBUTE = "snum";
	
	/**
	 * The default phrase tag, &quot;s&quot;.
	 */
	public static final String DEFAULT_PHRASE_TAG = "s";
	
	/**
	 * The Moses encoding scheme.
	 */
	public static final EncodingScheme MOSES_ENCODING_SCHEME;
	
	/**
	 * The NAACL encoding scheme.
	 */
	public static final EncodingScheme NAACL_ENCODING_SCHEME;
	
	/**
	 * The default fields for the Moses format.
	 */
	public static final Set<MappingFormat.Field> MOSES_DEFAULT_FIELDS;
	
	/**
	 * The default fields for the NAACL format.
	 */
	public static final Set<MappingFormat.Field> NAACL_DEFAULT_FIELDS;
	
	/**
	 * The fields used in the abbreviated Moses format: {@link Field#A_INDEX_FIELD},
	 * {@link Field#B_INDEX_FIELD}.
	 */
	public static final Set<MappingFormat.Field> MOSES_SHORT_FIELDS;
	
	/**
	 * The fields used in the abbreviated NAACL format: {@link Field#PHRASE_NUMBER_FIELD},
	 * {@link Field#A_INDEX_FIELD}, {@link Field#B_INDEX_FIELD}, {@link Field#STATUS_FIELD}.
	 */
	public static final Set<MappingFormat.Field> NAACL_SHORT_FIELDS;
	
	/**
	 * The fields used in the extremely abbreviated NAACL format: {@link Field#PHRASE_NUMBER_FIELD},
	 * {@link Field#A_INDEX_FIELD}, {@link Field#B_INDEX_FIELD}.
	 */
	public static final Set<MappingFormat.Field> NAACL_VERY_SHORT_FIELDS;
	
	/**
	 * The default {@linkplain MappingFormat#isStrict() mapping format strictness}: <tt>false</tt>.
	 */
	public static final boolean DEFAULT_STRICTNESS = false;
	
	/**
	 * The default {@linkplain IdentifiedPhraseWriter#isPadding() identified phrase writer padding}:
	 * <tt>false</tt>.
	 */
	public static final boolean DEFAULT_PHRASE_PADDING = false;
	
	
	static {
		Set<Field> msf = new HashSet<MappingFormat.Field>(),
				nsf = new HashSet<MappingFormat.Field>(),
				nvsf = new HashSet<MappingFormat.Field>();
		
		msf.add(A_INDEX_FIELD);
		msf.add(B_INDEX_FIELD);
		
		nsf.add(PHRASE_NUMBER_FIELD);
		nsf.add(A_INDEX_FIELD);
		nsf.add(B_INDEX_FIELD);
		nsf.add(STATUS_FIELD);
		
		nvsf.add(PHRASE_NUMBER_FIELD);
		nvsf.add(A_INDEX_FIELD);
		nvsf.add(B_INDEX_FIELD);
		
		MOSES_SHORT_FIELDS = Collections.unmodifiableSet(msf);
		NAACL_SHORT_FIELDS = Collections.unmodifiableSet(nsf);
		NAACL_VERY_SHORT_FIELDS = Collections.unmodifiableSet(nvsf);
		
		MOSES_DEFAULT_FIELDS = MOSES_SHORT_FIELDS;
		NAACL_DEFAULT_FIELDS = NAACL_SHORT_FIELDS;
		
		// these have to come last, they depend on some of the others
		MOSES_ENCODING_SCHEME = new MosesEncodingScheme(); 
		NAACL_ENCODING_SCHEME = new NAACLEncodingScheme();
	}
	
	private Alignments() {
		// this class should not be instantiated
	}
	
	/**
	 * Tokenizes a string according to the {@linkplain #DEFAULT_WORD_DELIMITER default word delimiter}.
	 */
	public static String[] tokenize(String s) {
		return tokenize(s, DEFAULT_WORD_DELIMITER);
	}
	
	/**
	 * Tokenizes an array of strings according to the {@linkplain #DEFAULT_WORD_DELIMITER default word
	 * delimiter pattern}.
	 */
	public static String[] tokenize(String s, Pattern wordDelimiter) {
		return wordDelimiter.split(s);
	}
	
	/**
	 * Untokenizes a list of tokens into a single string, with former tokens separated by the
	 * {@linkplain #DEFAULT_WORD_SEPARATOR}.
	 * 
	 * @see #untokenize(List, String)
	 */
	public static String untokenize(List<String> tokens) {
		return untokenize(tokens, DEFAULT_WORD_SEPARATOR);
	}
	
	/**
	 * Untokenizes a list of tokens into a single string, with former tokens separated by the
	 * specified <tt>delimiter</tt> string.
	 */
	public static String untokenize(List<String> tokens, String delimiter) {
		return untokenize(tokens.toArray(new String[tokens.size()]));
	}
	
	/**
	 * Untokenizes an array of tokens into a single string using the
	 * {@linkplain #DEFAULT_WORD_SEPARATOR default word separator}.
	 * @param tokens
	 * @return An untokenized string from the given tokens, with individual
	 * tokens separated by the default word separator.
	 */
	public static String untokenize(String[] tokens) {
		return untokenize(tokens, DEFAULT_WORD_SEPARATOR);
	}
	
	/**
	 * Untokenizes an array of tokens into a single string, with former tokens separated by the
	 * specified <tt>delimiter</tt> string.
	 */
	public static String untokenize(String[] tokens, String delimiter) {
		StringBuilder sb = new StringBuilder();
		
		for(String w : tokens) {
			if(sb.length() > 0) {
				sb.append(delimiter);
			}
			
			sb.append(w.toString());
		}
		
		return sb.toString();
	}
	
	/**
	 * Reads phrases sequentially from the specified file.
	 * @see #readPhrases(Reader)
	 */
	public static List<Phrase> readPhrases(File f) throws IOException {
		return readPhrases(new BufferedReader(new FileReader(f)));
	}
	
	/**
	 * Reads phrases sequentially from the specified reader.
	 * @see #readPhrases(Reader, IndexBase)
	 */
	public static List<Phrase> readPhrases(Reader r) throws IOException {
		return readPhrases(r, DEFAULT_PHRASE_NUMBER_BASE);
	}
	
	/**
	 * Reads phrases from the specified reader. Phrases will have their line numbers translated into the
	 * specified index base.
	 * 
	 * @see #readPhrases(PhraseReader)
	 */
	public static List<Phrase> readPhrases(Reader r, IndexBase phraseNumberBase)
			throws IOException {
		PhraseReader reader = new PhraseReader(r, phraseNumberBase);
		
		try {
			return readPhrases(reader);
		}
		finally {
			reader.close();
		}
	}
	
	/**
	 * Reads phrases from the specified file.
	 * 
	 * @see #readIdentifiedPhrases(Reader)
	 */
	public static List<Phrase> readIdentifiedPhrases(File f) throws IOException {
		return readIdentifiedPhrases(new BufferedReader(new FileReader(f)));
	}
	
	/**
	 * Reads phrases from the specified reader, using the default
	 * {@linkplain #DEFAULT_PHRASE_NUMBER_BASE phrase number base},
	 * {@linkplain #DEFAULT_PHRASE_TAG phrase tag}, and
	 * {@linkplain #DEFAULT_PHRASE_IDENTIFIER_ATTRIBUTE phrase identifier attribute}.
	 * 
	 * @see #readIdentifiedPhrases(Reader, IndexBase, String, String)
	 */
	public static List<Phrase> readIdentifiedPhrases(Reader r) throws IOException {
		return readIdentifiedPhrases(r, DEFAULT_PHRASE_NUMBER_BASE, DEFAULT_PHRASE_TAG,
				DEFAULT_PHRASE_IDENTIFIER_ATTRIBUTE);
	}
	
	/**
	 * Reads phrases from the specified reader. The input is assumed to have markup accompanying the phrase data
	 * that indicates the {@linkplain Phrase#getId() phrase ID} for each phrase.
	 * 
	 * @param r The underlying reader.
	 * @param phraseNumberBase The index base to translate line numbers into.
	 * @param phraseTag The tag name for markup signaling a phrase.
	 * @param phraseIdentifierAttribute The name of the attribute that contains the phrase's ID in the markup.
	 * 
	 * @see #readPhrases(PhraseReader)
	 */
	public static List<Phrase> readIdentifiedPhrases(Reader r, IndexBase phraseNumberBase, String phraseTag,
			String phraseIdentifierAttribute) throws IOException {
		PhraseReader reader = new IdentifiedPhraseReader(r, phraseNumberBase, phraseTag,
				phraseIdentifierAttribute);
		
		try {
			return readPhrases(reader);
		}
		finally {
			reader.close();
		}
	}
	
	/**
	 * Reads phrases sequentially from the specified phrase reader.
	 * 
	 * @return A list of phrases in the order they are encountered by calling {@link PhraseReader#readPhrase()}
	 * on the specified <tt>reader</tt>.
	 * @throws IOException if one is thrown by the specified phrase reader.
	 * @see PhraseReader
	 */
	public static List<Phrase> readPhrases(PhraseReader reader) throws IOException {
		List<Phrase> l = new ArrayList<Phrase>();
		
		Phrase p;
		while((p = reader.readPhrase()) != null) {
			l.add(p);
		}
		
		return l;
	}
	
	/**
	 * Writes a list of phrases with IDs to the specified file.
	 * 
	 * @see #writeIdentifiedPhrases(List, Writer)
	 */
	public static void writeIdentifiedPhrases(List<Phrase> phrases, File f) throws IOException {
		writeIdentifiedPhrases(phrases, new BufferedWriter(new FileWriter(f)));
	}
	
	/**
	 * Writes a list of phrases with IDs to the specified writer, using the default
	 * {@linkplain #DEFAULT_WORD_SEPARATOR word separator},
	 * {@linkplain #DEFAULT_PHRASE_TAG phrase tag}, 
	 * {@linkplain #DEFAULT_PHRASE_IDENTIFIER_ATTRIBUTE phrase identifier attribute}, and
	 * {@linkplain #DEFAULT_PHRASE_PADDING padding flag}.
	 * 
	 * @see #writeIdentifiedPhrases(List, Writer, String, String, String, boolean)
	 */
	public static void writeIdentifiedPhrases(List<Phrase> phrases, Writer w) throws IOException {
		writeIdentifiedPhrases(phrases, w, DEFAULT_WORD_SEPARATOR, DEFAULT_PHRASE_TAG,
				DEFAULT_PHRASE_IDENTIFIER_ATTRIBUTE, DEFAULT_PHRASE_PADDING);
	}
	
	/**
	 * Writes a list of phrases to the specified writer.
	 * 
	 * @param phrases The phrases to write.
	 * @param w The underlying writer.
	 * @param wordSeparator The string to use to {@linkplain #untokenize(String[], String) untokenize} with.
	 * @param phraseTag The name of the tag used to signal a phrase in the output markup.
	 * @param phraseIdentifierAttribute The name of the attribute bearing the phrase's ID in the output markup.
	 * @param padding Whether or not to include padding between the markup and the phrase data.
	 * 
	 * @see #writePhrases(List, PhraseWriter)
	 */
	public static void writeIdentifiedPhrases(List<Phrase> phrases, Writer w, String wordSeparator,
			String phraseTag, String phraseIdentifierAttribute, boolean padding) throws IOException {
		PhraseWriter pw = new IdentifiedPhraseWriter(w, wordSeparator, phraseTag, phraseIdentifierAttribute,
				padding);
		
		try {
			writePhrases(phrases, pw);
		}
		finally {
			pw.close();
		}
	}	
	
	/**
	 * Writes a list of phrases to the specified file.
	 * 
	 * @see #writePhrases(List, Writer)
	 */
	public static void writePhrases(List<Phrase> phrases, File f) throws IOException {
		writePhrases(phrases, new BufferedWriter(new FileWriter(f)));
	}
	
	/**
	 * Writes a list of phrases to the specified writer using the 
	 * {@linkplain #DEFAULT_WORD_SEPARATOR default word separator}.
	 * 
	 * @see #writePhrases(List, Writer, String)
	 */
	public static void writePhrases(List<Phrase> phrases, Writer w) throws IOException {
		writePhrases(phrases, w, DEFAULT_WORD_SEPARATOR);
	}
	
	/**
	 * Writes a list of phrases to the specified writer using the specified word separator.
	 * 
	 * @see #writePhrases(List, PhraseWriter)
	 */
	public static void writePhrases(List<Phrase> phrases, Writer w, String wordSeparator)
			throws IOException {
		PhraseWriter pw = new PhraseWriter(w, wordSeparator);
		
		try {
			writePhrases(phrases, pw);
		}
		finally {
			pw.close();
		}
	}
	
	/**
	 * Writes a list of phrases to the specified phrase writer.
	 * 
	 * @param phrases The phrases to write.
	 * @param writer The underlying phrase writer.
	 * @throws IOException if a call to {@link PhraseWriter#writePhrase(Phrase)} throws one for one of the
	 * <tt>phrases</tt>.
	 */
	public static void writePhrases(List<Phrase> phrases, PhraseWriter writer) throws IOException {
		for(Phrase p : phrases) {
			writer.writePhrase(p);
		}
	}
	
	/**
	 * Reads mappings from the specified file using the specified format.
	 * 
	 * @see #readMappings(Reader, MappingFormat)
	 */
	public static Map<Integer, Set<Mapping>> readMappings(File f, MappingFormat format)
			throws IOException {
		return readMappings(new BufferedReader(new FileReader(f)), format);
	}
	
	/**
	 * Reads mappings from the specified reader using the specified format.
	 * 
	 * @see #readMappings(MappingReader)
	 */
	public static Map<Integer, Set<Mapping>> readMappings(Reader r, MappingFormat format)
			throws IOException {
		MappingReader mr = new MappingReader(r, format);
		
		try {
			return readMappings(mr);
		}
		finally {
			mr.close();
		}
	}
	
	/**
	 * Reads mappings from the specified mapping reader. Once all available mappings have been read, the
	 * specified reader is {@linkplain MappingReader#close() closed}.
	 * 
	 * @param reader The mapping reader to read mappings from.
	 * @return A map whose keys are the {@linkplain Phrase#getNumber() phrase numbers} of the corresponding
	 * phrases and whose values are sets containing the mappings for the key phrase. Both the keys and the 
	 * sets of mappings are maintained in the order in which they occur in the input. 
	 * 
	 * @throws IOException if the underlying reader throws an exception, or if one of the 
	 * {@linkplain MappingGroup mapping groups} contains a duplicate mapping.
	 * 
	 * @see MappingReader
	 */
	public static Map<Integer, Set<Mapping>> readMappings(MappingReader reader) throws IOException {
		Map<Integer, Set<Mapping>> am = new LinkedHashMap<Integer, Set<Mapping>>();
		
		try {
			MappingGroup ag = null;
			while((ag = reader.nextGroup()) != null) {
				Set<Mapping> as = am.get(ag.phraseNumber);
				if(as == null) {
					as = new LinkedHashSet<Mapping>();
					am.put(ag.phraseNumber, as);
				}
				
				while(reader.canRead()) {
					Mapping m = reader.readMapping();
					if(!as.add(m)) {
						throw new IOException("duplicate mapping in group " + ag + ": " + m);
					}
				}
			}
		}
		finally {
			reader.close();
		}
		
		return am;
	}
	
	/**
	 * Reads mappings into a sorted map from the specified file, based on the specified format.
	 * 
	 * @see #readSortedMappings(Reader, MappingFormat)
	 */
	public static SortedMap<Integer, SortedSet<Mapping>> readSortedMappings(File f, MappingFormat format) 
			throws IOException {
		return readSortedMappings(new BufferedReader(new FileReader(f)), format);
	}
	
	/**
	 * Reads mappings into a sorted map from the specified reader, using the specified format to parse
	 * mappings. 
	 * 
	 * @see #readSortedMappings(MappingReader)
	 */
	public static SortedMap<Integer, SortedSet<Mapping>> readSortedMappings(Reader r, MappingFormat format)
			throws IOException {
		MappingReader mr = new MappingReader(r, format);
		
		try {
			return readSortedMappings(mr);
		}
		finally {
			mr.close();
		}
	}
	
	/**
	 * Reads mappings into a sorted map from the specified reader, using the specified format to parse
	 * mappings.
	 * 
	 * @param mr The mapping reader to use.
	 * @return A sorted map whose keys and values are also sorted according to their natural order.
	 * 
	 * @throws IOException if the underlying reader throws an exception.
	 * 
	 * @see Mapping#compareTo(Mapping)
	 */
	public static SortedMap<Integer, SortedSet<Mapping>> readSortedMappings(MappingReader mr)
			throws IOException {
		SortedMap<Integer, SortedSet<Mapping>> sm = new TreeMap<Integer, SortedSet<Mapping>>();
		
		Map<Integer, Set<Mapping>> m = readMappings(mr);
		
		for(Integer k : m.keySet()) {
			sm.put(k, new TreeSet<Mapping>(m.get(k)));
		}
		
		return sm;
	}
	
	/**
	 * Writes the specified map to the specified file using the format provided.
	 * 
	 * @see #writeMappings(Map, Writer, MappingFormat)
	 */
	public static void writeMappings(Map<Integer, Set<Mapping>> map, File f, MappingFormat format)
			throws IOException {
		writeMappings(map, new BufferedWriter(new FileWriter(f)), format);
	}
	
	/**
	 * Writes the specified map to the specified writer using the format provided.
	 * 
	 * @see #writeMappings(Map, MappingWriter)
	 */
	public static void writeMappings(Map<Integer, Set<Mapping>> map, Writer w, MappingFormat format)
			throws IOException {
		writeMappings(map, new MappingWriter(w, format));
	}
	
	/**
	 * Writes the specified map to the specified writer, starting {@linkplain MappingGroup mapping groups}
	 * as needed based on the key and the {@linkplain Set#size() size} of the value set. After all the sets
	 * of mappings in the map have been written, {@link MappingWriter#close()} is called.
	 * 
	 * @param map The mappings to write.
	 * @param writer The underlying writer to write to.
	 * @see MappingGroup
	 * @throws IOException if one occurs in the underlying writer.
	 */
	public static void writeMappings(Map<Integer, Set<Mapping>> map, MappingWriter writer) throws IOException {
		try {
			for(Integer k : map.keySet()) {
				Set<Mapping> as = map.get(k);
				
				writer.startGroup(new MappingGroup(k, as.size()));			
				
				for(Mapping a : as) {
					writer.writeMapping(a);
				}
			}
		}
		finally {
			writer.close();
		}
	}
	
	/**
	 * Reads alignments from the specified files, using the provided mapping format.
	 * 
	 * @see #readAlignments(Reader, Reader, Reader, MappingFormat)
	 */
	public static List<Alignment> readAlignments(File phraseA, File phraseB,
			File mappings, Pattern wordDelimiter, MappingFormat format) throws IOException {
		return readAlignments(new BufferedReader(new FileReader(phraseA)),
			new BufferedReader(new FileReader(phraseB)), new BufferedReader(new FileReader(mappings)), format);
	}
	
	/**
	 * Reads alignments from the specified readers, using the provided mapping format.
	 * 
	 * @see #readAlignments(PhraseReader, PhraseReader, Reader, MappingFormat)
	 */
	public static List<Alignment> readAlignments(Reader phraseA, Reader phraseB,
			Reader mappings, MappingFormat format) throws IOException {
		IndexBase idBase = format.encodingScheme.getPhraseNumberBase();
		return readAlignments(new PhraseReader(phraseA, idBase),
				new PhraseReader(phraseB, idBase), mappings, format);
	}
	
	/**
	 * Reads alignments from the specified files, using the provided word delimiter pattern and mapping format.
	 * The files containing phrases are assumed to contain markup indicating the phrase IDs.
	 * 
	 * @see #readIdentifiedAlignments(Reader, Reader, Reader, MappingFormat)
	 */
	public static List<Alignment> readIdentifiedAlignments(File phraseA, File phraseB,
			File mappings, Pattern wordDelimiter, MappingFormat format) throws IOException {
		return readIdentifiedAlignments(new BufferedReader(new FileReader(phraseA)),
				new BufferedReader(new FileReader(phraseB)), new BufferedReader(new FileReader(mappings)), 
				format);
	}
	
	/**
	 * Reads alignments from the specified readers, using the provided word delimiter pattern and mapping format.
	 * The readers for phrases are assumed to have input with markup indicating the phrase IDs.
	 * 
	 * @see #readAlignments(PhraseReader, PhraseReader, Reader, MappingFormat)
	 */
	public static List<Alignment> readIdentifiedAlignments(Reader phraseA,
			Reader phraseB, Reader mappings, MappingFormat format) throws IOException {
		return readAlignments(new IdentifiedPhraseReader(phraseA), new IdentifiedPhraseReader(phraseB),
				mappings, format);
	}
	
	/**
	 * Reads alignments from the specified readers, using the provided format to parse mappings. The
	 * line numbers of the phrases are translated into the
	 * {@linkplain EncodingScheme#getPhraseNumberBase() phrase number base} of the
	 * {@linkplain MappingFormat#getEncodingScheme() format's encoding scheme}.
	 * 
	 * @param phraseA The reader from which the {@linkplain PhrasePosition#A A-position} phrases are read.
	 * @param phraseB The reader from which the {@linkplain PhrasePosition#B B-position} phrases are read.
	 * @param mappings The reader whose input contains the mappings from A-phrases to B-phrases, where the
	 * A-position indices are assumed to correspond to the phrases in <tt>phraseA</tt> and the B-position
	 * indices are assumed to correspond to the phrases in <tt>phraseB</tt>.
	 * @param format The mapping format used to parse mappings read from <tt>mapping</tt>.
	 * @return A list of alignments where the {@linkplain Alignment#getA() A-phrases} are from <tt>phraseA</tt>,
	 * the {@linkplain Alignment#getB() B-phrases} are from <tt>phraseB</tt>, and the mappings are the ones
	 * read from <tt>mappings</tt> with the corresponding {@linkplain Phrase#getNumber() phrase number}. 
	 * @throws IOException if <tt>phraseA</tt> has a different number of phrases than <tt>phraseB</tt>, or if
	 * one is thrown by any of the underlying readers.
	 * 
	 * @see PhraseReader
	 * @see MappingReader
	 * @see #readPhrases(PhraseReader)
	 * @see #readMappings(MappingReader)
	 */
	public static List<Alignment> readAlignments(PhraseReader phraseA, PhraseReader phraseB,
			Reader mappings, MappingFormat format) throws IOException {
		List<Alignment> m = new ArrayList<Alignment>();
				
		try {
			List<Phrase> ps1 = readPhrases(phraseA), ps2 = readPhrases(phraseB);
			Map<Integer, Set<Mapping>> mm = readMappings(mappings, format);
			
			// sanity check
			if(ps1.size() != ps2.size()) {
				throw new IOException("number of phrases different between first and second");
			}

			for(int i = 0; i < ps1.size(); i++) {				
				m.add(new Alignment(ps1.get(i), ps2.get(i), mm.get(i)));
			}
		}
		finally {
			phraseA.close();
			phraseA.close();
			mappings.close();
		}
		
		return m;
	}
	
	/**
	 * Writes a list of alignments to the specified files, using the word separator and format provided.
	 * 
	 * @see #writeAlignments(List, Writer, Writer, Writer, String, MappingFormat)
	 */
	public static void writeAlignments(List<Alignment> alignments,
			File phraseA, File phraseB, File mappings, String wordSeparator, MappingFormat format)
				throws IOException {
		writeAlignments(alignments, new BufferedWriter(new FileWriter(phraseA)),
			new BufferedWriter(new FileWriter(phraseB)), new BufferedWriter(new FileWriter(mappings)),
				wordSeparator, format);
	}
	
	/**
	 * Writes a list of alignments to the specified readers, using the word separator and format provided.
	 * After all the <tt>alignments</tt> are written, all the associated writers are closed.
	 * 
	 * @param alignments The alignments to write.
	 * @param phraseA The writer to which {@linkplain Alignment#getA() A-position phrases} are written.
	 * @param phraseB The writer to which {@linkplain Alignment#getB() B-position phrases} are written.
	 * @param mappings The mappings to write, where the {@linkplain Mapping#getA() A-position indices} are
	 * assumed to correspond to the phrases in <tt>phraseA</tt> and the 
	 * {@linkplain Mapping#getB() B-position indices} are assumed to correspond to the ones in <tt>phraseB</tt>.
	 * @param wordSeparator The word separator to use for
	 * {@linkplain #untokenize(List, String) untokenization}.
	 * @param format The format to use for formatting mappings in the <tt>alignments</tt>.
	 * @throws IOException if one is thrown by any of the underlying writers.
	 */
	public static void writeAlignments(List<Alignment> alignments,
			Writer phraseA, Writer phraseB, Writer mappings, String wordSeparator, MappingFormat format)
				throws IOException {
		PhraseWriter pw1 = new PhraseWriter(phraseA, wordSeparator),
			pw2 = new PhraseWriter(phraseB, wordSeparator);
		MappingWriter mw = new MappingWriter(mappings, format);
		
		try {
			for(int i = 0; i < alignments.size(); i++) {
				Alignment a = alignments.get(i);
				
				pw1.writePhrase(a.a);
				pw2.writePhrase(a.b);
	
				mw.startGroup(new MappingGroup(i, a.size()));
				
				for(Mapping m : a) {
					mw.writeMapping(m);
				}
			}
		}
		finally {
			pw1.close();
			pw2.close();
			mw.close();
		}
	}
}


================================================
FILE: src/opennlp/ccg/alignment/EncodingScheme.java
================================================
//////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2012 Scott Martin
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.alignment;

import java.util.List;
import java.util.Set;

/**
 * An encoding scheme for mappings. Some examples are
 * the {@linkplain MosesEncodingScheme Moses scheme} and the {@linkplain NAACLEncodingScheme NAACL scheme}.
 * <p>
 * Implementers keep track of the {@link IndexBase}s corresponding to an encoding scheme (for both phrase 
 * numbers and indices), which characters it uses to delimit mappings, groups of mappings, and fields within
 * mappings. It also captures which fields occur
 * in which {@linkplain #getOrder() order} in an encoding scheme, along with which ones are
 * {@linkplain #getRequired() required}, and which are used by {@linkplain #getDefaults() default}.
 * <p>
 * Some convenience methods are provided for determining whether a given
 * character is the field, mapping, or group delimiter for this encoding scheme. These methods mainly allow
 * comparison when one character is a line separator that may be different from the one on the current platform.
 * <p>
 * Encoding schemes are used in the {@link MappingFormat} class, as well as in
 * the readers and writers for {@link Mapping}s and {@link Alignment}s. 
 * 
 * @author <a href="http://www.ling.osu.edu/~scott/">Scott Martin</a>
 * @see AbstractEncodingScheme
 * @see MappingFormat
 * @see <a href="http://www.statmt.org/moses/?n=FactoredTraining.AlignWords">Moses alignment format</a>
 * @see <a href="http://www.cse.unt.edu/~rada/wpt05/WordAlignment.Guidelines.txt">NAACL shared task alignment format</a>
 */
public interface EncodingScheme {
	
	/**
	 * Tests whether the supplied character counts as a field delimiter according to this encoding scheme.
	 * @return true if <code>c</code> is equal to {@link #getFieldDelimiter()} or both <code>c</code> and 
	 * field delimiters are line separators.
	 */
	public boolean isFieldDelimiter(Character c);
	
	/**
	 * Tests whether the supplied character counts as a mapping delimiter according to this encoding scheme.
	 * @return true if <code>c</code> is equal to {@link #getMappingDelimiter()} or both <code>c</code> and 
	 * mapping delimiters are line separators.
	 */
	public boolean isMappingDelimiter(Character c);
	
	/**
	 * Tests whether the supplied character counts as a group delimiter according to this encoding scheme.
	 * @return true if <code>c</code> is equal to {@link #getGroupDelimiter()} or both <code>c</code> and 
	 * group delimiters are line separators.
	 */
	public boolean isGroupDelimiter(Character c);

	/**
	 * Gets the delimiter for fields.
	 */
	public Character getFieldDelimiter();

	/**
	 * Gets the delimiter for mappings.
	 */
	public Character getMappingDelimiter();

	/**
	 * Gets the delimiter for groups.
	 */
	public Character getGroupDelimiter();

	/**
	 * Gets the numbering base used for phrases.
	 */
	public IndexBase getPhraseNumberBase();

	/**
	 * Gets the numbering base used for mapping indices.
	 */
	public IndexBase getIndexBase();

	/**
	 * Gets the order in which fields occur in this encoding scheme.
	 */
	public List<MappingFormat.Field> getOrder();

	/**
	 * Gets the required (non-optional) fields in this scheme.
	 */
	public Set<MappingFormat.Field> getRequired();
	
	/**
	 * Gets the default fields in this scheme.
	 */
	public Set<MappingFormat.Field> getDefaults();
}


================================================
FILE: src/opennlp/ccg/alignment/IdentifiedPhraseReader.java
================================================
//////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2012 Scott Martin
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.alignment;

import static opennlp.ccg.alignment.Alignments.DEFAULT_PHRASE_IDENTIFIER_ATTRIBUTE;
import static opennlp.ccg.alignment.Alignments.DEFAULT_PHRASE_NUMBER_BASE;
import static opennlp.ccg.alignment.Alignments.DEFAULT_PHRASE_TAG;
import static opennlp.ccg.alignment.Alignments.DEFAULT_WORD_DELIMITER;

import java.io.IOException;
import java.io.Reader;
import java.util.ArrayList;
import java.util.List;

/**
 * Phrase reader for phrases that have an identifier in addition to a line number, usually formatted by
 * markup like
 * <blockquote><pre>
 * &lt;s snum=&quot;157&quot;&gt; ... &lt;/s&gt;
 * </pre></blockquote>
 * Since the value of the identifier is not necessarily an {@link Integer}, this class gives IDs as strings.
 * The {@linkplain #getPhraseIdentifierAttribute() phrase identifier attribute} (here <code>snum</code>) and
 * {@linkplain #getPhraseTag() phrase tag} (here <code>s</code>) are configurable when instances are
 * constructed.
 * 
 * @author <a href="http://www.ling.osu.edu/~scott/">Scott Martin</a>
 * @see Alignments#DEFAULT_PHRASE_TAG
 * @see Alignments#DEFAULT_PHRASE_IDENTIFIER_ATTRIBUTE
 */
public class IdentifiedPhraseReader extends PhraseReader {

	static final String TAG_START = "<", TAG_END = ">";
	
	final String phraseTag, phraseIdentifierAttribute;
	
	private String lastId = null;
	
	/**
	 * Creates an identified phrase reader with the {@linkplain Alignments#DEFAULT_PHRASE_NUMBER_BASE default
	 * number base}.
	 * 
	 * @see #IdentifiedPhraseReader(Reader, IndexBase)
	 * @see Alignments#DEFAULT_PHRASE_TAG
	 * @see Alignments#DEFAULT_PHRASE_IDENTIFIER_ATTRIBUTE
	 */
	public IdentifiedPhraseReader(Reader in) {
		this(in, DEFAULT_PHRASE_NUMBER_BASE);		
	}
	
	/**
	 * Creates an identified phrase reader with the {@linkplain Alignments#DEFAULT_PHRASE_TAG default phrase tag}
	 * and {@link Alignments#DEFAULT_PHRASE_IDENTIFIER_ATTRIBUTE default phrase identifier attribute}.
	 * 
	 * @see #IdentifiedPhraseReader(Reader, IndexBase, String, String)
	 * @see Alignments#DEFAULT_PHRASE_TAG
	 * @see Alignments#DEFAULT_PHRASE_IDENTIFIER_ATTRIBUTE
	 */
	public IdentifiedPhraseReader(Reader in, IndexBase numberBase) {
		this(in, numberBase, DEFAULT_PHRASE_TAG, DEFAULT_PHRASE_IDENTIFIER_ATTRIBUTE);		
	}

	/**
	 * Creates an identified phrase reader for the specified phrase tag and identifier attribute.
	 * @param phraseTag The phrase tag that will be used to parse identifiers.
	 * @param phraseIdentifierAttribute The attribute that will denote identifiers when parsing phrases.
	 * @throws IllegalArgumentException if <tt>phraseIdentifierAttribute</tt> or <tt>phraseTag</tt> 
	 * is <tt>null</tt>. 
	 */
	public IdentifiedPhraseReader(Reader in, IndexBase numberBase, String phraseTag,
			String phraseIdentifierAttribute) {
		super(in, numberBase);
		
		if(phraseIdentifierAttribute == null) {
			throw new IllegalArgumentException("phraseIdentifierAttribute is null");
		}
		if(phraseTag == null) {
			throw new IllegalArgumentException("phraseTag is null");
		}
		
		this.phraseIdentifierAttribute = phraseIdentifierAttribute;
		this.phraseTag = phraseTag;
	}

	/**
	 * Gets the last ID encountered.
	 */
	public String getLastId() {
		return lastId;
	}

	/**
	 * Gets the tag that denotes a phrase.
	 */
	public String getPhraseTag() {
		return phraseTag;
	}

	/**
	 * Gets the attribute name that denotes a phrase identifier.
	 */
	public String getPhraseIdentifierAttribute() {
		return phraseIdentifierAttribute;
	}

	/**
	 * Reads a phrase from the underlying input stream, first parsing the {@linkplain Phrase#getNumber()
	 * phrase's number} based on the {@linkplain #getPhraseTag() phrase tag} and
	 * {@linkplain #getPhraseIdentifierAttribute() identifier attribute} being used.
	 * @return A phrase with the ID signaled in the input.
	 * @throws IOException If the underlying input contains ill-formated phrase markup, or if no ID cannot be
	 * determined after parsing the phrase markup.
	 */
	@Override
	public Phrase readPhrase() throws IOException {
		String ln = readLine();
		if(ln == null) {
			return null;
		}
		
		String[] chunks = DEFAULT_WORD_DELIMITER.split(ln);
		String c = chunks[0];
		
		if(!c.trim().startsWith(TAG_START)) {
			throw new IOException("unable to parse: " + ln + "; expected <, but was " + c.trim());
		}
		
		int clen = c.length();
		int pos = (clen > 1) ? 1 : 2;
		String t = (pos == 1) ? c.substring(1).trim() : chunks[1];
		if(!t.equals(phraseTag)) {
			throw new IOException("expected sequence tag " + phraseTag + ", but was " + t);
		}
		
		boolean foundIndex = false;
		int start = -1;
		
		for(int i = pos; i < chunks.length; i++) {
			if(!foundIndex) {
				String[] subchunks = chunks[i].trim().split("=");
				if(subchunks.length > 1) {
					if(subchunks[0].equals(phraseIdentifierAttribute)) {
						char[] idVal = subchunks[1].toCharArray();
						
						int idStart = 0, idEnd = idVal.length - 1;
						boolean foundStart = false;
						for(int j = 0; j < idVal.length; j++) {
							if(idVal[j] == '\'' || idVal[j] == '\"') {
								if(foundStart) {
									idEnd = j;
									break;
								}
								else {
									foundStart = true;
									idStart = j + 1;
								}
							}
						}
						
						lastId = new String(idVal).substring(idStart, idEnd);
						foundIndex = true;
					}
				}
			}
			
			if(chunks[i].contains(TAG_END)) {
				start = i;
				break;
			}
		}
		
		if(!foundIndex) {
			throw new IOException("no ID found on line " + getLineNumber());
		}
		
		List<String> l = new ArrayList<String>(chunks.length);
		for(int j = start; j < chunks.length; j++) {
			String cj = chunks[j];
			
			if(j == start) {
				int te = cj.indexOf(TAG_END);
				if(te != -1) {
					cj = cj.substring(te + 1);
				}
			}
			
			if(j + 1 == chunks.length) {
				int ts = cj.indexOf(TAG_START);
				if(ts != -1) {
					cj = cj.substring(0, ts);
				}
			}
			
			if(cj.length() > 0) {
				l.add(cj);
			}
		}
		
		return new Phrase(lastId, getPhraseNumber(), l);
	}
}


================================================
FILE: src/opennlp/ccg/alignment/IdentifiedPhraseWriter.java
================================================
//////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2012 Scott Martin
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.alignment;

import java.io.IOException;
import java.io.Writer;

import static opennlp.ccg.alignment.Alignments.*;

/**
 * A writer for phrases with {@linkplain Phrase#getId() ids} in addition to
 * {@linkplain Phrase#getNumber() numbers}. Identified phrases are ones read from
 * markup that signals an ID for each phrase.
 * <p>
 * In addition to allowing the phrase tag and identifier attribute to be configured, this class can optionally
 * output {@linkplain #isPadding() padding} of a single space between the markup and the phrase.
 * 
 * @author <a href="http://www.ling.osu.edu/~scott/">Scott Martin</a>
 * @see IdentifiedPhraseReader
 */
public class IdentifiedPhraseWriter extends PhraseWriter {

	final String phraseTag, phraseIdentifierAttribute;
	final boolean padding;
	
	/**
	 * Creates a new identified phrase writer. The word separator used is
	 * {@link Alignments#DEFAULT_WORD_SEPARATOR}.
	 * @see #IdentifiedPhraseWriter(Writer, String)
	 */
	public IdentifiedPhraseWriter(Writer out) {
		this(out, Alignments.DEFAULT_WORD_SEPARATOR);
	}

	/**
	 * Creates a new identified phrase writer with the given word separator. The phrase tag used is the default,
	 * {@link Alignments#DEFAULT_PHRASE_TAG}, as is the phrase ID attribute
	 * ({@link Alignments#DEFAULT_PHRASE_IDENTIFIER_ATTRIBUTE}).
	 * @see #IdentifiedPhraseWriter(Writer, String, String, String)
	 */
	public IdentifiedPhraseWriter(Writer out, String wordSeparator) {
		this(out, wordSeparator, DEFAULT_PHRASE_TAG, DEFAULT_PHRASE_IDENTIFIER_ATTRIBUTE);
	}
	
	/**
	 * Creates a new identified phrase writer with the given word separator. The phrase tag used is the default,
	 * {@link Alignments#DEFAULT_PHRASE_TAG}, as is the phrase ID attribute
	 * ({@link Alignments#DEFAULT_PHRASE_IDENTIFIER_ATTRIBUTE}).
	 * @see #IdentifiedPhraseWriter(Writer, String, String, String, boolean)
	 */
	public IdentifiedPhraseWriter(Writer out, String wordSeparator, String phraseTag,
			String phraseIdentifierAttribute) {
		this(out, wordSeparator, phraseTag, phraseIdentifierAttribute, DEFAULT_PHRASE_PADDING);
	}
	
	/**
	 * Creates a new identified phrase writer for writing phrases to the underlying writer.
	 * @param phraseTag The name of the tag that holds the phrase identifier.
	 * @param phraseIdentifierAttribute The phrase identifier attribute.
	 * @param padding Whether this writer should write a space between the pre-markup and the phrase, and
	 * between the phrase and the post-markup.
	 * @throws IllegalArgumentException if <tt>phraseTag</tt> or <tt>phraseIdentifierAttribute</tt>
	 * is <tt>null</tt>.
	 */
	public IdentifiedPhraseWriter(Writer out, String wordSeparator, String phraseTag,
			String phraseIdentifierAttribute, boolean padding) {
		super(out, wordSeparator);
		
		if(phraseTag == null) {
			throw new IllegalArgumentException("phraseTag is null");
		}
		if(phraseIdentifierAttribute == null) {
			throw new IllegalArgumentException("phraseIdentifierAttribute is null");
		}
		
		this.phraseTag = phraseTag;
		this.phraseIdentifierAttribute = phraseIdentifierAttribute;
		this.padding = padding;
	}

	/**
	 * Gets the phrase tag this writer generates with each phrase.
	 */
	public String getPhraseTag() {
		return phraseTag;
	}

	/**
	 * Gets the phrase identifier attribute used to signal the phrase ID for each phrase.
	 */
	public String getPhraseIdentifierAttribute() {
		return phraseIdentifierAttribute;
	}

	/**
	 * Tests whether this writer writes space padding between its pre- and post-markup and the phrase itself.
	 * @return true if this writer uses padding.
	 */
	public boolean isPadding() {
		return padding;
	}

	/**
	 * Writes the start markup indicating a phrase's ID. The tag and ID attribute are the ones used to
	 * create this writer.
	 * 
	 * @see #getPhraseTag()
	 * @see #getPhraseIdentifierAttribute()
	 * @throws IOException If a problem occurs in the underlying writer.
	 */
	@Override
	public void preWritePhrase(Phrase phrase) throws IOException {
		String id = phrase.getId();
		if(id == null) {
			throw new IOException("attempt to write phrase with null ID: " + phrase);
		}
		
		printWriter.print('<');
		printWriter.print(phraseTag);
		printWriter.print(' ');
		printWriter.print(phraseIdentifierAttribute);
		printWriter.print("=\"");
		printWriter.print(id);
		printWriter.print("\">");
		
		if(padding) {
			printWriter.print(' ');
		}
	}
	
	/**
	 * Writes the end markup signaling the end of a phrase, plus a line separator.
	 * 
	 * @throws IOException If a problem occurs in the underlying writer.
	 */
	@Override
	public void postWritePhrase(Phrase phrase) throws IOException {
		if(padding) {
			printWriter.print(' ');
		}
		
		printWriter.print("</");
		printWriter.print(phraseTag);
		printWriter.println(">");
	}
}


================================================
FILE: src/opennlp/ccg/alignment/IndexBase.java
================================================
//////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2012 Scott Martin
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.alignment;

/**
 * A set of {@link Enum} constants representing the two common indexing bases used in representing alignments.
 * The constants are ordered so that their {@link Enum#ordinal()} method returns a number corresponding to 
 * their {@linkplain #getStart() start index}.
 * <p>
 * An index base is characterized by its {@linkplain IndexBase#getStart() starting point} and its 
 * {@linkplain #getNullValue() null value}, which is derived from its starting point by decrementing by one.
 * One index base can translate an integer in that base into another base via the
 * {@link #translate(Integer, IndexBase)} method.
 * 
 * @author <a href="http://www.ling.ohio-state.edu/~scott/">Scott Martin</a>
 * @see EncodingScheme
 */
public enum IndexBase {
	
	/**
	 * The index base that starts with <tt>0</tt>.
	 */
	ZERO,
	
	/**
	 * The index base starting with <tt>1</tt>.
	 */
	ONE;
	
	final Integer start, nullValue;
	
	private IndexBase() {
		this.start = Integer.valueOf(ordinal());
		this.nullValue = start - 1;
	}
	
	/**
	 * Gets the starting point of this index base.
	 */
	public Integer getStart() {
		return start;
	}

	/**
	 * This index base's special null value, the value of {@link #getStart()}<code> - 1</code>.
	 */
	public Integer getNullValue() {
		return nullValue;
	}

	/**
	 * Tests whether the specified index is valid in this index base.
	 * @param index The index to test.
	 * @return true If index is non-null and not less than {@link #getNullValue()}.
	 */
	public boolean isValidIndex(Integer index) {
		return index != null && nullValue <= index;
	}
	
	/**
	 * Translates an index in this base to another base. For example, <code>ZERO.translate(2, ONE)</code> yields
	 * <code>3</code> and <code>ONE.translate(1, ZERO)</code> yields <code>0</code>. Note that supplying the same
	 * index base as the target has no effect, so that if <code>b</code> is an index base constant, then
	 * <code>b.translate(n, b)</code> returns <code>n</code> for every {@link Integer} <code>n</code> as long
	 * as <code>n</code> is {@linkplain #isValidIndex(Integer) valid} (throwing an exception otherwise).
	 * @param index The index to translate.
	 * @param target The target index base to translate <code>index</code> into.
	 * @return The value of <code>index</code> as it is represented in the index base <code>target</code>.
	 * @throws IllegalArgumentException If <code>index</code> is invalid for this index base.
	 * @see #isValidIndex(Integer) 
	 */
	public Integer translate(Integer index, IndexBase target) {
		if(!isValidIndex(index)) {
			throw new IllegalArgumentException("invalid index for index base " + name() + ": " + index);
		}
		
		if(target == this) {
			return index;
		}
		
		return Integer.valueOf(index + (target.start - start));
	}
}

================================================
FILE: src/opennlp/ccg/alignment/Mapping.java
================================================
//////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2012 Scott Martin
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.alignment;

import static opennlp.ccg.alignment.PhrasePosition.*;

/**
 * A mapping from an index in the {@linkplain PhrasePosition#A A} phrase position to an index in the
 * {@linkplain PhrasePosition#B B} phrase position. Mappings are interpreted as the individual pairs
 * that make up an {@link Alignment} from one {@link Phrase} to another. This class implements
 * {@link Comparable} so that mappings can be easily sorted (see the {@link #compareTo(Mapping)} method).
 * <p>
 * Although different
 * {@linkplain EncodingScheme encoding schemes} may use different {@linkplain IndexBase index bases}, all
 * mappings share a common one, namely {@link Alignments#DEFAULT_INDEX_BASE}. As such, no index can be 
 * specified that is less than the {@linkplain IndexBase#nullValue null value} of that index base. Similarly,
 * the phrase number specified (if any) must be in the range of the
 * {@linkplain Alignments#DEFAULT_PHRASE_NUMBER_BASE default phrase number base},
 * even though different encoding schemes may have different phrase number bases.
 * <p>
 * Since some {@linkplain EncodingScheme encoding schemes} do not require an
 * {@linkplain #getPhraseNumber() phrase number}
 * to be specified, the phrase number field may be <code>null</code>. However, none of the other fields may be
 * <code>null</code>. To specify that the mapping is to the special null word value, the
 * {@linkplain Alignments#DEFAULT_INDEX_BASE default index base}'s
 * {@linkplain IndexBase#nullValue null value} is used.
 * 
 * @author <a href="http://www.ling.ohio-state.edu/~scott/">Scott Martin</a>
 * @see PhrasePosition
 * @see EncodingScheme
 * @see IndexBase
 * @see Alignments#DEFAULT_PHRASE_NUMBER_BASE
 * @see Alignments#DEFAULT_INDEX_BASE
 * @see Alignments#DEFAULT_STATUS
 * @see Alignments#DEFAULT_CONFIDENCE
 */
public class Mapping implements Comparable<Mapping> {

	final Integer phraseNumber, a, b;
	Status status;
	Double confidence;
	
	/**
	 * Creates a mapping between the two specified indices with a <code>null</code> phrase number.
	 * @see #Mapping(Integer, Integer, Integer)
	 */
	public Mapping(Integer a, Integer b) {
		this(null, a, b);
	}
	
	/**
	 * Creates a mapping between the two specified indices with a <code>null</code> phrase number and the
	 * {@linkplain Alignments#DEFAULT_STATUS default status}.
	 * @see #Mapping(Integer, Integer, Integer, Status)
	 */
	public Mapping(Integer phraseNumber, Integer a, Integer b) {
		this(phraseNumber, a, b, Alignments.DEFAULT_STATUS);
	}
	
	/**
	 * Creates a mapping between the two specified indices with the specified phrase number and status, with the
	 * {@linkplain Alignments#DEFAULT_CONFIDENCE default confidence}.
	 * @see #Mapping(Integer, Integer, Integer, Status, Double)
	 */
	public Mapping(Integer phraseNumber, Integer a, Integer b, Status status) {
		this(phraseNumber, a, b, status, Alignments.DEFAULT_CONFIDENCE);
	}
	
	/**
	 * Creates a mapping between the two specified indices.
	 * @param phraseNumber The phrase number of the corresponding mapping.
	 * @param a The A index, corresponding to {@link PhrasePosition#A}.
	 * @param b The B index, corresponding to {@link PhrasePosition#B}.
	 * @param status The status of this mapping.
	 * @param confidence This mapping's confidence value.
	 * 
	 * @throws IndexOutOfBoundsException If any of <code>phraseNumber</code>, <code>a</code>, or
	 * <code>b</code> is out of bounds according to the corresponding default.
	 * @throws IllegalArgumentException If either index is <tt>null</tt>, or if <code>status</code> or
	 * <code>confidence</code> is <code>null</code>.
	 * 
	 * @see Alignments#DEFAULT_PHRASE_NUMBER_BASE
	 * @see Alignments#DEFAULT_INDEX_BASE
	 */
	public Mapping(Integer phraseNumber, Integer a, Integer b, Status status, Double confidence) {
		checkPhraseNumber(phraseNumber);
		checkIndex(a);
		checkIndex(b);
		checkField(status, "status");
		checkField(confidence, "confidence");
		
		this.phraseNumber = phraseNumber;
		this.a = a;
		this.b = b;
		this.status = status;
		this.confidence = confidence;
	}
	
	/**
	 * Gets a copy of this mapping with its {@linkplain #getPhraseNumber() phrase number}
	 * set to the specified phrase number. This method is a convenience for the {@link MappingReader} class,
	 * which, for certain encoding scheme like {@link MosesEncodingScheme}, may not be able to
	 * parse the phrase number from the input string.
	 * @param phraseNumber The phrase number the returned mapping should have.
	 * @return This mapping if its {@linkplain #getPhraseNumber() phrase number} is <tt>null</tt> and the
	 * specified phrase number is <tt>null</tt>, or if this mapping's phrase number is
	 * {@linkplain Integer#equals(Object) equivalent to} the specified phrase number. Otherwise, a new 
	 * mapping is returned with all the same field values as this mapping, but with its phrase number set
	 * to <tt>phraseNumber</tt>.
	 * 
	 * @see #Mapping(Integer, Integer, Integer, Status, Double)
	 */
	public Mapping copyWithPhraseNumber(Integer phraseNumber) {
		if((this.phraseNumber == null && phraseNumber == null)
				|| (this.phraseNumber != null && this.phraseNumber.equals(phraseNumber))) {
			return this;
		}
		
		return new Mapping(phraseNumber, a, b, status, confidence);
	}
	
	/**
	 * Convenience method for creating mappings when the phrase position may possibly be 
	 * {@link PhrasePosition#B}.
	 * @see #mappingByPosition(Integer, Integer, Integer, Status, Double, PhrasePosition)
	 */
	public static Mapping mappingByPosition(Integer phraseNumber, Integer a, Integer b,
			PhrasePosition firstPosition) {
		return mappingByPosition(phraseNumber, a, b, Alignments.DEFAULT_STATUS,
				Alignments.DEFAULT_CONFIDENCE, firstPosition);
	}

	/**
	 * Convenience method for creating mappings in case which index should be {@linkplain #getA() A} and
	 * which should be {@linkplain #getB() B} depends on the phrase position.
	 * 
	 * @param phraseNumber The phrase number to use.
	 * @param a The index to use either for the A (if the first position is
	 * {@link PhrasePosition#A}) or B index (if the first position is {@link PhrasePosition#B}).
	 * @param b The index to use either for the B (if the first position is
	 * {@link PhrasePosition#A}) or A index (if the first position is {@link PhrasePosition#B}).
	 * @param status The status to use.
	 * @param confidence The confidence to use.
	 * @param firstPosition Which phrase position the new mapping should reflect. If this argument is
	 * {@link PhrasePosition#A}, the <code>a</code> argument will be the A index and the
	 * <code>b</code> argument the B. If it is {@link PhrasePosition#B}, these are reversed.
	 * @return A new mapping with its indices configured per the specified <code>firstPosition</code>.
	 * @see Mapping#Mapping(Integer, Integer, Integer, Status, Double)
	 */
	public static Mapping mappingByPosition(Integer phraseNumber, Integer a, Integer b, Status status,
			Double confidence, PhrasePosition firstPosition) {
		return new Mapping(phraseNumber,
				(firstPosition == A) ? a : b, (firstPosition == B) ? a : b, status, confidence);
	}
	
	/**
	 * Gets a new mapping just like this one except that the indices in the {@link PhrasePosition#A}
	 * and {@link PhrasePosition#B} positions are swapped. The original status and confidence are
	 * unchanged.
	 * @return A mapping with indices reversed.
	 * @see Mapping#mappingByPosition(Integer, Integer, Integer, Status, Double, PhrasePosition)
	 */
	public Mapping reverse() {
		return mappingByPosition(phraseNumber, a, b, status, confidence, B);
	}
	
	/**
	 * Gets this mapping's phrase number.
	 */
	public Integer getPhraseNumber() {
		return phraseNumber;
	}

	/**
	 * Gets this mapping's index in the {@linkplain PhrasePosition#A A-position}.
	 * @return The value of {@link #get(PhrasePosition)} for {@link PhrasePosition#A}.
	 */
	public Integer getA() {
		return get(A);
	}

	/**
	 * Gets this mapping's index in the {@linkplain PhrasePosition#B B-position}.
	 * @return The value of {@link #get(PhrasePosition)} for {@link PhrasePosition#B}.
	 */
	public Integer getB() {
		return get(B);
	}

	/**
	 * Gets this mapping's index at the specified phrase position.
	 * @param pos The phrase position at which to return the corresponding index.
	 * @return If <code>pos</code> is {@link PhrasePosition#A}, the A index; otherwise the B index.
	 */
	public Integer get(PhrasePosition pos) {
		return (pos == A) ? a : b;
	}
	
	/**
	 * Gets this mapping's status.
	 */
	public Status getStatus() {
		return status;
	}

	/**
	 * Sets this mapping's status to the specified value.
	 */
	public void setStatus(Status status) {
		checkField(status, "status");
		this.status = status;
	}

	/**
	 * Gets this mapping's confidence.
	 */
	public Double getConfidence() {
		return confidence;
	}

	/**
	 * Sets this mapping's confidence to the supplied value.
	 * @param confidence May be <code>null</code>. No bounds checking is performed on this value even if it
	 * is non-null.
	 */
	public void setConfidence(Double confidence) {
		checkField(confidence, "confidence");
		this.confidence = confidence;
	}

	/**
	 * Compares this mapping to another according to their natural ordering. The natural ordering of
	 * mappings is that first their IDs are compared, then their A indices, then their B indices,
	 * and finally their status and confidence value (in that order).
	 * <p>
	 * For the ID field, which may be null, the comparison is performed as follows. If both this mapping's 
	 * ID and the other's are null, they are considered equivalent. If this mapping's ID is non-null, it is
	 * compared to the (possibly null) other mapping's ID via {@link Integer#compareTo(Integer)}.
	 */
	@Override
	public int compareTo(Mapping o) {
		int i = (phraseNumber == null && o.phraseNumber == null) ? 0 : phraseNumber.compareTo(o.phraseNumber);
		
		if(i == 0) {
			i = a.compareTo(o.a);
		}
		if(i == 0) {
			i = b.compareTo(o.b);
		}
		if(i == 0) {
			i = status.compareTo(o.status);
		}
		if(i == 0) {
			i = confidence.compareTo(o.confidence);
		}
		
		return i;
	}

	/**
	 * Computes a hash code based on the ID, and A and B indices. The status and confidence fields are not
	 * used for hash code computation because they are mutable. Because of this, two mappings may have
	 * identical hash codes but not be equivalent according to {@link #equals(Object)}.
	 */
	@Override
	public int hashCode() {
		int h = 37 * 1 + a + b;
		
		return (phraseNumber == null) ? h : h + phraseNumber;
	}

	/**
	 * Tests whether this mapping is equal to another.
	 * @return true If this mapping's fields match the other according to the corresponding <code>equals</code>
	 * methods. For the phrase number field, they are considered equal if both <code>null</code>
	 * or if their corresponding <code>equals</code> method returns <code>true</code>, unequal otherwise.
	 */
	@Override
	public boolean equals(Object obj) {
		if(obj instanceof Mapping) {
			Mapping m = (Mapping)obj;
			return ((phraseNumber == null && m.phraseNumber == null) || phraseNumber.equals(m.phraseNumber))
				&& a.equals(m.a) && b.equals(m.b) && status.equals(m.status)
				&& confidence.equals(m.confidence);
		}
		
		return false;
	}

	void checkPhraseNumber(Integer phraseNumber) throws IndexOutOfBoundsException {
		if(phraseNumber != null && !Alignments.DEFAULT_PHRASE_NUMBER_BASE.isValidIndex(phraseNumber)) {
			throw new IndexOutOfBoundsException("invalid phrase number: " + phraseNumber);
		}
	}
	
	void checkIndex(Integer index) throws IndexOutOfBoundsException {
		if(index == null) {
			throw new IllegalArgumentException("null index");
		}
		
		if(!Alignments.DEFAULT_INDEX_BASE.isValidIndex(index)) {
			throw new IndexOutOfBoundsException("invalid index: " + index);
		}
	}
	
	void checkField(Object obj, String name) throws IllegalArgumentException {
		if(obj == null) {
			throw new IllegalArgumentException("null " + name);
		}
	}

	/**
	 * A string representation of this mapping's indices.
	 * @return For a mapping with a {@linkplain #getA() A} index of <code>3</code> and a 
	 * {@linkplain #getB() B} index of <code>6</code>, this method gives the string
	 * &quot;<code>3 <-> 6</code>&quot;.
	 */
	@Override
	public String toString() {
		StringBuilder sb = new StringBuilder(a.toString());
		sb.append(" <-> ");
		sb.append(b.toString());
		
		return sb.toString();
	}
}


================================================
FILE: src/opennlp/ccg/alignment/MappingFormat.java
================================================
//////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2012 Scott Martin
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.alignment;

import static opennlp.ccg.alignment.Alignments.DEFAULT_CONFIDENCE;
import static opennlp.ccg.alignment.Alignments.DEFAULT_INDEX_BASE;
import static opennlp.ccg.alignment.Alignments.DEFAULT_PHRASE_NUMBER_BASE;
import static opennlp.ccg.alignment.Alignments.DEFAULT_STATUS;
import static opennlp.ccg.alignment.Alignments.DEFAULT_STRICTNESS;
import static opennlp.ccg.alignment.MappingFormat.Field.A_INDEX_FIELD;
import static opennlp.ccg.alignment.MappingFormat.Field.B_INDEX_FIELD;
import static opennlp.ccg.alignment.MappingFormat.Field.CONFIDENCE_FIELD;
import static opennlp.ccg.alignment.MappingFormat.Field.PHRASE_NUMBER_FIELD;
import static opennlp.ccg.alignment.MappingFormat.Field.STATUS_FIELD;

import java.text.FieldPosition;
import java.text.Format;
import java.text.ParseException;
import java.text.ParsePosition;
import java.util.HashMap;
import java.util.HashSet;
import java.util.Iterator;
import java.util.List;
import java.util.Map;
import java.util.Set;
import java.util.regex.Matcher;
import java.util.regex.Pattern;

/**
 * A class for formatting mappings according to an {@linkplain EncodingScheme encoding scheme} and a specified
 * set of {@linkplain Field formatting fields}. This class
 * extends {@link Format} so that it fits in with the Java text parsing API.
 * <p>
 * Care is always taken to translate a mapping's phrase number and indices to the target
 * encoding scheme's {@linkplain EncodingScheme#getIndexBase() index base}.
 * If a mapping format is not {@linkplain #isStrict() strict}, parsing is handled robustly in that it tolerates
 * fields that are optional and may not always be specified. On output, a non-strict mapping format will only
 * include fields that either (1) do not have a {@linkplain Field#hasDefaultValue() default value}, or (2)
 * have a value different from {@linkplain Field#getDefaultValue() the default}. Strict mapping
 * formats, on the other hand, always expect and generate all and only the {@linkplain #getFields() fields
 * specified}.
 * <p>
 * Instances of mapping formats can be obtained by calling one of the
 * <code>getInstance(...)</code> methods.
 * 
 * @see #getFields()
 * @see #isStrict()
 * @see EncodingScheme
 * @see IndexBase
 * @author <a href="http://www.ling.ohio-state.edu/~scott/">Scott Martin</a>
 */
public class MappingFormat extends Format {
	private static final long serialVersionUID = 1L;
	
	final EncodingScheme encodingScheme;
	final Set<Field> fields;
	final Pattern mappingPattern, fieldPattern;
	final boolean strict;
	
	private static Map<EncodingScheme, Set<MappingFormat>> formatCache; 
	
	/**
	 * Marks mapping fields like ID, first index, second index, etc. Fields can have a 
	 * {@linkplain #getDefaultValue() default value}, which may be used depending on whether this format is
	 * {@linkplain MappingFormat#isStrict() strict}.
	 * @author <a href="http://www.ling.ohio-state.edu/~scott/">Scott Martin</a>
	 */
	public static class Field extends java.text.Format.Field {
		private static final long serialVersionUID = 1L;
		
		Object defaultValue = null;
		
		/**
		 * Field representing a mapping's ID. 
		 */
		public static final Field PHRASE_NUMBER_FIELD = new Field("PHRASE_NUMBER", null);
		
		/**
		 * Field representing a mapping's A index. 
		 */
		public static final Field A_INDEX_FIELD = new Field("A_INDEX", null);
			
		/**
		 * Field representing a mapping's B index. 
		 */
		public static final Field B_INDEX_FIELD = new Field("B_INDEX", null);
			
		/**
		 * Field representing a mapping's status field. 
		 */
		public static final Field STATUS_FIELD = new Field("STATUS", DEFAULT_STATUS);
			
		/**
		 * Field representing a mapping's confidence field. 
		 */
		public static final Field CONFIDENCE_FIELD = new Field("CONFIDENCE", DEFAULT_CONFIDENCE);
		
		/**
		 * Creates a new mapping format field.
		 * @param name The new field's name.
		 * @param defaultValue The default value for this field. If this field does not have a default value,
		 * <code>null</code> is specified.
		 * @throws IllegalArgumentException if <tt>name</tt> is <tt>null</tt>.
		 */
		protected Field(String name, Object defaultValue) {
			super(name);
			
			if(name == null) {
				throw new IllegalArgumentException("name is null");
			}
			
			this.defaultValue = defaultValue;
		}

		/**
		 * Tests whether this field has a default value.
		 * @return true If the {@linkplain #getDefaultValue() default value} is non-null.
		 */
		public boolean hasDefaultValue() {
			return defaultValue != null;
		}
		
		/**
		 * Gets the default value for this field, if any.
		 * @see #hasDefaultValue()
		 */
		public Object getDefaultValue() {
			return defaultValue;
		}

		/**
		 * Overrides the superclass method to return the value of {@link java.text.Format.Field#getName()}.
		 */
		@Override
		public String toString() {
			return getName();
		}
	}
	
	/**
	 * Creates a mapping format based on the given encoding scheme and fields. The boolean flag tells instances
	 * whether or not to output values when they are the default, or expect them during parsing.
	 * 
	 * @param scheme The encoding scheme to create a formatter/parser for.
	 * @param fields The fields to include.
	 * @param strict Whether or not to use/expect default values in formatting and parsing.
	 * @throws IllegalArgumentException If <tt>scheme</tt> or <tt>fields</tt> is <tt>null</tt>,
	 * or if the specified set of fields does not contain all of the
	 * {@linkplain EncodingScheme#getRequired() required fields} of the specified scheme.
	 * @see Field#hasDefaultValue()
	 */
	protected MappingFormat(EncodingScheme scheme, Set<Field> fields, boolean strict) {
		if(scheme == null) {
			throw new IllegalArgumentException("encoding scheme is null");
		}
		if(fields == null) {
			throw new IllegalArgumentException("fields is null");
		}
		
		this.encodingScheme = scheme;
		this.fields = fields;
		this.strict = strict;
		
		if(!fields.containsAll(encodingScheme.getRequired())) {
			throw new IllegalArgumentException("specified fields does not contain all required fields");
		}
		if(!encodingScheme.getOrder().containsAll(fields)) {
			throw new IllegalArgumentException("encoding scheme does not use all the specified fields");
		}
		
		fieldPattern = Pattern.compile(scheme.getFieldDelimiter().toString());
		mappingPattern = Pattern.compile("([\\w\\.]+" + scheme.getFieldDelimiter() + ")+[\\w\\.]+");
	}
	
	/**
	 * Gets an instance of a mapping formatter/parser for a given encoding scheme with the scheme's
	 * {@linkplain EncodingScheme#getDefaults() default fields} as the specified fields.
	 * @see #getInstance(EncodingScheme, Set)
	 */
	public static MappingFormat getInstance(EncodingScheme scheme) {
		return getInstance(scheme, scheme.getDefaults());
	}
	
	/**
	 * Gets an instance of a mapping formatter/parser for a given encoding scheme and field set.
	 * @see #getInstance(EncodingScheme, Set, boolean)
	 * @see Alignments#DEFAULT_STRICTNESS
	 */
	public static MappingFormat getInstance(EncodingScheme scheme, Set<Field> fields) {
		return getInstance(scheme, fields, DEFAULT_STRICTNESS);
	}
	
	/**
	 * Gets an instance of a mapping formatter/parser for a given encoding scheme and field set. The
	 * returned instances are cached to avoid creating multiple copies with the same scheme, fields, and
	 * strictness flag. Cache access is synchronized to avoid threading issues.
	 * 
	 * @param scheme The scheme to create a formatter/parser for.
	 * @param fields The fields to include in the parser/formatter.
	 * @param strict Whether the returned format should be {@linkplain #isStrict() strict}.
	 * @return A new formatter/parser for mappings that will expect mappings encoded per the specified
	 * <code>scheme</code> and will format mappings to strings of that encoding scheme.
	 */
	public static MappingFormat getInstance(EncodingScheme scheme, Set<Field> fields, boolean strict) {
		if(scheme == null) { // test for this here so null isn't added to cache as a key
			throw new IllegalArgumentException("encoding scheme is null");
		}
		
		synchronized(MappingFormat.class) {
			MappingFormat mf = null;
			Set<MappingFormat> fs = null;
			
			if(formatCache == null) {
				formatCache = new HashMap<EncodingScheme, Set<MappingFormat>>();
			}
			else {
				fs = formatCache.get(scheme);
			}		 
			
			if(fs == null) {
				fs = new HashSet<MappingFormat>();
				formatCache.put(scheme, fs);
			}
			
			for(MappingFormat f : fs) {
				if(f.strict == strict && f.fields.equals(fields)) {
					mf = f;
					break;
				}
			}
			
			if(mf == null) {
				mf = new MappingFormat(scheme, fields, strict);
				fs.add(mf);
			}
			
			return mf;
		}
	}
	
	/**
	 * Gets the encoding scheme used by this mapping formatter/parser.
	 * @return The encoding scheme used to create this instance.
	 * @see #getInstance(EncodingScheme)
	 */
	public EncodingScheme getEncodingScheme() {
		return encodingScheme;
	}

	/**
	 * Gets the field set used by this mapping formatter/parser.
	 * @see #getInstance(EncodingScheme)
	 */
	public Set<Field> getFields() {
		return fields;
	}
	
	/**
	 * Tests whether this mapping format will output default values, or expect them during parsing. If
	 * <code>true</code>, this format will output and parse for every specified field. Otherwise, this format
	 * will only write/expect fields that have a default value if their value differs from the default.
	 * @see Field#hasDefaultValue()
	 */
	public boolean isStrict() {
		return strict;
	}

	/**
	 * Formats a mapping according to the {@linkplain #getEncodingScheme() encoding scheme in effect}.
	 * @param mapping The mapping to format.
	 * @return A string in the format required by this formatter/parser's {@link #getEncodingScheme()}.
	 * @see #format(Mapping, StringBuffer, FieldPosition) 
	 */
	public String formatMapping(Mapping mapping) {
		List<Field> order = encodingScheme.getOrder(); 
		Field field = null;
		int index = -1;
		
		for(int i = 0; i < order.size(); i++) {
			Field f = order.get(i);
			if(fields.contains(f)) {
				field = f;
				index = i;
				break;
			}
		}
		
		return format(mapping, new StringBuffer(), new FieldPosition(field, index)).toString();
	}
	
	/**
	 * Overrides the {@link Format#format(Object, StringBuffer, FieldPosition)} method to make sure the
	 * specified <code>Object</code> <code>obj</code> is an instance of {@link Mapping}.
	 * @see #format(Mapping, StringBuffer, FieldPosition)
	 */
	@Override
	public StringBuffer format(Object obj, StringBuffer toAppendTo, FieldPosition pos) {
		if(!(obj instanceof Mapping)) {
			throw new IllegalArgumentException("not a mapping: " + obj);
		}
		if(pos.getFieldAttribute() == null) {
			int i = pos.getField();
			pos = new FieldPosition(fieldAtIndex(i), i);
		}
		
		return format((Mapping)obj, toAppendTo, pos);
	}
	
	/**
	 * Formats a given {@link Mapping} based on the specified field position, appending the
	 * output to the string buffer provided. 
	 * @param mapping The mapping to format.
	 * @param toAppendTo The string buffer to append to.
	 * @param pos The field position to use.
	 * @return A string buffer with the information from <code>mapping</code> corresponding to the
	 * field position <code>pos</code> appended to the one provided.
	 * @throws IllegalArgumentException For the following reasons:
	 * <ul> 
	 * 	<li>An attempt is made to format an alignment with a {@link IndexBase#nullValue null index}.</li>
	 * 	<li>The value of <code>pos.getFieldAttribute()</code> is not an instance of {@link MappingFormat.Field}.
	 * 	<li>The encoding scheme does not contain the field specified by <code>pos</code>.</li>
	 * 	<li>The specified {@linkplain #getFields() list of fields} does not contain the field specified by
	 * 		<code>pos</code>.
	 * 	<li>Either a field required by the encoding scheme or the field specified by <code>pos</code>
	 * 		has a <code>null</code> value.
	 * </ul>
	 */
	public StringBuffer format(Mapping mapping, StringBuffer toAppendTo, FieldPosition pos) {
		if(mapping.a.equals(Alignments.DEFAULT_INDEX_BASE.nullValue)
				|| mapping.b.equals(Alignments.DEFAULT_INDEX_BASE.nullValue)) {
			throw new IllegalArgumentException("cannot format null mapping: " + mapping);
		}
		
		java.text.Format.Field f = pos.getFieldAttribute();
		if(!(f instanceof MappingFormat.Field)) {
			int i = pos.getField();
			pos = new FieldPosition(fieldAtIndex(i), i);
		}
		
		Field field = (MappingFormat.Field)f;
		
		if(!encodingScheme.getOrder().contains(field)) {
			throw new IllegalArgumentException("no such field \'" + field + "\' in scheme " + encodingScheme);
		}
		if(!fields.contains(field)) {
			throw new IllegalArgumentException("field \'" + field + "\' not specified for this format");
		}
		
		int start = toAppendTo.length();
		for(Field af : encodingScheme.getOrder()) {
			if(!fields.contains(af)) {
				continue;
			}
			
			Object val = null;
			
			if(af.equals(PHRASE_NUMBER_FIELD)) {
				val = mapping.phraseNumber;				
			}
			else if(af.equals(A_INDEX_FIELD)) {
				val = mapping.a;
			}
			else if(af.equals(B_INDEX_FIELD)) {
				val = mapping.b;
			}
			else if(af.equals(STATUS_FIELD)) {
				val = (strict || encodingScheme.getRequired().contains(STATUS_FIELD)) ? mapping.status
						: (mapping.status == DEFAULT_STATUS) ? null : mapping.status;
			}
			else if(af.equals(CONFIDENCE_FIELD)) {
				val = (strict || encodingScheme.getRequired().contains(CONFIDENCE_FIELD)) ? mapping.confidence
						: (mapping.confidence.equals(DEFAULT_CONFIDENCE)) ? null : mapping.confidence;
			}
			
			if(val == null) { // skip nulls, but check
				if(encodingScheme.getRequired().contains(af)) {
					throw new IllegalArgumentException("required field " + af + " contains null value");
				}
				if(field.equals(af)) {
					throw new IllegalArgumentException("specified field " + field + " contains null value");
				} 
			}
			else {
				if(af.equals(PHRASE_NUMBER_FIELD)
						|| af.equals(A_INDEX_FIELD) || af.equals(B_INDEX_FIELD)) { // translate indices?
					boolean pn = af.equals(PHRASE_NUMBER_FIELD);
					IndexBase mappingBase = pn ? encodingScheme.getPhraseNumberBase()
								: encodingScheme.getIndexBase(),
							defaultBase = pn ? DEFAULT_PHRASE_NUMBER_BASE : DEFAULT_INDEX_BASE;
					
					val = defaultBase.translate((Integer)val, mappingBase);
				}
				else if(af.equals(STATUS_FIELD)) {
					val = ((Status)val).abbreviation;
				}
			
				if(start < toAppendTo.length()) {
					toAppendTo.append(encodingScheme.getFieldDelimiter());
				}
				
				if(field.equals(af)) {
					pos.setBeginIndex(toAppendTo.length());
				}
				
				toAppendTo.append(val);
				
				if(field.equals(af)) {
					pos.setEndIndex(toAppendTo.length());
				}
			}
		}
		
		return toAppendTo;
	}
	
	Field fieldAtIndex(int i) throws IndexOutOfBoundsException {
		Field f = encodingScheme.getOrder().get(i);
		if(f == null) {
			throw new IndexOutOfBoundsException("no field at position " + i);
		}
		
		return f;
	}
	
	/**
	 * Parses a {@link Mapping} from a given string, based on the {@linkplain #getEncodingScheme() encoding
	 * scheme} in effect. 
	 * @param source The string to parse.
	 * @return A mapping object representing the specified string.
	 * @throws ParseException If the string is ill-formed according to this formatter/parser's
	 * {@link #getEncodingScheme() encoding scheme}. The exception thrown will contain an
	 * {@linkplain ParseException#getErrorOffset() error offset} reflecting the position in the string where
	 * the parse error occurred, if possible. 
	 */
	public Mapping parseMapping(String source) throws ParseException {
		ParsePosition pos = new ParsePosition(0);
		Mapping m = (Mapping)parseObject(source, pos);
		if(pos.getErrorIndex() != -1) {
			throw new ParseException("problem parsing input \"" + source + "\"", pos.getErrorIndex());
		}
		
		return m;
	}
	
	/**
	 * Overrides the {@link Format#parseObject(String, ParsePosition)} method to return a mapping, parsing
	 * from the specified {@link ParsePosition}.
	 * @see #parseMapping(String) 
	 */
	@Override
	public Object parseObject(String source, ParsePosition pos) {
		if(pos == null) {
			throw new NullPointerException("parse position is null");
		}
		
		int index = pos.getIndex();
		
		Matcher matcher = mappingPattern.matcher(source);
		if(!matcher.matches()) {
			pos.setErrorIndex(index);
			return null;
		}		
		if(matcher.start() != index) {
			pos.setErrorIndex(index);
			return null;
		}
		
		String[] chunks = fieldPattern.split(source);
		Iterator<MappingFormat.Field> oi = encodingScheme.getOrder().iterator();
		Map<MappingFormat.Field, Object> values
			= new HashMap<MappingFormat.Field, Object>(encodingScheme.getOrder().size());
		
		for(int i = 0; i < chunks.length; i++) {
			String c = chunks[i];
			
			if(c.length() == 0 || !oi.hasNext()) {
				pos.setErrorIndex(index);
				return null;
			}
			
			Object val;
			MappingFormat.Field af = null;
			while(oi.hasNext()) {
				af = oi.next();
				try {
					if(af.equals(PHRASE_NUMBER_FIELD)
							|| af.equals(A_INDEX_FIELD) || af.equals(B_INDEX_FIELD)) {
						boolean pn = af.equals(PHRASE_NUMBER_FIELD);
						IndexBase mappingBase = pn ? encodingScheme.getPhraseNumberBase()
									: encodingScheme.getIndexBase(),
								defaultBase = pn ? DEFAULT_PHRASE_NUMBER_BASE : DEFAULT_INDEX_BASE;
						
						try {
							val = mappingBase.translate(Integer.valueOf(c), defaultBase);
						}
						catch(IllegalArgumentException iie) { // thrown by IndexBase.translate()
							pos.setErrorIndex(index);
							return null;
						}
						
						// can't have null value
						if(((Integer)val).equals(defaultBase.nullValue)) {
							pos.setErrorIndex(index);
							return null;
						}
					}
					else if(af.equals(STATUS_FIELD)) {
						val = Status.forAbbreviation(c);
					}
					else if(af.equals(CONFIDENCE_FIELD)) {
						val = Double.valueOf(c);
					}
					else {
						val = null;
					}
				}
				catch(NumberFormatException e) {
					pos.setErrorIndex(index);
					return null;
				}
				
				if(val == null) {
					if(encodingScheme.getRequired().contains(af) || (strict && fields.contains(af))) {
						pos.setErrorIndex(index);
						return null;
					}
					
					continue; // keep going if not required
				}
				
				values.put(af, val);
				break;
			}
			
			// update parse index
			index += c.length();
			if(i < chunks.length - 1) {
				index++; // add one for delimiter
			}
		}
		
		pos.setIndex(matcher.end());
		
		Set<Field> keys = values.keySet();
		if(!keys.containsAll(encodingScheme.getRequired()) || (strict && !keys.containsAll(fields))) {
			pos.setErrorIndex(index);
			return null;
		}
		
		Integer id = values.containsKey(PHRASE_NUMBER_FIELD) ? (Integer)values.get(PHRASE_NUMBER_FIELD) : null;
		
		Integer first = values.containsKey(A_INDEX_FIELD) ? (Integer)values.get(A_INDEX_FIELD) : null,
			second = values.containsKey(B_INDEX_FIELD) ? (Integer)values.get(B_INDEX_FIELD) : null;
				
		Status status = (Status)values.get(STATUS_FIELD);
		if(status == null && STATUS_FIELD.hasDefaultValue()) {
			status = (Status)STATUS_FIELD.defaultValue;
		}
		
		Double confidence = (Double)values.get(CONFIDENCE_FIELD);
		if(confidence == null && CONFIDENCE_FIELD.hasDefaultValue()) {
			confidence = (Double)CONFIDENCE_FIELD.defaultValue;
		}
		
		return new Mapping(id, first, second, status, confidence);
	}
}


================================================
FILE: src/opennlp/ccg/alignment/MappingGroup.java
================================================
//////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2012 Scott Martin
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.alignment;


/**
 * Class for representing groups of mappings during reading or writing.
 * Mapping groups encapsulate a phrase number (usually associated with a
 * phrase's line number) and a number of mappings in the group (its
 * {@linkplain #getLength() length}).
 * 
 * @author <a href="http://www.ling.osu.edu/~scott/">Scott Martin</a>
 */
public class MappingGroup implements Comparable<MappingGroup> {

	Integer phraseNumber;
	int length;
	
	/**
	 * Creates a new mapping group with the given phrase number and length.
	 * @throws IllegalArgumentException if <tt>phraseNumber</tt> is <tt>null</tt>, or if
	 * <tt>length &lt; 0</tt>.
	 */
	public MappingGroup(Integer phraseNumber, int length) {
		if(phraseNumber == null) {
			throw new IllegalArgumentException("phraseNumber is null");
		}
		if(length < 0) {
			throw new IllegalArgumentException("length < 0: " + length);
		}
		
		this.phraseNumber = phraseNumber;
		this.length = length;
	}
	
	/**
	 * Gets this group's phrase number.
	 */
	public Integer getPhraseNumber() {
		return phraseNumber;
	}

	/**
	 * Gets the length of this mapping group.
	 */
	public int getLength() {
		return length;
	}

	/**
	 * Tests whether this group is equal to another by comparing the two groups'
	 * phrase numbers and lengths.
	 */
	@Override
	public boolean equals(Object obj) {
		if(obj instanceof MappingGroup) {
			MappingGroup ag = (MappingGroup)obj;
			return phraseNumber.equals(ag.phraseNumber) && length == ag.length;
		}
		
		return false;
	}

	/**
	 * Compares this mapping group to another by comparing their IDs and lengths.
	 */
	public int compareTo(MappingGroup ag) {
		int i = phraseNumber.compareTo(ag.phraseNumber);
		
		if(i == 0) {
			i = (length == ag.length) ? 0 : length < ag.length ? -1 : 1;
		}
		
		return i;
	}

	/**
	 * Computes a hash code for this mapping group based on its ID and length.
	 */
	@Override
	public int hashCode() {
		// brackets are to guard against 0
		return 37 * (1 + phraseNumber.intValue() + length);
	}

	/**
	 * Gets a string representation of this group.
	 * @return For a group with phrase number <code>37</code> and length 
	 * <code>12</code>, the string &quot;<code>Group 37 (12 mappings)</code>&quot;. 
	 */
	@Override
	public String toString() {
		StringBuilder sb = new StringBuilder("Group ");
		sb.append(phraseNumber);
		sb.append(" (");
		sb.append(length);
		sb.append(" mappings)");
		
		return sb.toString();
	}

}


================================================
FILE: src/opennlp/ccg/alignment/MappingReader.java
================================================
//////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2012 Scott Martin
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.alignment;

import java.io.FilterReader;
import java.io.IOException;
import java.io.Reader;
import java.text.ParseException;
import java.util.LinkedList;
import java.util.Queue;


/**
 * Class for reading {@link Mapping}s from an underlying reader based on a specified {@link MappingFormat}.
 * <p>
 * Instances of this class read mappings group by group, with {@link #nextGroup()} called after reading the
 * correct number of mappings for the current group, as signaled by the {@link #canRead()} method.
 * <p>
 * The following code fragment illustrates the usage of this class:
 * <blockquote><pre>
 * MappingReader reader = ...;
 * 
 * MappingGroup g;
 * while((g = reader.getNextGroup()) != null) {
 * 	while(reader.canRead()) {
 * 		Mapping m = reader.readMapping();
 * 		...
 * 	}
 * }</pre></blockquote>
 * @author <a href="http://www.ling.osu.edu/~scott/">Scott Martin</a>
 * @see MappingFormat
 */
public class MappingReader extends FilterReader {

	final MappingFormat format;
	
	private MappingGroup currentGroup;	
	private Queue<Mapping> mappingQueue;
	private int mappingCount = 0;
	private boolean skipLF = false;
	
	/**
	 * Creates a mapping reader.
	 * @param r The underlying reader.
	 * @param format The mapping format to use for reading {@link Mapping}s.
	 * @throws IllegalArgumentException if <tt>format</tt> is <tt>null</tt>.
	 */
	public MappingReader(Reader r, MappingFormat format) {
		super(r);
		
		if(format == null) {
			throw new IllegalArgumentException("format is null");
		}
		
		this.format = format;
		mappingQueue = new LinkedList<Mapping>();		
	}
	
	/**
	 * @return The format used to read mappings.
	 */
	public MappingFormat getFormat() {
		return format;
	}
	
	/**
	 * Starts reading from the next mapping group.
	 * @return The next {@link MappingGroup} found by reading from the underlying reader.
	 * @throws IOException If a {@link ParseException} is encountered when calling
	 * {@link MappingFormat#parseMapping(String)} based on the underlying input, or if one is thrown by the
	 * underlying reader. An IOException is also thrown if the number of mappings in the
	 * {@linkplain MappingGroup#getLength() current group} could not be read. 
	 */
	public MappingGroup nextGroup() throws IOException {
		checkMappingCount();
		mappingCount = 0;
		
		MappingGroup previous = (currentGroup == null) ? null : currentGroup;
		int newCount = mappingQueue.size();
		
		currentGroup = (newCount == 0)
			? null : new MappingGroup(mappingQueue.peek().phraseNumber, newCount);
		
		boolean eog = false;
		
		while(!eog) {
			StringBuilder sb = new StringBuilder();
			
			int i;
			while((i = in.read()) != -1) {
				char c = (char)i;
				
				if(skipLF) {
					skipLF = false;
					if(c == '\n') {
						continue;
					}
				}
				
				if(c == '\r') {
					skipLF = true;
				}
				
				if(format.encodingScheme.isMappingDelimiter(c)) {
					break;
				}
				else if(format.encodingScheme.isGroupDelimiter(c)) {
					eog = true;
					break;
				}
				else {
					sb.append(c); 
				}
			}
			
			if(sb.length() == 0) {
				break; // for EOF and end of group
			}
			
			Mapping a = null;
			try {
				a = format.parseMapping(sb.toString());
			}
			catch(ParseException pe) {
				throw new IOException(((currentGroup == null) ? ""
						: "group " + currentGroup.phraseNumber + ": ") + "problem formatting mapping "
						+ sb.toString() + " at offset " + pe.getErrorOffset() + ": " + pe.getMessage(), pe);
			}
			
			// if the format allows null IDs, use previous's running counter
			if(currentGroup == null) {
				Integer I = (a.phraseNumber == null)
					? (previous == null) ? format.encodingScheme.getPhraseNumberBase().start
							: previous.phraseNumber + 1
					: a.phraseNumber;
				
				currentGroup = new MappingGroup(I, 0);
			}
			
			if(a.phraseNumber == null) {
				// have to copy because phraseNumber is immutable (and final)
				a = a.copyWithPhraseNumber(currentGroup.phraseNumber);
			}
			
			if(!currentGroup.phraseNumber.equals(a.phraseNumber)) {
				eog = true;
			}
			else {
				newCount++; // only increment if should be read
			}			
			
			if(!mappingQueue.offer(a)) { // save for next read
				throw new IOException("unable to read mapping");
			}
		}
		
		if(currentGroup != null) {
			currentGroup.length = newCount;
		}
		
		return (currentGroup == null || currentGroup.length == 0) ? null : currentGroup;
	}
	
	/**
	 * Tests whether mappings can be read from this reader without throwing an {@link IOException}.
	 * @return true If there is a current mapping group and mappings remain to be read from it.
	 * @see #nextGroup()
	 * @see #readMapping()
	 */
	public boolean canRead() {
		return currentGroup != null && mappingCount < currentGroup.length;
	}
	
	/**
	 * Overrides the superclass method to check first if any mappings are available.
	 * @throws IOException If no mappings are available.
	 * @see #canRead()
	 */
	@Override
	public int read() throws IOException {
		checkRead();
		int c = super.read();
		if(skipLF) {
			skipLF = false;
			if(c == '\n') {
				c = super.read();
			}
		}
		
		return c;
	}

	/**
	 * Overrides the superclass method to check first if any mappings are available.
	 * @throws IOException If no mappings are available.
	 * @see #canRead()
	 */
	@Override
	public int read(char[] cbuf, int off, int len) throws IOException {
		checkRead();
		
		if(len < 1) {
			return 0;
		}
		
		if(skipLF) {
			int c = read();
			skipLF = false;
			
			if(c == -1) {
				return c;
			}
			else if(c != '\n') {
				cbuf[off++] = (char)c;
				len--;
			}
		}
		
		return super.read(cbuf, off, len);
	}

	/**
	 * Tests whether mappings can be read without blocking.
	 * @return true If it is guaranteed that a call to {@link #readMapping()} will not block for input.
	 */
	@Override
	public boolean ready() throws IOException {
		return canRead();
	}

	/**
	 * Reads a mapping from the underlying reader, if one is {@linkplain #canRead() available}.
	 * @return A mapping formatted by the {@linkplain #getFormat() format in effect}.
	 * @throws IOException If no mappings are available in the current group.
	 * @see #canRead()
	 */
	public Mapping readMapping() throws IOException {
		checkRead();
		
		Mapping a = mappingQueue.poll();
		
		if(a != null) {
			mappingCount++;
		}
		
		return a;
	}
	
	/**
	 * Closes this reader, checking first if the correct number of mappings were read.
	 * @throws IOException If mappings remain to be read from the current group.
	 */
	@Override
	public void close() throws IOException {
		try {
			checkMappingCount();
		}
		finally {
			super.close();
		}
	}
	
	void checkRead() throws IOException {
		if(!canRead()) {
			throw new IOException("no mappings available");
		}
	}

	void checkMappingCount() throws IOException {
		if((currentGroup == null && mappingCount > 0) 
				|| (currentGroup != null && mappingCount != currentGroup.length)) {
			throw new IOException(
				currentGroup == null ? "" : "group " + currentGroup.phraseNumber + ": "
					+ "mapping count does not match: expected "
					+ ((currentGroup == null) ? 0 : currentGroup.length)
					+ ", but was " + mappingCount);
		}
	}
}


================================================
FILE: src/opennlp/ccg/alignment/MappingWriter.java
================================================
//////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2012 Scott Martin
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.alignment;

import java.io.FilterWriter;
import java.io.IOException;
import java.io.Writer;

/**
 * A writer for outputting {@link Mapping}s to a specified underlying {@link Writer}.
 * <p>
 * Mapping writers write mappings by group, so that before any mappings are written,
 * {@link #startGroup(MappingGroup)} must always be called
 * to signal to the writer that a new group is starting (and what its length is). The outgoing mappings are
 * formatted according to a {@link MappingFormat} specified at creation.
 * <p>
 * After a new group is started, exactly the {@linkplain MappingGroup#getLength() number of mappings} in that
 * group must be written. Otherwise, an {@link IOException} is thrown. An {@link IOException} is also thrown
 * if an attempt is made to write a mapping whose {@linkplain Mapping#getPhraseNumber() id} is different from the 
 * current group's {@linkplain MappingGroup#getPhraseNumber() id}, or if {@link #writeMapping(Mapping)} is called without
 * first calling {@link #startGroup(MappingGroup)}.
 * <p>
 * Example usage:
 * <blockquote><pre>
 * MappingWriter mw = ...;
 * 
 * // while there are more groups
 * mw.startGroup(new MappingGroup(...));
 * while(mw.canWrite()) {
 * 	mw.writeMapping(...);
 * }
 * 
 * mw.close();</pre></blockquote>
 * @author <a href="http://www.ling.osu.edu/~scott/">Scott Martin</a>
 */
public class MappingWriter extends FilterWriter {

	final MappingFormat format;
	
	private MappingGroup currentGroup;
	private int mappingCount = 0;
	
	private String mappingDelimiter, groupDelimiter;
	
	/**
	 * Creates a new mapping writer.
	 * @param out The underlying writer.
	 * @param format The mapping format to use.
	 * @throws IllegalArgumentException if <tt>format</tt> is <tt>null</tt>.
	 */
	public MappingWriter(Writer out, MappingFormat format) {
		super(out);
		
		if(format == null) {
			throw new IllegalArgumentException("format is null");
		}
		
		this.format = format;
	}
		
	/**
	 * Gets the mapping format used by this writer.
	 */
	public MappingFormat getFormat() {
		return format;
	}
	
	/**
	 * Gets the current mapping group being written.
	 */
	public MappingGroup getCurrentGroup() {
		return currentGroup;
	}
	
	void checkWrite() throws IOException {
		if(!canWrite()) {
			throw new IOException("unable to write");
		}
	}
	
	void checkMappingCount() throws IOException {
		if(currentGroup != null && mappingCount != currentGroup.length) {
			throw new IOException("incorrect mapping count for group " +
					+ currentGroup.phraseNumber + "; expected "
					+ currentGroup.length + ", but was " + mappingCount);
		}
	}
	
	/**
	 * Starts a new mapping group for writing mappings. If {@link #endGroup()} was not called explicitly,
	 * it is first called to end the current group.
	 * @param mappingGroup The group to start.
	 * @throws IOException If the number of mappings written since the last call to
	 * {@link #startGroup(MappingGroup)}does not exactly equal the length of the
	 * {@linkplain #getCurrentGroup() current group}.
	 * @see #writeMapping(Mapping)
	 * @see #endGroup()
	 */
	public void startGroup(MappingGroup mappingGroup) throws IOException {
		if(currentGroup != null) {
			endGroup();	
		}
		
		currentGroup = mappingGroup;
	}
	
	/**
	 * Ends the current group, writing the {@linkplain EncodingScheme#getGroupDelimiter() proper group
	 * delimiter} for the {@linkplain #getFormat() mapping format in effect}.
	 * @throws IOException If {@link #startGroup(MappingGroup)} was not first called, or if the correct number
	 * of mappings for the current group was not written.
	 * @see #startGroup(MappingGroup)
	 */
	public void endGroup() throws IOException {
		if(currentGroup == null) {
			throw new IOException("no current group");
		}
		
		checkMappingCount();
		
		if(currentGroup.length > 0) {
			if(groupDelimiter == null) {
				Character gd = format.encodingScheme.getGroupDelimiter();
				
				groupDelimiter = AbstractEncodingScheme.isLineSeparator(gd)
						? System.getProperty("line.separator") : String.valueOf(gd);
			}
			
			out.write(groupDelimiter); // no empty lines
		}
		
		currentGroup = null;
		mappingCount = 0;
	}
	
	/**
	 * Writes to the underlying writer, first checking if mappings can be written.
	 * @see #canWrite()
	 */
	@Override
	public void write(char[] cbuf, int off, int len) throws IOException {
		checkWrite();
		super.write(cbuf, off, len);
	}

	/**
	 * Writes to the underlying writer, first checking if mappings can be written.
	 * @see #canWrite()
	 */
	@Override
	public void write(int c) throws IOException {
		checkWrite();
		super.write(c);
	}

	/**
	 * Writes to the underlying writer, first checking if mappings can be written.
	 * @see #canWrite()
	 */
	@Override
	public void write(String str, int off, int len) throws IOException {
		checkWrite();
		super.write(str, off, len);
	}

	/**
	 * Writes to the underlying writer, first checking if mappings can be written.
	 * @see #canWrite()
	 */
	@Override
	public void write(char[] cbuf) throws IOException {
		checkWrite();
		super.write(cbuf);
	}

	/**
	 * Writes to the underlying writer, first checking if mappings can be written.
	 * @see #canWrite()
	 */
	@Override
	public void write(String str) throws IOException {
		checkWrite();
		super.write(str);
	}
	
	/**
	 * Tests whether the mapping writer is currently in a state in which mappings can be written without
	 * throwing an {@link IOException}. Mappings
	 * can only be written when a current group has been {@linkplain #startGroup(MappingGroup) started} and 
	 * the number of mappings written since the last group started is less than the total
	 * {@linkplain MappingGroup#getLength() length} of the current group.
	 * @return true If the {@linkplain #getCurrentGroup() current group} is non-null and the number of mappings
	 * written to the current group is less than its length.
	 */
	public boolean canWrite() {
		return currentGroup != null && mappingCount < currentGroup.length; 
	}

	/**
	 * Writes a mapping to the underlying writer, formatted by {@linkplain #getFormat() the mapping format}. If
	 * other mappings have been written since the last call to {@link #startGroup(MappingGroup)}, the
	 * {@linkplain EncodingScheme#getMappingDelimiter() mapping delimiter} used by the current format is first
	 * written.
	 * @param mapping The mapping to write.
	 * @throws IOException If {@link #canWrite()} returns <code>false</code>, if
	 * {@link #startGroup(MappingGroup)} was not first called, or if an attempt is made
	 * to write a mapping with an {@linkplain Mapping#getPhraseNumber() id} that does not equal the current group's
	 * {@linkplain MappingGroup#getPhraseNumber() id}.
	 */
	public void writeMapping(Mapping mapping) throws IOException {
		checkWrite();
		if(mapping == null) {
			throw new NullPointerException("null mapping");
		}		
		if(mapping.phraseNumber != null && !mapping.phraseNumber.equals(currentGroup.phraseNumber)) {
			throw new IOException("mapping from group " + mapping.phraseNumber
				+ ", but current group is " + currentGroup.phraseNumber);
		}
		
		if(mappingCount > 0) {
			if(mappingDelimiter == null) {
				Character md = format.encodingScheme.getMappingDelimiter();
				mappingDelimiter = AbstractEncodingScheme.isLineSeparator(md)
						? System.getProperty("line.separator") : String.valueOf(md);
			}
			
			out.write(mappingDelimiter);
		}		
		
		out.write(format.formatMapping(mapping));
		mappingCount++;
	}

	/**
	 * Overrides the superclass method to first check that the correct number of mappings were written.
	 * @throws IOException If a number of mappings have been written that does not exactly equal the length 
	 * of the {@linkplain #getCurrentGroup() current group}.
	 */
	@Override
	public void close() throws IOException {
		try {
			checkMappingCount();
		}
		finally {
			super.close();
		}
	}
}


================================================
FILE: src/opennlp/ccg/alignment/MosesEncodingScheme.java
================================================
//////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2012 Scott Martin
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.alignment;

import static opennlp.ccg.alignment.MappingFormat.Field.A_INDEX_FIELD;
import static opennlp.ccg.alignment.MappingFormat.Field.B_INDEX_FIELD;
import static opennlp.ccg.alignment.MappingFormat.Field.STATUS_FIELD;

import java.util.Arrays;
import java.util.HashSet;

/**
 * Represents the Moses encoding.
 * <table>
 * 	<tr><td>Field separator</td><td>-</td></tr>
 * 	<tr><td>Mapping separator</td><td>(space)</td></tr>
 * 	<tr><td>Group separator</td><td>(newline)</td></tr>
 * 	<tr><td>ID base</td><td>{@link IndexBase#ZERO}</td></tr>
 * 	<tr><td>Index base</td><td>{@link IndexBase#ZERO}</td></tr>
 * 	<tr><td>Example group</td><td>0-1 2-3 2-4-P 3-0</td></tr>
 * </table>
 * @see <a href="http://www.statmt.org/moses/?n=FactoredTraining.AlignWords">Moses Word Alignment Tutorial</a>
 * 
 * @author <a href="http://www.ling.ohio-state.edu/~scott/">Scott Martin</a>
 */
public class MosesEncodingScheme extends AbstractEncodingScheme {
	
	/**
	 * Creates a new instance of the Moses encoding scheme.
	 * @see Alignments#MOSES_ENCODING_SCHEME
	 */
	public MosesEncodingScheme() {
		super('-', ' ', '\n', Alignments.DEFAULT_INDEX_BASE, IndexBase.ZERO,
				new HashSet<MappingFormat.Field>(Arrays.asList(A_INDEX_FIELD, B_INDEX_FIELD, STATUS_FIELD)),
				new HashSet<MappingFormat.Field>(Arrays.asList(A_INDEX_FIELD, B_INDEX_FIELD)),
				A_INDEX_FIELD, B_INDEX_FIELD, STATUS_FIELD);
	}

}


================================================
FILE: src/opennlp/ccg/alignment/NAACLEncodingScheme.java
================================================
//////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2012 Scott Martin
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.alignment;

import static opennlp.ccg.alignment.MappingFormat.Field.*;

import java.util.Arrays;
import java.util.HashSet;

/**
 * Represents the NAACL shared task encoding.
 * <table>
 * 	<tr><td>Field separator</td><td>(space)</td></tr>
 * 	<tr><td>Mapping separator</td><td>(newline)</td></tr>
 * 	<tr><td>Group separator</td><td>(newline)</td></tr>
 * 	<tr><td>ID base</td><td>{@link IndexBase#ZERO}</td></tr>
 * 	<tr><td>Index base</td><td>{@link IndexBase#ONE}</td></tr>
 * 	<tr><td>Example group</td><td>
 * <pre>
 * 37 1 2 S
 * 37 3 4 S
 * 37 3 5 P
 * 37 4 1 S
 * </pre>
 * </td></tr>
 * </table>
 * @see <a href="http://www.cse.unt.edu/~rada/wpt/WordAlignment.Guidelines.txt">NAACL shared task word alignment guidelines</a>
 * @author <a href="http://www.ling.ohio-state.edu/~scott/">Scott Martin</a>
 */
public class NAACLEncodingScheme extends AbstractEncodingScheme {
	
	/**
	 * Creates a new instance of the NAACL encoding scheme.
	 * @see Alignments#NAACL_ENCODING_SCHEME
	 */
	public NAACLEncodingScheme() {
		super(' ', '\n', '\n', IndexBase.ZERO, IndexBase.ONE,
			Alignments.NAACL_DEFAULT_FIELDS,				
			new HashSet<MappingFormat.Field>(Arrays.asList(PHRASE_NUMBER_FIELD, A_INDEX_FIELD, B_INDEX_FIELD)),				
			PHRASE_NUMBER_FIELD, A_INDEX_FIELD, B_INDEX_FIELD, STATUS_FIELD, CONFIDENCE_FIELD);
	}

}


================================================
FILE: src/opennlp/ccg/alignment/Phrase.java
================================================
//////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2012 Scott Martin
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.alignment;

import java.util.AbstractList;
import java.util.List;

/**
 * A phrase, i.e., a sequence of words with an associated {@linkplain #getNumber() phrase number}.
 * Phrases may additionally have a {@linkplain #getId() string ID}.
 * To save access time and space, this class is backed by an array of
 * {@link String}s, but extends {@link AbstractList} so that phrases can be iterated over and have 
 * all of the usual convenience methods.
 * <p>
 * Phrases are immutable once created, so calling any of the {@link List#add(Object)},
 * {@link List#remove(int)}, or {@link List#set(int, Object)}
 * methods will throw an {@link UnsupportedOperationException}. Similarly, the
 * {@linkplain #iterator() iterator's} <tt>remove()</tt> method also throws an
 * {@link UnsupportedOperationException}. 
 * <p>
 * For convenience, this class implements the {@link Comparable} interface, comparing
 * phrases by their {@linkplain #getNumber() numbers}.
 * 
 * @author <a href="http://www.ling.ohio-state.edu/~scott/">Scott Martin</a>
 */
public class Phrase extends AbstractList<String> implements Comparable<Phrase> {

	final Integer number;
	final String id;
	final String[] words;
	
	/**
	 * Creates a new phrase with the given number and list of words.
	 * @see Phrase#Phrase(String, Integer, String...)
	 */
	public Phrase(Integer number, List<String> words) {
		this(number, words.toArray(new String[words.size()]));
	}
	
	/**
	 * Creates a new phrase with the specified number, made up of the given words.
	 * @see Phrase#Phrase(String, Integer, String...)
	 */
	public Phrase(Integer number, String... words) {
		this(null, number, words);
	}
	
	/**
	 * Creates a new phrase with the given number, ID, and list of words.
	 * @see Phrase#Phrase(String, Integer, String...)
	 */
	public Phrase(String id, Integer number, List<String> words) {
		this(id, number, words.toArray(new String[words.size()]));
	}
	
	/**
	 * Creates a new phrase with the specified number and id, made up of the given words.
	 * The ID may be <tt>null</tt>, but the cannot be <tt>null</tt>. The list of words cannot be
	 * <tt>null</tt> or contain <tt>null</tt> members, although it can be empty.
	 * @throws IllegalArgumentException If <code>number</code>, <code>words</code> is <code>null</code>,
	 * or one of the strings in <tt>words</tt> is <tt>null</tt>.
	 */
	public Phrase(String id, Integer number, String... words) {
		checkObject(number, "number");
		checkObject(words, "words");
		
		for(int i = 0; i < words.length; i++) {
			checkObject(words[i], "word " + i);
		}
		
		this.number = number;
		this.id = id;
		this.words = words;
	}

	void checkObject(Object obj, String name) {
		if(obj == null) {
			throw new IllegalArgumentException(name + " is null");
		}
	}
	
	/**
	 * Gets this phrase's ID, if any was specified.
	 * @return The ID of this phrase, possibly <code>null</code>.
	 */
	public String getId() {
		return id;
	}

	/**
	 * @return This phrase's number.
	 */
	public Integer getNumber() {
		return number;
	}

	/**
	 * Returns the word in this phrase at the supplied index.
	 */
	@Override
	public String get(int index) {
		return words[index];
	}

	/**
	 * @return The number of words in this phrase.
	 */
	@Override
	public int size() {
		return words.length;
	}

	/**
	 * Compares this phrase to another by comparing their {@linkplain #getNumber() numbers}.
	 * @return The value of <tt>getNumber().compareTo(o.getNumber())</tt>.
	 * @param o The phrase to compare to.
	 * @see Integer#compareTo(Integer)
	 */
	@Override
	public int compareTo(Phrase o) {
		return getNumber().compareTo(o.getNumber());
	}

	/**
	 * Tests whether this phrase is equal to another by first calling the superclass method 
	 * {@link AbstractList#equals(Object)}, then comparing this phrase's number and id to the other.
	 */
	@Override
	public boolean equals(Object o) {
		if(o instanceof Phrase && super.equals(o)) {
			Phrase p = (Phrase)o;
			return number.equals(p.number) && ((id == null && p.id == null) || id.equals(p.id));
		}
		
		return false;
	}

	/**
	 * Generates a hash code for this phrase based on the superclass hash code, its number, and its ID
	 * (if any).
	 */
	@Override
	public int hashCode() {
		int h = 31 * super.hashCode() + number.hashCode();
		
		return (id == null) ? h : h + id.hashCode();
	}

	/**
	 * Gets a string representation of this phrase.
	 * @return For a phrase with number <code>37</code>, ID <code>phrase 3</code>, and words
	 * &quot;Test phrase&quot;, prepends <code>37 (phrase 3): </code> to the result of calling the
	 * superclass method {@link AbstractList#toString()}; 
	 */
	@Override
	public String toString() {
		StringBuilder sb = new StringBuilder(number.toString());
		
		if(id != null) {
			sb.append(" (");
			sb.append(id);
			sb.append(')');
		}
		
		sb.append(": ");
		sb.append(super.toString());
		
		return sb.toString();
	}

}


================================================
FILE: src/opennlp/ccg/alignment/PhrasePosition.java
================================================
//////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2012 Scott Martin
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.alignment;

/**
 * In an alignment, a phrase position indicates which of the two aligned phrases
 * is first (the &quot;A&quot; phrase) and which is second (the &quot;B&quot; phrase)
 * in terms of the alignment indices.
 *  
 * @author <a href="http://www.ling.ohio-state.edu/~scott/">Scott Martin</a>
 */
public enum PhrasePosition {
	
	/**
	 * The &quot;A&quot; position.
	 */
	A,
	
	/**
	 * The &quot;B&quot; position.
	 */
	B;
	
	/**
	 * Gives the opposite of this phrase position.
	 * @return {@link #B} if this position is {@link #A}, otherwise 
	 * {@link #A}.
	 */
	public PhrasePosition opposite() {
		return (this == A) ? B : A;
	}
}


================================================
FILE: src/opennlp/ccg/alignment/PhraseReader.java
================================================
//////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2012 Scott Martin
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.alignment;

import java.io.IOException;
import java.io.LineNumberReader;
import java.io.Reader;

/**
 * A phrase reader just reads line numbers, but does not search for phrase IDs. The line number of each phrase
 * read is {@linkplain IndexBase#translate(Integer, IndexBase) translated} into the {@link IndexBase} provided
 * at creation.
 * @author <a href="http://www.ling.osu.edu/~scott/">Scott Martin</a>
 */
public class PhraseReader extends LineNumberReader {

	final IndexBase numberBase;
	
	/**
	 * The index base that starts numbering lines at 1.
	 * @see IndexBase#ONE
	 */
	public static final IndexBase LINE_NUMBER_BASE = IndexBase.ONE;
	
	/**
	 * Creates a phrase reader from the specified underlying reader and word index base for phrase numbers.
	 * @see #PhraseReader(Reader, IndexBase)
	 * @see Alignments#DEFAULT_PHRASE_NUMBER_BASE
	 */
	public PhraseReader(Reader in) {
		this(in, Alignments.DEFAULT_PHRASE_NUMBER_BASE);
	}
	
	/**
	 * Creates a phrase reader.
	 * @param numberBase The target phrase numbering base. Phrases read from the underlying reader will have
	 * their numbers translated from {@link #LINE_NUMBER_BASE the default} to <code>numberBase</code>.
	 * @throws IllegalArgumentException if <tt>numberBase</tt> is <tt>null</tt>.
	 * @see IndexBase#translate(Integer, IndexBase)
	 * @see #readPhrase()
	 */
	public PhraseReader(Reader in, IndexBase numberBase) {
		super(in);
		
		if(numberBase == null) {
			throw new IllegalArgumentException("numberBase is null");
		}
		
		this.numberBase = numberBase;
	}

	/**
	 * The target number base that new phrase IDs will have their line numbers translated into.
	 * @see #readPhrase()
	 */
	public IndexBase getNumberBase() {
		return numberBase;
	}
	
	/**
	 * Gets the number last assigned to a phrase, translated into the specified
	 * {@linkplain #getNumberBase() number base}. Note that this method may return a different result than
	 * {@link #getLineNumber()} due to the base translation.
	 * @see IndexBase#translate(Integer, IndexBase)
	 */
	public Integer getPhraseNumber() {
		return LINE_NUMBER_BASE.translate(getLineNumber(), numberBase);
	}

	/**
	 * Reads the next phrase from the underlying reader. The number is determined by translating the line number
	 * of the phrase into the {@linkplain #getNumberBase() target number base}. The words in the phrase are
	 * tokenized by the {@link Alignments#tokenize(String)} method.
	 * @return null if no phrases can be read from the underlying reader.
	 */
	public Phrase readPhrase() throws IOException {
		String ln = readLine();
		return (ln == null) ? null : new Phrase(getPhraseNumber(), Alignments.tokenize(ln));
	}
}


================================================
FILE: src/opennlp/ccg/alignment/PhraseWriter.java
================================================
//////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2012 Scott Martin
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.alignment;

import java.io.FilterWriter;
import java.io.IOException;
import java.io.PrintWriter;
import java.io.Writer;

/**
 * A writer for phrases. This writer writes {@linkplain Phrase phrase} instances to the underlying writer with
 * the specified string as a word separator. No markup is placed around phrases that are written; only a line
 * separator is written after the phrase.
 * 
 * @author <a href="http://www.ling.osu.edu/~scott/">Scott Martin</a>
 * @see Alignments#untokenize(String[], String)
 */
public class PhraseWriter extends FilterWriter {

	final String wordSeparator;
	
	protected PrintWriter printWriter;
	
	/**
	 * Creates a new phrase writer with the default word separator.
	 * @see #PhraseWriter(Writer, String)
	 * @see Alignments#DEFAULT_WORD_SEPARATOR
	 */
	public PhraseWriter(Writer out) {
		this(out, Alignments.DEFAULT_WORD_SEPARATOR);
	}

	/**
	 * Creates a new phrase writer for the underlying input stream that will use
	 * the specified word separator when untokenizing phrases.
	 * 
	 * @param wordSeparator The word separator to use when translating phrases into strings.
	 * @throws IllegalArgumentException if <tt>wordSeparator</tt> is <tt>null</tt>.
	 * @see Alignments#untokenize(String[], String) 
	 */
	public PhraseWriter(Writer out, String wordSeparator) {
		super(new PrintWriter(out));
		
		if(wordSeparator == null) {
			throw new IllegalArgumentException("wordSeparator is null");
		}
		
		this.wordSeparator = wordSeparator;
		printWriter = (PrintWriter)this.out;
	}
	
	/**
	 * Gets the word separator that this phrase writer uses when writing phrases.
	 */
	public String getWordSeparator() {
		return wordSeparator;
	}
	
	/**
	 * Writes a phrase by {@linkplain Alignments#untokenize(List, String) untokenizing} its words
	 * according to the {@linkplain #getWordSeparator() word separator being used}. Before writing the
	 * untokenized phrase, {@link #preWritePhrase(Phrase)} is called exactly once. After writing the phrase,
	 * {@link #postWritePhrase(Phrase)} is called exactly once.
	 * 
	 * @param phrase The phrase to write.
	 * @throws IOException If the underlying writer throws an {@link IOException}, or if one is thrown by
	 * either {@link #preWritePhrase(Phrase)} or {@link #postWritePhrase(Phrase)}.
	 */
	public void writePhrase(Phrase phrase) throws IOException {
		preWritePhrase(phrase);
		printWriter.print(Alignments.untokenize(phrase, wordSeparator));
		postWritePhrase(phrase);
	}
	
	/**
	 * Called before {@link #writePhrase(Phrase)} (to be overridden by implementing classes).
	 * @param phrase The phrase about to be written.
	 */
	protected void preWritePhrase(Phrase phrase) throws IOException {
		// default is to do nothing
	}
	
	/**
	 * Called after {@link #writePhrase(Phrase)} (to be overridden by implementing classes). This implementation
	 * just writes a line separator.
	 * @param phrase The phrase that was just written.
	 */
	protected void postWritePhrase(Phrase phrase) throws IOException {
		printWriter.println();
	}
}


================================================
FILE: src/opennlp/ccg/alignment/Status.java
================================================
//////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2012 Scott Martin
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.alignment;

/**
 * A set of {@link Enum} constants for describing the status of a {@linkplain Mapping mapping}, either as
 * {@link #POSSIBLE} or {@link #SURE}.
 * <p>
 * Statuses have a corresponding {@linkplain #getAbbreviation() abbreviated form} for use when mappings are
 * formatted and parsed as strings. The enum constants are arranged in order of strength of surety, so that 
 * {@link Enum#ordinal()} returns numbers in order of increasing surety.
 * 
 * @author <a href="http://www.ling.ohio-state.edu/~scott/">Scott Martin</a>
 * @see MappingFormat
 */
public enum Status {
	
	/**
	 * The status of a mapping that is only possible, not sure.
	 */
	POSSIBLE,
	
	/**
	 * The status of a sure mapping (not just possible).
	 */
	SURE;
	
	/**
	 * An abbreviated form for this status, for use in parsing and formatting.
	 * @see MappingFormat
	 */
	final String abbreviation;
	
	private Status() {
		this.abbreviation = name().substring(0, 1);
	}
	
	/**
	 * Gets the abbreviated form of this status, &quot;S&quot; for {@link #SURE}
	 * and &quot;P&quot; for {@link #POSSIBLE}.
	 */
	public String getAbbreviation() {
		return abbreviation;
	}

	/**
	 * Gives the status constant corresponding to the given abbreviation.
	 * @param abbreviation The abbreviated form to find a status constant for.
	 * @return A status constant if one is found whose {@link #getAbbreviation()} is equal to the specified 
	 * abbreviation, otherwise <code>null</code>.
	 */
	public static Status forAbbreviation(String abbreviation) {
		for(Status s : values()) {
			if(s.abbreviation.equals(abbreviation)) {
				return s;
			}
		}
		
		return null;
	}
}

================================================
FILE: src/opennlp/ccg/alignment/package.html
================================================
<body>
	
<p>This package provides classes for modeling alignments between two
phrases.</p>

<p>
The {@link opennlp.ccg.alignment.Phrase} class models a phrase as simply
a list of words. A single alignment between an index in one phrase and an index
in another is captured by the {@link opennlp.ccg.alignment.Mapping} class. The
{@link opennlp.ccg.alignment.Alignment} class is build on top of Phrase and
Mapping, encapsulating an &quot;A&quot; phrase and a &quot;B&quot; phrase
along with a set of mappings between them (see
{@link opennlp.ccg.alignment.PhrasePosition}).
</p>

<p>
Since there are multiple different encoding schemes for representing alignments,
a goal of this package is to make the conceptual representation of aligned phrases
as independent of encoding as possible. The interface
{@link opennlp.ccg.alignment.EncodingScheme} gives a way to represent
encoding schemes, and two popular encoding schemes (Moses and NAACL) are provided by this
package. Different encoding schemes use different
numbering bases: some start numbering indices at 0 and some at 1. To reconcile this
difference, the class {@link opennlp.ccg.alignment.IndexBase} provides a way to translate
different numbering bases into a common index base. The {@link opennlp.ccg.alignment.MappingFormat}
class extends {@link java.text.Format} to give encoding-independent formatting and parsing
for mappings.
</p>

<p>
The classes {@link opennlp.ccg.alignment.PhraseReader} and {@link opennlp.ccg.alignment.PhraseWriter}
(and their descendants), {@link opennlp.ccg.alignment.MappingReader} and
{@link opennlp.ccg.alignment.MappingWriter} provide convenient ways to read and write phrases
and mappings. Lastly, the non-instantiable class {@link opennlp.ccg.alignment.Alignments} provides some
convenience methods for reading phrases, mappings and alignments.
</p>


</body>

================================================
FILE: src/opennlp/ccg/disjunctivizer/AlignedEdgeFilter.java
================================================
//////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2012 Scott Martin
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.disjunctivizer;

import static opennlp.ccg.disjunctivizer.MatchType.SOURCE_ALIGNED;
import static opennlp.ccg.disjunctivizer.MatchType.SOURCE_UNALIGNED;
import static opennlp.ccg.disjunctivizer.MatchType.TARGET_ALIGNED;
import static opennlp.ccg.disjunctivizer.MatchType.TARGET_UNALIGNED;

import java.util.Collection;
import java.util.Set;

import opennlp.ccg.hylo.graph.LFEdge;
import opennlp.ccg.hylo.graph.LFVertex;


/**
 * A filter for edges that tests whether they are aligned based on a specified set of 
 * {@linkplain #getAlignmentIndices() alignment indices}. Whether the source or target vertices
 * (or both) is considered depends on the match type criteria in effect. For example, if the match
 * type criteria contains {@link MatchType#SOURCE_ALIGNED}, this filter's {@link #allows(LFEdge)} method
 * will check whether argument edges have a {@linkplain LFVertex#getIndex() source index} that is 
 * contained in the set of alignment indices. 
 * <p>
 * Instances of this class use the following match type criteria: {@link MatchType#SOURCE_ALIGNED},
 * {@link MatchType#SOURCE_UNALIGNED}, {@link MatchType#TARGET_ALIGNED}, 
 * and {@link MatchType#TARGET_UNALIGNED}. If the set of alignment indices is modified after an instance
 * of this class is created, the filter will reflect the changes because the set is not copied at
 * creation.
 * 
 * @author <a href="http://www.ling.ohio-state.edu/~scott/">Scott Martin</a>
 */
public class AlignedEdgeFilter extends MatchTypeFilter {

	Set<Integer> alignmentIndices;
		
	/**
	 * Creates a new aligned edge filter based on the specified alignment indices for the specified
	 * match type criteria.
	 * @param alignmentIndices The set of indices to check for alignment.
	 * @param matchTypes The match type criteria to use.
	 * @throws IllegalArgumentException If <tt>alignmentIndices</tt> is <tt>null</tt>.
	 */
	public AlignedEdgeFilter(Set<Integer> alignmentIndices, MatchType... matchTypes) {
		super(matchTypes);
		
		checkAlignmentIndices(alignmentIndices);
		this.alignmentIndices = alignmentIndices;
	}

	/**
	 * Creates a new aligned edge filter based on the specified alignment indices for the specified
	 * match type criteria.
	 * @param alignmentIndices The set of indices to check for alignment.
	 * @param matchTypes The match type criteria to use.
	 * @throws IllegalArgumentException If <tt>alignmentIndices</tt> is <tt>null</tt>.
	 */
	public AlignedEdgeFilter(Set<Integer> alignmentIndices, Collection<MatchType> matchTypes) {
		super(matchTypes);
		
		checkAlignmentIndices(alignmentIndices);
		this.alignmentIndices = alignmentIndices;
	}
	
	private void checkAlignmentIndices(Set<Integer> alignmentIndices) {
		if(alignmentIndices == null) {
			throw new IllegalArgumentException("alignmentIndices is null");
		}
	}

	/**
	 * Gets the alignment indices used by this filter.
	 */
	public Set<Integer> getAlignmentIndices() {
		return alignmentIndices;
	}

	/**
	 * Sets the alignment indices used by this filter.
	 * @throws IllegalArgumentException If <tt>alignmentIndices</tt> is <tt>null</tt>.
	 */
	public void setAlignmentIndices(Set<Integer> alignmentIndices) {
		checkAlignmentIndices(alignmentIndices);	
		this.alignmentIndices = alignmentIndices;
	}

	/**
	 * Tests whether this filter allows the specified LF edge.
	 * @return <tt>false</tt> if {@link #getMatchTypes()} contains
	 * <ul>
	 * 	<li>{@link MatchType#SOURCE_ALIGNED}, but the alignment indices does not contain the edge's
	 * 		source vertex's index,</li>
	 * 	<li>{@link MatchType#SOURCE_UNALIGNED}, but the alignment indices contains the edge's
	 * 		source vertex's index,</li>
	 * 	<li>{@link MatchType#TARGET_ALIGNED}, but the alignment indices does not contain the edge's
	 * 		target vertex's index,</li>
	 * 	<li>{@link MatchType#TARGET_UNALIGNED}, but the alignment indices contains the edge's
	 * 		target vertex's index,</li>
	 * </ul>
	 * and <tt>true</tt> otherwise.
	 * 
	 * @see #getAlignmentIndices()
	 * @see LFEdge#getSource()
	 * @see LFEdge#getTarget()
	 * @see LFVertex#getIndex()
	 */
	@Override
	public boolean allows(LFEdge edge) {
		for(MatchType t : matchTypes) {
			if(t == SOURCE_ALIGNED && !alignmentIndices.contains(edge.getSource().getIndex())) {
				return false;
			}
			else if(t == SOURCE_UNALIGNED && alignmentIndices.contains(edge.getSource().getIndex())) {
				return false;
			}
			else if(t == TARGET_ALIGNED && !alignmentIndices.contains(edge.getTarget().getIndex())) {
				return false;
			}
			else if(t == TARGET_UNALIGNED && alignmentIndices.contains(edge.getTarget().getIndex())) {
				return false;
			}
		}
		
		return true;
	}

}


================================================
FILE: src/opennlp/ccg/disjunctivizer/Disjunctivizer.java
================================================
//////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2012 Scott Martin
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.disjunctivizer;

import static opennlp.ccg.alignment.PhrasePosition.A;
import static opennlp.ccg.alignment.PhrasePosition.B;
import static opennlp.ccg.disjunctivizer.Disjunctivizer.VertexType.LOCAL_ANCESTOR;
import static opennlp.ccg.disjunctivizer.Disjunctivizer.VertexType.OPTIONAL;
import static opennlp.ccg.disjunctivizer.Disjunctivizer.VertexType.PREDICATES;
import static opennlp.ccg.disjunctivizer.Disjunctivizer.VertexType.SHARED;
import static opennlp.ccg.disjunctivizer.Disjunctivizer.VertexType.VISITED;
import static opennlp.ccg.disjunctivizer.MatchType.TARGET_PREDICATE_MISMATCH;

import java.util.Arrays;
import java.util.Collections;
import java.util.EnumMap;
import java.util.HashMap;
import java.util.HashSet;
import java.util.Iterator;
import java.util.Map;
import java.util.Set;

import javax.xml.parsers.DocumentBuilderFactory;
import javax.xml.parsers.ParserConfigurationException;

import opennlp.ccg.alignment.PhrasePosition;
import opennlp.ccg.hylo.Mode;
import opennlp.ccg.hylo.Proposition;
import opennlp.ccg.hylo.graph.LFEdge;
import opennlp.ccg.hylo.graph.LFEdgeLabel;
import opennlp.ccg.hylo.graph.LFGraph;
import opennlp.ccg.hylo.graph.LFVertex;
import opennlp.ccg.util.DelegatedFilter;
import opennlp.ccg.util.Filter;
import opennlp.ccg.util.FilteredSet;
import opennlp.ccg.util.MembershipFilter;
import opennlp.ccg.util.VisitedFilter;

import org.jgrapht.traverse.DepthFirstIterator;
import org.w3c.dom.Document;
import org.w3c.dom.Element;
import org.w3c.dom.Node;
import org.w3c.dom.NodeList;

/**
 * Creates a disjunctive logical form from a difference between two graphs.
 * Instances can be configured to switch handling of {@link LFGraphDifference#inserts()},
 * {@link LFGraphDifference#deletes()} and {@link LFGraphDifference#substitutions()}
 * on or off. By default, all three are performed.
 * <p>
 * Disjunctivizers can be re-used, so that  all of the boolean parameters
 * {@link #setProcessingDeletes(boolean)}, {@link #setProcessingInserts(boolean)},
 * and {@link #setProcessingSubstitutions(boolean)} can be modified in between calls to
 * {@link #buildDisjunctiveLFFor(LFGraphDifference)}.
 * When these parameters are changed, the disjunctive LF built will change as well.
 * The {@link Document} used to create disjunctive LF elements (and the elements within them)
 * can be configured as well, either at creation or via {@link #setDocument(Document)}. 
 * 
 * @author <a href="http://www.ling.ohio-state.edu/~scott/">Scott Martin</a>
 */
public class Disjunctivizer {

	/**
	 * Attribute set tag name: <tt>atts</tt>.
	 */
	public static final String ATTS_TAG = "atts";
	
	/**
	 * Choice disjunction tag name: <tt>one-of</tt>.
	 */
	public static final String CHOICE_TAG = "one-of";
	
	/**
	 * Disjunctive LF tag name: <tt>dlf</tt>.
	 */
	public static final String DLF_TAG = "dlf";
	
	/**
	 * Node tag name: <tt>node</tt>.
	 */
	public static final String NODE_TAG = "node";
	
	/**
	 * Optional disjunction tag name: <tt>opt</tt>.
	 */
	public static final String OPTIONAL_TAG = "opt";
	
	/**
	 * Relation tag name: <tt>rel</tt>.
	 */
	public static final String RELATION_TAG = "rel";
	
	/**
	 * ID attribute name: <tt>id</tt>.
	 */
	public static final String ID_ATTR = "id";
	
	/**
	 * ID reference attribute name: <tt>idref</tt>.
	 */
	public static final String IDREF_ATTR = "idref";
	
	/**
	 * Name attribute name: <tt>name</tt>.
	 */
	public static final String NAME_ATTR = "name";
	
	/**
	 * Predicate attribute name: <tt>pred</tt>.
	 */
	public static final String PRED_ATTR = "pred";
	
	/**
	 * Attribute name for node sharedness: <tt>shared</tt>.
	 */
	public static final String SHARED_ATTR = "shared";
	
	/**
	 * The suffix appended to foreign nodes: <tt>f</tt>.
	 */
	public static final String FOREIGN_SUFFIX = "f";
	
	Document document;
	boolean processingInserts, processingDeletes, processingSubstitutions;
	
	private Element disjunctiveLF;
	
	private LFGraphDifference graphDifference;
	private Set<LFVertex> importedVertices = null;
	private Map<LFVertex, LFVertex> vertexAliases = null;
	private Map<LFVertex, LFVertex> foreignAlignedSubgraphRoots = null;
	
	/**
	 * Creates a new disjunctivizer using a new document.
	 * @see #Disjunctivizer(Document)
	 */
	public Disjunctivizer() throws ParserConfigurationException {
		this(DocumentBuilderFactory.newInstance().newDocumentBuilder().newDocument());
	}
	
	/**
	 * Creates a new disjunctivizer that will use the specified document
	 * to create the elements in its generated disjunctive LFs.
	 * @see #Disjunctivizer(Document, boolean, boolean, boolean)
	 */
	public Disjunctivizer(Document document) {
		this(document, true, true, true);
	}
	
	/**
	 * Creates a new disjunctivizer that will use the specified document
	 * to create the elements in its generated disjunctive LFs, with the specified parameters dictating
	 * whether to process inserts, deletes, and substitutions.
	 * 
	 * @param document The document to use for creating elements, attributes, nodes, etc.
	 * @param processingInserts Whether to process {@link LFGraphDifference#inserts()}.
	 * @param processingDeletes Whether to process {@link LFGraphDifference#deletes()}.
	 * @param processingSubstitutions Whether to process {@link LFGraphDifference#substitutions()}.
	 */
	public Disjunctivizer(Document document,
			boolean processingInserts, boolean processingDeletes, boolean processingSubstitutions) {
		if(document == null) {
			throw new IllegalArgumentException("document is null");
		}
		
		this.document = document;
		this.processingInserts = processingInserts;
		this.processingDeletes = processingDeletes;
		this.processingSubstitutions = processingSubstitutions;
	}

	/**
	 * Gets the document used to create elements, nodes, attributes, etc.
	 * @see #Disjunctivizer(Document, boolean, boolean, boolean)
	 */
	public Document getDocument() {
		return document;
	}

	/**
	 * Sets the document used to create elements.	
	 * @param document The document that will be used while building disjunctive LF elements.
	 */
	public void setDocument(Document document) {
		this.document = document;
	}
	
	/**
	 * Returns whether this disjunctivizer processes {@link LFGraphDifference#inserts()}.
	 */
	public boolean isProcessingInserts() {
		return processingInserts;
	}

	/**
	 * Sets whether this disjunctivizer processes {@link LFGraphDifference#inserts()}.
	 */
	public void setProcessingInserts(boolean processingInserts) {
		if(this.processingInserts != processingInserts) {
			this.processingInserts = processingInserts;
			resetDisjunctiveLF();
		}
	}

	/**
	 * Returns whether this disjunctivizer processes {@link LFGraphDifference#deletes()}.
	 */
	public boolean isProcessingDeletes() {
		return processingDeletes;
	}

	/**
	 * Sets whether this disjunctivizer processes {@link LFGraphDifference#deletes()}.
	 */
	public void setProcessingDeletes(boolean processingDeletes) {
		if(this.processingDeletes != processingDeletes) {
			this.processingDeletes = processingDeletes;
			resetDisjunctiveLF();
		}
	}

	/**
	 * Returns whether this disjunctivizer processes {@link LFGraphDifference#substitutions()}.
	 */
	public boolean isProcessingSubstitutions() {
		return processingSubstitutions;
	}

	/**
	 * Sets whether this disjunctivizer processes {@link LFGraphDifference#substitutions()}.
	 */
	public void setProcessingSubstitutions(boolean processingSubstitutions) {
		if(this.processingSubstitutions != processingSubstitutions) {
			this.processingSubstitutions = processingSubstitutions;
			resetDisjunctiveLF();
		}
	}

	private void resetDisjunctiveLF() {
		this.disjunctiveLF = null;
	}
	
	/**
	 * Builds a disjunctive LF based on the specified graph difference.
	 * The shape of the returned element will change depending on whether inserts, deletes, or substitutions
	 * are being processed.
	 * @param graphDifference The graph difference to use for building the disjunctive LF.
	 * @return A recursively build disjunctive LF based on this disjunctivizer's graph difference.
	 * @throws IllegalArgumentException If <tt>graphDifference</tt> is <tt>null</tt>.
	 */
	public Element buildDisjunctiveLFFor(LFGraphDifference graphDifference) {
		if(graphDifference == null) {
			throw new IllegalArgumentException("graph difference is null");
		}
		
		if(disjunctiveLF == null || !this.graphDifference.equals(graphDifference)) {
			this.graphDifference = graphDifference;
						
			// reset in case this has been previously called
			if(foreignAlignedSubgraphRoots != null) {
				foreignAlignedSubgraphRoots = null;
			}
			
			if(importedVertices == null) {
				importedVertices = new HashSet<LFVertex>();
			}
			else {
				importedVertices.clear();
			}
			
			if(vertexAliases == null) {
				vertexAliases = new HashMap<LFVertex, LFVertex>();
			}
			else {
				vertexAliases.clear();
			}		
			
			disjunctiveLF = document.createElement(DLF_TAG);
			
			for(LFVertex p : graphDifference.a.highestLFAncestors()) {
				disjunctiveLF.appendChild(createDisjunctiveElement(new DLFContext(A, p, disjunctiveLF)));
			}
		}
		
		return disjunctiveLF;
	}
	
	private void findForeignAlignedSubgraphRoots() {
		foreignAlignedSubgraphRoots = new HashMap<LFVertex, LFVertex>();
		
		LFGraphIterator rootIterator = new LFGraphIterator(graphDifference.b);
		Map<Integer, Set<Integer>> mappings = graphDifference.alignment.asMap(B);
		
		while(rootIterator.hasNext()) {
			LFVertex vertex = rootIterator.next();
			
			if(!foreignAlignedSubgraphRoots.containsKey(vertex)) { // already encountered?
				if(mappings.containsKey(vertex.getIndex())) { // aligned?
					LFGraphIterator subgraphIterator = new LFGraphIterator(graphDifference.b, vertex);
					
					while(subgraphIterator.hasNext()) { // map whole subgraph to the aligned vertex
						foreignAlignedSubgraphRoots.put(subgraphIterator.next(), vertex);
					}
				}
			}
		}
	}
	
	private Element createDisjunctiveElement(DLFContext context) {
		LFVertex alias = vertexAliases.get(context.vertex);
		
		String vertexName = nameFor(context.vertex);
		boolean imported = importedVertices.contains(context.vertex);
		
		Element newNode = document.createElement(NODE_TAG);
		context.parent.appendChild(newNode);
		
		DLFContext localContext = context.copy();
		localContext.parent = newNode;
		Set<LFVertex> locals = localContext.getVertices(LOCAL_ANCESTOR),
				visited = localContext.getVertices(VISITED);
		
		if(locals.contains(localContext.vertex)
				|| (alias != null && visited.contains(localContext.vertex))) {
			LFVertex v = (alias == null) ? localContext.vertex : alias;
			localContext.parent.setAttribute(IDREF_ATTR, nameFor(v));
			
			if(visited.contains(localContext.vertex)
					&& localContext.getVertices(SHARED).contains(v) && !locals.contains(v)) {
				localContext.parent.setAttribute(SHARED_ATTR, "true");
			}
		}
		else {
			localContext.parent.setAttribute(ID_ATTR, alias == null ? vertexName : nameFor(alias));
			
			visited.add(localContext.vertex);
			locals.add(localContext.vertex);
			
			addNonPredAttributes(localContext);
			
			if(!imported && processingInserts) { // inserts
				processInserts(localContext);
			}
			if(!imported && processingDeletes) { // deletes
				processDeletes(localContext);
			}
			
			LFGraph graph = localContext.getGraph();
			
			@SuppressWarnings("unchecked")
			Set<LFEdge> outgoingEdges = graph.containsVertex(localContext.vertex)
					? graph.outgoingEdgesOf(localContext.vertex) : Collections.EMPTY_SET;
			
			if(outgoingEdges.isEmpty()) { // leaf?
				setPredicateName(localContext);
			}
			else {
				if(!imported && processingSubstitutions) { // do substitutions, if applicable
					processSubstitutions(localContext);
				}
				else {
					for(LFEdge out : outgoingEdges) {
						if(imported) {
							importedVertices.add(out.getTarget());
						}
						
						// context.graph should be the B graph if imported
						processNonsubstitutedEdge(localContext, out);
					}
				}
			}
		}
		
		fixLabelReferences(newNode);
		
		return newNode;
	}
	
	private String nameFor(LFVertex vertex) {
		String vn = vertex.getName();
		return importedVertices.contains(vertex) ? vn + FOREIGN_SUFFIX : vn;
	}
	
	private void processInserts(DLFContext context) {
		Element optional = null;
		
		for(LFEdge ins : graphDifference.insertsFor(context.vertex)) {
			// check if subgraph is aligned somewhere
			if(foreignAlignedSubgraphRoots == null) {
				findForeignAlignedSubgraphRoots();
			}
			
			if(!foreignAlignedSubgraphRoots.containsKey(ins.getTarget())) {
				DLFContext ctxt = context.copy();
				ctxt.graphPosition = B; // use foreign graph
				
				if(optional == null) {
					ctxt.parent = addOptional(context);
				}
				
				importedVertices.add(ins.getTarget()); // remember that inserted vertex is foreign
				
				doInsertDelete(ctxt, ins);
			}
		}
	}
	
	private void processDeletes(DLFContext context) {
		Element optional = null;
		
		for(LFEdge del : graphDifference.deletesFor(context.vertex)) {
			DLFContext ctxt = context.copy();
			
			if(optional == null) {
				ctxt.parent = addOptional(context);
			}
			
			doInsertDelete(ctxt.copy(), del);
		}
	}
	
	private void doInsertDelete(DLFContext context, LFEdge edge) {
		LFVertex trg = edge.getTarget();
		DLFContext ctxt = context.copy(); 
		ctxt.vertex = trg;
		ctxt.parent = addRelation(ctxt, edge.getLabel());
		ctxt.addVertex(trg, OPTIONAL);
		
		ctxt.parent.appendChild(createDisjunctiveElement(ctxt));
	}
	
	private void processSubstitutions(DLFContext context) {
		for(LFEdge outgoing : context.getGraph().outgoingEdgesOf(context.vertex)) {
			if(graphDifference.substitutionsFor(outgoing).isEmpty()) { // no substitution(s) for this edge?
				processNonsubstitutedEdge(context.copy(), outgoing);
			}
			else {
				processSubstitutedEdge(context.copy(), outgoing);
			}
		}
	}
	
	private void processNonsubstitutedEdge(DLFContext context, LFEdge outgoing) {
		if(!context.getVertices(PREDICATES).contains(context.vertex)) {
			setPredicateName(context);
		}
		
		LFVertex trg = outgoing.getTarget();
		Set<LFVertex> similarTargets = new FilteredSet<LFVertex>(context.getVertices(OPTIONAL), 
				new SimilarTargetVertexFilter(trg));
		
		if(similarTargets.isEmpty()) {
			DLFContext ctxt = context.copy();
			ctxt.vertex = trg;
			ctxt.parent = addRelation(context, outgoing.getLabel());
			
			ctxt.parent.appendChild(createDisjunctiveElement(ctxt));
		}
		else { // target already present as an option
			for(LFVertex similar : similarTargets) {
				assimilateAttributes(context.copy(), trg, similar);
			}
		}
	}
	
	private void processSubstitutedEdge(DLFContext context, LFEdge outgoing) {
		processSubstitutedSimilarTarget(context.copy(), outgoing);
		
		if(!context.getVertices(PREDICATES).contains(context.vertex)) {
			processSubstitutedPredicates(context.copy(), outgoing);
		}
		
		// get the substitutions for the outgoing edge
		Map<LFVertex, Set<LFEdge>> subsBySource = graphDifference.substitutionsBySourceFor(outgoing);
		EdgeMatchFilter predicateFilter = null;
		
		for(LFVertex subSource : subsBySource.keySet()) {
			Set<LFEdge> subEdges = subsBySource.get(subSource);
			
			if(predicateFilter == null) {
				predicateFilter = new EdgeMatchFilter(outgoing, TARGET_PREDICATE_MISMATCH);
			}
			else {
				predicateFilter.setBasis(outgoing);
			}
			
			// find the edges matching the outgoing edge's label, and the vertices with different predicates
			// from the outgoing edge's target vertex
			FilteredLFEdgeSet identicals = new FilteredLFEdgeSet(subEdges, new MembershipFilter<LFEdge>(
										context.getGraph().outgoingEdgesOf(context.vertex)));
			Set<LFEdge> matchingLabels
				= new FilteredLFEdgeSet(subEdges, new LabelMatchFilter(outgoing.getLabel()));
			Set<LFVertex> differentPredicates
				= new FilteredSet<LFVertex>(
						new FilteredLFEdgeSet(matchingLabels, predicateFilter).targetView(),
						new VisitedFilter<LFVertex>());
			
			// deal with the edges with matching labels separately from other substitutions
			subEdges.removeAll(matchingLabels);
			differentPredicates.removeAll(identicals.targetView());
			subEdges.removeAll(identicals);
			
			if(subEdges.isEmpty() && differentPredicates.isEmpty()) { // no substitutions to make
				DLFContext ctxt = context.copyWithVertexMask(LOCAL_ANCESTOR, PREDICATES);
				fixOptions(ctxt, outgoing.getLabel());
				
				ctxt.parent = addRelation(context, outgoing.getLabel());
				ctxt.vertex = outgoing.getTarget();
				ctxt.parent.appendChild(createDisjunctiveElement(ctxt));				
			}
			else {
				if(!differentPredicates.isEmpty()) { // handle matching labels but different predicates
					processDifferentPredicates(context.copy(), outgoing, differentPredicates);
				}
				
				if(!subEdges.isEmpty()) { // handle others
					processSubstitutedEdges(context.copy(), outgoing, subEdges);
				}
			}
		}
	}
	
	private void processDifferentPredicates(DLFContext context, LFEdge outgoing,
			Set<LFVertex> differentPredicates) {
		LFEdgeLabel label = outgoing.getLabel();
		
		boolean terminal = context.getGraph().outDegreeOf(context.vertex) == 0;
		if(!terminal) {
			terminal = !new FilteredSet<LFVertex>(
							differentPredicates, new TerminalFilter(graphDifference.b))
						.isEmpty();
		}
		
		if(terminal) {
			DLFContext ctxt = context.copy();
			ctxt.vertex = outgoing.getTarget();
						
			if(differentPredicates.size() == 1) { // if we're here at all, it's at least non-empty
				processSingletonDifferentPredicate(ctxt, outgoing, differentPredicates.iterator().next());
			}
			else {
				processMultipleDifferentPredicates(ctxt, outgoing, differentPredicates);
			}
		}
		else { // non-terminal, continue recursing through the graph
			DLFContext ctxt = context.copyWithVertexMask(LOCAL_ANCESTOR, PREDICATES);
			
			ctxt.vertex = outgoing.getTarget();
			ctxt.parent = addRelation(ctxt, label);
			
			ctxt.parent.appendChild(createDisjunctiveElement(ctxt));
		}
	}
	
	private void processSingletonDifferentPredicate(DLFContext context, LFEdge outgoing,
			LFVertex differentPredicate) {
		LFEdgeLabel label = outgoing.getLabel();
		
		// add relation, then choice point
		Element newRel = addRelation(context, label);
		context.parent = newRel;
		Element choiceElement = addChoice(context);
		context.parent = choiceElement;
		
		// generate the target element, but do not propagate changes to tracked vertices
		Element targetElement = createDisjunctiveElement(context.copy(true));
		
		if(!vertexAliases.containsKey(differentPredicate)) {
			vertexAliases.put(differentPredicate, outgoing.getTarget());
		}
		
		context.vertex = differentPredicate;
		context.parent.appendChild(createDisjunctiveElement(context.copy(true)));
		
		// cleanup: how many new nodes were aliased?
		NodeList newNodes = newRel.getElementsByTagName(NODE_TAG);
		for(int j = 0; j < newNodes.getLength(); j++) {
			if(newNodes.item(j).getAttributes().getNamedItem(IDREF_ATTR) == null) {
				return; // one wasn't aliased
			}
		}
		
		// if we get here, they all were aliased: use generated target element instead
		newRel.replaceChild(targetElement, choiceElement);
	}
	
	private void processMultipleDifferentPredicates(DLFContext context, LFEdge outgoing,
			Set<LFVertex> differentPredicates) {
		LFEdgeLabel label = outgoing.getLabel();
		
		// generate the choice point
		Element choiceElement = addChoice(context);
		context.parent = choiceElement;
		
		// and the relation, but do not propagate changes to tracked vertices
		context.parent = addRelation(context, label);
		context.parent.appendChild(createDisjunctiveElement(context.copy(true)));
		
		// add attributes tag, after resetting parent to choice point
		context.parent = choiceElement;
		Element atts = addElement(context, ATTS_TAG);
		
		// then go through the different predicates, checking for aliases
		boolean aliased = false;
		for(LFVertex d : differentPredicates) {
			context.parent = atts;
			
			if(!aliased && !vertexAliases.containsKey(d)) {
				vertexAliases.put(d, outgoing.getTarget());
				aliased = true;
			}
			
			// add new relation for each different pred.
			context.parent = addRelation(context, label);
			context.vertex = d;
			context.parent.appendChild(createDisjunctiveElement(context.copy(true)));
		}
	}
	
	private void processSubstitutedEdges(DLFContext context, LFEdge outgoing, Set<LFEdge> substituedEdges) {
		LFEdgeLabel label = outgoing.getLabel();
		boolean singleton = substituedEdges.size() == 1; // can't be empty if we get here
		
		Element choiceElement = addChoice(context);
		context.parent = choiceElement;
		
		Element toAppendTo = singleton ? choiceElement : addElement(context, ATTS_TAG);
		
		context.parent = addRelation(context, label);
		
		DLFContext ctxt = context.copy(true);
		ctxt.vertex = outgoing.getTarget();
		ctxt.parent.appendChild(createDisjunctiveElement(ctxt));
		
		boolean aliased = false;
		context.parent = toAppendTo;
		
		for(LFEdge s : substituedEdges) {
			LFVertex t = s.getTarget();
			String vPred = context.vertex.getPredicate(), tPred = t.getPredicate();
			LFEdgeLabel l = s.getLabel();
			
			context.parent = addRelation(context, l);
			
			// shared?
			if(vPred != null && vPred.equals(tPred) && !label.equals(l)) { 
				Element subNode = addElement(context, NODE_TAG);
				subNode.setAttribute(IDREF_ATTR, nameFor(context.vertex));
				
				LFVertex sAlias = vertexAliases.get(context.vertex);
				if(context.getVertices(VISITED).contains(sAlias)
						&& context.getVertices(SHARED).contains(sAlias)
						&& !context.getVertices(LOCAL_ANCESTOR).contains(sAlias)) {
					subNode.setAttribute(SHARED_ATTR, "true");
				}
			}
			else {
				if((singleton || !aliased) && !vertexAliases.containsKey(t)) {
					vertexAliases.put(t, outgoing.getTarget());
					aliased = true;
				}
				
				DLFContext c = context.copy(true);
				
				c.vertex = t;
				importedVertices.add(t);
				
				c.graphPosition = B; // use foreign graph for substitution
				c.parent.appendChild(createDisjunctiveElement(c));
			}
		}
	}
	
	private void processSubstitutedSimilarTarget(DLFContext context, LFEdge outgoing) {
		LFVertex target = outgoing.getTarget();
		Map<LFVertex, Set<LFEdge>> subsBySource = graphDifference.substitutionsBySourceFor(outgoing);
		
		DLFContext ctxt = context.copy();
		
		// for each substituted edge, look for similar target
		for(LFVertex subSource : subsBySource.keySet()) {
			Set<LFEdge> similarTargetEdges = new FilteredLFEdgeSet(subsBySource.get(subSource),
					new SimilarTargetEdgeFilter(ctxt.vertex, outgoing.getLabel()));
			
			if(!similarTargetEdges.isEmpty()) {
				if(similarTargetEdges.size() > 1) { // more than one similar target?
					System.err.println("more than one similar target edge for " + ctxt.vertex
							+ ": " + similarTargetEdges); // TODO figure out what to do about this
				}
				
				assimilateAttributes(ctxt, target, similarTargetEdges.iterator().next().getTarget());
				LFVertex hp = ctxt.getGraph().highestLFAncestorOf(target);
				
				if(hp == null || hp.equals(outgoing.getSource())) {
					context.getVertices(SHARED).add(target);
					
					ctxt.vertex = target;
					ctxt.vertices = context.copyVertices(LOCAL_ANCESTOR, PREDICATES);
					ctxt.parent.appendChild(createDisjunctiveElement(ctxt));
					
					return; // stop after similar target found
				}
			}
		}
	}
	
	private void processSubstitutedPredicates(DLFContext context, LFEdge outgoing) {
		final String predicate = context.vertex.getPredicate();
		if(predicate != null) {
			Set<LFVertex> alternates = new FilteredSet<LFVertex>(
					graphDifference.substitutionsBySourceFor(outgoing).keySet(),
					new DelegatedFilter<LFVertex, String>(new Filter<String>(){
						@Override
						public boolean allows(String s) {
							return !predicate.equals(s);
						}
					}) {
						@Override
						public String delegateValueFor(LFVertex e) {
							return e.getPredicate();
						}
					});
			
			if(alternates.isEmpty()) { // the simple case, no other predicates involved
				setPredicateName(context);
			}
			else { // add alternates as choice, with predicate an option
				DLFContext ctxt = context.copy();
				ctxt.getVertices(PREDICATES).add(ctxt.vertex);
				
				ctxt.parent = addChoice(ctxt);
				addAttributes(ctxt, PRED_ATTR, predicate);
				
				for(LFVertex ap : alternates) {
					addAttributes(ctxt, PRED_ATTR, ap.getPredicate());
				}
			}
		}
	}
	
	private Element addRelation(DLFContext context, LFEdgeLabel label) {
		Element newRel = addElement(context, RELATION_TAG);
		newRel.setAttribute(NAME_ATTR, label.getName());
		
		return newRel;
	}
	
	private Element addOptional(DLFContext context) {
		return addElement(context, OPTIONAL_TAG);
	}
	
	private Element addChoice(DLFContext context) {
		return addElement(context, CHOICE_TAG);
	}
	
	private Element addElement(DLFContext context, String elementName) {
		Element newEl = document.createElement(elementName);
		context.parent.appendChild(newEl);
		
		return newEl;
	}
	
	private Element addAttributes(DLFContext context, String name, String value) {
		Element newAtts = document.createElement(ATTS_TAG);
		context.parent.appendChild(newAtts);
		
		newAtts.setAttribute(name, value);
		
		return newAtts;
	}
	
	private Element addAttributes(DLFContext context, Map<Mode,Proposition> attributes) {
		Element newAtts = document.createElement(ATTS_TAG);
		context.parent.appendChild(newAtts);
		
		for(Mode m : attributes.keySet()) {
			String n = m.getName();
			if(!n.equals(PRED_ATTR)) { // TODO does this ever happen?
				newAtts.setAttribute(n, attributes.get(m).getName());
			}
		}
		
		return newAtts;
	}
	
	private void fixLabelReferences(Element newNode) {
		NodeList rels = newNode.getChildNodes();
		int rlen = rels.getLength();
		Map<String,String> refRels = new HashMap<String, String>(rlen);
		
		for(int k = 0; k < rlen; k++) {
			Node n = rels.item(k);
			if(n != null && n.getNodeType() == Node.ELEMENT_NODE && n.getNodeName().equals(RELATION_TAG)) {
				Element ne = (Element)n;
				Node m = ne.getFirstChild();
				if(m != null && m.getNodeType() == Node.ELEMENT_NODE && m.getNodeName().equals(NODE_TAG)) {
					Element me = (Element)m;
					String l = ne.getAttribute(NAME_ATTR);
					String idref = me.getAttribute(IDREF_ATTR);
					
					if(idref == null || idref.length() == 0) {
						String id = me.getAttribute(ID_ATTR);
						if(id != null && id.length() > 0) {
							refRels.put(l, id);
						}
					}
					else {
						if(idref.equals(refRels.get(l))) {
							newNode.removeChild(n);
						}
						else {
							refRels.put(l, idref);
						}
					}
				}
			}
		}
	}
	
	private void fixOptions(DLFContext context, LFEdgeLabel label) {
		String cPred = context.vertex.getPredicate();
		if(cPred == null) {
			return;
		}
		
		NodeList ncs = context.parent.getChildNodes();
		for(int j = 0; j < ncs.getLength(); j++) {
			Node c = ncs.item(j);
			if(c != null && c.getNodeType() == Node.ELEMENT_NODE && c.getNodeName().equals(OPTIONAL_TAG)) {
				NodeList rs = c.getChildNodes();
				for(int k = 0; k < rs.getLength(); k++) {
					Node r = rs.item(k);
					if(r != null && r.getNodeType() == Node.ELEMENT_NODE
							&& r.getNodeName().equals(RELATION_TAG)) {
						Element re = (Element)r;
						if(label.getName().equals(re.getAttribute(NAME_ATTR))) {
							Node d = re.getFirstChild();
							if(d != null && d.getNodeType() == Node.ELEMENT_NODE
									&& d.getNodeName().equals(NODE_TAG)
									&& cPred.equals(((Element)d).getAttribute(PRED_ATTR))) {
								context.parent.removeChild(c); 
								break; // don't try to remove more than once, throws DOMException
							}
						}
					}
				}
			}
		}
	}
	
	private void setPredicateName(DLFContext context) {
		String p = context.vertex.getPredicate(); 
		if(p != null) {
			context.parent.setAttribute(PRED_ATTR, p);
			context.getVertices(PREDICATES).add(context.vertex);
		}
	}
		
	private void addNonPredAttributes(DLFContext context) {
		for(Mode m : context.vertex.attributeNames()) {
			String n = m.getName();
			if(!n.equals(PRED_ATTR)) { // TODO is this attribute ever present??
				context.parent.setAttribute(n, context.vertex.getAttributeValue(m).getName());
			}
		}
	}
	
	private void assimilateAttributes(DLFContext context, LFVertex one, LFVertex two) {
		// copy attribute maps for both vertices
		Map<Mode, Proposition> oneAttrs = new HashMap<Mode, Proposition>(one.getAttributeMap()),
				twoAttrs = new HashMap<Mode, Proposition>(two.getAttributeMap());
		
		// add all attributes common to both vertices, remove from both maps
		Iterator<Map.Entry<Mode, Proposition>> i = oneAttrs.entrySet().iterator();
		while(i.hasNext()) {
			Map.Entry<Mode, Proposition> e = i.next();
			Set<Map.Entry<Mode, Proposition>> tes = twoAttrs.entrySet();			
			
			if(tes.contains(e)) {
				context.parent.setAttribute(e.getKey().getName(), e.getValue().getName());
				
				i.remove();
				tes.remove(e);
			}
		}
		
		if(oneAttrs.isEmpty()) { // if first is empty, add second as optional
			if(!twoAttrs.isEmpty()) {
				DLFContext ctxt = context.copy(true);
				ctxt.parent = addOptional(context);
				
				addAttributes(ctxt, twoAttrs);
			}
		}
		else if(twoAttrs.isEmpty()) { // some attributes remain for first vertex
			addAttributes(context.copy(), oneAttrs);
		}
		else { // both are non-empty, make choice
			DLFContext ctxt = context.copy(true);
			ctxt.parent = addChoice(context);
			
			addAttributes(ctxt, oneAttrs);
			addAttributes(ctxt, twoAttrs);
		}
	}

	static class SimilarTargetVertexFilter implements Filter<LFVertex> {
		LFVertex vertex;
		
		SimilarTargetVertexFilter(LFVertex vertex) {
			this.vertex = vertex;
		}
		
		@Override
		public boolean allows(LFVertex v) {
			String p = vertex.getPredicate();
			return p != null && p.equals(v.getPredicate());
		}
	}
	
	static class SimilarTargetEdgeFilter extends DelegatedFilter<LFEdge, LFVertex> {

		LFEdgeLabel label;
		
		SimilarTargetEdgeFilter(LFVertex vertex, LFEdgeLabel label) {
			super(new SimilarTargetVertexFilter(vertex));
			this.label = label;
		}
		
		@Override
		public boolean allows(LFEdge e) {
			return super.allows(e) && label.equals(e.getLabel());
		}

		@Override
		public LFVertex delegateValueFor(LFEdge e) {
			return e.getTarget();
		}
	}
	
	class TerminalFilter implements Filter<LFVertex> {
		LFGraph graph;
		
		TerminalFilter(LFGraph graph) {
			this.graph = graph;
		}

		@Override
		public boolean allows(LFVertex e) {
			return graph.outDegreeOf(e) == 0;
		}
	}
	
	static enum VertexType {
		LOCAL_ANCESTOR, OPTIONAL, PREDICATES, SHARED, VISITED;
	}
	
	class DLFContext {
		PhrasePosition graphPosition;
		LFVertex vertex;
		Element parent;
		
		private Map<VertexType, Set<LFVertex>> vertices;
		
		DLFContext(PhrasePosition graphPosition, LFVertex vertex, Element parent) {
			this(graphPosition, vertex, parent, new EnumMap<VertexType, Set<LFVertex>>(VertexType.class));
		}
		
		DLFContext(PhrasePosition graphPosition, LFVertex vertex, Element parent, Map<VertexType,
				Set<LFVertex>> vertices) {
			this.graphPosition = graphPosition;
			this.vertex = vertex;
			this.parent = parent;
			this.vertices = vertices;
		}
		
		LFGraph getGraph() {
			return graphDifference.get(graphPosition);
		}
		
		DLFContext copy() {
			return copy(false);
		}
		
		DLFContext copy(boolean copyVertices) {
			return copyVertices ? copyWithVertexMask(VertexType.values())
					: new DLFContext(graphPosition, vertex, parent, vertices);
		}
		
		DLFContext copyWithVertexMask(VertexType... vertexType) {
			return new DLFContext(graphPosition, vertex, parent, copyVertices(vertexType));
		}
		
		Map<VertexType, Set<LFVertex>> copyVertices() {
			return copyVertices(VertexType.values());
		}
		
		Map<VertexType, Set<LFVertex>> copyVertices(VertexType... vertexType) {
			Map<VertexType, Set<LFVertex>> m = new EnumMap<VertexType, Set<LFVertex>>(vertices);
			m.keySet().retainAll(Arrays.asList(vertexType));
			
			return m;
		}
		
		Set<LFVertex> getVertices(VertexType vertexType) {
			Set<LFVertex> vs = vertices.get(vertexType);
			
			if(vs == null) {
				vs = new HashSet<LFVertex>();
				vertices.put(vertexType, vs);
			}
			
			return vs;
		}
		
		boolean addVertex(LFVertex vertex, VertexType vertexType) {
			return getVertices(vertexType).add(vertex);
		}
	}
	
	static class LFGraphIterator extends DepthFirstIterator<LFVertex, LFEdge> {
		LFGraphIterator(LFGraph graph) {
			super(graph);
		}
		
		LFGraphIterator(LFGraph graph, LFVertex startVertex) {
			super(graph, startVertex);
		}
	}
}


================================================
FILE: src/opennlp/ccg/disjunctivizer/EdgeMatchFilter.java
================================================
//////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2012 Scott Martin
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.disjunctivizer;

import static opennlp.ccg.disjunctivizer.MatchType.LABEL_MATCH;
import static opennlp.ccg.disjunctivizer.MatchType.LABEL_MISMATCH;
import static opennlp.ccg.disjunctivizer.MatchType.SOURCE_MATCH;
import static opennlp.ccg.disjunctivizer.MatchType.SOURCE_MISMATCH;
import static opennlp.ccg.disjunctivizer.MatchType.SOURCE_PREDICATE_MATCH;
import static opennlp.ccg.disjunctivizer.MatchType.SOURCE_PREDICATE_MISMATCH;
import static opennlp.ccg.disjunctivizer.MatchType.TARGET_MATCH;
import static opennlp.ccg.disjunctivizer.MatchType.TARGET_MISMATCH;
import static opennlp.ccg.disjunctivizer.MatchType.TARGET_PREDICATE_MATCH;
import static opennlp.ccg.disjunctivizer.MatchType.TARGET_PREDICATE_MISMATCH;

import java.util.Arrays;
import java.util.Collection;
import java.util.EnumSet;

import opennlp.ccg.hylo.graph.LFEdge;
import opennlp.ccg.util.CompositeFilter;
import opennlp.ccg.util.Filter;
import opennlp.ccg.util.InverseFilter;


/**
 * A filter for LF edges based on a set of {@linkplain #getMatchTypes() match type criteria}. Instances of
 * this class compare a specified {@linkplain #getBasis() basis edge} based on their match type criteria.
 * This class extends {@link CompositeFilter}, and the constructors add various filters as members depending on 
 * the criteria in effect.  
 * <p>
 * Edge match filters use the following match types as criteria in addition to the ones used by
 * {@link VertexMatchFilter}: {@link MatchType#LABEL_MATCH}, and {@link MatchType#LABEL_MISMATCH}. 
 * 
 * @see VertexMatchFilter
 * @see LabelMatchFilter
 * 
 * @author <a href="http://www.ling.ohio-state.edu/~scott/">Scott Martin</a>
 */
public class EdgeMatchFilter extends CompositeFilter<LFEdge> {
	
	LFEdge basis;
	final EnumSet<MatchType> matchTypes;
	
	/**
	 * Creates a new edge match filter based on the specified edge and criteria.
	 * @see #EdgeMatchFilter(LFEdge, Collection)
	 */
	public EdgeMatchFilter(LFEdge basis, MatchType... matchTypes) {
		this(basis, Arrays.asList(matchTypes));
	}
	
	/**
	 * Creates a new edge match filter based on the specified edge, using the specified
	 * match type criteria. Depending on the criteria, this constructor adds instances of
	 * {@link VertexMatchFilter} and {@link LabelMatchFilter} (or their inverses) to the
	 * set of filters composing it.
	 * 
	 * @param basis The LF edge to use for comparison.
	 * @param matchTypes The comparison criteria, used to populate this composite filter.
	 * 
	 * @throws IllegalArgumentException if <tt>basis</tt> is <tt>null</tt>.
	 */
	public EdgeMatchFilter(LFEdge basis, Collection<MatchType> matchTypes) {
		super();
		
		checkBasis(basis);
		this.basis = basis;
		this.matchTypes = EnumSet.copyOf(matchTypes);
				
		for(MatchType t : matchTypes) {
			Filter<LFEdge> f = null;
			
			if(t == LABEL_MATCH || t == LABEL_MISMATCH) {
				f = new LabelMatchFilter(basis.getLabel());
				if(t == LABEL_MISMATCH) {
					f = new InverseFilter<LFEdge>(f);
				}
			}
			else if(t == SOURCE_MATCH || t == SOURCE_MISMATCH
					|| t == SOURCE_PREDICATE_MATCH || t == SOURCE_PREDICATE_MISMATCH) {
				f = new VertexMatchFilter(basis.getSource(), t);
			}
			else if(t == TARGET_MATCH || t == TARGET_MISMATCH
					|| t == TARGET_PREDICATE_MATCH || t == TARGET_PREDICATE_MISMATCH) {
				f = new VertexMatchFilter(basis.getTarget(), t);
			}
			
			if(f != null) {
				addFilter(f);
			}
		}
	}
	
	private void checkBasis(LFEdge basis) {
		if(basis == null) {
			throw new IllegalArgumentException("basis is null");
		}
	}
	
	/**
	 * Gets the edge that comparisons are based on.
	 */
	public LFEdge getBasis() {
		return basis;
	}

	/**
	 * Sets the edge used for comparisons.
	 * @throws IllegalArgumentException if <tt>basis</tt> is <tt>null</tt>.
	 */
	public void setBasis(LFEdge basis) {
		checkBasis(basis);
		this.basis = basis;
	}

	/**
	 * Gets the match type criteria used by this edge match filter.
	 */
	public EnumSet<MatchType> getMatchTypes() {
		return matchTypes;
	}
}


================================================
FILE: src/opennlp/ccg/disjunctivizer/FilteredLFEdgeSet.java
================================================
//////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2012 Scott Martin
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.disjunctivizer;

import java.util.AbstractCollection;
import java.util.Collection;
import java.util.Iterator;
import java.util.Set;

import opennlp.ccg.hylo.graph.LFEdge;
import opennlp.ccg.hylo.graph.LFEdgeLabel;
import opennlp.ccg.hylo.graph.LFVertex;
import opennlp.ccg.util.Filter;
import opennlp.ccg.util.FilteredSet;


/**
 * A filtered set of LF edges. This class extends {@link FilteredSet} to provide the additional functionality
 * of edge-based views of its contents: {@link #sourceView()}, {@link #targetView()}, and {@link #labelView()},
 * which respectively get the set of source vertices, set of target vertices, and set of labels contained
 * in the edges in this set. All of these view sets are read-only, so that attempting to add or remove
 * elements from them (including via the iterator) throws {@link UnsupportedOperationException}.
 * 
 * @author <a href="http://www.ling.ohio-state.edu/~scott/">Scott Martin</a>
 */
public class FilteredLFEdgeSet extends FilteredSet<LFEdge> {

	private VertexView sourceView = null, targetView = null;
	private LabelView labelView = null;
	
	/**
	 * Creates a new filtered edge set based on the specified underlying edge set and edge filter.
	 */
	public FilteredLFEdgeSet(Set<? extends LFEdge> edges, Filter<? super LFEdge> edgeFilter) {
		super(edges, edgeFilter);
	}
	
	/**
	 * Gets a view of this filtered edge set as a set of LF vertices that are the 
	 * {@linkplain LFEdge#getSource() source vertices} for each edge in this set.
	 * @return A set containing every LF vertex that is the source vertex of some edge in this set.
	 * Note that the returned collection is immutable, and may contain duplicate vertices.
	 */
	public Collection<LFVertex> sourceView() {
		return (sourceView == null) ? (sourceView = new VertexView(true)) : sourceView;
	}
	
	/**
	 * Gets a view of this filtered edge set as a set of LF vertices that are the 
	 * {@linkplain LFEdge#getTarget() target vertices} for each edge in this set.
	 * @return A set containing every LF vertex that is the target vertex of some edge in this set.
	 * Note that the returned collection is immutable, and may contain duplicate vertices.
	 */
	public Collection<LFVertex> targetView() {
		return (targetView == null) ? (targetView = new VertexView(false)) : targetView;
	}
	
	/**
	 * Gets a view of this filtered edge set as a set of LF vertices that are the 
	 * {@linkplain LFEdge#getLabel() labels} for each edge in this set.
	 * @return A set containing every LF edge label that is the label of some edge in this set.
	 * Note that the returned collection is immutable, and may contain duplicate labels.
	 */
	public Collection<LFEdgeLabel> labelView() {
		return (labelView == null) ? (labelView = new LabelView()) : labelView;
	}
	
	abstract class ComponentView<T> extends AbstractCollection<T> {
		
		abstract T componentOf(LFEdge edge);
		
		@Override
		public Iterator<T> iterator() {
			return new Iterator<T>() {
				private Iterator<LFEdge> i = FilteredLFEdgeSet.this.iterator();
				
				@Override
				public boolean hasNext() {
					return i.hasNext();
				}

				@Override
				public T next() {
					// don't have to worry whether hasNext() is true, iterator should throw exception if not
					return componentOf(i.next());
				}

				@Override
				public void remove() {
					throw new UnsupportedOperationException();
				}
			};
		}

		@Override
		public int size() {
			return FilteredLFEdgeSet.this.size();
		}
	}
	
	class VertexView extends ComponentView<LFVertex> {

		boolean source;
		
		VertexView(boolean source) {
			this.source = source;
		}
		
		@Override
		LFVertex componentOf(LFEdge edge) {
			return source ? edge.getSource() : edge.getTarget();
		}		
	}
	
	class LabelView extends ComponentView<LFEdgeLabel> {

		@Override
		LFEdgeLabel componentOf(LFEdge edge) {
			return edge.getLabel();
		}
	}
}


================================================
FILE: src/opennlp/ccg/disjunctivizer/LFGraphDifference.java
================================================
//////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2012 Scott Martin
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.disjunctivizer;

import static opennlp.ccg.alignment.PhrasePosition.A;
import static opennlp.ccg.alignment.PhrasePosition.B;
import static opennlp.ccg.disjunctivizer.MatchType.SOURCE_ALIGNED;
import static opennlp.ccg.disjunctivizer.MatchType.SOURCE_MATCH;
import static opennlp.ccg.disjunctivizer.MatchType.SOURCE_UNALIGNED;
import static opennlp.ccg.disjunctivizer.MatchType.TARGET_ALIGNED;
import static opennlp.ccg.disjunctivizer.MatchType.TARGET_UNALIGNED;

import java.util.AbstractMap;
import java.util.AbstractSet;
import java.util.Collections;
import java.util.Iterator;
import java.util.LinkedHashSet;
import java.util.Map;
import java.util.Set;
import java.util.Map.Entry;

import opennlp.ccg.alignment.Alignment;
import opennlp.ccg.alignment.PhrasePosition;
import opennlp.ccg.hylo.graph.LFEdge;
import opennlp.ccg.hylo.graph.LFGraph;
import opennlp.ccg.hylo.graph.LFVertex;
import opennlp.ccg.util.CompositeFilter;
import opennlp.ccg.util.Filter;
import opennlp.ccg.util.FilteredMap;
import opennlp.ccg.util.FilteredSet;
import opennlp.ccg.util.VisitedFilter;

/**
 * Represents the difference between two {@link LFGraph}s that characterizes their difference as a set 
 * of edits: either {@link #inserts()}, {@link #deletes()}, or {@link #substitutions()}. These edits are
 * determined by a specified {@linkplain #getAlignment() alignment} between the phrases the graphs
 * are supposed to represent. All of the sets of edges returned by this class, and the convenience maps
 * build on top of them, are read-only. Attempting to add or remove elements or keys from any of these
 * (including via any of the iterators) throws an {@link UnsupportedOperationException}.
 * <p>
 * This class also provides the convenience methods {@link #insertsFor(LFVertex)} and  
 * {@link #deletesFor(LFVertex)}, for getting just the inserts or deletes for a specified vertex.
 * The convenience methods {@link #substitutionsFor(LFEdge)} gets the set of substitutions correspoding
 * to a given edge, and {@link #substitutionsBySource()} and {@link #substitutionsBySourceFor(LFEdge)}
 * are similar methods that provide maps whose keys are the source vertices of the substituted edges. 
 * 
 * @author <a href="http://www.ling.ohio-state.edu/~scott/">Scott Martin</a>
 */
public class LFGraphDifference {

	final LFGraph a, b;
	final Alignment alignment;
	
	private Set<LFEdge> deletes, inserts, substitutions;
	
	/**
	 * Creates a new graph difference between <tt>a</tt> and <tt>b</tt>, as determined by the specified
	 * alignment.
	 * @param a The {@linkplain PhrasePosition#A A-position} graph.
	 * @param b The {@linkplain PhrasePosition#B B-position} graph.
	 * @param alignment An alignment between <tt>a</tt> and <tt>b</tt> where the
	 * {@linkplain PhrasePosition#A A-position} indices are understood to correspond to <tt>a</tt> and
	 * {@linkplain PhrasePosition#B B-position} indices are understood to correspond to <tt>b</tt>.
	 * @throws IllegalArgumentException If either graph is <tt>null</tt>, or if the alignment is
	 * <tt>null</tt>.
	 */
	public LFGraphDifference(LFGraph a, LFGraph b, Alignment alignment) {
		checkGraph(a, A);
		checkGraph(b, B);
		
		if(alignment == null) {
			throw new IllegalArgumentException("alignment is null");
		}
		
		this.a = a;
		this.b = b;
		this.alignment = alignment;
	}
	
	private void checkGraph(LFGraph g, PhrasePosition pos) {
		if(g == null) {
			throw new IllegalArgumentException(pos.name() + " graph is null");
		}
	}

	/**
	 * Gets the {@linkplain PhrasePosition#A A-position} graph.
	 */
	public LFGraph getA() {
		return get(A);
	}

	/**
	 * Gets the {@linkplain PhrasePosition#B B-position} graph.
	 */
	public LFGraph getB() {
		return get(B);
	}
	
	/**
	 * Gets the graph in the specified position.
	 * @param position The position to retrieve a graph for.
	 * @return The value of {@link #getA()} if <tt>position</tt> is {@link PhrasePosition#A}, and
	 * the value of {@link #getB()} otherwise.
	 */
	public LFGraph get(PhrasePosition position) {
		return (position == A) ? a : b;
	}

	/**
	 * Gets the alignment used to determine the edits between the two graphs.
	 */
	public Alignment getAlignment() {
		return alignment;
	}
	
	/**
	 * Computes a hash code for this graph difference based on its graphs and the
	 * alignment between them.
	 */
	@Override
	public int hashCode() {
		return 31 * a.hashCode() + b.hashCode() + alignment.hashCode(); 
	}

	/**
	 * Tests whether this LF graph difference is equivalent to another by comparing their
	 * graphs and the alignment between them.
	 */
	@Override
	public boolean equals(Object obj) {
		if(obj instanceof LFGraphDifference) {
			LFGraphDifference diff = (LFGraphDifference)obj;
			return a.equals(diff.a) && b.equals(diff.b) && alignment.equals(diff.alignment);
		}
		
		return false;
	}
	
	/**
	 * Gets a string representation of this graph difference.
	 */
	@Override
	public String toString() {
		StringBuilder sb = new StringBuilder("difference for graphs: ");
		
		for(PhrasePosition pos : PhrasePosition.values()) {
			sb.append(pos);
			sb.append(": ");
			sb.append(get(pos));
			sb.append(", ");
		}
		
		sb.append("alignment: ");
		sb.append(alignment.toString());
		
		return sb.toString();
	}

	/**
	 * Gets an LF graph difference that is the reverse of the present one.
	 * @return An LF graph difference whose {@linkplain PhrasePosition#A A-position} graph is the value of this
	 * difference's {@link #getB()}, whose {@linkplain PhrasePosition#B B-position} graph is the value of this
	 * difference's {@link #getA()}, and whose alignments are the {@linkplain Alignment#reverse() reverse} of
	 * this difference's {@link #getAlignment()}. 
	 */
	public LFGraphDifference reverse() {
		return new LFGraphDifference(b, a, alignment.reverse());
	}
	
	/**
	 * Gets the deletes for this graph difference.
	 * @return The set of edges in the {@linkplain PhrasePosition#A A-position} graph that have an aligned 
	 * {@linkplain LFEdge#getSource() source vertex} and an unaligned 
	 * {@linkplain LFEdge#getTarget() target vertex}.
	 * 
	 * @see AlignedEdgeFilter
	 */
	public Set<LFEdge> deletes() {
		return (deletes == null) ? (deletes = doDeletes(A)) : deletes;
	}
	
	/**
	 * Gets the inserts for this graph difference.
	 * @return The set of edges in the {@linkplain PhrasePosition#B B-position} graph that have an aligned 
	 * {@linkplain LFEdge#getSource() source vertex} and an unaligned 
	 * {@linkplain LFEdge#getTarget() target vertex}.
	 * 
	 * @see AlignedEdgeFilter
	 */
	public Set<LFEdge> inserts() {
		return (inserts == null) ? (inserts = doDeletes(B)) : inserts;
	}
	
	Set<LFEdge> doDeletes(PhrasePosition keyPosition) {
		return Collections.unmodifiableSet(new FilteredLFEdgeSet(get(keyPosition).edgeSet(),
				new AlignedEdgeFilter(alignment.asMap(keyPosition).keySet(),
						SOURCE_ALIGNED, TARGET_UNALIGNED)));
	}
	
	/**
	 * Gets the inserts for a specified vertex.	
	 * @param vertex The vertex to return the inserts for.
	 * @return The subset of {@link #inserts()} whose {@linkplain LFEdge#getSource() source} index is among the
	 * {@linkplain Alignment#getTargets(Integer) targets} for the specified vertex, or {@link Collections#EMPTY_SET}
	 * if none exist.
	 * 
	 * @see AlignedEdgeFilter
	 */
	@SuppressWarnings("unchecked")
	public Set<LFEdge> insertsFor(LFVertex vertex) {
		Set<Integer> indices = alignment.getTargets(vertex.getIndex());
		
		return (indices.isEmpty()) ? Collections.EMPTY_SET
				: new FilteredLFEdgeSet(inserts(), new AlignedEdgeFilter(indices, SOURCE_ALIGNED));
	}
	
	/**
	 * Gets the deletes for a specified vertex.
	 * @param vertex The vertex to get the deletes for.
	 * @return The subset of {@link #deletes()} whose {@linkplain LFEdge#getSource() source vertex} is
	 * the specified vertex.
	 * 
	 * @see VertexMatchFilter
	 */
	public Set<LFEdge> deletesFor(LFVertex vertex) {
		return new FilteredLFEdgeSet(deletes(), new VertexMatchFilter(vertex, SOURCE_MATCH));
	}
	
	/**
	 * Gets the substitutions for this graph difference.
	 * @return The subset of the {@linkplain PhrasePosition#B B-position} graph's edges for which there
	 * exists an edge in the {@linkplain PhrasePosition#A A-position} graph that meets the following
	 * conditions:
	 * <ol>
	 * 	<li>The B edge's source is aligned to the A edge's source, but the B edge's target is not.</li>
	 * 	<li>The B edge's target is aligned to the A edge's target, but the B edge's source is not.</li>
	 * </ol>
	 * 
	 * @see CompositeFilter
	 */
	public Set<LFEdge> substitutions() {
		if(substitutions == null) {
			substitutions = new LinkedHashSet<LFEdge>();
			Set<LFEdge> bEdges = b.edgeSet();
			
			AlignedEdgeFilter sourceFilter = null, targetFilter = null;
			CompositeFilter<LFEdge> filter = new CompositeFilter<LFEdge>();
			
			for(LFEdge aEdge : a.edgeSet()) {
				Set<Integer> sMaps = alignment.getTargets(aEdge.getSource().getIndex()),
								tMaps = alignment.getTargets(aEdge.getTarget().getIndex());
				
				if(!sMaps.isEmpty() && !tMaps.isEmpty()) {
					if(sourceFilter == null) {
						sourceFilter = new AlignedEdgeFilter(sMaps, SOURCE_ALIGNED, TARGET_UNALIGNED);
						targetFilter = new AlignedEdgeFilter(tMaps, TARGET_ALIGNED, SOURCE_UNALIGNED);
						
						filter.addFilter(sourceFilter);
						filter.addFilter(targetFilter);
					}
					else {
						sourceFilter.setAlignmentIndices(sMaps);
						targetFilter.setAlignmentIndices(tMaps);
					}
					
					substitutions.addAll(new FilteredLFEdgeSet(bEdges, filter));
				}
			}
		}
		
		return Collections.unmodifiableSet(substitutions);
	}
	
	/**
	 * Gets the substitutions for the specified edge.
	 * @param edge The edge to get substitutions for.
	 * @return The subset of {@link #substitutions()} whose source is aligned to the edge's source and
	 * whose target is aligned to the edge's target, or {@link Collections#EMPTY_SET} if none exist. 
	 */
	@SuppressWarnings("unchecked")
	public Set<LFEdge> substitutionsFor(LFEdge edge) {
		Set<Integer> srcMapsTo = alignment.getTargets(edge.getSource().getIndex()),
			trgMapsTo = alignment.getTargets(edge.getTarget().getIndex());
		
		return (srcMapsTo.isEmpty() || trgMapsTo.isEmpty()) ? Collections.EMPTY_SET
				: Collections.unmodifiableSet(new FilteredLFEdgeSet(substitutions(),
						new CompositeFilter<LFEdge>(new AlignedEdgeFilter(srcMapsTo, SOURCE_ALIGNED),
								new AlignedEdgeFilter(trgMapsTo, TARGET_ALIGNED))));
	}
	
	/**
	 * Gets a map view of the substitutions in this graph difference.
	 * @return A map whose keys are the source vertices in the set of {@link #substitutions()} and whose values
	 * are the edges whose {@linkplain LFEdge#getSource() source vertex} is the same as the corresponding key.
	 * If there are no substitutions, {@link Collections#EMPTY_MAP} is returned.
	 * <p>
	 * Note that the returned map is
	 * read-only, that is, both its {@link Map#put(Object, Object)} method and its 
	 * {@linkplain Map#entrySet() entry set}'s iterator's {@link Iterator#remove()} method throw an
	 * {@link UnsupportedOperationException}. Also, the members of the returned map's entry set are immutable,
	 * so that their {@link Entry#setValue(Object)} methods also throw an {@link UnsupportedOperationException}.
	 */
	@SuppressWarnings("unchecked")
	public Map<LFVertex, Set<LFEdge>> substitutionsBySource() {
		Set<LFEdge> subs = substitutions();
		
		return subs.isEmpty() ? Collections.EMPTY_MAP
				: Collections.unmodifiableMap(
						new FilteredMap<LFVertex, Set<LFEdge>>(new SourceView(),
								new VisitedFilter<LFVertex>()));
	}
	
	/**
	 * Gets a map view of the substitutions for the specified edge.
	 * @param edge The edge to get substitutions for.
	 * @return The subset of {@link #substitutionsBySource()} in which the keys are aligned to the specified edge's
	 * source and the associated values' targets are aligned to the specified edge's target. Since this map is
	 * based on the one returned by {@link #substitutionsBySource()}, it is also read-only, and the same stipulations
	 * apply to it.
	 * 
	 * @see #substitutionsBySource()
	 */
	public Map<LFVertex, Set<LFEdge>> substitutionsBySourceFor(LFEdge edge) {
		Map<LFVertex, Set<LFEdge>> subsBySource = substitutionsBySource();		
		return subsBySource.isEmpty() ? subsBySource : new SubstitutedSourceView(subsBySource, edge);
	}
	
	class SourceView extends AbstractMap<LFVertex, FilteredLFEdgeSet> {

		@Override
		public Set<Entry<LFVertex, FilteredLFEdgeSet>> entrySet() {
			return new AbstractSet<Entry<LFVertex,FilteredLFEdgeSet>>() {
				Set<LFEdge> subs = substitutions();
				
				@Override
				public int size() {
					return subs.size();
				}

				@Override
				public Iterator<Entry<LFVertex, FilteredLFEdgeSet>> iterator() {
					return new Iterator<Entry<LFVertex,FilteredLFEdgeSet>>() {
						private Iterator<LFEdge> edgeIterator = null;
																			
						@Override
						public boolean hasNext() {
							if(edgeIterator == null) {
								edgeIterator = subs.iterator();
							}
							
							return edgeIterator.hasNext();
						}

						@Override
						public Entry<LFVertex, FilteredLFEdgeSet> next() {
							if(edgeIterator == null) {
								edgeIterator = subs.iterator();
							}
							
							LFVertex src = edgeIterator.next().getSource();
							
							return new SimpleImmutableEntry<LFVertex, FilteredLFEdgeSet>(src,
									new FilteredLFEdgeSet(subs, new VertexMatchFilter(src, SOURCE_MATCH)));
						}
						
						@Override
						public void remove() { // subs.iterator() should be read-only, but just in case
							throw new UnsupportedOperationException();
						}
					};
				}
			};
		}
	}
	
	class SubstitutedSourceView extends AbstractMap<LFVertex, Set<LFEdge>> {

		Map<LFVertex, Set<LFEdge>> sourceView;
		LFEdge edge;
		
		private Set<Entry<LFVertex, Set<LFEdge>>> entrySet;
		
		SubstitutedSourceView(Map<LFVertex, Set<LFEdge>> sourceView, LFEdge edge) {
			this.sourceView = sourceView;
			this.edge = edge;
		}
		
		@Override
		public Set<Entry<LFVertex, Set<LFEdge>>> entrySet() {
			return (entrySet == null) ? (entrySet = new EntrySet()) : entrySet;
		}
		
		class EntrySet extends AbstractSet<Entry<LFVertex, Set<LFEdge>>> {
			private Set<Entry<LFVertex, Set<LFEdge>>> entries;
			Set<Integer> srcMapsTo = alignment.getTargets(edge.getSource().getIndex()),
								trgMapsTo = alignment.getTargets(edge.getTarget().getIndex());
			
			Set<Entry<LFVertex, Set<LFEdge>>> entries() {
				if(entries == null) {
					entries = new FilteredSet<Entry<LFVertex, Set<LFEdge>>>(
						sourceView.entrySet(),
						new Filter<Entry<LFVertex, Set<LFEdge>>>() {
							@Override
							public boolean allows(Entry<LFVertex, Set<LFEdge>> e) {
								if(srcMapsTo.contains(e.getKey().getIndex())) {
									for(LFEdge t : e.getValue()) {
										if(trgMapsTo.contains(t.getTarget().getIndex())) {
											return true;
										}
									}
								}
								
								return false;
							}
						}
					);
				}
				
				return entries;
			}
			
			@Override
			public int size() {
				return entries().size();
			}
			
			@Override
			public Iterator<Entry<LFVertex, Set<LFEdge>>> iterator() {
				return new Iterator<Entry<LFVertex, Set<LFEdge>>>() {
					private Iterator<Entry<LFVertex, Set<LFEdge>>> i = entries().iterator();
					
					@Override
					public boolean hasNext() {
						return i.hasNext();
					}

					@Override
					public Entry<LFVertex, Set<LFEdge>> next() {
						Entry<LFVertex, Set<LFEdge>> e = i.next();
						return new SimpleImmutableEntry<LFVertex, Set<LFEdge>>(
								e.getKey(),
								new FilteredLFEdgeSet(e.getValue(), new Filter<LFEdge>() {
									@Override
									public boolean allows(LFEdge e) {
										return trgMapsTo.contains(e.getTarget().getIndex());
									}									
								}
							)
						);
					}

					@Override
					public void remove() { // source view is already read-only, so just in case
						throw new UnsupportedOperationException();						
					}					
				};
			}
		}
	}
}


================================================
FILE: src/opennlp/ccg/disjunctivizer/LabelMatchFilter.java
================================================
//////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2012 Scott Martin
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.disjunctivizer;

import opennlp.ccg.hylo.graph.LFEdge;
import opennlp.ccg.hylo.graph.LFEdgeLabel;
import opennlp.ccg.util.Filter;


/**
 * A filter for edges based on a comparison of their {@linkplain LFEdge#getLabel() labels}. Instances of
 * this class compare a specified {@linkplain #getBasis() basis edge label}, so that the 
 * {@link #allows(LFEdge)} method returns <tt>true</tt> if it is
 * {@linkplain LFEdgeLabel#equals(Object) equivalent to} the specified edge's label. 
 * 
 * @author <a href="http://www.ling.ohio-state.edu/~scott/">Scott Martin</a>
 */
public class LabelMatchFilter implements Filter<LFEdge> {
	
	LFEdgeLabel basis;
	
	/**
	 * Creates a new label match filter that will compare edge labels to the specified label.
	 * @param basis The label to be used for comparison.
	 * @throws IllegalArgumentException if <tt>basis</tt> is <tt>null</tt>.
	 */
	public LabelMatchFilter(LFEdgeLabel basis) {
		checkBasis(basis);
		this.basis = basis;
	}

	private void checkBasis(LFEdgeLabel basis) {
		if(basis == null) {
			throw new IllegalArgumentException("basis is null");
		}
	}
	
	/**
	 * Gets the label used as the basis for comparison in the {@link #allows(LFEdge)} method.
	 * @return The edge label specified at creation.
	 * 
	 * @see #LabelMatchFilter(LFEdgeLabel)
	 */
	public LFEdgeLabel getBasis() {
		return basis;
	}

	/**
	 * Sets the edge label used as the basis for comparison.
	 * @throws IllegalArgumentException if <tt>basis</tt> is <tt>null</tt>.
	 */
	public void setBasis(LFEdgeLabel basis) {
		checkBasis(basis);
		this.basis = basis;
	}

	/**
	 * Tests whether the specified edge's label is equivalent to this filter's {@linkplain #getBasis() basis
	 * edge}.
	 * @param edge The edge to test.
	 * @return <tt>true</tt> if the basis edge label is equivalent to <tt>edge.getLabel()</tt> based on a
	 * comparison via their {@link LFEdgeLabel#equals(Object)} method.
	 */
	@Override
	public boolean allows(LFEdge edge) {
		return basis.equals(edge.getLabel());
	}

}


================================================
FILE: src/opennlp/ccg/disjunctivizer/MatchType.java
================================================
//////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2012 Scott Martin
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.disjunctivizer;

import opennlp.ccg.hylo.graph.LFEdge;
import opennlp.ccg.hylo.graph.LFVertex;

/**
 * A set of enum constants for identifying the matching criteria used by a {@link MatchTypeFilter}.
 * Not all match type filters will use all of the match type criteria contained in this enum.
 * 
 * @see LFVertex
 * @see LFEdge
 * 
 * @author <a href="http://www.ling.ohio-state.edu/~scott/">Scott Martin</a>
 */
public enum MatchType {
	/**
	 * Matching source vertices.
	 */
	SOURCE_MATCH,
	
	/**
	 * Matching target vertices.
	 */
	TARGET_MATCH,
	
	/**
	 * Matching edge labels.
	 */
	LABEL_MATCH,
	
	/**
	 * Matching predicates for source vertices.
	 */
	SOURCE_PREDICATE_MATCH,
	
	/**
	 * Matching predicates for target vertices.
	 */
	TARGET_PREDICATE_MATCH,
	
	/**
	 * Mismatching source vertices.
	 */
	SOURCE_MISMATCH,
	
	/**
	 * Mismatching target vertices.
	 */
	TARGET_MISMATCH,
	
	/**
	 * Mismatching edge labels.
	 */
	LABEL_MISMATCH,
	
	/**
	 * Mismatching source vertex predicates.
	 */
	SOURCE_PREDICATE_MISMATCH,
	
	/**
	 * Mismatching target vertex predicates.
	 */
	TARGET_PREDICATE_MISMATCH,
	
	/**
	 * Source vertex is aligned.
	 */
	SOURCE_ALIGNED,
	
	/**
	 * Source vertex is not aligned.
	 */
	SOURCE_UNALIGNED,
	
	/**
	 * Target vertex is aligned.
	 */
	TARGET_ALIGNED,
	
	/**
	 * Target vertex is unaligned.
	 */
	TARGET_UNALIGNED
}


================================================
FILE: src/opennlp/ccg/disjunctivizer/MatchTypeFilter.java
================================================
//////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2012 Scott Martin
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.disjunctivizer;

import java.util.Arrays;
import java.util.Collection;
import java.util.EnumSet;

import opennlp.ccg.hylo.graph.LFEdge;
import opennlp.ccg.util.Filter;

/**
 * Abstract class for filters that allow {@link LFEdge}s based on criteria indicated by the set of
 * {@linkplain #getMatchTypes() match types} they use. 
 * 
 * @author <a href="http://www.ling.ohio-state.edu/~scott/">Scott Martin</a>
 *
 */
public abstract class MatchTypeFilter implements Filter<LFEdge> {
	
	/**
	 * The set of match types used as criteria by this filter.
	 */
	protected final EnumSet<MatchType> matchTypes;

	/**
	 * Creates a new match type filter based on the specified match types.
	 * @see #MatchTypeFilter(Collection)
	 */
	protected MatchTypeFilter(MatchType... matchTypes) {
		this(Arrays.asList(matchTypes));
	}
	
	/**
	 * Creates a new match type filter based on the specified match types.
	 * @param matchTypes The collection of match types to use. The specified collection is 
	 * copied via {@link EnumSet#copyOf(Collection)}.
	 */
	protected MatchTypeFilter(Collection<MatchType> matchTypes) {
		this.matchTypes = EnumSet.copyOf(matchTypes);
	}

	/**
	 * Gets the match types used by this match type filter.
	 */
	public EnumSet<MatchType> getMatchTypes() {
		return matchTypes;
	}

}


================================================
FILE: src/opennlp/ccg/disjunctivizer/VertexMatchFilter.java
================================================
//////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2012 Scott Martin
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.disjunctivizer;

import static opennlp.ccg.disjunctivizer.MatchType.SOURCE_MATCH;
import static opennlp.ccg.disjunctivizer.MatchType.SOURCE_MISMATCH;
import static opennlp.ccg.disjunctivizer.MatchType.SOURCE_PREDICATE_MATCH;
import static opennlp.ccg.disjunctivizer.MatchType.SOURCE_PREDICATE_MISMATCH;
import static opennlp.ccg.disjunctivizer.MatchType.TARGET_MATCH;
import static opennlp.ccg.disjunctivizer.MatchType.TARGET_MISMATCH;
import static opennlp.ccg.disjunctivizer.MatchType.TARGET_PREDICATE_MATCH;
import static opennlp.ccg.disjunctivizer.MatchType.TARGET_PREDICATE_MISMATCH;

import java.util.Collection;

import opennlp.ccg.hylo.graph.LFEdge;
import opennlp.ccg.hylo.graph.LFVertex;


/**
 * A filter that matches vertices based on a basis vertex and a set of match type criteria.
 * <p>
 * Instances of this class use the following match types: {@link MatchType#SOURCE_MATCH}, 
 * {@link MatchType#SOURCE_MISMATCH}, {@link MatchType#TARGET_MATCH}, {@link MatchType#TARGET_MISMATCH},
 * {@link MatchType#SOURCE_PREDICATE_MATCH}, {@link MatchType#SOURCE_PREDICATE_MISMATCH},
 * {@link MatchType#TARGET_PREDICATE_MATCH}, {@link MatchType#TARGET_PREDICATE_MISMATCH}.
 * 
 * @author <a href="http://www.ling.ohio-state.edu/~scott/">Scott Martin</a>
 */
public class VertexMatchFilter extends MatchTypeFilter {

	LFVertex basis;
	
	/**
	 * Creates a new vertex match filter using the specified vertex as a basis for comparison and the
	 * specified match type criteria.
	 * @throws IllegalArgumentException if <tt>basis</tt> is <tt>null</tt>.
	 * @see #VertexMatchFilter(LFVertex, Collection)
	 */
	public VertexMatchFilter(LFVertex basis, MatchType... matchTypes) {
		super(matchTypes);
		
		checkBasis(basis);
		this.basis = basis;
	}
		
	/**
	 * Creates a new vertex match filter using the specified vertex as a basis for comparison and the
	 * specified match type criteria.
	 * @param basis The vertex to use as a basis for comparison.
	 * @param matchTypes The set of match type criteria to use.
	 * @throws IllegalArgumentException if <tt>basis</tt> is <tt>null</tt>.
	 */
	public VertexMatchFilter(LFVertex basis, Collection<MatchType> matchTypes) {
		super(matchTypes);
		
		checkBasis(basis);
		this.basis = basis;
	}

	private void checkBasis(LFVertex basis) {
		if(basis == null) {
			throw new IllegalArgumentException("basis is null");
		}
	}
	
	/**
	 * Gets the vertex that is the basis for comparison in this filter's {@link #allows(LFEdge)} method.
	 */
	public LFVertex getBasis() {
		return basis;
	}

	/**
	 * Sets the vertex used as a basis for comparison.
	 * @throws IllegalArgumentException if <tt>basis</tt> is <tt>null</tt>.
	 */
	public void setBasis(LFVertex basis) {
		checkBasis(basis);
		this.basis = basis;
	}

	/**
	 * Tests whether a specified edge is allowed based on the match type criteria in effect and the
	 * vertex used as a basis for comparison.
	 * @param edge The edge to test.
	 * @return <tt>false</tt> if {@link #getMatchTypes()} contains
	 * <ul>
	 * 	<li>{@link MatchType#SOURCE_MATCH}, but the basis edge does not equal the edge's source,</li>
	 * 	<li>{@link MatchType#SOURCE_MISMATCH}, but the basis edge is equal to the edge's source,</li>
	 * 	<li>{@link MatchType#TARGET_MATCH}, but the basis edge does not equal the edge's target,</li>
	 * 	<li>{@link MatchType#TARGET_MISMATCH}, but the basis edge is equal to the edge's target,</li>
	 * 	<li>{@link MatchType#SOURCE_PREDICATE_MATCH}, but the basis edge's predicate does not equal the 
	 * 		edge's source vertex's predicate,</li>
	 * 	<li>{@link MatchType#SOURCE_PREDICATE_MISMATCH}, but the basis edge's predicate is equal to the 
	 * 		edge's source vertex's predicate,</li>
	 * 	<li>{@link MatchType#TARGET_PREDICATE_MATCH}, but the basis edge's predicate does not equal the 
	 * 		edge's target vertex's predicate,</li>
	 * 	<li>{@link MatchType#TARGET_PREDICATE_MISMATCH}, but the basis edge's predicate is equal to the 
	 * 		edge's target vertex's predicate,</li>
	 * </ul>
	 * and <tt>true</tt> otherwise.
	 */
	@Override
	public boolean allows(LFEdge edge) {
		for(MatchType t : matchTypes) {
			if(t == SOURCE_MATCH && !basis.equals(edge.getSource())) {
				return false;
			}
			else if(t == SOURCE_MISMATCH && basis.equals(edge.getSource())) {
				return false;
			}
			else if(t == TARGET_MATCH && !basis.equals(edge.getTarget())) {
				return false;
			}
			else if(t == TARGET_MISMATCH && basis.equals(edge.getTarget())) {
				return false;
			}
			else if(basis.getPredicate() != null) {
				if(t == SOURCE_PREDICATE_MATCH 
						&& !basis.getPredicate().equals(edge.getSource().getPredicate())) {
					return false;
				}
				else if(t == SOURCE_PREDICATE_MISMATCH 
						&& basis.getPredicate().equals(edge.getSource().getPredicate())) {
					return false;
				}
				else if(t == TARGET_PREDICATE_MATCH 
						&& !basis.getPredicate().equals(edge.getTarget().getPredicate())) {
					return false;
				}
				else if(t == TARGET_PREDICATE_MISMATCH 
						&& basis.getPredicate().equals(edge.getTarget().getPredicate())) {
					return false;
				}
			}
		}
		
		return true;
	}

}


================================================
FILE: src/opennlp/ccg/disjunctivizer/package.html
================================================
<body>
	
<p>Package for the disjunctivizer, which creates a disjunctive LF XML structure based on
an {@link opennlp.ccg.disjunctivizer.LFGraphDifference}. An LF graph difference is a
characterization of the difference
between two {@link opennlp.ccg.hylo.graph.LFGraph graphs} and an
{@link opennlp.ccg.alignment.Alignment} between them in terms of
the edits needed to make one into the other: inserts, deletes, and substitutions.</p>

<p>The {@link opennlp.ccg.disjunctivizer.FilteredLFEdgeSet} class extends
{@link opennlp.ccg.util.FilteredSet} to also provide
views of its edges by {@linkplain opennlp.ccg.hylo.graph.LFEdge#getSource() source},
{@linkplain opennlp.ccg.hylo.graph.LFEdge#getTarget() target}, or
{@linkplain opennlp.ccg.hylo.graph.LFEdge#getLabel() label}. The various filters in this
package provide a lot of flexibility in terms of how to filter edges: whether their source,
target, or label matches a given edge's (or just their predicates), whether their source or
target is aligned, etc. These filters, and the {@link opennlp.ccg.disjunctivizer.FilteredLFEdgeSet} class,
are used internally by the {@link opennlp.ccg.disjunctivizer.Disjunctivizer} for generating
disjunctive LFs.</p>

</body>

================================================
FILE: src/opennlp/ccg/grammar/AbstractApplicationRule.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003 Jason Baldridge and University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.grammar;

import opennlp.ccg.unify.*;
import opennlp.ccg.synsem.*;

import java.util.*;

import org.jdom.Element;

/**
 * Super class for application rules.
 *
 * @author  Jason Baldridge
 * @author  Michael White
 * @version $Revision: 1.8 $, $Date: 2009/12/21 03:27:18 $
 */
public abstract class AbstractApplicationRule extends AbstractRule {
	
	private static final long serialVersionUID = 1L;
	
	protected Slash _functorSlash;

    /** Returns an XML element representing the rule. */
    public Element toXml(String dir) {
    	Element retval = new Element("application");
    	retval.setAttribute("dir", dir);
    	return retval;
    }

    public int arity() {
        return 2;
    }

    protected List<Category> apply(Category xyCat, Category yCat) throws UnifyFailure {

        if (xyCat instanceof ComplexCat) {

            ComplexCat xyCurCat = (ComplexCat)xyCat;
            Arg xyOuter = xyCurCat.getOuterArg();

            List<Category> results;
            _headCats.clear();

            if (xyOuter instanceof BasicArg) {
                xyOuter.unifySlash(_functorSlash);
                Category xyOuterCat = ((BasicArg)xyOuter).getCat();
                Substitution sub = new GSubstitution();
                GUnifier.unify(xyOuterCat, yCat, sub);
                results = new ArrayList<Category>(1);
                ((GSubstitution)sub).condense();
                Category result = (Category) xyCurCat.getResult().fill(sub);
                appendLFs(xyCat, yCat, result, sub);
                results.add(result);
                Slash xyOuterSlash = ((BasicArg)xyOuter).getSlash();
                _headCats.add(xyOuterSlash.isModifier() ? yCat : xyCat); 
            } else if (xyOuter instanceof SetArg) {
                SetArg xyOuterSet = (SetArg)xyOuter;
                results = new ArrayList<Category>(xyOuterSet.size());
                for (int i=0; i<xyOuterSet.size(); i++) {
                    BasicArg argi = xyOuterSet.get(i);
                    try {
                        argi.unifySlash(_functorSlash);
                        Substitution sub = new GSubstitution();
                        GUnifier.unify(argi.getCat(), yCat, sub);
                        ComplexCat result = (ComplexCat)xyCurCat.copy();
                        result.setOuterArgument(xyOuterSet.copyWithout(i));
                        ((GSubstitution)sub).condense();
                        result = (ComplexCat)result.fill(sub);
                        appendLFs(xyCat, yCat, result, sub);
                        results.add(result);
                        Slash xyOuterSlash = argi.getSlash();
                        _headCats.add(xyOuterSlash.isModifier() ? yCat : xyCat); 
                    } catch (UnifyFailure uf) {}                
                }
            } else {
                throw new UnifyFailure();
            }

            if (results.size() == 0) {
                throw new UnifyFailure();
            }
            
            return results;
        } else {
            throw new UnifyFailure();
        }
    }
}


================================================
FILE: src/opennlp/ccg/grammar/AbstractCompositionRule.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2002-3 Jason Baldridge and University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.grammar;

import opennlp.ccg.TextCCG;
import opennlp.ccg.unify.*;
import opennlp.ccg.synsem.*;

import java.util.*;
import java.util.prefs.Preferences;

import org.jdom.Element;

/**
 * Super class for composition rules.
 * 
 * @author Jason Baldridge
 * @author Michael White
 * @version $Revision: 1.10 $, $Date: 2009/12/21 03:27:18 $
 */
public abstract class AbstractCompositionRule extends AbstractApplicationRule {

	private static final long serialVersionUID = 1L;

	/** Preference key for Eisner constraints. */
    public static final String EISNER_CONSTRAINTS = "Use Eisner Constraints";
    
	/** 
	 * Flag for whether to impose Eisner's normal form constraints.
	 * The flag is initialized based on user preferences; 
	 * it must be changed for further preferences to take effect. 
	 */
	public static boolean useEisnerConstraints = initEisnerConstraints();
	
	private static boolean initEisnerConstraints() {
        Preferences prefs = Preferences.userNodeForPackage(TextCCG.class);
        return prefs.getBoolean(EISNER_CONSTRAINTS, true);
	}
	
	protected boolean _isHarmonic;

	protected Slash _argSlash;

    /** Returns an XML element representing the rule. */
    public Element toXml(String dir) {
    	Element retval = new Element("composition");
    	retval.setAttribute("dir", dir);
    	retval.setAttribute("harmonic", Boolean.toString(_isHarmonic));
    	return retval;
    }

	protected boolean eisner() { return useEisnerConstraints && _isHarmonic; }
	
	protected List<Category> apply(Category xyCat, Category yzCat) throws UnifyFailure {

		if (xyCat instanceof ComplexCat && yzCat instanceof ComplexCat) {
			List<Category> results = new ArrayList<Category>(1);
            _headCats.clear();
			ComplexCat xyCC = (ComplexCat) xyCat;
			ComplexCat yzCC = (ComplexCat) yzCat;

			Arg xyOuter = xyCC.getOuterArg();
			if (xyOuter instanceof BasicArg) {
				Slash xySlash = ((BasicArg) xyOuter).getSlash();
				xySlash.unifyCheck(_functorSlash);
				if (eisner() && xySlash.isHarmonicCompositionResult()) throw new UnifyFailure();
				Category xyOuterCat = ((BasicArg) xyOuter).getCat();

				if (xyOuterCat instanceof AtomCat) {
					// e.g. s/s Y/Z
					ArgStack zStack = yzCC.getArgStack();
					zStack.slashesUnify(_argSlash);
					Substitution sub = new GSubstitution();
					GUnifier.unify(xyOuterCat, yzCC.getTarget(), sub);
					xySlash = (Slash) xySlash.fill(sub);
					xySlash.unifyCheck(_functorSlash);
					Category outcome = createResult(xyCC.getResult(), zStack, xySlash, sub);
					appendLFs(xyCat, yzCat, outcome, sub);
					results.add(outcome);
	                _headCats.add(xySlash.isModifier() ? yzCat : xyCat); 
				} else if (xyOuterCat instanceof ComplexCat) {
					// e.g. s/(s/n) Y/Z
					Substitution sub = new GSubstitution();
					ArgStack zStack = composeComplexY((ComplexCat) xyOuterCat, xySlash, yzCC, sub);
					xySlash = (Slash) xySlash.fill(sub);
					xySlash.unifyCheck(_functorSlash);
					Category outcome = createResult(xyCC.getResult(), zStack, xySlash, sub);
					appendLFs(xyCat, yzCat, outcome, sub);
					results.add(outcome);
	                _headCats.add(xySlash.isModifier() ? yzCat : xyCat); 
				}
			} else if (xyOuter instanceof SetArg) {
				// e.g. s/{s,n} Y/Z
				Category yzTarget = yzCC.getTarget();
				SetArg xyOuterSet = (SetArg) xyOuter;
				int targetIndex = xyOuterSet.indexOf(yzTarget);
				if (targetIndex > -1) {
					Slash xySlash = xyOuterSet.get(targetIndex).getSlash();
					xySlash.unifyCheck(_functorSlash);
					if (eisner() && xySlash.isHarmonicCompositionResult()) throw new UnifyFailure();
					Substitution sub = new GSubstitution();
					GUnifier.unify(xyOuterSet.getCat(targetIndex), yzTarget, sub);
					Category result = xyCC.copy();
					((ComplexCat) result).setOuterArgument(xyOuterSet.copyWithout(targetIndex));
					ArgStack zStack = yzCC.getArgStack();
					zStack.slashesUnify(_argSlash);
					Category outcome = createResult(result, zStack, xySlash, sub);
					appendLFs(xyCat, yzCat, outcome, sub);
					results.add(outcome);
	                _headCats.add(xySlash.isModifier() ? yzCat : xyCat); 
				} else {
					boolean success = false;
					for (int i = 0; i < xyOuterSet.size(); i++) {
						BasicArg yInSet = xyOuterSet.get(i);
						if (yInSet.getCat() instanceof ComplexCat) {
							Slash xySlash = yInSet.getSlash();
							xySlash.unifyCheck(_functorSlash);
							if (eisner() && xySlash.isHarmonicCompositionResult()) throw new UnifyFailure();
							ComplexCat yCat = (ComplexCat) yInSet.getCat();
							Substitution sub = new GSubstitution();
							ArgStack zStack = composeComplexY((ComplexCat) yCat, xySlash, yzCC, sub);
							xySlash = (Slash) xySlash.fill(sub);
							xySlash.unifyCheck(_functorSlash);
							Category result = xyCC.copy();
							((ComplexCat) result).setOuterArgument(xyOuterSet.copyWithout(i));
							Category outcome = createResult(result, zStack, xySlash, sub);
							appendLFs(xyCat, yzCat, outcome, sub);
							results.add(outcome);
			                _headCats.add(xySlash.isModifier() ? yzCat : xyCat); 
							success = true;
						}
					}
					if (!success) {
						throw new UnifyFailure();
					}
				}
			} else {
				throw new UnifyFailure();
			}

			return results;
		} else {
			throw new UnifyFailure();
		}
	}

	private Category createResult(Category result, ArgStack zStack,
			Slash xySlash, Substitution sub) throws UnifyFailure {
		((GSubstitution) sub).condense();
		result = (Category) result.fill(sub);
		ArgStack newStack = zStack.fill(sub);
		if (!_isHarmonic
				&& (!xySlash.sameDirAsModality() || zStack
						.containsContrarySlash())) {
			newStack.deepMap(INERTIZER_FCN);
		}
		newStack.get(0).setSlashModifier(false);
		if (_isHarmonic && useEisnerConstraints) 
			newStack.setSlashHarmonicCompositionResult(true);
		if (result instanceof ComplexCat) {
			((ComplexCat) result).add(newStack);
		} else {
			result = new ComplexCat((TargetCat) result, newStack);
		}
		return result;
	}

	/**
	 * A function that tries to unify the value ant=+ into feature structures.
	 */
	private static ModFcn INERTIZER_FCN = new ModFcn() {
		public void modify(Mutable m) {
			if (m instanceof Slash) {
				((Slash) m).setAbility("inert");
			}
		}
	};

	private ArgStack composeComplexY(ComplexCat xyOuterCC, Slash xySlash,
			ComplexCat yzCC, Substitution sub) throws UnifyFailure {

		GUnifier.unify(xyOuterCC.getTarget(), yzCC.getTarget(), sub);
		ArgStack zStack = yzCC.getArgStack();
		if (xyOuterCC.containsDollarArg()) {
			// e.g. s$/(s$\n) s\n/n
			xyOuterCC.getArgStack().unifyPrefix(zStack, zStack.size() - 1, sub);
			zStack = zStack.subList(zStack.size() - 1);
			zStack.slashesUnify(_argSlash);
			xySlash = (Slash) xySlash.fill(sub);
			xySlash.unifyCheck(_functorSlash);
			return zStack;
		} else if (xyOuterCC.arity() == 1) {
			ArgStack yzStack = yzCC.getArgStack();
			if (!(xyOuterCC.getArg(0) instanceof BasicArg)) {
				throw new UnifyFailure();
			}
			BasicArg xyOuterOuter = (BasicArg) xyOuterCC.getArg(0);
			Arg yzStackInner = yzStack.get(0);
			if (yzStackInner instanceof SetArg) {
				// e.g. s/(s/n) s/{s,n}
				SetArg yzSetArg = (SetArg) yzStackInner;
				int iaIndex = yzSetArg.indexOf(xyOuterOuter);
				if (iaIndex == -1)
					throw new UnifyFailure();
				xyOuterOuter.unify(yzSetArg.get(iaIndex), sub);
				xySlash = (Slash) xySlash.fill(sub);
				xySlash.unifyCheck(_functorSlash);
				zStack = yzStack.copy();
				zStack.set(0, yzSetArg.copyWithout(iaIndex));
				zStack.slashesUnify(_argSlash);
				return zStack;
			} else {
				// e.g. s/(s/n) s/n/s
				if (yzStack.size() < 2) {
					throw new UnifyFailure();
				}
				xyOuterOuter.unify(yzStackInner, sub);
				zStack = yzStack.subList(1).copy();
				zStack.slashesUnify(_argSlash);
				xySlash = (Slash) xySlash.fill(sub);
				xySlash.unifyCheck(_functorSlash);
				return zStack;
			}
		} else if (xyOuterCC.arity() == 2) {
			// e.g. s\np/(s\np) s\np/(s\np)/n
			// nb: not dealing with set args
			ArgStack yzStack = yzCC.getArgStack();
			if (!(xyOuterCC.getArg(0) instanceof BasicArg)
					|| !(xyOuterCC.getArg(1) instanceof BasicArg)
					|| yzStack.size() < 3) {
				throw new UnifyFailure();
			}
			BasicArg xyOuterOuter1 = (BasicArg) xyOuterCC.getArg(0);
			BasicArg xyOuterOuter2 = (BasicArg) xyOuterCC.getArg(1);
			Arg yzStackInner1 = yzStack.get(0);
			Arg yzStackInner2 = yzStack.get(1);
			xyOuterOuter1.unify(yzStackInner1, sub);
			xyOuterOuter2.unify(yzStackInner2, sub);
			zStack = yzStack.subList(2).copy();
			zStack.slashesUnify(_argSlash);
			xySlash = (Slash) xySlash.fill(sub);
			xySlash.unifyCheck(_functorSlash);
			return zStack;
		} else {
			// nb: not dealing with xyOuterCC arity > 2
			throw new UnifyFailure();
		}
	}
}


================================================
FILE: src/opennlp/ccg/grammar/AbstractRule.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003 Jason Baldridge and University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.grammar;

import opennlp.ccg.unify.*;
import opennlp.ccg.synsem.*;
import opennlp.ccg.hylo.*;

import java.io.Serializable;
import java.util.*;

import org.jdom.Element;

/**
 * Implements some default behavior for Rule objects.
 *
 * @author  Jason Baldridge
 * @author  Michael White
 * @version $Revision: 1.18 $, $Date: 2009/12/21 03:27:18 $
 */
public abstract class AbstractRule implements Rule, Serializable {

	private static final long serialVersionUID = 1L;

	/** The interned name of this rule. */
    protected String _name;
    
    /** The rule group which contains this rule. */
    protected RuleGroup _ruleGroup;
    
    /** Reusable list of head cats, one for each result. */
    protected List<Category> _headCats = new ArrayList<Category>(); 

    /** Returns an XML element representing the rule. */
    abstract public Element toXml();

    /** Applies the rule to the given input signs, adding to the given list of results. */
    public void applyRule(Sign[] inputs, List<Sign> results) {

        if (inputs.length != arity()) { // shouldn't happen
            throw new RuntimeException("Inputs must have length " + arity());
        }

        Category[] cats = new Category[inputs.length];
        for (int i=0; i < cats.length; i++) {
            cats[i] = inputs[i].getCategory();
        }

        try {
            List<Category> resultCats = applyRule(cats);
            if (resultCats.isEmpty()) return;
            
            for (int i=0; i < resultCats.size(); i++) {
            	Category catResult = resultCats.get(i);
                distributeTargetFeatures(catResult);
                Category headCat = _headCats.get(i);
                Sign lexHead = inputs[0].getLexHead();
                for (int j=0; j < inputs.length; j++) {
                	if (inputs[j].getCategory() == headCat) lexHead = inputs[j].getLexHead();
                }
                Sign sign = Sign.createDerivedSign(catResult, inputs, this, lexHead);
                results.add(sign);
            }
        } catch (UnifyFailure uf) {}
    }
    
    /** Propagates distributive features from target cat to the rest. */
    // nb: it would be nicer to combine inheritsFrom with $, but 
    //     this would be complicated, as inheritsFrom is compiled out
    protected void distributeTargetFeatures(Category cat) {
    	if (_ruleGroup == null) return;
        if (_ruleGroup.grammar.lexicon.getDistributiveAttrs() == null) return;
        if (!(cat instanceof ComplexCat)) return;
        ComplexCat complexCat = (ComplexCat) cat;
        Category targetCat = (Category) complexCat.getTarget();
        targetFS = (GFeatStruc) targetCat.getFeatureStructure();
        if (targetFS == null) return;
        cat.forall(distributeTargetFeaturesFcn);
    }
    
    // target cat's feature structure
    private GFeatStruc targetFS = null;

    // copies ground distributive features from _targetFS to the rest
    private CategoryFcn distributeTargetFeaturesFcn = new DistributeTargetFeaturesFcn();
    
    private class DistributeTargetFeaturesFcn extends CategoryFcnAdapter implements Serializable {
		private static final long serialVersionUID = 5247861522003485434L;
		public void forall(Category c) {
            if (!(c instanceof AtomCat)) return;
            FeatureStructure fs = c.getFeatureStructure();
            if (fs == null) return;
            if (fs == targetFS) return;
            String[] distrAttrs = _ruleGroup.grammar.lexicon.getDistributiveAttrs();
            for (int i = 0; i < distrAttrs.length; i++) {
                Object targetVal = targetFS.getValue(distrAttrs[i]);
                if (targetVal != null && !(targetVal instanceof Variable)) {
                    fs.setFeature(distrAttrs[i], UnifyControl.copy(targetVal));
                }
            }
        }
    }
    
    
    /**
     * The number of arguments this rule takes.  For example, the arity of the
     * forward application rule of categorial grammar (X/Y Y => Y) is 2.
     *
     * @return the number of arguments this rule takes
     **/
    public abstract int arity();

    /**
     * Apply this rule to some input categories.
     *
     * @param inputs the input categories to try to combine
     * @return the categories resulting from using this rule to combine the
     *         inputs
     * @exception UnifyFailure if the inputs cannot be combined by this rule
     **/
    public abstract List<Category> applyRule(Category[] inputs) throws UnifyFailure;

    
    /** Prints an apply instance for the given categories to System.out. */
    protected void showApplyInstance(Category[] inputs) {
        StringBuffer sb = new StringBuffer();  
        sb.append(_name).append(": ");
        
        for (int i=0; i < inputs.length; i++) {
            sb.append(inputs[i]).append(' ');
        }

        System.out.println(sb);
    }

    /** Prints an apply instance for the given categories to System.out. */
    protected void showApplyInstance(Category first, Category second) {
        Category[] ca = {first,second};
        showApplyInstance(ca);
    }

    
    /**
     * Returns the interned name of this rule.
     */
    public String name() {
        return _name;
    }
    
    /**
     * Returns the rule group which contains this rule.
     */
    public RuleGroup getRuleGroup() { return _ruleGroup; }
    
    /**
     * Sets this rule's rule group.
     */
    public void setRuleGroup(RuleGroup ruleGroup) { _ruleGroup = ruleGroup; }

    
    /** Appends, fills, sorts and checks the LFs from cats 1 and 2 into the result cat. */
    protected void appendLFs(Category cat1, Category cat2, Category result, Substitution sub) 
        throws UnifyFailure
    {
        LF lf = HyloHelper.append(cat1.getLF(), cat2.getLF());
        if (lf != null) {
            lf = (LF) lf.fill(sub);
            HyloHelper.sort(lf);
            HyloHelper.check(lf);
        }
        result.setLF(lf);
    }
}


================================================
FILE: src/opennlp/ccg/grammar/AbstractSubstitutionRule.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2002-3 Jason Baldridge and University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.grammar;

import opennlp.ccg.unify.*;
import opennlp.ccg.synsem.*;

import java.util.*;

import org.jdom.Element;

/**
 * Super class for substitution rules.
 *
 * @author  Jason Baldridge
 * @author  Michael White
 * @version $Revision: 1.5 $, $Date: 2009/12/21 03:27:18 $
 */
public abstract class AbstractSubstitutionRule extends AbstractApplicationRule {

	private static final long serialVersionUID = 1L;
	
	protected boolean _isHarmonic;
    protected Slash _argSlash;

    /** Returns an XML element representing the rule. */
    public Element toXml(String dir) {
    	Element retval = new Element("substitution");
    	retval.setAttribute("dir", dir);
    	retval.setAttribute("harmonic", Boolean.toString(_isHarmonic));
    	return retval;
    }

    protected List<Category> apply (Category xyzCat, Category yzCat)
        throws UnifyFailure {
        
        if (xyzCat instanceof ComplexCat && yzCat instanceof ComplexCat) {
            ComplexCat xyzCC = (ComplexCat)xyzCat;
            ComplexCat yzCC = (ComplexCat)yzCat;

            if (xyzCC.arity() < 2
                || xyzCC.containsDollarArg()
                || xyzCC.containsSetArg()
                || yzCC.containsSetArg()
                || yzCC.containsDollarArg()) {
                throw new UnifyFailure();
            }

            ArgStack primaryStack = xyzCC.getArgStack();
            int size = primaryStack.size();
            
            BasicArg primaryArgY = (BasicArg)primaryStack.get(size-2);
            primaryArgY.unifySlash(_functorSlash);
            BasicArg primaryArgZ = (BasicArg)primaryStack.get(size-1);
            primaryArgZ.unifySlash(_argSlash);

            BasicArg secondaryArgZ = (BasicArg)yzCC.getOuterArg();
            secondaryArgZ.unifySlash(_argSlash);
            Category secondaryY = yzCC.getResult();

            GSubstitution sub = new GSubstitution();

            GUnifier.unify(primaryArgZ.getCat(), secondaryArgZ.getCat(), sub);
            GUnifier.unify(primaryArgY.getCat(), secondaryY, sub);         
            
            Category result =
                new ComplexCat(xyzCC.getTarget(), primaryStack.copyWithout(size-2));
            ((GSubstitution)sub).condense();
            result = (Category)result.fill(sub);
            ((ComplexCat)result).getOuterArg().setSlashModifier(false);
            
            appendLFs(xyzCat, yzCat, result, sub);
            
            List<Category> results = new ArrayList<Category>(1);
            _headCats.clear();
            results.add(result);
            _headCats.add(primaryArgY.getSlash().isModifier() ? yzCat : xyzCat); 
            return results;
        } else {
            throw new UnifyFailure();
        }

    }
}


================================================
FILE: src/opennlp/ccg/grammar/AbstractTypeRaisingRule.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003 Jason Baldridge and University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.grammar;

import opennlp.ccg.unify.*;
import opennlp.ccg.synsem.*;

import java.util.*;

import org.jdom.Element;

/**
 * Type-raising, e.g. np => s/(s\np).
 *
 * @author  Jason Baldridge
 * @author  Michael White
 * @version $Revision: 1.9 $, $Date: 2009/12/21 03:27:18 $
 */
// NB: It might make sense to eventually make this a subclass of TypeChangingRule, 
//     but currently it's structured a bit differently.
public abstract class AbstractTypeRaisingRule extends AbstractRule {

	private static final long serialVersionUID = 1L;

	/** The upper slash, eg the first slash in s/(s\np). */
    protected Slash _upperSlash; 

    /** The embedded slash, eg the second slash in s/(s\np). */
    protected Slash _embeddedSlash;

    /** 
     * The result of the type raised category, eg the "s" in s/(s\np). Defaults to "s". 
     */
    protected Category _result;

    /** 
     * The argument of the ComplexCat argument of the type raised category,
     * eg the "np" in s/(s\np). Defaults to "np".
     */
    protected Category _arg;

    /**
     * Creates a new type raising rule with the given name; upper and lower slashes; 
     * use dollar switch; arg category; and result category.  Defaults are used 
     * for the arg and result categories if null.
     */
    protected AbstractTypeRaisingRule(
        String name, Slash uslash, Slash eslash, 
        boolean useDollar, Category arg, Category result
    ) {
        _name = name;
        _upperSlash = uslash;
        _upperSlash.setAbility("active");
        _upperSlash.setModifier(true);
        _embeddedSlash = eslash;
        _embeddedSlash.setAbility("active");

        if (arg != null) { _arg = arg; }
        else { _arg = new AtomCat("np", new GFeatStruc()); }

        if (result != null) { 
            _result = result;
            result.getFeatureStructure().setIndex(1);
        }
        else {
            GFeatStruc resfs = new GFeatStruc();
            resfs.setIndex(1);
            _result = new AtomCat("s", resfs);
        }
        
        if (useDollar) {
            Dollar dol = new Dollar("1");
            dol.setIndex(1);
            _result = new ComplexCat((AtomCat)_result, dol);
        }
        
    }

    /** Returns an XML element representing the rule. */
    public Element toXml(String dir) {
    	Element retval = new Element("typeraising");
    	retval.setAttribute("dir", dir);
    	boolean usesDollar = (_result instanceof ComplexCat) && ((ComplexCat)_result).containsDollarArg();
    	retval.setAttribute("useDollar", Boolean.toString(usesDollar));
    	if (!(_arg instanceof AtomCat) || !((AtomCat)_arg).getType().equals("np")) {
        	Element argElt = new Element("arg");
        	retval.addContent(argElt);
        	argElt.addContent(_arg.toXml());
    	}
    	if (!((AtomCat)_result.getTarget()).getType().equals("s")) {
        	Element resultElt = new Element("result");
        	retval.addContent(resultElt);
        	resultElt.addContent(_result.getTarget().toXml());
    	}
    	return retval;
    }

    /** Returns 1. */
    public int arity() {
        return 1;
    }

    /** Applies this rule to the given inputs. */
    public List<Category> applyRule(Category[] inputs) throws UnifyFailure {
        if (inputs.length != 1) {
            throw new UnifyFailure();
        }
        return apply(inputs[0]);
    }

    /** Applies this rule to the given input. */
    protected List<Category> apply(Category input) throws UnifyFailure {
        Substitution sub = new GSubstitution();
        Category arg = (Category)_arg.unify(input, sub);
        ((GSubstitution)sub).condense();
        
        Category result = _result.copy();
        ComplexCat range;
        UnifyControl.reindex(result);
        if (result instanceof ComplexCat) {
            range = (ComplexCat)result.copy();
            range.add(new BasicArg(_embeddedSlash, arg));
            ((ComplexCat)result).add(new BasicArg(_upperSlash, range));
        } else {
            range = new ComplexCat((TargetCat)result.copy(),
                                   new BasicArg(_embeddedSlash, arg));
            result = new ComplexCat((TargetCat)result.copy(),
                                    new BasicArg(_upperSlash, range));
        }
        
        // nb: with defined type changing rules, this step is done when the 
        //     rule is created; with type raising, it is done here, so that 
        //     the arg need not have its distributive features yet, and since 
        //     the full result category doesn't exist beforehand
        _ruleGroup.grammar.lexicon.propagateDistributiveAttrs(result);
        
        LF inputLF = input.getLF();
        if (inputLF != null) {
            result.setLF((LF)inputLF.copy());
        }
        
        List<Category> results = new ArrayList<Category>(1);
        _headCats.clear();
        results.add(result);
        _headCats.add(input);
        return results;
    }
}


================================================
FILE: src/opennlp/ccg/grammar/BackwardApplication.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2002 Jason Baldridge
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.grammar;

import opennlp.ccg.unify.*;
import opennlp.ccg.synsem.*;

import java.util.*;

import org.jdom.Element;

/**
 * Forward application: X/Y Y => X
 *
 * @author  Jason Baldridge
 * @version $Revision: 1.3 $, $Date: 2009/07/17 04:23:30 $
 */
public class BackwardApplication extends AbstractApplicationRule {

	private static final long serialVersionUID = 6981288425455531650L;

	public BackwardApplication () {
		_name = "<";
		_functorSlash = new Slash('\\');
		_functorSlash.setAbility("active");
    }
    
    /** Returns an XML element representing the rule. */
    public Element toXml() { return super.toXml("backward"); }
    
    public List<Category> applyRule(Category[] inputs) throws UnifyFailure {
		if (inputs.length != 2) {
		    throw new UnifyFailure();
		}
		return apply(inputs[1], inputs[0]);
    }

    public String toString() {
		return "Y X\\Y => X";
    }
}


================================================
FILE: src/opennlp/ccg/grammar/BackwardComposition.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2002 Jason Baldridge
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.grammar;

import opennlp.ccg.unify.*;
import opennlp.ccg.synsem.*;

import java.util.*;

import org.jdom.Element;

/**
 * Backward composition, e.g. Y\Z X\Y => X\Z
 * 
 * @author Jason Baldridge
 * @version $Revision: 1.3 $, $Date: 2009/07/17 04:23:30 $
 */
public class BackwardComposition extends AbstractCompositionRule {

	private static final long serialVersionUID = -937944882697380690L;

	public BackwardComposition() {
		this(true);
	}

	public BackwardComposition(boolean isHarmonic) {
		_isHarmonic = isHarmonic;
		if (isHarmonic) {
			_name = "<B";
			_functorSlash = new Slash('\\', "^");
			_argSlash = new Slash('\\', "^");
		} else {
			_name = "<Bx";
			_functorSlash = new Slash('\\', "x");
			_argSlash = new Slash('/', "x");
		}
		_functorSlash.setAbility("active");
	}

    /** Returns an XML element representing the rule. */
    public Element toXml() { return super.toXml("backward"); }

	public List<Category> applyRule(Category[] inputs) throws UnifyFailure {
		if (inputs.length != 2) {
			throw new UnifyFailure();
		}

		return apply(inputs[1], inputs[0]);
	}

	public String toString() {
		StringBuffer sb = new StringBuffer();
		sb.append("Y").append(_argSlash.toString()).append("Z ").append(
				"X\\Y => X").append(_argSlash.toString()).append("Z");
		return sb.toString();
	}

}


================================================
FILE: src/opennlp/ccg/grammar/BackwardSubstitution.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2002 Jason Baldridge
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.grammar;

import opennlp.ccg.unify.*;
import opennlp.ccg.synsem.*;

import java.util.*;

import org.jdom.Element;

/**
 * Backward substitution, e.g. Y\Z X\Y\Z => X\Z
 * 
 * @author Jason Baldridge
 * @version $Revision: 1.3 $, $Date: 2009/07/17 04:23:30 $
 */
public class BackwardSubstitution extends AbstractSubstitutionRule {

	private static final long serialVersionUID = -4597839433754132265L;

	public BackwardSubstitution() {
		this(true);
	}

	public BackwardSubstitution(boolean isHarmonic) {
		_isHarmonic = isHarmonic;
		if (isHarmonic) {
			_name = "<S";
			_functorSlash = new Slash('\\', "^");
			_argSlash = new Slash('\\', "^");
		} else {
			_name = "<Sx";
			_functorSlash = new Slash('\\', "x");
			_argSlash = new Slash('/', "x");
		}
		_functorSlash.setAbility("active");
	}

    /** Returns an XML element representing the rule. */
    public Element toXml() { return super.toXml("backward"); }

	public List<Category> applyRule(Category[] inputs) throws UnifyFailure {
		if (inputs.length != 2) {
			throw new UnifyFailure();
		}

		return apply(inputs[1], inputs[0]);
	}

	public String toString() {
		StringBuffer sb = new StringBuffer();
		sb.append("Y").append(_argSlash.toString()).append("Z ").append(
				"X\\Y => X").append(_argSlash.toString()).append("Z");
		return sb.toString();
	}

}


================================================
FILE: src/opennlp/ccg/grammar/BackwardTypeRaising.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003 Jason Baldridge and University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.grammar;

import org.jdom.Element;

import opennlp.ccg.synsem.*;

/**
 * Backward type-raising: X => Y\(Y/X).
 *
 * @author  Jason Baldridge
 * @author  Michael White
 * @version $Revision: 1.5 $, $Date: 2009/07/17 04:23:30 $
 */
public class BackwardTypeRaising extends AbstractTypeRaisingRule {

	private static final long serialVersionUID = 4334502669369098203L;

	/** Creates a backward type raising rule with the given parameters. */
    public BackwardTypeRaising(boolean useDollar, Category arg, Category result) {
        super("<T", new Slash('\\', new VarModality("i")), new Slash('/', new VarModality("i")),
              useDollar, arg, result);
    }
    
    /** Returns an XML element representing the rule. */
    public Element toXml() {
    	return super.toXml("backward");
    }

    public String toString() {
        return "X => Y\\(Y/X)";
    }
}


================================================
FILE: src/opennlp/ccg/grammar/ForwardApplication.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2002 Jason Baldridge
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.grammar;

import opennlp.ccg.unify.*;
import opennlp.ccg.synsem.*;

import java.util.*;

import org.jdom.Element;

/**
 * Forward application: X/Y Y => X
 * 
 * @author Jason Baldridge
 * @version $Revision: 1.3 $, $Date: 2009/07/17 04:23:30 $
 */
public class ForwardApplication extends AbstractApplicationRule {

	private static final long serialVersionUID = 1336124476870410093L;

	public ForwardApplication() {
		_name = ">";
		_functorSlash = new Slash('/');
		_functorSlash.setAbility("active");
	}
	
    /** Returns an XML element representing the rule. */
    public Element toXml() { return super.toXml("forward"); }

	public List<Category> applyRule(Category[] inputs) throws UnifyFailure {
		if (inputs.length != 2) {
			throw new UnifyFailure();
		}

		return apply(inputs[0], inputs[1]);
	}

	public String toString() {
		return "X/Y Y => X";
	}
}


================================================
FILE: src/opennlp/ccg/grammar/ForwardComposition.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2002 Jason Baldridge
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.grammar;

import opennlp.ccg.unify.*;
import opennlp.ccg.synsem.*;

import java.util.*;

import org.jdom.Element;

/**
 * Forward composition, e.g. X/Y Y/Z => X/Z
 * 
 * @author Jason Baldridge
 * @version $Revision: 1.3 $, $Date: 2009/07/17 04:23:30 $
 */
public class ForwardComposition extends AbstractCompositionRule {

	private static final long serialVersionUID = -5029901211362928251L;

	public ForwardComposition() {
		this(true);
	}

	public ForwardComposition(boolean isHarmonic) {
		_isHarmonic = isHarmonic;
		if (isHarmonic) {
			_name = ">B";
			_functorSlash = new Slash('/', "^");
			_argSlash = new Slash('/', "^");
		} else {
			_name = ">Bx";
			_functorSlash = new Slash('/', "x");
			_argSlash = new Slash('\\', "x");
		}
		_functorSlash.setAbility("active");
	}

    /** Returns an XML element representing the rule. */
    public Element toXml() { return super.toXml("forward"); }

	public List<Category> applyRule(Category[] inputs) throws UnifyFailure {
		if (inputs.length != 2) {
			throw new UnifyFailure();
		}

		return apply(inputs[0], inputs[1]);
	}

	public String toString() {
		StringBuffer sb = new StringBuffer();
		sb.append("X").append(_functorSlash.toString()).append("Y Y").append(
				_argSlash.toString()).append("Z => X").append(
				_argSlash.toString()).append("Z");
		return sb.toString();
	}

}


================================================
FILE: src/opennlp/ccg/grammar/ForwardSubstitution.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2002 Jason Baldridge
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.grammar;

import opennlp.ccg.unify.*;
import opennlp.ccg.synsem.*;

import java.util.*;

import org.jdom.Element;

/**
 * Forward substitution, e.g. X/Y/Z Y/Z => X/Z
 * 
 * @author Jason Baldridge
 * @version $Revision: 1.3 $, $Date: 2009/07/17 04:23:30 $
 */
public class ForwardSubstitution extends AbstractSubstitutionRule {

	private static final long serialVersionUID = 7324585108055853456L;

	public ForwardSubstitution() {
		this(true);
	}

	public ForwardSubstitution(boolean isHarmonic) {
		_isHarmonic = isHarmonic;
		if (isHarmonic) {
			_name = ">S";
			_functorSlash = new Slash('/', "^");
			_argSlash = new Slash('/', "^");
		} else {
			_name = ">Sx";
			_functorSlash = new Slash('/', "x");
			_argSlash = new Slash('\\', "x");
		}
		_functorSlash.setAbility("active");
	}

    /** Returns an XML element representing the rule. */
    public Element toXml() { return super.toXml("forward"); }

	public List<Category> applyRule(Category[] inputs) throws UnifyFailure {
		if (inputs.length != 2) {
			throw new UnifyFailure();
		}

		return apply(inputs[0], inputs[1]);
	}

	public String toString() {
		StringBuffer sb = new StringBuffer();
		sb.append("X").append(_functorSlash.toString()).append("Y Y").append(
				_argSlash.toString()).append("Z => X").append(
				_argSlash.toString()).append("Z");
		return sb.toString();
	}

}


================================================
FILE: src/opennlp/ccg/grammar/ForwardTypeRaising.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003 Jason Baldridge and University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.grammar;

import org.jdom.Element;

import opennlp.ccg.synsem.*;

/**
 * Forward type-raising: X => Y/(Y\X).
 *
 * @author  Jason Baldridge
 * @author  Michael White
 * @version $Revision: 1.5 $, $Date: 2009/07/17 04:23:30 $
 */
public class ForwardTypeRaising extends AbstractTypeRaisingRule {
    
	private static final long serialVersionUID = 1417585756957436141L;

	/** Creates a forward type raising rule with the given parameters. */
    public ForwardTypeRaising (boolean useDollar, Category arg, Category result) {
        super(">T", new Slash('/', new VarModality("i")), new Slash('\\', new VarModality("i")),
              useDollar, arg, result);
    }
    
    /** Returns an XML element representing the rule. */
    public Element toXml() {
    	return super.toXml("forward");
    }

    public String toString() {
        return "X => Y/(Y\\X)";
    }
}


================================================
FILE: src/opennlp/ccg/grammar/FragmentJoining.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2007 Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.grammar;

import opennlp.ccg.synsem.*;
import opennlp.ccg.unify.*;

import java.util.*;

import org.jdom.Element;


/**
 * Rule for joining fragments that don't fit together, when all else fails.
 *
 * @author Michael White
 * @version $Revision: 1.4 $, $Date: 2009/07/17 04:23:30 $
 */
public class FragmentJoining extends AbstractRule {

	private static final long serialVersionUID = 7451163798607652012L;

	/** Constructor. */
	public FragmentJoining() { _name = "*"; }
	
    /** Returns an XML element representing the rule (not supported). */
    public Element toXml() { throw new RuntimeException("toXml not supported for FragmentJoining rules"); }

	/**
	 *  Returns the result of applying this rule to two input signs.
	 */
	public Sign applyRule(Sign sign1, Sign sign2) {
		List<Sign> results = new ArrayList<Sign>(1);
		Sign[] inputs = new Sign[] { sign1, sign2 };
		applyRule(inputs, results);
		return results.get(0);
	}
	
    /**
     * Apply this rule to two input categories.  
     * Returns a copy of the first cat with the LFs appended.
     **/
    public List<Category> applyRule(Category[] inputs) throws UnifyFailure {
		if (inputs.length != 2) { throw new UnifyFailure(); }
		List<Category> results = new ArrayList<Category>(1);
        _headCats.clear();
		Category result = inputs[0].shallowCopy();
		try {
			appendLFs(inputs[0], inputs[1], result, new EmptySubstitution());
		}
		catch (UnifyFailure uf) { // not expected
			// System.err.println("Unexpected unify failure in appending LFs when joining fragments:");
			// System.err.println("cat0: " + inputs[0] + " lf: " + inputs[0].getLF());
			// System.err.println("cat1: " + inputs[1] + " lf: " + inputs[1].getLF());
		}
		results.add(result);
		_headCats.add(inputs[0]);
		return results;
    }

    /**
     * The number of arguments this rule takes.
     **/
    public int arity() { return 2; }

    /** Returns a string for this rule. */
	public String toString() {
		return "X Y *=> X";
	}
}


================================================
FILE: src/opennlp/ccg/grammar/GlueRule.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2011 Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.grammar;

import java.util.*;

import org.jdom.Element;

import opennlp.ccg.synsem.*;
import opennlp.ccg.unify.*;

/**
 * Implements a glue rule for combining a sequence of fragments.
 * The rule is frag|cat cat => frag, allowing only the first input 
 * to itself be a fragment, unless the second input has the 
 * frag completion flag set, meaning that it completes a chunk/alt.
 * 
 * @author  Michael White
 * @version $Revision: 1.3 $, $Date: 2011/06/07 05:12:01 $
 */
public class GlueRule extends AbstractRule {

	private static final long serialVersionUID = 4867141181941895272L;

	// empty subst for combining LFs
	private static final Substitution emptySubst = new SimpleSubstitution();
	
	/** Fragment result type. */
	public static final String resultType = "frag";
	
	/** Constructor. */
	public GlueRule() { _name = "glue"; }
	
    /** Returns an XML element representing the rule (not supported). */
    public Element toXml() { throw new RuntimeException("toXml not supported for GlueRule rules"); }

	/** Arity. */
	public int arity() { return 2; }

	/** Glues cats into fragments. */
	public List<Category> applyRule(Category[] inputs) throws UnifyFailure {
		// check num inputs
		if (inputs.length != 2) {
			throw new UnifyFailure();
		}
		// check for frag as second input with completion false
		if (inputs[1] instanceof AtomCat) {
			AtomCat ac2 = (AtomCat) inputs[1];
			if (ac2.isFragment() && !ac2.fragCompletion) 
				throw new UnifyFailure();
		}
		// make result cat
        List<Category> results = new ArrayList<Category>(1);
        _headCats.clear();
        AtomCat ac = new AtomCat(resultType);
        appendLFs(inputs[0], inputs[1], ac, emptySubst);
        results.add(ac);
        // guess head, with left as default
        boolean leftHead = true;
        boolean leftMod = isModifier(inputs[0]);
        boolean rightMod = isModifier(inputs[1]);
        if ((inputs[0] instanceof AtomCat && inputs[1] instanceof ComplexCat && !rightMod) ||
        	(leftMod && !rightMod)) 
        {
        	leftHead = false;
        }
		// return result cat with guessed head
        _headCats.add(leftHead ? inputs[0] : inputs[1]);
		return results;
	}
	
	// modifier check
	private static boolean isModifier(Category cat) {
		if (cat instanceof ComplexCat) {
			ComplexCat xyCat = (ComplexCat) cat;
			Arg arg = xyCat.getOuterArg();
			if (arg instanceof BasicArg) {
				return ((BasicArg)arg).getSlash().isModifier();
			}
		}
		return false;
	}

	/** toString. */
	public String toString() {
		return "frag|cat cat => frag";
	}
}


================================================
FILE: src/opennlp/ccg/grammar/Grammar.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003-5 University of Edinburgh (Michael White) and Gunes Erkan
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.grammar;

import opennlp.ccg.lexicon.*;
import opennlp.ccg.util.*;
import opennlp.ccg.synsem.*;
import opennlp.ccg.hylo.*;
import opennlp.ccg.parse.Parser;
import opennlp.ccg.parse.ParseException;
import opennlp.ccg.realize.Realizer;

import org.jdom.*;
import org.jdom.input.*;
import org.jdom.output.*;
import org.jdom.transform.*;
import org.xml.sax.*;

import javax.xml.parsers.*;
import javax.xml.transform.*;
import javax.xml.transform.stream.*;
import javax.xml.transform.sax.*;
import java.io.*;
import java.net.URL;
import java.util.*;

/**
 * A CCG grammar is essentially a lexicon plus a rule group.
 * A grammar may also have sequences of transformations to use in 
 * loading/saving LFs from/to XML.
 *
 * @author  Michael White
 * @author  Gunes Erkan
 * @version $Revision: 1.45 $, $Date: 2010/12/06 02:39:35 $ 
 */
public class Grammar {

    /** The lexicon. */
    public final Lexicon lexicon;
    
    /** The rule group. */
    public final RuleGroup rules;

    /** The type hierarchy. */
    public final Types types;
    
    /** The features to include in supertags. */
    public final Set<String> supertagFeatures = new HashSet<String>();
    
    /** The sequence of transformations to use when loading LFs from XML. */
    public final URL[] fromXmlTransforms;
    
    /** The sequence of transformations to use when saving LFs to XML. */
    public final URL[] toXmlTransforms;

    /** Preferences for displaying elements in this grammar. */
    public DisplayPrefs prefs = new DisplayPrefs();
   
    /** For access to the current grammar; should be generalized eventually. */
    public static Grammar theGrammar;
	
    // name of the grammar
    private String grammarName = null;
	
    // parser, for getting parsed words
    private Parser parser = null; 

    // XML factories
    private SAXParserFactory spf = null; 
    private static SAXTransformerFactory stf = null; 
    
    // transformer for loading/saving LFs from/to XML
    private Transformer transformer = null;
    
    // transformations for loading/saving LFs from/to XML
    private Templates[] fromXmlTemplates = null;
    private Templates[] toXmlTemplates = null;
    
    // transformer for saving strings to APML
    private Transformer apmlTransformer = null;
    
    /** The pitch accents recognized as underscored suffixes for translation to APML. */
    public static final String[] pitchAccents = { 
        "H*", "L*", "L+H*", "L*+H", "H*+L", "H+L*"
    };

    // set of pitch accents
    private static Set<String> pitchAccentsSet = null;    
    
    /** The boundary tones recognized as separate tokens for translation to APML. */
    public static final String[] boundaryTones = { 
        "L", "H", "LL%", "HH%", "LH%", "HL%"
    };
    
    // set of boundary tones
    private static Set<String> boundaryTonesSet = null;    

    
    /** Loads a grammar from the given filename. */
    public Grammar(String filename) throws IOException {
        this(new File(filename).toURI().toURL());
    }
    
    /** Loads a grammar from the given URL. */
	public Grammar(URL url) throws IOException {
    	this(url, false);
    }
    
    /** Loads a grammar from the given URL, with the given flag for whether to ignore rule combos. */
    @SuppressWarnings("unchecked")
	public Grammar(URL url, boolean ignoreCombos) throws IOException {
        theGrammar = this;
        // read XML
        SAXBuilder builder = new SAXBuilder();
        Document doc;
        try {
            doc = builder.build(url);
        } catch (JDOMException jde) {
            throw (IOException) new IOException().initCause(jde);
        }
        Element root = doc.getRootElement();	// root corresponds to <grammar>
		    grammarName = root.getAttributeValue("name");
		
        Element supertagsElt = root.getChild("supertags");
        if (supertagsElt != null) {
            String feats = supertagsElt.getAttributeValue("feats");
            if (feats != null) {
                String[] names = feats.split("\\s+");
                for (int i = 0; i < names.length; i++) {
                    supertagFeatures.add(names[i]);
                }
            }
        }
        if (supertagFeatures.isEmpty()) {
            // default is "form" and "lex"
            supertagFeatures.add("form"); supertagFeatures.add("lex"); 
        }
        
        Tokenizer tokenizer = null;
        Element tokenizerElt = root.getChild("tokenizer");
        if (tokenizerElt != null) {
            String tokenizerClass = tokenizerElt.getAttributeValue("classname");
            if (tokenizerClass != null) {
                try {
                    tokenizer = (Tokenizer) Class.forName(tokenizerClass).newInstance();
                } catch (Exception exc) {
                    throw (IOException) new IOException().initCause(exc);
                }
            }
            else tokenizer = new DefaultTokenizer();
            String replacementSemClasses = tokenizerElt.getAttributeValue("replacement-sem-classes");
            if (replacementSemClasses != null) {
                String[] semClasses = replacementSemClasses.split("\\s+");
                for (int i = 0; i < semClasses.length; i++) {
                    tokenizer.addReplacementSemClass(semClasses[i]);
                }
            }
        }
        
        Element typesElt = root.getChild("types");
        URL typesUrl;
        if (typesElt != null) {
            typesUrl = new URL(url, typesElt.getAttributeValue("file"));
        }
        else typesUrl = null;
        Element lexiconElt = root.getChild("lexicon");
        boolean openlex = "true".equals(lexiconElt.getAttributeValue("openlex"));
        URL lexiconUrl = new URL(url, lexiconElt.getAttributeValue("file")); 
        Element morphElt = root.getChild("morphology");
        URL morphUrl = new URL(url, morphElt.getAttributeValue("file"));
        Element rulesElt = root.getChild("rules");
        URL rulesUrl = new URL(url, rulesElt.getAttributeValue("file"));
        Element fromXmlElt = root.getChild("LF-from-XML");
        if (fromXmlElt != null) {
            List<Element> children = fromXmlElt.getChildren();
            fromXmlTransforms = new URL[children.size()];
            for (int i = 0; i < children.size(); i++) {
                Element transformElt = (Element) children.get(i);
                fromXmlTransforms[i] = new URL(url, transformElt.getAttributeValue("file"));
            }
        } else {
            fromXmlTransforms = new URL[0];
        }
        Element toXmlElt = root.getChild("LF-to-XML");
        if (toXmlElt != null) {
            List<Element> children = toXmlElt.getChildren();
            toXmlTransforms = new URL[children.size()];
            for (int i = 0; i < children.size(); i++) {
                Element transformElt = (Element) children.get(i);
                toXmlTransforms[i] = new URL(url, transformElt.getAttributeValue("file"));
            }
        } else {
            toXmlTransforms = new URL[0];
        }
        
        // load type hierarchy, lexicon and rules
        if (typesUrl != null) types = new Types(typesUrl, this);
        else types = new Types(this);
        if (tokenizer != null) lexicon = new Lexicon(this, tokenizer);
        else lexicon = new Lexicon(this);
        lexicon.openlex = openlex;
        lexicon.init(lexiconUrl, morphUrl); 
        rules = new RuleGroup(rulesUrl, this);
        
        // add observed supertag-rule combos for filtering, if any, unless ignoring combos
        if (!ignoreCombos) {
	        String combosfile = rulesElt.getAttributeValue("combosfile");
	        if (combosfile != null) {
	        	URL combosUrl = new URL(url, combosfile);
	        	rules.loadSupercatRuleCombos(combosUrl);
	        }
	        // set dynamic combos: defaults to true with a combosfile, otherwise defaults to false
	        boolean dynamic = (combosfile != null);
	        String dynamicCombos = rulesElt.getAttributeValue("dynamic-combos");
	        if (dynamicCombos != null) dynamic = Boolean.parseBoolean(dynamicCombos);
	        rules.setDynamicCombos(dynamic);
        }
    }

    
    /**
     * Returns a file url string relative to the user's current directory 
     * for the given filename.
     */
    public static String convertToFileUrl(String filename) {
        try {
            return new File(filename).toURI().toURL().toString();
        }
        catch (java.net.MalformedURLException exc) {
            throw (RuntimeException) new RuntimeException().initCause(exc);
        }
        // return "file:"+System.getProperty("user.dir")+"/"+filename;
    }
    
    
    // initializes factories and transformers
    private void initializeTransformers() throws TransformerConfigurationException {
        // init factories
        if (spf == null) {
            spf = SAXParserFactory.newInstance(); 
            spf.setNamespaceAware(true);
        }
        if (stf == null) {
            stf = (SAXTransformerFactory) TransformerFactory.newInstance();
            try { // try setting indent at factory level
                stf.setAttribute("indent-number", new Integer(2));
            } catch (IllegalArgumentException exc) {} // ignore
        }
        // set up transformer with indenting
        // nb: with some JVMs (eg JDK 1.4.1 on Windows), 
        //     the transformer needs to be reinitialized each time, in order to 
        //     run multiple :r FN commands in tccg 
        if (transformer == null) {
            transformer = stf.newTransformer();
            transformer.setOutputProperty(OutputKeys.INDENT, "yes");
            try { // also try setting indent as a xalan property 
                transformer.setOutputProperty("{http://xml.apache.org/xalan}indent-amount", "2");
            } catch (IllegalArgumentException exc) {} // ignore
        }
        // set up apml transformer 
        if (apmlTransformer == null) {
            InputStream toApmlStr = ClassLoader.getSystemResourceAsStream("opennlp/ccg/grammar/to-apml.xsl");
            apmlTransformer = stf.newTransformer(new StreamSource(toApmlStr));
            // nb: DOCTYPE SYSTEM also specified in to-apml.xsl; including  
            //     redundant specification here to workaround omission of DOCTYPE with Linux 1.5 JVM
            apmlTransformer.setOutputProperty(OutputKeys.DOCTYPE_SYSTEM, "apml.dtd");
        }
    }
    
    
    // does setup for LF from XML transformation, and returns a SAXSource for the given input stream
    // nb: need a new filter chain one for each use (perhaps due to an underyling bug)
    private SAXSource fromXmlSetup(InputStream istream) throws IOException {
        try {
            // initialize transformer
            initializeTransformers();
            // load transformations
            if (fromXmlTemplates == null) {
                fromXmlTemplates = new Templates[fromXmlTransforms.length];
                for (int i = 0; i < fromXmlTemplates.length; i++) {
                    String url = fromXmlTransforms[i].toString();
                    fromXmlTemplates[i] = stf.newTemplates(new StreamSource(url));
                }
            }
            // set up initial reader
            SAXParser parser = spf.newSAXParser();
            XMLReader reader = parser.getXMLReader();
            // set up chain of filters
            XMLFilter[] filters = new XMLFilter[fromXmlTransforms.length];
            for (int i = 0; i < filters.length; i++) {
                // create filter
                filters[i] = stf.newXMLFilter(fromXmlTemplates[i]);
                // set parent
                if (i == 0) { filters[0].setParent(reader); }
                else { filters[i].setParent(filters[i-1]); }
            }
            // set final reader/filter
            XMLReader finalReader = (filters.length == 0) ? reader : filters[filters.length-1];
            // set up and return LF from XML SAX source with final reader/filter
            return new SAXSource(finalReader, new InputSource(istream));
        } catch (ParserConfigurationException pce) {
            throw (IOException) new IOException().initCause(pce);
        } catch (SAXException se) {
            throw (IOException) new IOException().initCause(se);
        } catch (TransformerConfigurationException tce) {
            throw (IOException) new IOException().initCause(tce);
        }
    }
    
    /**
     * Loads a document from the XML in the given input stream, 
     * applying the configured from-XML transformations.
     */
    public synchronized Document loadFromXml(InputStream istream) throws IOException {
        try {
            // do setup and get source
            Source source = fromXmlSetup(istream);
            // do transformation
            JDOMResult result = new JDOMResult();
            transformer.transform(source, result);
            // return result doc
            return result.getDocument();
        } catch (TransformerException exc) { 
            throw (IOException) new IOException().initCause(exc);
        }
    }
    
    /**
     * Loads a document from the XML file with the given filename, 
     * applying the configured from-XML transformations.
     */
    public synchronized Document loadFromXml(String filename) throws IOException {
        BufferedInputStream bis = new BufferedInputStream(new FileInputStream(filename));
        Document retval = loadFromXml(bis);
        bis.close();
        return retval;
    }
    

    // does setup for LF to XML transformation, and returns a SAXSource for the given source
    // nb: need a new filter chain one for each use (perhaps due to an underyling bug)
    private SAXSource toXmlSetup(Source source) throws IOException {
        try {
            // initialize transformer
            initializeTransformers();
            // load transformations
            if (toXmlTemplates == null) {
                toXmlTemplates = new Templates[toXmlTransforms.length];
                for (int i = 0; i < toXmlTemplates.length; i++) {
                    // File file = new File(toXmlTransforms[i]);
                    // toXmlTemplates[i] = stf.newTemplates(new StreamSource(file));
                    String url = toXmlTransforms[i].toString();
                    toXmlTemplates[i] = stf.newTemplates(new StreamSource(url));
                }
            }
            // set up initial reader
            SAXParser parser = spf.newSAXParser();
            XMLReader reader = parser.getXMLReader();
            // set up chain of filters
            XMLFilter[] filters = new XMLFilter[toXmlTransforms.length];
            for (int i = 0; i < filters.length; i++) {
                // create filter
                filters[i] = stf.newXMLFilter(toXmlTemplates[i]);
                // set parent
                if (i == 0) { filters[0].setParent(reader); }
                else { filters[i].setParent(filters[i-1]); }
            }
            // set final reader/filter
            XMLReader finalReader = (filters.length == 0) ? reader : filters[filters.length-1];
            // set up and return LF to XML SAX source with final reader/filter
            return new SAXSource(finalReader, SAXSource.sourceToInputSource(source));
        } catch (ParserConfigurationException pce) {
            throw (IOException) new IOException().initCause(pce);
        } catch (SAXException se) {
            throw (IOException) new IOException().initCause(se);
        } catch (TransformerConfigurationException tce) {
            throw (IOException) new IOException().initCause(tce);
        }
    }

    /**
     * Saves the given LF with the given target string to an XML file 
     * with the given filename, applying the configured to-XML
     * transformations.
     */
    public synchronized void saveToXml(LF lf, String target, String filename) throws IOException { 
        // ensure dirs exist for filename
        File file = new File(filename);
        File parent = file.getParentFile();
        if (parent != null && !parent.exists()) { parent.mkdirs(); }
        FileOutputStream out = new FileOutputStream(file); 
        saveToXml(lf, target, out);
        out.close();
    }

    /**
     * Saves the given LF with the given target string as XML to the 
     * given output stream, applying the configured to-XML
     * transformations.
     */
    public synchronized void saveToXml(LF lf, String target, OutputStream out) throws IOException { 
        // make doc with XML for LF and target
        Document doc = new Document();
        Element root = new Element("xml");
        doc.setRootElement(root);
        root.addContent(HyloHelper.toXml(lf));
        Element targetElt = new Element("target");
        targetElt.addContent(target);
        root.addContent(targetElt);

        // write transformed doc to file
        try {
            // do setup and get source
            Source source = toXmlSetup(new JDOMSource(doc));
            // do transformation
            transformer.transform(source, new StreamResult(new OutputStreamWriter(out)));
        } catch (TransformerException exc) { 
            throw (IOException) new IOException().initCause(exc);
        }
    }

    
    /**
     * Transforms an LF by applying the configured to-XML and from-XML transformations, 
     * then loading the LF from the resulting doc.
     */
    public synchronized LF transformLF(LF lf) throws IOException {
        ByteArrayOutputStream out = new ByteArrayOutputStream();
        saveToXml(lf, "", out);
        ByteArrayInputStream in = new ByteArrayInputStream(out.toByteArray());
        Document doc = loadFromXml(in);
        return Realizer.getLfFromDoc(doc);
    }
    
    /**
     * Loads an LF by applying the configured from-XML transformations, 
     * then loading the LF from the resulting doc.
     */
    public synchronized LF loadLF(Document doc) throws IOException {
        ByteArrayOutputStream out = new ByteArrayOutputStream();
        serializeXml(doc, out);
        ByteArrayInputStream in = new ByteArrayInputStream(out.toByteArray());
        Document doc2 = loadFromXml(in);
        return Realizer.getLfFromDoc(doc2);
    }
    
    
    /**
     * Convenience method to serialize XML.
     */
    public synchronized void serializeXml(Document doc, OutputStream out) throws IOException {
        try {
            initializeTransformers();
            JDOMResult result = new JDOMResult(); // as suggested by Amy Isard, for better java/xml version compatibility
            transformer.transform(new JDOMSource(doc), result);
            XMLOutputter outputter = new XMLOutputter();
            outputter.setFormat(Format.getPrettyFormat());
            outputter.output(result.getDocument(), new OutputStreamWriter(out)); // end of A.I. suggestion
        } catch (TransformerException exc) { 
            throw (IOException) new IOException().initCause(exc);
        }
    }

    
    /** 
     * Makes an element for the given LF, applying the configured to-XML transformations.
     */
    public synchronized Element makeLfElt(LF lf) throws IOException { 
        // make doc with LF in it
        Document lfDoc = new Document();
        lfDoc.setRootElement(HyloHelper.toXml(lf));
        // apply to-XML transformations
        try {
            // do setup and get source
            Source source = toXmlSetup(new JDOMSource(lfDoc));
            // do transformation and get resulting doc
            JDOMResult result = new JDOMResult();
            transformer.transform(source, result);
            lfDoc = result.getDocument();
        } catch (TransformerException exc) { 
            throw (IOException) new IOException().initCause(exc);
        }
        return lfDoc.detachRootElement();
    }

    
    /** 
     * Returns whether the given string is a recognized pitch accent.
     */
    public static boolean isPitchAccent(String s) {
        if (pitchAccentsSet == null) {
            pitchAccentsSet = new HashSet<String>();
            for (int i = 0; i < pitchAccents.length; i++) {
                pitchAccentsSet.add(pitchAccents[i]);
            }
        }
        return pitchAccentsSet.contains(s);
    }
    
    /** 
     * Returns whether the given string is a recognized boundary tone. 
     */
    public static boolean isBoundaryTone(String s) {
        if (boundaryTonesSet == null) {
            boundaryTonesSet = new HashSet<String>();
            for (int i = 0; i < boundaryTones.length; i++) {
                boundaryTonesSet.add(boundaryTones[i]);
            }
        }
        return boundaryTonesSet.contains(s);
    }
    
    
    /**
     * Saves the given sign's words, pitch accents and boundary tones 
     * to an APML file with the given filename.
     */
    public synchronized void saveToApml(Sign sign, String filename) throws IOException {
        // ensure dirs exist for filename
        File file = new File(filename);
        File parent = file.getParentFile();
        if (parent != null && !parent.exists()) { parent.mkdirs(); }
        // do transformation
        FileWriter fw = new FileWriter(file);
        saveToApml(sign, fw);
        fw.close();
    }
    
    /**
     * Saves the given sign's words, pitch accents and boundary tones 
     * as APML to the given writer.
     * The orthography is first converted to XML using Sign.getWordsInXml, 
     * and then converted to APML using opennlp/ccg/grammar/to-apml.xsl.
     * The string is assumed to be a single performative.
     */
    public synchronized void saveToApml(Sign sign, Writer writer) throws IOException { 
        // convert words
        Document doc = sign.getWordsInXml();
        // write transformed doc to file
        try {
            // do setup and get source
            initializeTransformers();
            Source source = new JDOMSource(doc);
            // do transformation
            apmlTransformer.transform(source, new StreamResult(writer));
        } catch (TransformerException exc) { 
            throw (IOException) new IOException().initCause(exc);
        }
    }
    
    
    /** 
     * Returns the words for the given string, as determined by its 
     * first parse, or an empty list, if it cannot be parsed.
     */
    // NB: Could try to extend this to find the parse with the intended LF.
    public List<Word> getParsedWords(String s) {
        // ensure parser instantiated
        if (parser == null) parser = new Parser(this);
        // get parses
        try {
            parser.parse(s);
        }
        catch (ParseException pe) {
            return new ArrayList<Word>(0);
        }
        List<Sign> parses = parser.getResult();
        // return words of first parse
        Sign sign = parses.get(0);
        return sign.getWords();
    }


	/**
	* Returns the name of the loaded grammar. Null if no name given.
	*/
	public final String getName() {
		return grammarName;
	}
	
	
    /**
     * Writes the list of words to a basic morph file.
     * @throws IOException 
     */
    public void toMorphXml(List<Word> words, String filename) throws IOException {
    	Collections.sort(words);
    	XMLOutputter xout = new XMLOutputter();
    	xout.setFormat(Format.getPrettyFormat());
    	PrintWriter out = new PrintWriter(new BufferedWriter(new FileWriter(filename)));
    	out.println("<?xml version=\"1.0\" encoding=\"UTF-8\"?>");
    	out.println("<morph name=\"" + grammarName + "\">");
    	for (Word w : words) {
    		Element e = new Element("entry");
    		e.setAttribute("word", w.getForm());
    		if (w.getForm() != w.getStem() && w.getStem() != null) e.setAttribute("stem", w.getStem());
    		if (w.getPOS() != null) e.setAttribute("pos", w.getPOS());
    		if (w.getSemClass() != null) e.setAttribute("class", w.getSemClass());
    		xout.output(e, out); out.println();
    	}
    	out.println("</morph>");
    	out.flush(); out.close();
    }
	
    /**
     * Writes the list of categories and associated POS tags to a basic lexicon file.
     * Note that the LFs are expected to have a [*DEFAULT*] proposition in the 
     * desired location for predicate insertion.
     * @throws IOException 
     */
    public void toLexiconXml(List<Category> cats, List<String> POSs, String filename) throws IOException {
    	// create map from supertags with unique suffixes to cat/pos pairs
    	Map<String,Pair<Category,String>> stagMap = new HashMap<String,Pair<Category,String>>();
    	for (int i=0; i < cats.size(); i++) {
    		Category cat = cats.get(i); String pos = POSs.get(i);
    		String stag = cat.getSupertag();
    		if (stagMap.containsKey(stag)) {
        		int j = 1;
    			while (stagMap.containsKey(stag+"-"+j)) j++;
    			stag += "-"+j;
    		}
    		stagMap.put(stag, new Pair<Category,String>(cat, pos));
    	}
    	List<String> keys = new ArrayList<String>(stagMap.keySet());
    	Collections.sort(keys);
    	XMLOutputter xout = new XMLOutputter();
    	xout.setFormat(Format.getPrettyFormat());
    	PrintWriter out = new PrintWriter(new BufferedWriter(new FileWriter(filename)));
    	out.println("<?xml version=\"1.0\" encoding=\"UTF-8\"?>");
    	out.println("<lexicon name=\"" + grammarName + "\">");
    	for (String key : keys) {
    		Pair<Category,String> p = stagMap.get(key);
    		Category cat = p.a; String pos = p.b;
    		Element fam = new Element("family");
    		fam.setAttribute("name", key);
    		fam.setAttribute("pos", pos);
    		Element ent = new Element("entry");
    		ent.setAttribute("name", "1");
    		fam.addContent(ent);
    		ent.addContent(cat.toXml());
    		xout.output(fam, out); out.println();
    	}
    	out.println("</lexicon>");
    	out.flush(); out.close();
    }
}


================================================
FILE: src/opennlp/ccg/grammar/Rule.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003 Jason Baldridge, Gann Bierner and 
//                    University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.grammar;

import opennlp.ccg.synsem.*;
import opennlp.ccg.unify.*;
import java.util.*;

import org.jdom.Element;


/**
 * Interface for categorial rules.
 *
 * @author Gann Bierner
 * @author Jason Baldridge
 * @author Michael White
 * @version $Revision: 1.5 $, $Date: 2009/11/30 20:36:15 $
 */
public interface Rule {

    /**
     * Apply this rule to some input categories.
     *
     * @param inputs the input categories to try to combine
     * @return the Category (or categories) resulting from using this Rule to combine the
     *         inputs
     * @exception UnifyFailure if the inputs cannot be combined by this Rule
     **/
    public List<Category> applyRule(Category[] inputs) throws UnifyFailure;

    /**
     * The number of arguments this rule takes.  For example, the arity of the
     * forward application rule of categorial grammar (X/Y Y => Y) is 2.
     *
     * @return the number of arguments this rule takes
     **/
    public int arity();

    /**
     * Returns the interned name of this rule.
     */
    public String name();
    
    /**
     * Returns the rule group which contains this rule.
     */
    public RuleGroup getRuleGroup();
    
    /**
     * Sets this rule's rule group.
     */
    public void setRuleGroup(RuleGroup ruleGroup);
    
    /** Returns an XML element representing the rule. */
    public Element toXml();
}


================================================
FILE: src/opennlp/ccg/grammar/RuleGroup.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003-6 Jason Baldridge, Gann Bierner and 
//                      Michael White (University of Edinburgh, The Ohio State University)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.grammar;

import opennlp.ccg.synsem.*;
import opennlp.ccg.hylo.*;
import opennlp.ccg.unify.*;
import opennlp.ccg.util.*;

import org.jdom.*;
import org.jdom.output.*;
import gnu.trove.*;

import java.io.*;
import java.net.*;
import java.util.*;

/**
 * A set of rules for combining categories.
 * Observed rule combos can be cached, either statically or dynamically.
 *
 * During deserialization, the grammar is set to the current grammar, 
 * and supercat rule combos are borrowed from the current grammar's rule group.
 * 
 * @author      Jason Baldridge
 * @author      Gann Bierner
 * @author      Michael White
 * @version     $Revision: 1.32 $, $Date: 2011/06/07 05:12:01 $
 */
public class RuleGroup implements Serializable {

	private static final long serialVersionUID = -6240266013357142289L;

	/** The grammar that this rule group is part of. */
    public transient Grammar grammar;
    
    // rules
    private List<Rule> unaryRules = new ArrayList<Rule>();
    private List<Rule> binaryRules = new ArrayList<Rule>();

    // maps of type changing rules by their semantics
    private GroupMap<String,TypeChangingRule> predsToRules = new GroupMap<String,TypeChangingRule>();
    private GroupMap<String,TypeChangingRule> relsToRules = new GroupMap<String,TypeChangingRule>();
    
    // rule for use in applying coarticulations
    private BackwardApplication bapp = new BackwardApplication();

    // glue rule
    private GlueRule glueRule = new GlueRule();
    
    // supercat-rule combos, to support filtering on observed ones
    private class SupercatRuleCombo {
    	// NB: strings must be interned
		private String supercat; 
    	private String supercat2;
    	private String rule;
    	// unary rule constructor
    	public SupercatRuleCombo(String supercat, String rule) {
    		setCombo(supercat.intern(), (rule != null) ? rule.intern() : null);
    	}
    	// binary rule constructor
    	public SupercatRuleCombo(String supercat, String supercat2, String rule) {
    		setCombo(supercat.intern(), supercat2.intern(), (rule != null) ? rule.intern() : null);
    	}
    	// setters
    	// NB: assume interned strings!
    	public void setCombo(String supercat, String rule) {
    		this.supercat = supercat; this.supercat2 = null; this.rule = rule;
    	}
    	public void setCombo(String supercat, String supercat2, String rule) {
    		this.supercat = supercat; this.supercat2 = supercat2; this.rule = rule;
    	}
    	// hashcode
    	public int hashCode() {
    		return 31*System.identityHashCode(supercat) + 17*System.identityHashCode(rule) + System.identityHashCode(supercat2);
    	}
    	// equals
    	public boolean equals(Object obj) {
    		if (!(obj instanceof SupercatRuleCombo)) return false;
    		SupercatRuleCombo combo = (SupercatRuleCombo) obj;
    		return supercat == combo.supercat && supercat2 == combo.supercat2 && rule == combo.rule;
    	}
    	// supercat hashcode, excluding rule
    	public int supercatHashCode() {
    		return 31*System.identityHashCode(supercat) + System.identityHashCode(supercat2);
    	}
    	// supercat equals
    	public boolean supercatEquals(Object obj) {
    		if (!(obj instanceof SupercatRuleCombo)) return false;
    		SupercatRuleCombo combo = (SupercatRuleCombo) obj;
    		return supercat == combo.supercat && supercat2 == combo.supercat2;
    	}
    	// toString
    	public String toString() {
    		StringBuffer sb = new StringBuffer(supercat);
    		if (supercat2 != null) sb.append(' ').append(supercat2);
    		sb.append(' ').append(rule);
    		return sb.toString();
    	}
    }
    
    // class for seen combos when determined dynamically
    // nb: for space efficiency, allows representative to be retrieved from set
    private static class SupercatComboSet extends THashSet {
		private static final long serialVersionUID = 1L;
		SupercatComboSet() {
    		super(
    	        new TObjectHashingStrategy() {
					private static final long serialVersionUID = 1L;
					public int computeHashCode(Object o) {
    					return (o instanceof SupercatRuleCombo) ? ((SupercatRuleCombo)o).supercatHashCode() : 0;
    	            }
    	            public boolean equals(Object o1, Object o2) {
    					return (o1 instanceof SupercatRuleCombo) ? ((SupercatRuleCombo)o1).supercatEquals(o2) : false;
    	            }
    	        }
        	);
    	}
    	// return the seen combo, or null if none
    	SupercatRuleCombo get(SupercatRuleCombo combo) {
    		int index = index(combo);
    		if (index < 0) return null;
    		return (SupercatRuleCombo) this._set[index];
    	}
    }
    
    // observed supercat-rule combos
    private transient Set<SupercatRuleCombo> supercatRuleCombos = null;
    
    // observed supercat combos (for which complete rule combos are known)
    private transient SupercatComboSet supercatCombosSeen = null;
    
    // reusable combo for checking presence
    private transient SupercatRuleCombo combo = new SupercatRuleCombo("dummy", "dummy");
    
    // flag for whether observed supercat combos is determined dynamically
    private boolean dynamicCombos = false;
    
    /**
     * Constructs an empty rule group for the given grammar.
     */
    public RuleGroup(Grammar grammar) {
        this.grammar = grammar;
        bapp.setRuleGroup(this);
    }
    
    /**
     * Constructs a rule group from the given URL, for 
     * the given grammar.
     */
    public RuleGroup(URL url, Grammar grammar) throws IOException {

        this.grammar = grammar;
        bapp.setRuleGroup(this);
        
        XmlScanner ruleScanner = new XmlScanner() {
        	public void handleElement(Element ruleEl) {
                String active = ruleEl.getAttributeValue("active");
                if (active == null || active.equals("true")) {
                    try { addRule(readRule(ruleEl)); }
                    catch (RuntimeException exc) {
                        System.err.println("Skipping rule: " + ruleEl.getAttributeValue("name"));
                        System.err.println(exc.toString());
                    }
                }
        	}
        };
        ruleScanner.parse(url);
    }

    
    // during deserialization, sets grammar to the current grammar
    private void readObject(java.io.ObjectInputStream in) throws IOException, ClassNotFoundException {
    	in.defaultReadObject();
    	grammar = Grammar.theGrammar;
    	borrowSupercatRuleCombos(grammar.rules);
    }
    
    
    // reads in a rule
    private Rule readRule(Element ruleEl) {
        Rule r;
        String type = ruleEl.getName();
        if (type.equals("application")) {
            String dir = ruleEl.getAttributeValue("dir");
            if (dir.equals("forward")) {
                r = new ForwardApplication();
            } else {
                r = new BackwardApplication();
            }
        } else if (type.equals("composition")) {
            String dir = ruleEl.getAttributeValue("dir");
            String harmonic = ruleEl.getAttributeValue("harmonic");
            boolean isHarmonic = new Boolean(harmonic).booleanValue();
            if (dir.equals("forward")) {
                r = new ForwardComposition(isHarmonic);
            } else {
                r = new BackwardComposition(isHarmonic);
            }
        } else if (type.equals("substitution")) {
            String dir = ruleEl.getAttributeValue("dir");
            String harmonic = ruleEl.getAttributeValue("harmonic");
            boolean isHarmonic = new Boolean(harmonic).booleanValue();
            if (dir.equals("forward")) {
                r = new ForwardSubstitution(isHarmonic);
            } else {
                r = new BackwardSubstitution(isHarmonic);
            }
        } else if (type.equals("typeraising")) {
            String dir = ruleEl.getAttributeValue("dir");
            String useDollar = ruleEl.getAttributeValue("useDollar");
            boolean addDollar = new Boolean(useDollar).booleanValue();
            Category arg = null;
            Element argElt = ruleEl.getChild("arg");
            if (argElt != null) {
                arg = CatReader.getCat((Element)argElt.getChildren().get(0));
            }
            Category result = null;
            Element resultElt = ruleEl.getChild("result");
            if (resultElt != null) {
                result = CatReader.getCat((Element)resultElt.getChildren().get(0));
            }
            if (dir.equals("forward")) {
                r = new ForwardTypeRaising(addDollar, arg, result);
            } else {
                r = new BackwardTypeRaising(addDollar, arg, result);
            }
        } else if (type.equals("typechanging")) {
            r = readTypeChangingRule(ruleEl);
        } else {
            throw new RuntimeException("Invalid element in rules: " + type);
        }
        return r;
    }
    
    // reads in a type changing rule
    private Rule readTypeChangingRule(Element ruleEl) {
        
        String rname = ruleEl.getAttributeValue("name");
        Element argCatElt = (Element)ruleEl.getChild("arg").getChildren().get(0);
        Category arg = CatReader.getCat(argCatElt);
        Element resultCatElt = (Element)ruleEl.getChild("result").getChildren().get(0);
        Element lfElt = resultCatElt.getChild("lf");
        Category result = CatReader.getCat(resultCatElt);
        LF firstEP = null;
        if (lfElt != null) {
            firstEP = HyloHelper.firstEP(HyloHelper.getLF(lfElt));
        }
        
        grammar.lexicon.propagateTypes(result, arg);
        grammar.lexicon.propagateDistributiveAttrs(result, arg);
        grammar.lexicon.expandInheritsFrom(result, arg);

        return new TypeChangingRule(arg, result, rname, firstEP);
    }

    /**
     * Writes the rules to an XML file with the given name.
     * @throws IOException 
     */
    public void toXml(String filename) throws IOException {
    	XMLOutputter xout = new XMLOutputter();
    	xout.setFormat(Format.getPrettyFormat());
    	PrintWriter out = new PrintWriter(new BufferedWriter(new FileWriter(filename)));
    	out.println("<?xml version=\"1.0\" encoding=\"UTF-8\"?>");
    	out.println("<rules name=\"" + grammar.getName() + "\">");
    	for (Rule r : binaryRules) { 
    		xout.output(r.toXml(), out); out.println();
    	}
    	for (Rule r : unaryRules) {
    		xout.output(r.toXml(), out); out.println();
    	}
    	out.println("</rules>");
    	out.flush(); out.close();
    }
    
    /**
     * Sets the dynamic combos flag to the given value, controlling whether the 
     * observed supercat combos is determined dynamically.
     */
    public void setDynamicCombos(boolean dynamic) {
    	this.dynamicCombos = dynamic;
    	if (!dynamicCombos) supercatCombosSeen = null;
    	else if (dynamicCombos) {
    		if (supercatCombosSeen == null) supercatCombosSeen = new SupercatComboSet();
    		if (supercatRuleCombos == null) supercatRuleCombos = new HashSet<SupercatRuleCombo>();
    	}
    }
    
    /**
     * Returns the dynamic combos flag.
     */
    public boolean getDynamicCombos() { return dynamicCombos; }
    
    /** 
     * Loads the observed supercat-rule combos, for filtering. 
     * Only file URLs are supported at present.
     * Missing files are ignored. 
     **/
    public void loadSupercatRuleCombos(URL url) throws IOException {
    	supercatRuleCombos = new HashSet<SupercatRuleCombo>();
    	File combosFile = new File(url.getFile());
    	if (!combosFile.exists()) return;
    	System.out.println("Loading supercat combos from " + url.getFile());
    	BufferedReader in = new BufferedReader(new FileReader(combosFile));
    	String line;
    	while ((line = in.readLine()) != null) {
    		String[] tokens = line.split("\\s");
    		if (tokens.length < 2) {
    			System.err.println("Warning: skipping supercat-rule combo with fewer than two tokens: " + line);
    			continue;
    		}
    		if (tokens.length == 2) {
    			supercatRuleCombos.add(new SupercatRuleCombo(tokens[0], tokens[1]));
    		}
    		else {
	    		if (tokens.length > 3) {
	    			System.err.println("Warning: ignoring extra tokens (beyond 3rd) in supercat-rule combo: " + line);
	    		}
    			supercatRuleCombos.add(new SupercatRuleCombo(tokens[0], tokens[1], tokens[2]));
    		}
    	}
    	in.close();
    }
    
    
    /** Borrows the observed supercat-rule combos from the given rule group. */
    public void borrowSupercatRuleCombos(RuleGroup ruleGroup) {
    	supercatRuleCombos = ruleGroup.supercatRuleCombos;
    	supercatCombosSeen = ruleGroup.supercatCombosSeen;
    }
    
    
    /** Adds the given rule. */
    public void addRule(Rule r) {
        r.setRuleGroup(this);
        if (r instanceof TypeChangingRule) {
            unaryRules.add(r);
            index((TypeChangingRule)r);
        }
        else if (r.arity() == 1) { unaryRules.add(r); } 
        else if (r.arity() == 2) { binaryRules.add(r); } 
        else {
            // shouldn't happen
            throw new RuntimeException("Can't determine arity of rule: " + r);
        }
    }

    // indexes type changing rules by preds and rels
    private void index(TypeChangingRule rule) {
        LF firstEP = rule.getFirstEP();
        if (firstEP == null) { return; }
        String pred = HyloHelper.getLexPred(firstEP);
        if (pred != null) { 
            predsToRules.put(pred, rule); 
            return; 
        }
        String rel = HyloHelper.getRel(firstEP);
        if (rel != null) { 
            relsToRules.put(rel, rule);
        }
    }
    
    
    /** Returns the unary rules. */
    public List<Rule> getUnaryRules() { return unaryRules; }

    /** Returns the binary rules. */
    public List<Rule> getBinaryRules() { return binaryRules; }

    /** Returns the type changing rule with the given name, or null if none. */
    public TypeChangingRule getTypeChangingRule(String name) {
        for (Iterator<Rule> it = unaryRules.iterator(); it.hasNext(); ) {
            Object rule = it.next();
            if (rule instanceof TypeChangingRule) {
                TypeChangingRule tcr = (TypeChangingRule) rule;
                if (tcr.name().equals(name)) return tcr;
            }
        }
        return null;
    }
    
    /**
     * Returns the type changing rules indexed by the given lexical predicate. 
     * The type changing rules are indexed by their first elementary predication.
     */
    public Collection<TypeChangingRule> getRulesForPred(String pred) {
        return predsToRules.get(pred);
    }
    
    /**
     * Returns the type changing rules indexed by the given relation.
     * The type changing rules are indexed by their first elementary predication.
     */
    public Collection<TypeChangingRule> getRulesForRel(String rel) {
        return relsToRules.get(rel);
    }
    
    
    /** Applies the unary rules to the given input sign, returning the list of results. */
    public List<Sign> applyUnaryRules(Sign input) {
    	Sign[] inputs = { input };
        List<Sign> results = new ArrayList<Sign>(2);
        String supertag = input.getCategory().getSupertag();
        // check whether dynamic combos update required, or whether rules can be skipped
        boolean dynamicCombosUpdate = false;
        boolean skip = false;
        if (dynamicCombos) {
    		combo.setCombo(supertag, null);
    		SupercatRuleCombo rep = supercatCombosSeen.get(combo);
    		if (rep == null) dynamicCombosUpdate = true;
    		else if (rep.rule == null) skip = true;
        }
        // skip if possible
        if (skip) return results;
        // try each rule 
        for (Rule r : unaryRules) {
        	// filter on observed supercat-rule combos, if any, if not updating
        	if (!dynamicCombosUpdate && supercatRuleCombos != null) {
        		combo.setCombo(supertag, r.name());
        		if (!supercatRuleCombos.contains(combo)) { continue; }
        	}
        	// if updating combos, apply rule and record results
        	if (dynamicCombosUpdate) {
        		int prevsize = results.size();
            	((AbstractRule)r).applyRule(inputs, results);
            	// update upon success
            	if (results.size() > prevsize) {
            		SupercatRuleCombo newCombo = null;
            		combo.setCombo(supertag, r.name());
            		if (!supercatRuleCombos.contains(combo)) { 
            			newCombo = new SupercatRuleCombo(supertag, r.name());
            			supercatRuleCombos.add(newCombo);
            		}
            		if (!supercatCombosSeen.contains(combo)) {
            			if (newCombo == null) newCombo = new SupercatRuleCombo(supertag, r.name());
                		supercatCombosSeen.add(newCombo);
            		}
            	}
        	}
        	// otherwise just apply rule
        	else ((AbstractRule)r).applyRule(inputs, results);
        }
        // if updating combos and none succeeded, add one with null rule
        if (dynamicCombosUpdate) {
    		combo.setCombo(supertag, null);
    		if (!supercatCombosSeen.contains(combo)) {
    			SupercatRuleCombo newCombo = new SupercatRuleCombo(supertag, null);
    			supercatCombosSeen.add(newCombo);
    		}
        }
        // done
        return results;
    }
    
    /** Applies the binary rules to the given input signs, returning the list of results. */
    public List<Sign> applyBinaryRules(Sign input1, Sign input2) {
    	Sign[] inputs = { input1, input2 };
        List<Sign> results = new ArrayList<Sign>(2);
		String supertag1 = input1.getCategory().getSupertag();
		String supertag2 = input2.getCategory().getSupertag();
        // check whether dynamic combos update required, or whether rules can be skipped
        boolean dynamicCombosUpdate = false;
        boolean skip = false;
        if (dynamicCombos) {
    		combo.setCombo(supertag1, supertag2, null);
    		SupercatRuleCombo rep = supercatCombosSeen.get(combo);
    		if (rep == null) dynamicCombosUpdate = true;
    		else if (rep.rule == null) skip = true;
        }
        // skip if possible
        if (skip) return results;
        // try each rule
        for (Rule r : binaryRules) {
        	// filter on observed supercat-rule combos, if any, if not updating
        	if (!dynamicCombosUpdate && supercatRuleCombos != null) {
        		combo.setCombo(supertag1, supertag2, r.name());
        		if (!supercatRuleCombos.contains(combo)) { continue; }
        	}
        	// if updating combos, apply rule and record results
        	if (dynamicCombosUpdate) {
        		int prevsize = results.size();
            	((AbstractRule)r).applyRule(inputs, results);
            	// update upon success
            	if (results.size() > prevsize) {
            		SupercatRuleCombo newCombo = null;
            		combo.setCombo(supertag1, supertag2, r.name());
            		if (!supercatRuleCombos.contains(combo)) { 
            			newCombo = new SupercatRuleCombo(supertag1, supertag2, r.name());
            			supercatRuleCombos.add(newCombo);
            		}
            		if (!supercatCombosSeen.contains(combo)) {
            			if (newCombo == null) newCombo = new SupercatRuleCombo(supertag1, supertag2, r.name());
                		supercatCombosSeen.add(newCombo);
            		}
            	}
        	}
        	// otherwise just apply rule
        	else ((AbstractRule)r).applyRule(inputs, results);
        }
        // if updating combos and none succeeded, add one with null rule
        if (dynamicCombosUpdate) {
    		combo.setCombo(supertag1, supertag2, null);
    		if (!supercatCombosSeen.contains(combo)) {
        		SupercatRuleCombo newCombo = new SupercatRuleCombo(supertag1, supertag2, null);
    			supercatCombosSeen.add(newCombo);
    		}
        }
        // done
        return results;
    }
    
    
    /** Applies the glue rule to the given input signs, returning the list of results. */
    public List<Sign> applyGlueRule(Sign input1, Sign input2) {
    	Sign[] inputs = { input1, input2 };
        List<Sign> results = new ArrayList<Sign>(1);
    	glueRule.applyRule(inputs, results);
        return results;
    }

    
    /** Applies the coarticulation to the given sign, adding the result (if any) to the given ones. */
    public void applyCoart(Sign lexSign, Sign coartSign, List<Sign> results) {

        Category[] cats = new Category[] { lexSign.getCategory(), coartSign.getCategory() }; 

        try {
            List<Category> resultCats = bapp.applyRule(cats);
            if (resultCats.isEmpty()) return;
            
            for (Iterator<Category> it = resultCats.iterator(); it.hasNext();) {
                Category catResult = it.next();
                bapp.distributeTargetFeatures(catResult);
                Sign sign = Sign.createCoartSign(catResult, lexSign, coartSign);
                results.add(sign);
            }
        } catch (UnifyFailure uf) {}
    }
}


================================================
FILE: src/opennlp/ccg/grammar/TypeChangingRule.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003-4 Jason Baldridge and University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.grammar;

import opennlp.ccg.unify.*;
import opennlp.ccg.hylo.HyloHelper;
import opennlp.ccg.synsem.*;

import java.util.*;

import org.jdom.Element;

/**
 * A CCG unary type changing rule.
 *
 * @author      Jason Baldridge
 * @author      Michael White
 * @version $Revision: 1.12 $, $Date: 2009/11/30 20:36:16 $
 **/
public class TypeChangingRule extends AbstractRule implements LexSemOrigin {
	
	private static final long serialVersionUID = -2654945192870162776L;

	/**
	 * String used as the POS for all type changing rules, 
	 * to satisfy the LexSemOrigin interface.
	 * Defaults to "URULE".
	 */
	public static String POS_STRING = "URULE";
	

    /** The argument category. */   
    protected Category _arg; 

    /** The result category. */
    protected Category _result; 
    
    /** The first elementary predication in the result LF (or null), before sorting. */
    protected LF _firstEP;


    /** Constructor. */
    public TypeChangingRule(Category arg, Category result, String name, LF firstEP) {
        _arg = arg; _result = result; _name = name.intern(); _firstEP = firstEP;
        setOrigin();
    }

    /** Returns an XML element representing the rule. */
    public Element toXml() {
    	Element retval = new Element("typechanging");
    	retval.setAttribute("name", _name);
    	Element argElt = new Element("arg");
    	retval.addContent(argElt);
    	argElt.addContent(_arg.toXml());
    	Element resultElt = new Element("result");
    	retval.addContent(resultElt);
    	resultElt.addContent(_result.toXml());
    	return retval;
    }

    /** Returns 1. */
    public int arity() { return 1; }
    
    /** Returns the arg. */
    public Category getArg() { return _arg; }
    
    /** Returns the result. */
    public Category getResult() { return _result; }

    /** Returns the first elementary predication in the result LF (or null), before sorting. */
    public LF getFirstEP() { return _firstEP; }


    /** Applies this rule to the given inputs. */
    public List<Category> applyRule(Category[] inputs) throws UnifyFailure {
        // check arity
        if (inputs.length != 1) {
            throw new UnifyFailure();
        }
        return apply(inputs[0]);
    }

    /** Applies this rule to the given input. */
    protected List<Category> apply(Category input) throws UnifyFailure {

        // unify quick check
        _arg.unifyCheck(input);
        
        // copy arg and result
        Category arg = _arg.copy();
        Category result = _result.copy();
        
        // make variables unique
        UnifyControl.reindex(result, arg);

        // unify
        Substitution sub = new GSubstitution();
        GUnifier.unify(input, arg, sub);
        ((GSubstitution)sub).condense();

        // fill in result
        Category $result = (Category)result.fill(sub);
        appendLFs(input, result, $result, sub);

        // return
        List<Category> results = new ArrayList<Category>(1);
        _headCats.clear();
        results.add($result);
        _headCats.add(input);
        return results;
    }
    
    
    /** Returns 'name: arg => result'. */
    public String toString() {
        StringBuffer sb = new StringBuffer();
        sb.append(_name).append(": ");
        sb.append(_arg).append(' ');
        sb.append("=> ").append(_result);
        return sb.toString();
    }
    
    /** Returns 'arg_=>_result' as the supertag. */
    public String getSupertag() {
        StringBuffer sb = new StringBuffer();
        sb.append(_arg.getSupertag()).append("_=>_").append(_result.getSupertag());
        return sb.toString();
    }
    
    /**
     * Always returns POS_STRING. 
     */
    public String getPOS() { return POS_STRING; }
    
    /**
     * Sets the origin of the elementary predications.
     */
    public void setOrigin() { HyloHelper.setOrigin(_result.getLF(), this); }
}


================================================
FILE: src/opennlp/ccg/grammar/Types.java
================================================
///////////////////////////////////////////////////////////////////////////////
//// Copyright (C) 2003-4 Gunes Erkan and University of Edinburgh (Michael White)
//// 
//// This library is free software; you can redistribute it and/or
//// modify it under the terms of the GNU Lesser General Public
//// License as published by the Free Software Foundation; either
//// version 2.1 of the License, or (at your option) any later version.
//// 
//// This library is distributed in the hope that it will be useful,
//// but WITHOUT ANY WARRANTY; without even the implied warranty of
//// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
//// GNU Lesser General Public License for more details.
//// 
//// You should have received a copy of the GNU Lesser General Public
//// License along with this program; if not, write to the Free Software
//// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
////////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.grammar;

import opennlp.ccg.util.*;
import opennlp.ccg.unify.*;

import org.jdom.*;
import org.jdom.input.*;

import java.io.*;
import java.net.*;
import java.util.*;

import gnu.trove.*;

/**
 * Class for constructing and holding the hierarchical simple type maps.
 *
 * @author  Gunes Erkan
 * @author  Michael White
 * @version $Revision: 1.13 $, $Date: 2009/12/21 03:27:18 $
 */
public class Types {

    public final Grammar grammar;
    private final HashMap<String,SimpleType> nameToType = new HashMap<String,SimpleType>();
    private final ArrayList<SimpleType> indexToType = new ArrayList<SimpleType>();
    private int maxTypeIndex = 0;
    public static final String TOP_TYPE = "top";
    public static final String BOT_TYPE = "bottom";
	
    /** Constructor for an empty hierarchy (with just the top type). */
    public Types(Grammar grammar) {
        getSimpleType(TOP_TYPE);
        this.grammar = grammar;
    }

    /**
     * Constructs the type hierarchy from the given URL, for 
     * the given grammar.
     */
    @SuppressWarnings("unchecked")
	public Types(URL url, Grammar grammar) throws IOException {
        this.grammar = grammar;
        SAXBuilder builder = new SAXBuilder();
        Document doc;
        try {
            doc = builder.build(url);
        }
        catch (JDOMException exc) {
          getSimpleType(TOP_TYPE);
          throw (IOException) new IOException().initCause(exc);
        }
        List<Element> entries = doc.getRootElement().getChildren();
        readTypes(entries);
        // for debugging: print the indexToType list
        //printTypes();
    }
    
    /** Returns the simple type with the given name, or a new one if none yet exists. */
    public SimpleType getSimpleType(String typeName) {
        SimpleType type = nameToType.get(typeName);
        if (type == null) {
            BitSet bs = new BitSet();
            bs.set(maxTypeIndex);
            SimpleType newtype = new SimpleType(maxTypeIndex, typeName, bs, this);
            nameToType.put(typeName, newtype);
            indexToType.add(newtype);
            nameToType.get(TOP_TYPE).getBitSet().set(maxTypeIndex++);
            return newtype;
        }
        else return type;
    }

    /** Returns whether there is a simple type with the given name. */
    public boolean containsSimpleType(String typeName) {
        return nameToType.containsKey(typeName);
    }
    
    /** Returns the list of types, with parents preceding children in the hierarchy. */
    public ArrayList<SimpleType> getIndexMap() {
        return indexToType;
    }


    /** Reads the rules and constructs the nameToType and indexToType maps. */
    private void readTypes(List<Element> _types) {
        
        GroupMap<String,String> hierarchy = new GroupMap<String,String>(); // map from types to all subtypes
        GroupMap<String,String> parents = new GroupMap<String,String>(); // map from types to parents
        TObjectIntHashMap depthMap = new TObjectIntHashMap(); // map from types to max depth

        // Construct the initial hierarchy of types without 
        // taking transitive closure.
        // Also store parents.
        for (int i=0; i < _types.size(); i++) {
            Element typeEl = _types.get(i);
            String typeName = typeEl.getAttributeValue("name");
            String _parents = typeEl.getAttributeValue("parents");
            hierarchy.put(typeName, BOT_TYPE);
            if (_parents == null) {
                hierarchy.put(TOP_TYPE, typeName);
                parents.put(typeName, TOP_TYPE);
            }
    		else {
    			String[] parentsArray = _parents.split("\\s+");
    			for (int j = 0; j < parentsArray.length; j++) {
    				hierarchy.put(parentsArray[j], typeName);
                    parents.put(typeName, parentsArray[j]);
    			}
    		}
    	}

        // Compute depth from parents.
        for (String type : parents.keySet()) {
            int depth = computeDepth(type, parents, type);
            depthMap.put(type, depth);
        }

    	// Compute ALL subtypes of each type and insert into the hierarchy.
    	for (String type : hierarchy.keySet()) { 
 		    hierarchy.putAll(type, findAllSubtypes(hierarchy, type));
 		}
        
    	// Assign a unique int to each type in breadth-first order.
    	// Then create the string -> SimpleType map.
    	createSimpleTypes(hierarchy, depthMap);
    }

    /** Returns the max depth of the given type, checking for cycles. */
    private static int computeDepth(String type, GroupMap<String,String> parents, String startType) {
        if (type.equals(TOP_TYPE)) return 0;
        int maxParentDepth = 0;
        Set<String> parentSet = parents.get(type);
	if (parentSet != null) {
	    for (String parent : parentSet) {
		if (parent.equals(startType)) {
		    throw new RuntimeException("Error, type hierarchy contains cycle from/to: " + startType);
		}
		int parentDepth = computeDepth(parent, parents, startType);
		maxParentDepth = Math.max(maxParentDepth, parentDepth);
	    }
	}
        return maxParentDepth + 1;
    }
    
    /** 
     * Computes the list of all sub-types of a given type (key) 
     * in depth-first order. 
     */
    private Collection<String> findAllSubtypes(GroupMap<String,String> hierarchy, String key) {
        ArrayList<String> subs = new ArrayList<String>();
        if (hierarchy.get(key) != null) {
      	    Stack<String> look = new Stack<String>();
	    for (String type : hierarchy.get(key)) {
		look.push(type);
	    }
            for (; !look.empty() ; ) {
                String new_sub = look.pop();
                subs.add(new_sub);
                if (hierarchy.get(new_sub) != null) {
                    for (String type : hierarchy.get(new_sub)) {
                        look.push(type);
                    }
                }
            }
        }
        return subs;
    }

    /** 
     * Creates the SimpleType objects and constructs the nameToType and indexToType maps. 
     */
    private void createSimpleTypes(GroupMap<String,String> hierarchy, TObjectIntHashMap depthMap) {
        
        // find max depth
        int maxDepth = 0;
        int[] depths = depthMap.getValues();
        for (int i = 0; i < depths.length; i++) {
            maxDepth = Math.max(maxDepth, depths[i]);
        }

        // add types in order of increasing depth
        ArrayList<String> typesVisited = new ArrayList<String>();
        typesVisited.add(TOP_TYPE);
        Object[] types = depthMap.keys();
        ArrayList<String> typesAtSameDepth = new ArrayList<String>();
        for (int i = 1; i <= maxDepth; i++) {
            typesAtSameDepth.clear();
            for (int j = 0; j < types.length; j++) {
                if (depthMap.get(types[j]) == i)
                    typesAtSameDepth.add((String)types[j]);
            }
            Collections.sort(typesAtSameDepth);
            typesVisited.addAll(typesAtSameDepth);
        }

        // construct the maps
        for (int i=0; i < typesVisited.size(); i++) {
            String typeName = typesVisited.get(i);
            BitSet bitset = new BitSet();
            bitset.set(i);
	    if (hierarchy.get(typeName) != null) {
		for (String type : hierarchy.get(typeName)) {
		    int indexToSet = typesVisited.indexOf(type); 
		    if (indexToSet != -1) bitset.set(indexToSet);
		}
	    }
            SimpleType st = new SimpleType(i, typeName, bitset, this);
            nameToType.put(typeName, st);
            indexToType.add(st);
        }
        maxTypeIndex = typesVisited.size();
    }
    
    /**
     * Prints the types and their subtypes to System.out.
     */
    public void printTypes() {
        System.out.println("types:");
        for (int i=0; i < indexToType.size(); i++) {
            SimpleType st = indexToType.get(i); 
            System.out.println(i + ": " + st.getName() + " subtypes: " + st.getBitSet());
        }
        System.out.println();
    }
    
    /** Tests serialization of simple types, including resolution. */
    public void debugSerialization() throws IOException, ClassNotFoundException {
        // test serialization
        SimpleType st = indexToType.get(1);
    	String filename = "tmp.ser";
    	ObjectOutputStream out = new ObjectOutputStream(new FileOutputStream(filename));
    	System.out.println("Writing st: " + st.getIndex() + ": " + st + " " + st.getBitSet());
    	out.writeObject(st);
    	out.close();
    	ObjectInputStream in = new ObjectInputStream(new FileInputStream(filename));
    	System.out.print("Reading st2: ");
    	SimpleType st2 = (SimpleType) in.readObject();
    	System.out.println(st2.getIndex() + ": " + st2 + " " + st2.getBitSet());
    	in.close();
    	// test identity (and thus readResolve)
    	System.out.println("st == st2?: " + (st == st2));
    }
}


================================================
FILE: src/opennlp/ccg/grammar/to-apml.xsl
================================================
<?xml version="1.0"?>
<!-- 
Copyright (C) 2004 Michael White 
$Revision: 1.8 $, $Date: 2004/12/12 12:06:11 $ 
-->
<xsl:transform 
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform" 
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  exclude-result-prefixes="xalan xalan2">
  
  <xsl:output doctype-system="apml.dtd"/>
  <xsl:output indent="yes" xalan2:indent-amount="2"/> 
  <xsl:strip-space elements="*"/>

  <xsl:variable name="apostrophe">'</xsl:variable>
  <xsl:variable name="n-apostrophe-t">n't</xsl:variable>
  
  <!-- ***** Start Output Here ***** -->
  <xsl:template match="/">
    <apml>
      <performative>
        <xsl:apply-templates/>
      </performative>
    </apml>
  </xsl:template>

  
  <!-- filter seg, span, multiword elements -->  
  <xsl:template match="seg|span|multiword">
    <xsl:apply-templates/>
  </xsl:template>

  
  <!-- remove word element and add space after each word, 
       unless it's the last word under a pitchaccent -->  
  <xsl:template match="word">
    <xsl:apply-templates/>
    <xsl:if test="not(ancestor::pitchaccent and position()=last())">
      <xsl:call-template name="add-space"/>
    </xsl:if>
  </xsl:template>

  
  <!-- change pitchaccent to emphasis -->  
  <xsl:template match="pitchaccent">
    <!-- spell out type -->
    <xsl:variable name="type">
      <xsl:choose>
        <xsl:when test="@type='H*'">Hstar</xsl:when>
        <xsl:when test="@type='L*'">Lstar</xsl:when>
        <xsl:when test="@type='L+H*'">LplusHstar</xsl:when>
        <xsl:when test="@type='L*+H'">LstarplusH</xsl:when>
        <xsl:when test="@type='H*+L'">HstarplusL</xsl:when>
        <xsl:when test="@type='H+L*'">HplusLstar</xsl:when>
      </xsl:choose>
    </xsl:variable>
    <!-- add emphasis element -->
    <xsl:choose>
      <!-- split around 'and', to avoid accenting 'and' in amounts etc  -->
      <xsl:when test="multiword/word[text()='and' and preceding-sibling::word]">
        <xsl:variable name="and-pos" 
          select="count(multiword/*[following-sibling::word[text()='and']]) + 1"/>
        <emphasis x-pitchaccent="{$type}">
          <xsl:apply-templates select="multiword/*[position() &lt; $and-pos]"/>
        </emphasis>
        <xsl:text> </xsl:text>
        <xsl:apply-templates select="multiword/*[position() = $and-pos]"/>
        <xsl:text> </xsl:text>
        <emphasis x-pitchaccent="{$type}">
          <xsl:apply-templates select="multiword/*[position() &gt; $and-pos]"/>
        </emphasis>
      </xsl:when>
      <!-- otherwise leave it around all words -->
      <xsl:otherwise>
        <emphasis x-pitchaccent="{$type}">
          <xsl:apply-templates/>
        </emphasis>
      </xsl:otherwise>
    </xsl:choose>
    <!-- add space -->
    <xsl:call-template name="add-space"/>
  </xsl:template>
  
  
  <!-- change boundary type -->  
  <xsl:template match="boundary">
    <!-- remove % from type -->
    <xsl:variable name="type">
      <xsl:choose>
        <xsl:when test="contains(@type,'%')">
          <xsl:value-of select="substring-before(@type,'%')"/>
        </xsl:when>
        <xsl:otherwise>
          <xsl:value-of select="@type"/>
        </xsl:otherwise>
      </xsl:choose>
    </xsl:variable>
    <boundary type="{$type}">
      <xsl:apply-templates/>
    </boundary>
    <xsl:call-template name="add-space"/>
  </xsl:template>

  
  <!-- change AM/PM to aamm/ppmm, to avoid APML tokenization problems -->
  <xsl:template match="word/text()[string(.)='AM']">
    <xsl:text>aamm</xsl:text>
  </xsl:template>
  <xsl:template match="word/text()[string(.)='PM']">
    <xsl:text>ppmm</xsl:text>
  </xsl:template>

  <!-- strip out apostrophes, to avoid APML tokenization problems -->
  <xsl:template match="word/text()[contains(string(.),$apostrophe)]">
    <xsl:value-of select="translate(string(.),$apostrophe,'')"/>
  </xsl:template>
  
  <!-- adds space if following word does not begin with ' or equal n't -->
  <xsl:template name="add-space">
    <xsl:if test="not(following::word[1][starts-with(text(),$apostrophe) or text()=$n-apostrophe-t])">
      <xsl:text> </xsl:text>
    </xsl:if>
  </xsl:template>  
  
  
  <!-- ***** Copy ***** -->
  <xsl:template match="@*|node()">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: src/opennlp/ccg/grammardoc/AbstractDocumenter.java
================================================
/*
 * $Id: AbstractDocumenter.java,v 1.2 2006/11/01 02:53:20 coffeeblack Exp $
 */
package opennlp.ccg.grammardoc;

/**
 * Convenience base class for documenters to extend
 * 
 * @author Scott Martin (http://www.ling.osu.edu/~scott/)
 * @version $Revision: 1.2 $
 */
public abstract class AbstractDocumenter implements Documenter {

	protected DocumenterContext documenterContext;
	protected String name;

	/**
	 * Default constructor. All documenters must have a no-argument constructor.
	 */
	protected AbstractDocumenter() {}

	/**
	 * Creates a new documenter with the specified name.
	 */
	protected AbstractDocumenter(String name) {
		this.name = name;
	}

	/**
	 * Sets this documenter's context.
	 */
	public void setDocumenterContext(DocumenterContext documenterContext) {
		this.documenterContext = documenterContext;
	}

	/**
	 * Gets this documenter's name.
	 */
	public String getName() {
		return name;
	}

}


================================================
FILE: src/opennlp/ccg/grammardoc/Documenter.java
================================================
/*
 * $Id: Documenter.java,v 1.2 2006/11/01 02:53:20 coffeeblack Exp $
 */
package opennlp.ccg.grammardoc;

/**
 * A documenter that produces documentation for an OpenCCG grammar.
 * 
 * @author Scott Martin (http://www.ling.osu.edu/~scott/)
 * @version $Revision: 1.2 $
 */
public interface Documenter {

	/**
	 * Gets the name of this documenter.
	 * 
	 * @return A string like <code>SGML Documenter</code>.
	 */
	public String getName();

	/**
	 * Sets this documenter's context.
	 * 
	 * @param documenterContext The context this documenter should use.
	 */
	public void setDocumenterContext(DocumenterContext documenterContext);

	/**
	 * Causes a documenter to produce documentation for the provided grammar.
	 * Before any calls to this method are made, the documenter will first be
	 * configured with a (single) call to
	 * {@link #setDocumenterContext(DocumenterContext)}.
	 * 
	 * @param grammar The grammar to document.
	 * @throws DocumenterException If any problems occur during the process of
	 *             generating documentation.
	 */
	public void document(SourceGrammar grammar) throws DocumenterException;
}


================================================
FILE: src/opennlp/ccg/grammardoc/DocumenterContext.java
================================================
/*
 * $Id: DocumenterContext.java,v 1.2 2006/11/01 02:53:20 coffeeblack Exp $
 */
package opennlp.ccg.grammardoc;

import java.io.File;

/**
 * Provides a context inside which a {@link Documenter} will execute. This class
 * gives the documenter access to objects it will need to produce its
 * documentation.
 * 
 * @author Scott Martin (http://www.ling.osu.edu/~scott/)
 * @version $Revision: 1.2 $
 */
public interface DocumenterContext {

	/**
	 * Logs a message from a documenter.
	 */
	public void log(String message);

	/**
	 * Gets the target location where the documenter should generate its
	 * documentation files.
	 * 
	 * @return A directory that exists in a filesystem.
	 */
	public File getDestinationDirectory();
}


================================================
FILE: src/opennlp/ccg/grammardoc/DocumenterException.java
================================================
/*
 * $Id: DocumenterException.java,v 1.2 2006/11/01 02:53:20 coffeeblack Exp $
 */
package opennlp.ccg.grammardoc;

/**
 * An exception thrown by a {@link Documenter}.
 * 
 * @author Scott Martin (http://www.ling.osu.edu/~scott/)
 * @version $Revision: 1.2 $
 */
public class DocumenterException extends GrammarDocException {

	private static final long serialVersionUID = 1L;

	/**
	 * Creates a new documenter exception.
	 */
	public DocumenterException() {
		super();
	}

	/**
	 * Creates a new exception with the specified message.
	 */
	public DocumenterException(String message) {
		super(message);
	}

	/**
	 * Creates a new exception with the specified message and underlying cause.
	 */
	public DocumenterException(String message, Throwable cause) {
		super(message, cause);
	}

	/**
	 * Creates a new exception with the specified underlying cause.
	 */
	public DocumenterException(Throwable cause) {
		super(cause);
	}

}


================================================
FILE: src/opennlp/ccg/grammardoc/DocumenterFactory.java
================================================
/*
 * $Id: DocumenterFactory.java,v 1.4 2006/12/11 18:19:24 coffeeblack Exp $
 */
package opennlp.ccg.grammardoc;

import java.util.EnumMap;
import java.util.Map;

/**
 * Factory class for creating documenters based on a predefined name.
 * 
 * @author Scott Martin (http://www.ling.osu.edu/~scott/)
 * @version $Revision: 1.4 $
 */
public class DocumenterFactory {

	private static final Map<DocumenterName, Documenter> documenters
		= new EnumMap<DocumenterName, Documenter>(DocumenterName.class);
	static final DocumenterFactory documenterFactory = new DocumenterFactory();

	private DocumenterFactory() {}

	/**
	 * Gets a new documenter factory.
	 */
	public static DocumenterFactory newInstance() {
		return documenterFactory;
	}

	/**
	 * Gets a new instance of the default documenter.
	 * 
	 * @return Calls {@link #newDocumenter(DocumenterName)} with
	 *         {@link DocumenterName#DEFAULT} as its argument.
	 * @throws DocumenterNotFoundException Does not throw this exception. This
	 *             is included for binary compatibility with
	 *             {@link #newDocumenter(DocumenterName)}.
	 */
	public Documenter newDocumenter() throws DocumenterNotFoundException {
		return newDocumenter(DocumenterName.DEFAULT);
	}

	/**
	 * Gets a new instance of the named documenter.
	 * 
	 * @param name Used to look up the documenter {@link DocumenterName name}.
	 * @return A documenter that corresponds to the specified name.
	 * @throws DocumenterNotFoundException If no documenter can be created for
	 *             the specified name.
	 */
	public Documenter newDocumenter(String name)
			throws DocumenterNotFoundException {
		try {
			DocumenterName nm = DocumenterName.valueOf(name);
			return newDocumenter(nm);
		}
		catch(IllegalArgumentException iae) {
			throw new DocumenterNotFoundException(name);
		}
	}

	/**
	 * Gets a new instance of the named documenter.
	 * 
	 * @param name The {@link DocumenterName name} of the documenter to create.
	 * @return A documenter that corresponds to the specified name.
	 * @throws DocumenterNotFoundException If no documenter can be created for
	 *             the specified name.
	 */
	public synchronized Documenter newDocumenter(DocumenterName name)
			throws DocumenterNotFoundException {
		Documenter d = documenters.get(name);

		if(d == null) {
			try {
				d = name.documenterClass.newInstance();
			}
			catch(InstantiationException ie) {
				throw new DocumenterNotFoundException(name, ie);
			}
			catch(IllegalAccessException iae) {
				throw new DocumenterNotFoundException(name, iae);
			}
			
			documenters.put(name, d);
		}

		return d;
	}
}


================================================
FILE: src/opennlp/ccg/grammardoc/DocumenterName.java
================================================
/*
 * $Id: DocumenterName.java,v 1.3 2006/12/11 18:19:24 coffeeblack Exp $
 */
package opennlp.ccg.grammardoc;

import opennlp.ccg.grammardoc.html.HTMLDocumenter;

/**
 * The known documenters that the {@link DocumenterFactory documenter factory}
 * is aware of. Calling {@link DocumenterFactory#newDocumenter(DocumenterName)}
 * with any of these values will return a valid documenter without throwing an
 * exception.
 * 
 * @author Scott Martin (http://www.ling.osu.edu/~scott/)
 * @version $Revision: 1.3 $
 */
public enum DocumenterName {
	/**
	 * The default documenter.
	 */
	DEFAULT(HTMLDocumenter.class),

	/**
	 * A documenter that produces HTML output.
	 */
	HTML(HTMLDocumenter.class);
	
	Class<? extends Documenter> documenterClass;
	
	private DocumenterName(Class<? extends Documenter> documenterClass) {
		this.documenterClass = documenterClass;
	}
}


================================================
FILE: src/opennlp/ccg/grammardoc/DocumenterNotFoundException.java
================================================
/*
 * $Id: DocumenterNotFoundException.java,v 1.3 2006/12/11 18:19:24 coffeeblack Exp $
 */
package opennlp.ccg.grammardoc;

/**
 * Signals that no documenter could be found for a given name.
 * 
 * @author Scott Martin (http://www.ling.osu.edu/~scott/)
 * @version $Revision: 1.3 $
 */
public class DocumenterNotFoundException extends DocumenterException {

	private static final long serialVersionUID = 1L;

	/**
	 * Creates a new exception indicating that a documenter with the specified
	 * name was not found.
	 */
	public DocumenterNotFoundException(DocumenterName name) {
		this(name.name());
	}

	/**
	 * Creates a new exception indicating that a documenter with the specified
	 * name was not found.
	 */
	public DocumenterNotFoundException(String name) {
		super(name);
	}

	/**
	 * Creates a new exception indicating that a documenter with the specified
	 * name was not found for the specified underlying reason.
	 */
	DocumenterNotFoundException(DocumenterName name, Throwable cause) {
		super(name.name(), cause);
	}
}


================================================
FILE: src/opennlp/ccg/grammardoc/DocumenterSourceException.java
================================================
/*
 * $Id: DocumenterSourceException.java,v 1.2 2006/11/01 02:53:20 coffeeblack Exp $
 */
package opennlp.ccg.grammardoc;

/**
 * An exception thrown by a {@link Documenter} because of a problem in the
 * source grammar. This exception tracks the
 * {@link SourceGrammarFile source grammar file} where the problem occurred.
 * 
 * @author Scott Martin (http://www.ling.osu.edu/~scott/)
 * @version $Revision: 1.2 $
 */
public class DocumenterSourceException extends DocumenterException {

	private static final long serialVersionUID = 1L;

	protected SourceGrammarFile sourceGrammarFile;

	/**
	 * Creates a new exception signaling a problem in the specified source
	 * grammar file.
	 */
	public DocumenterSourceException(SourceGrammarFile sourceGrammarFile) {
		this.sourceGrammarFile = sourceGrammarFile;
	}

	/**
	 * Creates a new exception with the specified message, signaling a problem
	 * in the specified source grammar file.
	 */
	public DocumenterSourceException(String message,
			SourceGrammarFile sourceGrammarFile) {
		super(message);
		this.sourceGrammarFile = sourceGrammarFile;
	}

	/**
	 * Creates a new exception with the specified message and underlying cause,
	 * signaling a problem in the specified source grammar file.
	 */
	public DocumenterSourceException(String message, Throwable cause,
			SourceGrammarFile sourceGrammarFile) {
		super(message, cause);
		this.sourceGrammarFile = sourceGrammarFile;
	}

	/**
	 * Creates a new exception with the specified underlying cause, signaling a
	 * problem in the specified source grammar file.
	 */
	public DocumenterSourceException(Throwable cause,
			SourceGrammarFile sourceGrammarFile) {
		super(cause);
		this.sourceGrammarFile = sourceGrammarFile;
	}

	/**
	 * Gets the source grammar file where this problem occurred.
	 */
	public SourceGrammarFile getSourceGrammarFile() {
		return sourceGrammarFile;
	}

}


================================================
FILE: src/opennlp/ccg/grammardoc/GrammarDoc.java
================================================
/*
 * $Id: GrammarDoc.java,v 1.7 2007/05/30 22:53:17 coffeeblack Exp $
 */
package opennlp.ccg.grammardoc;

import java.io.File;
import java.io.IOException;
import java.io.PrintStream;
import java.util.Arrays;
import java.util.Iterator;
import java.util.List;

import javax.xml.parsers.DocumentBuilder;
import javax.xml.parsers.DocumentBuilderFactory;
import javax.xml.parsers.ParserConfigurationException;

import org.apache.tools.ant.BuildException;
import org.apache.tools.ant.Project;
import org.apache.tools.ant.Target;
import org.apache.tools.ant.Task;
import org.w3c.dom.Document;
import org.w3c.dom.NodeList;
import org.xml.sax.SAXException;

/**
 * Class that implements the <code>grammardoc</code> ant task.
 * 
 * @author Scott Martin (http://www.ling.osu.edu/~scott/)
 * @version $Revision: 1.7 $
 */
public class GrammarDoc extends Task implements DocumenterContext {

	private File srcDir, destDir;

	/**
	 * Executes the grammardoc task. This method finds the specified
	 * <code>srcDir</code> and <code>destDir</code>, then invokes a
	 * {@link Documenter documenter} with those parameters.
	 * 
	 * @throws BuildException If a source directory or destination directory is
	 *             not specified, or the source directory does not exist.
	 */
	@Override
	public void execute() throws BuildException {
		if(srcDir == null) {
			srcDir = new File(System.getProperty("user.dir"));
		}
		
		if(!srcDir.exists()) {
			throw new BuildException("Source directory does not exist");
		}
		
		if(destDir == null) {
			destDir = new File(srcDir, "docs");
		}

		if(!destDir.exists()) {
			log("Creating directory " + destDir);
			destDir.mkdirs();
		}

		try {
			Documenter documenter = DocumenterFactory.newInstance()
					.newDocumenter();

			log("Using " + documenter.getName());
			log("Documenting " + srcDir.getAbsolutePath());
			log("Generating documentation to " + destDir);

			documenter.setDocumenterContext(this);
			documenter.document(loadSourceGrammar());
			log("Done");
		}
		catch(DocumenterNotFoundException dnfe) {
			throw new BuildException("documenter not found: "
					+ dnfe.getMessage(), getLocation());
		}
		catch(DocumenterSourceException dse) {
			throw new BuildException("problem in source file "
					+ dse.getSourceGrammarFile() + ": " + dse.getMessage(),
					getLocation());
		}
		catch(DocumenterException de) {
			throw new BuildException("problem documenting: " + de.getMessage(),
					de);
		}
		catch(GrammarDocException gde) {
			throw new BuildException(gde.getMessage(), getLocation());
		}
	}

	SourceGrammar loadSourceGrammar() throws GrammarDocException {
		SourceGrammar sourceGrammar = new SourceGrammar(srcDir);

		try {
			SourceGrammarFile grammar = loadGrammarFile(
					SourceGrammarFileType.GRAMMAR,
					new File(srcDir, SourceGrammarFileType.GRAMMAR.fileName
							+ ".xml"));
			sourceGrammar.addSourceGrammarFile(SourceGrammarFileType.GRAMMAR,
					grammar);
			//TODO make these StreamSource instead
			File gd = grammar.sourceFile;
			
			for(SourceGrammarFileType fileType
					: SourceGrammarFileType.values()) {
				if(!fileType.equals(SourceGrammarFileType.GRAMMAR)) { // already
					DocumentBuilder db = DocumentBuilderFactory.newInstance()
						.newDocumentBuilder();
					Document doc = db.parse(gd);
					
					NodeList fileEls = doc.getElementsByTagName(
							fileType.name().toLowerCase());
					if(fileEls.getLength() == 0) {
						if(fileType.isRequired()) {
							throw new GrammarDocException(
								"file type required but missing: " + fileType);
						}
					}
					else {
						sourceGrammar.addSourceGrammarFile(fileType,
								loadGrammarFile(fileType, 
									new File(srcDir,
											fileType.fileName + ".xml")));
					}
				}
			}
		}
		catch(ParserConfigurationException pce) {
			throw new GrammarDocException("parser configuration problem: "
					+ pce.getMessage(), pce);
		}
		catch(SAXException se) {
			throw new GrammarDocException("problem parsing source files: "
					+ se.getMessage(), se);
		}
		catch(IOException io) {
			throw new GrammarDocException("io problem with source files: "
					+ io.getMessage(), io);
		}

		return sourceGrammar;
	}
	
	SourceGrammarFile loadGrammarFile(SourceGrammarFileType fileType, File file) 
			throws GrammarDocException {
		if(!file.exists()) {			
			throw new GrammarDocException("file " + file.getName()
					+ " does not exist in " + srcDir);
		}
		else if(file.isDirectory()) {
			throw new GrammarDocException(file.getName()
					+ " refers to a directory in " + srcDir);
		}
		else {
			log("Loading " + file.getName());

			try {
				return new SourceGrammarFile(fileType, file);
			}
			catch(Exception e) {
				throw new GrammarDocException("problem parsing "
						+ file + ": " + e.getMessage(), e);
			}
		}
	}

	/**
	 * For conformance with {@link DocumenterContext}.
	 */
	public File getDestinationDirectory() {
		return getDestDir();
	}

	/**
	 * @return Returns the destDir.
	 */
	public File getDestDir() {
		return destDir;
	}

	/**
	 * @param destDir The destDir to set.
	 */
	public void setDestDir(File destDir) {
		this.destDir = destDir.getAbsoluteFile();
	}

	/**
	 * @return Returns the sourceDirectory.
	 */
	public File getSrcDir() {
		return srcDir;
	}

	/**
	 * @param srcDir The sourceDirectory to set.
	 */
	public void setSrcDir(File srcDir) {
		this.srcDir = srcDir.getAbsoluteFile();
	}
	
	public static void main(String[] args) {
		List<String> arguments = Arrays.asList(args);
		PrintStream out = System.out;
		GrammarDoc gd = new CommandGrammarDoc(out);
		
		if(arguments.contains("-h") || arguments.contains("--help")) {
			out.println("usage: ccg-grammardoc [-s|--source sourceDir] "
				+ "[-d|--dest destDir]");
		}
		else {
			Iterator<String> i = arguments.iterator();
			
			try {
				while(i.hasNext()) {
					String s = i.next();
					
					if(s.equals("-s") || s.equals("--source")) {
						if(gd.srcDir != null) {
							throw new IllegalArgumentException(
									"source directory already specified");
						}
						if(!i.hasNext()) {
							throw new IllegalArgumentException(
									"encountered flag " + s 
										+ ", but no directory specified");
						}
						
						gd.setSrcDir(new File(i.next()));
					}
					else if(s.equals("-d") || s.equals("--dest")) {
						if(gd.destDir != null) {
							throw new IllegalArgumentException(
									"destination directory already specified");
						}
						if(!i.hasNext()) {
							throw new IllegalArgumentException(
									"encountered flag " + s
										+ ", but no directory specified");
						}
						
						gd.setDestDir(new File(i.next()));
					}
				}
				
				gd.execute();
			}
			catch(Exception e) {
				gd.log("Error: " + e.getMessage());
			}			
		}
	}
	
	static final class CommandGrammarDoc extends GrammarDoc {
		PrintStream out;
		static final String logPrefix = "[grammardoc] ";
		
		CommandGrammarDoc(PrintStream out) {
			this.out = out;
			
			setProject(new Project());
			setOwningTarget(new Target());
		}

		@Override
		public void log(String s) {
			out.print(logPrefix);			
			out.println(s);
		}
	}
}


================================================
FILE: src/opennlp/ccg/grammardoc/GrammarDocException.java
================================================
/*
 * $Id: GrammarDocException.java,v 1.2 2006/11/01 02:53:20 coffeeblack Exp $
 */
package opennlp.ccg.grammardoc;

/**
 * An exception that occurs during the execution of {@link GrammarDoc}.
 * 
 * @author Scott Martin (http://www.ling.osu.edu/~scott/)
 * @version $Revision: 1.2 $
 */
public class GrammarDocException extends Exception {

	private static final long serialVersionUID = 1L;

	/**
	 * Creates a new exception.
	 */
	public GrammarDocException() {
		super();
	}

	/**
	 * Creates a new exception with the specified message.
	 */
	public GrammarDocException(String message) {
		super(message);
	}

	/**
	 * Creates a new exception with the specified message and underlying cause.
	 */
	public GrammarDocException(String message, Throwable cause) {
		super(message, cause);
	}

	/**
	 * Creates a new exception with the specified underlying cause.
	 */
	public GrammarDocException(Throwable cause) {
		super(cause);
	}

}


================================================
FILE: src/opennlp/ccg/grammardoc/SourceGrammar.java
================================================
/*
 * $Id: SourceGrammar.java,v 1.4 2007/03/19 17:45:35 coffeeblack Exp $
 */
package opennlp.ccg.grammardoc;

import java.io.File;
import java.util.EnumMap;
import java.util.Map;
import java.util.Set;

/**
 * Represents an OpenCCG grammar that is specified in a series of XML files.
 * 
 * @author Scott Martin (http://www.ling.osu.edu/~scott/)
 * @version $Revision: 1.4 $
 */
public class SourceGrammar {

	File sourceDirectory;
	Map<SourceGrammarFileType, SourceGrammarFile> sourceFiles;

	SourceGrammar(File sourceDirectory) {
		this.sourceDirectory = sourceDirectory;
		sourceFiles = new EnumMap<SourceGrammarFileType, SourceGrammarFile>
			(SourceGrammarFileType.class);
	}

	/**
	 * @return Returns the sourceDirectory.
	 */
	public File getSourceDirectory() {
		return sourceDirectory;
	}

	/**
	 * Gets the {@link SourceGrammarFileType file names} found in this source
	 * grammar.
	 */
	public Set<SourceGrammarFileType> getSourceGrammarFileTypes() {
		return sourceFiles.keySet();
	}

	/**
	 * Gets a source grammar file based on a specified
	 * {@link SourceGrammarFileType file name}.
	 * 
	 * @param fileType The file name identifying the desired
	 *            {@link SourceGrammarFile source grammar file}.
	 */
	public SourceGrammarFile getSourceGrammarFile(
			SourceGrammarFileType fileType) {
		return sourceFiles.get(fileType);
	}

	void addSourceGrammarFile(SourceGrammarFileType fileType,
			SourceGrammarFile sourceGrammarFile) {
		sourceFiles.put(fileType, sourceGrammarFile);
	}

}


================================================
FILE: src/opennlp/ccg/grammardoc/SourceGrammarFile.java
================================================
/*
 * $Id: SourceGrammarFile.java,v 1.4 2007/05/30 22:53:17 coffeeblack Exp $
 */
package opennlp.ccg.grammardoc;

import java.io.File;

import org.w3c.dom.Document;

/**
 * A file found in a source grammar. This class encapsulates the predefined
 * {@link SourceGrammarFileType file name} and {@link Document DOM document}.
 * 
 * @author Scott Martin (http://www.ling.osu.edu/~scott/)
 * @version $Revision: 1.4 $
 */
public class SourceGrammarFile {

	SourceGrammarFileType fileType;
	File sourceFile;

	/**
	 * Creates a new source grammar file.
	 */
	SourceGrammarFile(SourceGrammarFileType fileName, File sourceFile) {
		this.fileType = fileName;
		this.sourceFile = sourceFile;
	}

	/**
	 * @return Returns the fileType.
	 */
	public SourceGrammarFileType getFileType() {
		return fileType;
	}

	/**
	 * @return Returns the source file.
	 */
	public File getSourceFile() {
		return sourceFile;
	}

	/**
	 * Gets a string version of this source grammar file.
	 * 
	 * @return The value of this grammar file's
	 *         {@link SourceGrammarFileType#toString() file type}.
	 */
	@Override
	public String toString() {
		return fileType.toString();
	}

}


================================================
FILE: src/opennlp/ccg/grammardoc/SourceGrammarFileType.java
================================================
/*
 * $Id: SourceGrammarFileType.java,v 1.3 2007/05/02 21:51:35 coffeeblack Exp $
 */
package opennlp.ccg.grammardoc;

/**
 * File types for source grammars.
 * 
 * @author Scott Martin (http://www.ling.osu.edu/~scott/)
 * @version $Revision: 1.3 $
 */
public enum SourceGrammarFileType {
	GRAMMAR("grammar"),
	LEXICON("lexicon"),
	MORPHOLOGY("morph"),
	RULES("rules"),
	TYPES("types", false),
	DOCUMENTATION("documentation", false);
	
	final String fileName;
	final boolean required;
	
	private SourceGrammarFileType(String fileName) {
		this(fileName, true);
	}
	
	private SourceGrammarFileType(String fileName, boolean required) {
		this.fileName = fileName;
		this.required = required;
	}
	
	/**
	 * Gets the file name associated with this file type.
	 */
	public String getFileName() {
		return fileName;
	}
	
	/**
	 * Tests whether or not this grammar file name is required.
	 * @return true iff this grammar file type is required to be present in a
	 * grammar.
	 */
	public boolean isRequired() {
		return required;
	}
}

================================================
FILE: src/opennlp/ccg/grammardoc/html/HTMLDocumenter.java
================================================
/*
 * $Id: HTMLDocumenter.java,v 1.9 2009/12/21 04:18:31 mwhite14850 Exp $
 */
package opennlp.ccg.grammardoc.html;

import java.io.BufferedOutputStream;
import java.io.File;
import java.io.FileOutputStream;
import java.io.IOException;
import java.io.InputStream;
import java.util.HashMap;
import java.util.Map;

import javax.xml.transform.Source;
import javax.xml.transform.Templates;
import javax.xml.transform.Transformer;
import javax.xml.transform.TransformerConfigurationException;
import javax.xml.transform.TransformerException;
import javax.xml.transform.TransformerFactory;
import javax.xml.transform.URIResolver;
import javax.xml.transform.stream.StreamResult;
import javax.xml.transform.stream.StreamSource;

import opennlp.ccg.grammardoc.AbstractDocumenter;
import opennlp.ccg.grammardoc.DocumenterException;
import opennlp.ccg.grammardoc.DocumenterSourceException;
import opennlp.ccg.grammardoc.SourceGrammar;
import opennlp.ccg.grammardoc.SourceGrammarFile;
import opennlp.ccg.grammardoc.SourceGrammarFileType;

/**
 * A grammardoc documenter that produces <acronym title="Hypertext Markup
 * Language">HTML</acronym> documentation.
 * 
 * @author Scott Martin (http://www.ling.osu.edu/~scott/)
 * @version $Revision: 1.9 $
 */
public class HTMLDocumenter extends AbstractDocumenter implements URIResolver {

	private static final int FILE_BUFFER_SIZE = 256;
	private SourceGrammar sourceGrammar;
	private Map<String, Templates> templateCache;
	
	final TransformerFactory factory = TransformerFactory.newInstance();
	
	static enum FileName {
		STYLESHEET("grammardoc.css"), LEXICON_SCRIPT("lexicon.js");

		final String name;

		private FileName(String name) {
			this.name = name;
		}
	}

	/**
	 * Creates a new HTML Documenter.
	 */
	public HTMLDocumenter() {
		super("GrammarDoc HTML Documenter");
		templateCache = new HashMap<String, Templates>();
		factory.setURIResolver(this);
	}

	/**
	 * Documents a source grammar, producing linked HTML files for its source
	 * files.
	 */
	public void document(SourceGrammar grammar) throws DocumenterException {
		this.sourceGrammar = grammar;
		File destDir = documenterContext.getDestinationDirectory();
		copyFiles(destDir);
		
		String sections;
		StringBuilder sb = new StringBuilder();
		for(SourceGrammarFileType fileType
				: grammar.getSourceGrammarFileTypes()) {
			if(sb.length() > 0) {
				sb.append('|');
			}
			sb.append(fileType.getFileName());
		}
		sections = sb.toString();

		for(SourceGrammarFileType fileType : grammar
				.getSourceGrammarFileTypes()) {
			String baseName = fileType.getFileName();

			StringBuilder fb = new StringBuilder();
			fb.append(baseName.equals(
					SourceGrammarFileType.GRAMMAR.getFileName())
					? "index" : baseName);
			fb.append(".html");
			String targetName = fb.toString();

			SourceGrammarFile sourceFile
				= grammar.getSourceGrammarFile(fileType);
			Templates templates = loadTemplates(baseName);
			
			if(templates != null) {
				documenterContext.log("Generating " + targetName);

				try {
					File f = new File(destDir, targetName);
					StreamResult res = new StreamResult(
							new BufferedOutputStream(new FileOutputStream(f)));
					res.setSystemId(f);
					
					Transformer transformer = templates.newTransformer();
					transformer.setURIResolver(this);
					transformer.setParameter("sections", sections);		
					transformer.transform(
							new StreamSource(sourceFile.getSourceFile()), res);
				}
				catch(TransformerException te) {
					throw new DocumenterSourceException(
							"problem transforming output: "
									+ te.getMessageAndLocation(), te,
									sourceFile);
				}
				catch(IOException ioe) {
					throw new DocumenterException(ioe);
				}
			}
		}
	}

	/**
	 * Resolves URIs to sources. Used by the XSLT files in this package to
	 * resolve xsl:import and document() URIs.
	 */
	public Source resolve(String href, String base) throws TransformerException {

		StreamSource ss = null;
		
		if(href != null && href.length() > 0) {
			if(href.endsWith(".xsl")) {
				ss = new StreamSource(getResource(href));
			}
			else {
				File f = new File(sourceGrammar.getSourceDirectory(), href);
				if(!f.exists()) {
					throw new TransformerException("file does not exist: " + f);
				}
				if(f.isDirectory()) {
					throw new TransformerException("file is a directory: " + f);
				}
				
				ss = new StreamSource(f);
				ss.setSystemId(f);
			}
		}
		
		return ss;
	}

	private Templates loadTemplates(String baseName)
			throws DocumenterException {
		StringBuilder tb = new StringBuilder(baseName);
		tb.append(".xsl");
		String templateName = tb.toString();

		if(!templateCache.containsKey(templateName)) {
			InputStream is = getResource(templateName.toString());
			if(is == null) {
				return null;
			}

			try { // cache for later
				templateCache.put(templateName, 
						factory.newTemplates(new StreamSource(is)));
			}
			catch(TransformerConfigurationException tce) {
				throw new DocumenterException("problem loading template "
						+ templateName.toString() + ": "
							+ tce.getMessageAndLocation(), tce);
			}
		}
		
		return templateCache.get(templateName);
	}

	private void copyFiles(File destDir) throws DocumenterException {
		for(FileName fileName : FileName.values()) {
			doCopyFile(fileName, destDir);
		}
	}

	private void doCopyFile(FileName fileName, File destDir)
			throws DocumenterException {
		InputStream in = getResource(fileName.name);

		if(in == null) {
			throw new DocumenterException("Could not find " + fileName.name);
		}

		File f = new File(destDir, fileName.name);
		documenterContext.log("Writing " + f.getAbsolutePath());

		try {
			FileOutputStream fileOut = new FileOutputStream(f);
			byte[] buffer = new byte[HTMLDocumenter.FILE_BUFFER_SIZE];

			int i;
			while((i = in.read(buffer)) != -1) {
				fileOut.write(buffer, 0, i);
			}

			in.close();
			fileOut.close();
		}
		catch(IOException ioe) {
			throw new DocumenterException("problem copying file: "
					+ ioe.getMessage(), ioe);
		}
	}

	private InputStream getResource(String resourceName) {
		Class<? extends HTMLDocumenter> cl = getClass();
		String cn = cl.getName();
		String pkg = cn.substring(0, cn.lastIndexOf('.'));

		StringBuilder sb = new StringBuilder();
		sb.append(pkg.replace('.', '/'));
		sb.append('/');
		sb.append(resourceName);

		return cl.getClassLoader().getResourceAsStream(sb.toString());
	}
}


================================================
FILE: src/opennlp/ccg/grammardoc/html/base.xsl
================================================
<?xml version="1.0"?>
<!-- 
	$Id: base.xsl,v 1.2 2007/04/18 22:43:07 coffeeblack Exp $
	Author: Scott Martin (http://www.ling.osu.edu/~scott/)
-->
<xsl:stylesheet version="1.0"
	xmlns="http://www.w3.org/1999/xhtml"
	xmlns:xsl="http://www.w3.org/1999/XSL/Transform">
	
	<xsl:strip-space elements="*"/>
	
	<xsl:import href="navigation.xsl"/>
	<xsl:import href="comments.xsl"/>
	
	<xsl:output
		method="xml"
		omit-xml-declaration="yes"
		media-type="text/html"
		encoding="ISO-8859-1"
		indent="yes"	
		doctype-public="-//W3C//DTD XHTML 1.0 Strict//EN"
		doctype-system="http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd"/>
	
	<xsl:template match="grammar|ccg-lexicon|morph|types|rules">
		<xsl:variable name="grammar-name"
			select="document('grammar.xml')/grammar/@name"/>
		<xsl:variable name="page-name">
			<xsl:choose>
				<xsl:when test="self::grammar">grammar</xsl:when>
				<xsl:when test="self::ccg-lexicon">lexicon</xsl:when>
				<xsl:when test="self::morph">morph</xsl:when>
				<xsl:when test="self::types">types</xsl:when>
				<xsl:when test="self::rules">rules</xsl:when>
			</xsl:choose>
		</xsl:variable>
	
		<html lang="en">
			<head>
				<title>
					<xsl:text>Documentation for CCG grammar </xsl:text>
					<xsl:value-of
						select="$grammar-name"/>
					<xsl:if test="not($page-name='grammar')">
						<xsl:text> : </xsl:text>
						<xsl:call-template name="capitalize">
							<xsl:with-param name="word" select="$page-name"/>
						</xsl:call-template>
					</xsl:if>
				</title>
				<meta name="author" content="Scott Martin"/>
				<meta name="description">
					<xsl:attribute name="content">
						<xsl:text>Generated documentation for </xsl:text>
						<xsl:text>the CCG grammar </xsl:text>
						<xsl:value-of select="$grammar-name"/>
					</xsl:attribute>
				</meta>
				<link rel="author" title="Author: Scott Martin"
					href="http://www.ling.osu.edu/~scott/" type="text/html"/>
				<link rel="stylesheet" name="GrammarDoc" href="grammardoc.css"/>
				<xsl:if test="$page-name='lexicon' or $page-name='rules'">
					<script type="text/javascript" src="lexicon.js">
						<xsl:text> </xsl:text>
					</script>
				</xsl:if>
			</head>
			<body>
				<h1>
					<xsl:call-template name="capitalize">
						<xsl:with-param name="word" select="$page-name"/>
					</xsl:call-template>
					<xsl:text> </xsl:text>
					<xsl:value-of select="$grammar-name"/>
				</h1>
				
				<xsl:call-template name="navigation-generator">
					<xsl:with-param name="current" select="$page-name"/>
				</xsl:call-template>
				
				<div id="container">
					<xsl:call-template name="comment-handler"/>
					<xsl:apply-templates
						select="current()"
						mode="invoked"/>
				</div>
			</body>
		</html>
	</xsl:template>
	
	<xsl:template name="capitalize">
		<xsl:param name="word"></xsl:param>
		<xsl:if test="not(word='')">
			<xsl:value-of select="translate(substring($word, 1, 1),
				'abcdefghijklmnopqrstuvwxyz', 'ABCDEFGHIJKLMNOPQRSTUVWXYZ')"/>
			<xsl:value-of select="substring($word, 2)"/>
		</xsl:if>
	</xsl:template>

</xsl:stylesheet>

================================================
FILE: src/opennlp/ccg/grammardoc/html/categories.xsl
================================================
<?xml version="1.0"?>
<!-- 
	$Id: categories.xsl,v 1.12 2007/04/19 22:06:47 coffeeblack Exp $
	Author: Scott Martin (http://www.ling.osu.edu/~scott/)
-->
<xsl:stylesheet version="1.0"
	xmlns="http://www.w3.org/1999/xhtml"
	xmlns:xsl="http://www.w3.org/1999/XSL/Transform">
	
	<xsl:template match="fs/feat/lf">
		<xsl:value-of select="nomvar/@name"/>
	</xsl:template>
	
	<!--
		an atomic category occuring either within an entry or within a
		complex category	
	-->
	<xsl:template match="complexcat/atomcat|setarg/atomcat">
		<xsl:if test="@type">
			<dt>
				<xsl:value-of select="@type"/>
			</dt>
		</xsl:if>
		<xsl:apply-templates/>
	</xsl:template>
	
	<xsl:template match="complexcat/complexcat|atomcat/complexcat">
		<span class="enclosure">(</span>
		<dd class="category-container">
			<dl class="category">
				<xsl:apply-templates/>
			</dl>
		</dd>
		<span class="enclosure">)</span>
	</xsl:template>
	
	<xsl:template match="fs">
		<dd>
			<dl class="feature-structure">
				<xsl:if test="@id or @inheritsFrom">
					<dt class="fsid">
						<xsl:text>&lt;</xsl:text>
						<xsl:choose>
							<xsl:when test="@id">
								<xsl:value-of select="@id"/>
							</xsl:when>
							<xsl:when test="@inheritsFrom">
								<xsl:text>~</xsl:text><xsl:value-of
									select="@inheritsFrom"/>
							</xsl:when>
						</xsl:choose>
						<xsl:text>&gt;</xsl:text>
					</dt>
				</xsl:if>
				
				<xsl:apply-templates/>
			</dl>
		</dd>
	</xsl:template>
	
	<xsl:template match="fs/feat">
		<dd class="feat">
			<xsl:choose>
				<xsl:when
					test="preceding-sibling::feat[1][@val or featvar or lf]">
						<xsl:text>,</xsl:text>
				</xsl:when>
				<xsl:otherwise>
					<span class="enclosure">[</span>
				</xsl:otherwise>
			</xsl:choose>
			
			<acronym title="{@attr}">		
				<xsl:choose>
					<xsl:when test="@val">
						<xsl:value-of select="@val"/>
					</xsl:when>
					<xsl:otherwise>
						<xsl:apply-templates/>
					</xsl:otherwise>
				</xsl:choose>
			</acronym>

			<xsl:if test="not(following-sibling::feat)">
				<span class="enclosure">]</span>
			</xsl:if>
		</dd>
	</xsl:template>
	
	<xsl:template match="fs/feat/featvar">
		<xsl:value-of select="@name"/>
	</xsl:template>
	
	<xsl:template match="fs/feat/lf">
		<xsl:apply-templates/>
	</xsl:template>
	
	<xsl:template match="fs/feat/lf/nomvar|fs/feat/lf/prop|fs/feat/lf/var">
		<xsl:value-of select="@name"/>
	</xsl:template>
	
	<xsl:template match="complexcat/setarg">
		<span class="enclosure">{</span>
		<xsl:apply-templates/>
		<span class="enclosure">}</span>
	</xsl:template>
	
	<xsl:template match="complexcat/slash|setarg/slash">
		<dt>
			<xsl:attribute name="class">
				<xsl:text>slash</xsl:text>
				<xsl:if test="not(@dir) and following-sibling::node()[
					not(self::text())][1][self::dollar]">
					<xsl:text> redundant</xsl:text>
				</xsl:if>
			</xsl:attribute>
			
			<xsl:variable name="mode">
				<xsl:choose>
					<xsl:when test="@mode">
						<xsl:value-of select="@mode"/>
					</xsl:when>
					<xsl:otherwise>.</xsl:otherwise>
				</xsl:choose>
			</xsl:variable>
			
			<xsl:choose>
				<xsl:when test="@dir">
					<xsl:value-of select="@dir"/>
				</xsl:when>
				<xsl:otherwise>
					<xsl:text>|</xsl:text>
				</xsl:otherwise>
			</xsl:choose>
			
			<xsl:variable name="mode-text">
				<xsl:choose>
					<xsl:when test="$mode='*'">
						<xsl:text>application only</xsl:text>
					</xsl:when>
					<xsl:when test="$mode='^'">
						<xsl:text>associative</xsl:text>
					</xsl:when>
					<xsl:when test="$mode='x'">
						<xsl:text>permutative</xsl:text>
					</xsl:when>
					<xsl:when test="$mode='x&gt;'">
						<xsl:text>permutative right</xsl:text>
					</xsl:when>
					<xsl:when test="$mode='&lt;x'">
						<xsl:text>permutative left</xsl:text>
					</xsl:when>
					<xsl:when test="$mode='&gt;'">
						<xsl:text>associative permutative right</xsl:text>
					</xsl:when>
					<xsl:when test="$mode='&lt;'">
						<xsl:text>associative permutative left</xsl:text>
					</xsl:when>
					<xsl:when test="$mode='.'">
						<xsl:text>all rules</xsl:text>
					</xsl:when>
				</xsl:choose>
			</xsl:variable>
			
			<span class="mode">
				<acronym title="{$mode-text}">
					<xsl:value-of select="$mode"/>
				</acronym>
			</span>
		</dt>
	</xsl:template>
	
	<xsl:template match="atomcat/lf|complexcat/lf">
		<dt>
			<dl class="lf">
				<span class="divider"> : </span>
				<xsl:apply-templates/>
			</dl>
		</dt>
	</xsl:template>
	
	<xsl:template match="lf/satop">
		<xsl:if test="preceding-sibling::*">
			<span class="divider"> ^ </span>
		</xsl:if>
		<dt>@</dt>
		<dd class="nomvar">
			<xsl:value-of select="@nomvar"/>
		</dd>
		<dt>
			<span class="enclosure">(</span>
			<xsl:apply-templates/>
			<span class="enclosure">)</span>
		</dt>
	</xsl:template>
	
	<xsl:template match="satop/prop">
		<span class="prop">
			<xsl:value-of select="@name"/>
		</span>
	</xsl:template>
	
	<xsl:template match="diamond">
		<xsl:variable name="diamondSingleton"
			select="parent::diamond
				and not(preceding-sibling::* or following-sibling::*)"/>
		<xsl:variable name="satopSibling"
			select="parent::satop and preceding-sibling::*"/>
		<xsl:variable name="enclosedChildren"
			select="child::diamond or child::prop or child::var"/>
	
		<xsl:if test="parent::diamond or $satopSibling">
			<span class="divider"> ^ </span>
			<xsl:if test="$diamondSingleton">
				<span class="enclosure">(</span>
			</xsl:if>
		</xsl:if>
		
		<xsl:text>&lt;</xsl:text>
		<xsl:value-of select="@mode"/>
		<xsl:text>&gt;</xsl:text>
		
		<xsl:if test="$enclosedChildren">
			<span class="enclosure">(</span>
		</xsl:if>
		
		<xsl:apply-templates select="diamond|nomvar|prop|var"/>
		
		<xsl:if test="$enclosedChildren">
			<span class="enclosure">)</span>
		</xsl:if>
		
		<xsl:if test="$diamondSingleton">
			<span class="enclosure">)</span>
		</xsl:if>
	</xsl:template>
	
	<xsl:template match="diamond/prop|diamond/nomvar|diamond/var">
		<xsl:if test="preceding-sibling::*">
			<span class="divider"> ^ </span>
		</xsl:if>
	
		<span class="prop">
			<xsl:value-of select="@name"/>
		</span>
	</xsl:template>

	<xsl:template match="complexcat/dollar">
		<dt class="dollar">$</dt>
		<dd>
			<xsl:value-of select="@name"/>
		</dd>
	</xsl:template>

</xsl:stylesheet>

================================================
FILE: src/opennlp/ccg/grammardoc/html/comments.xsl
================================================
<?xml version="1.0"?>
<!-- 
	$Id: comments.xsl,v 1.3 2006/12/13 19:25:22 coffeeblack Exp $
	Author: Scott Martin (http://www.ling.osu.edu/~scott/)
-->
<xsl:stylesheet version="1.0"
	xmlns="http://www.w3.org/1999/xhtml"
	xmlns:xsl="http://www.w3.org/1999/XSL/Transform">
	
	<xsl:template name="comment-handler">
		<xsl:if test="preceding-sibling::node()[
				not(self::text())][1][self::comment()]">
			<xsl:call-template name="comment-generator">
				<xsl:with-param name="text"
					select="preceding-sibling::node()[not(self::text())][1]"/>
			</xsl:call-template>
		</xsl:if>
	</xsl:template>
	
	<xsl:template name="comment-generator">
		<xsl:param name="text"/>
		<xsl:if test="not(text='')">
			<pre>
				<xsl:value-of select="$text"/>
			</pre>
		</xsl:if>
	</xsl:template>
	
</xsl:stylesheet>

================================================
FILE: src/opennlp/ccg/grammardoc/html/grammar.xsl
================================================
<?xml version="1.0"?>
<!-- 
	$Id: grammar.xsl,v 1.2 2006/12/13 19:25:22 coffeeblack Exp $
	Author: Scott Martin (http://www.ling.osu.edu/~scott/)
 -->
<xsl:stylesheet version="1.0"
	xmlns="http://www.w3.org/1999/xhtml"
	xmlns:xsl="http://www.w3.org/1999/XSL/Transform">
	
	<xsl:import href="base.xsl" />
	
	<xsl:template match="grammar" mode="invoked">
		<xsl:apply-imports/>
	</xsl:template>
	
	<xsl:template name="content-generator"/>
</xsl:stylesheet>

================================================
FILE: src/opennlp/ccg/grammardoc/html/grammardoc.css
================================================
/*
 * $Id: grammardoc.css,v 1.8 2007/04/18 22:54:13 coffeeblack Exp $
 * Author: Scott Martin (http://www.ling.osu.edu/~scott/)
 */
body
{
	margin: 0 0 2em 0;
	padding: 0;
	background-color: rgb(250,250,250);
	color: rgb(25,25,25);
	font-family: Verdana, Arial, Helvetica, sans-serif;
	font-size: small;
}

a:hover
{
	text-decoration: none;
}

acronym
{
	border-bottom: 1px dotted;
	cursor: help;	
}

div.back
{
	text-align: right;
}

div#container {
	margin: 0 20px;
	clear: left;
}

h1, h2, h3, h4, h5
{
	font-family: Trebuchet MS, Arial, Helvetica, sans-serif;
}

h1
{
	margin: 0 0 1em 0;
	border-bottom: 1px dotted rgb(150,150,150);
	padding: 2em 0 .5em 20px;
	background-color: rgb(153,0,0);
	color: rgb(250,250,250);
	font-size: 1.8em;
}

h2
{
	margin: 2em 0 1em 0;
	border-bottom: 1px dotted rgb(160,160,160);
	padding-bottom: .25em;
	color: rgb(153,0,0);
	font-size: 1.6em;
}

h3
{
	color: rgb(80,0,0);
	font-size: 1.4em;
}

h4
{
	font-size: 1.2em;
}

h5
{
	font-size: 1.1em;
}

ul
{
	padding-left: 40px;
}

dl.box
{
	border: 1px solid rgb(150,150,150);
	background-color: rgb(235,235,235);
	padding: 10px;
}

dl.box dt
{
	color: rgb(153,51,0);
	font-family: Trebuchet MS, Arial, Helvetica, sans-serif;
	font-size: 1.1em;
	font-weight: bold;
}

dl.box dd, dl.attributes dd
{
	margin-left: 0;
}

dl.box dd li, ul.members li
{
	color: rgb(153,51,0);
}

ol.categories li
{
	/*font-size: 1.2em;*/
}

dl.category dt {
	font-size: 1.1em;
}

dl.category, dl.category dt, dl.category dd, dl.category dd dl
{
	display: inline;
}

dl.attributes dt
{
	float: left;
	margin-right: .25em;
	color: rgb(153,51,0);
	font-weight: bold;
}

dl.attributes dd
{
	color: rgb(153,85,50);
}

dl.category dt
{
	color: rgb(80,0,0);	
}

dl.feature-structure {
	font-size: .85em;
}

dl.category dd, dl.feature-structure dt, span.ruleLabel
{ 
	color: rgb(153,85,50);
	font-family: Georgia, "Times New Roman", serif;
}

dl.feature-structure dt
{
	font-family: Verdana, Arial, Helvetica, sans-serif;
	font-weight: normal;
}

dl.feature-structure dt, dl.feature-structure dd
{
	display: none;
}

span.enclosure, span.divider {
	font-size: 1.1em;
	font-weight: bold;
}

dl.feature-structure dd span.enclosure
{
	font-style: normal;
}

ol.categories li a
{
	margin-right: 10px;
	/*font-size: .85em;*/
	text-decoration: none;
}

.expanded dl.feature-structure dt, .expanded dl.feature-structure dd
{
	display: inline;
}

dl.category dd, span.ruleLabel {
	vertical-align: sub;
}

dl.category dd.category-container
{
	vertical-align: baseline;	
}

dd.category-container dl.category
{
	/*font-size: 1.1em;*/
}

dl.category dd.feat
{
	font-style: italic;
}

dt.slash span.mode
{
	/*font-size: .7em;*/
}

dl.category dt.redundant {
	display: none;
}

dl.lf {
	display: inline;
}

dl.lf dd.nomvar, dl.lf span.prop {
	font-weight: normal;
}

dl.lf dd.nomvar {
	font-style: italic;
}

dl.category span.prop {
	font-weight: bold;
}

dl.lf span.diamond, dl.lf span.prop {
	color: rgb(153,85,50);
}

dl.entries dl dt {
	margin-top: 1em;
}

dl.entries dl dd {
	margin-left: 20px;	
}

ul.rules {
	padding-left: 20px;
	list-style-type: none;
}

ul.rules li {
	padding-top: .5em;	
}

ul#navigation {
	margin-left: 20px;
	padding-bottom: 2em;
	padding-left: 0;
	list-style-type: none;
}

ul#navigation li a {
	float: left;
	margin-right: 10px;
	border: 1px solid rgb(150,150,150);
	background-color: rgb(235,235,235);
	color: rgb(153,0,0);
	padding: 5px;
	text-decoration: none;
	font-weight: bold;
}

ul#navigation li a.current, ul#navigation li a:hover,
	ul#navigation li a:active {
	background-color: rgb(153,0,0);
	border: 1px dotted rgb(150,150,150);
	color: rgb(255,255,255);
}

a.unaryRuleExpander {
	float: left;
	margin-right: 5px;
	text-decoration: none;
}

dd.unaryResult {
	display: inline;
}

dl.unaryRule {
	/*font-size: 1.1em !important;*/
	color: rgb(153,51,0);
}

dl.unaryRule span.arrow {
	color: rgb(153,85,50);
	font-weight: bold;
}

ul.short {
	list-style-type: none;
}

ul.short li {
	display: inline;
}

dl.shortcuts ul.short li {
	color: rgb(25,25,25);
}

ul.short li + li:before {
	content: ",";
}


================================================
FILE: src/opennlp/ccg/grammardoc/html/lexicon.js
================================================
/*
 * $Id: lexicon.js,v 1.2 2006/12/13 19:25:22 coffeeblack Exp $
 * Author: Scott Martin (http://www.ling.osu.edu/~scott/)
 */
function toggleFeatures(elem) {
	elem.className = (elem.className == "expanded")
		? "" : "expanded";
	
	var anchors = elem.getElementsByTagName("a");
	anchors[0].innerHTML = (elem.className == "expanded")
		? "[-]" : "[+]";
	
	anchors[0].setAttribute("title", 
		((elem.className == "expanded")
			? "collapse" : "expand") + " feature structures");
}

================================================
FILE: src/opennlp/ccg/grammardoc/html/lexicon.xsl
================================================
<?xml version="1.0"?>
<!-- 
	$Id: lexicon.xsl,v 1.6 2006/12/13 19:25:22 coffeeblack Exp $
	Author: Scott Martin (http://www.ling.osu.edu/~scott/)
 -->
<xsl:stylesheet version="1.0"
	xmlns="http://www.w3.org/1999/xhtml"
	xmlns:xsl="http://www.w3.org/1999/XSL/Transform">
	
	<xsl:import href="base.xsl"/>
	<xsl:import href="categories.xsl"/>

	<xsl:template match="ccg-lexicon" mode="invoked">
		<dl class="shortcuts box">
			<dt>Lexical Families</dt>
			<dd>
				<ul>
					<xsl:for-each select="family">
						<xsl:sort select="@name"/>
						<li>
							<a href="#{@name}">
								<xsl:value-of select="@name"/>
							</a>
						</li>
					</xsl:for-each>
				</ul>
			</dd>
		</dl>
		
		<xsl:apply-templates select="family">
			<xsl:sort select="@name"/>
		</xsl:apply-templates>
	</xsl:template>

	<xsl:template match="family">
		<div class="family">
			<a name="{@name}">
				<h2>
					<xsl:value-of select="@name"/>
				</h2>
			</a>
			
			<xsl:call-template name="comment-handler"/>
			
			<dl class="attributes">
				<dt>Closed: </dt>
				<dd>
					<xsl:choose>
						<xsl:when test="@closed">
							<xsl:value-of select="@closed"/>
						</xsl:when>
						<xsl:otherwise>false</xsl:otherwise>
					</xsl:choose>
				</dd>
				<dt>Part of Speech: </dt>
				<dd>
					<xsl:value-of select="@pos"/>
				</dd>
			</dl>
			
			<xsl:if test="not(@closed='true')">
				<a href="morph.html#{@pos}">Lexical Items</a>
			</xsl:if>
			
			<xsl:apply-templates select="entry">
				<xsl:sort select="@name"/>
			</xsl:apply-templates>
			
			<xsl:if test="member">
				<h3>Members</h3>
				<ul class="short">
					<xsl:apply-templates select="member[
						not(@stem=preceding-sibling::member/@stem)]">
						<xsl:sort select="@stem"/>
					</xsl:apply-templates>
				</ul>
			</xsl:if>
			
			<div class="back">
				<a href="#">Back to top</a>
			</div>
		</div>
	</xsl:template>
	
	<xsl:template match="member">
		<xsl:variable name="parentPos-stem">
			<xsl:value-of select="parent::family/@pos"/>
			<xsl:text>-</xsl:text>
			<xsl:value-of select="@stem"/>
		</xsl:variable>
		<li>
			<a href="morph.html#{$parentPos-stem}" name="{$parentPos-stem}">
				<xsl:value-of select="@stem"/>
			</a>
		</li>
	</xsl:template>
	
	<xsl:template match="entry">
		<h3>
			<xsl:value-of select="@name"/>
		</h3>
		
		<dl class="box">
			<dt>Categories</dt>
			<dd>
				<ol class="categories">
					<xsl:for-each select="atomcat|complexcat">
						<li>
							<a href="javascript://"
								title="expand feature structures"
								onclick="toggleFeatures(this.parentNode);">
								<xsl:text>[+]</xsl:text>
							</a>
							<dl class="category">
								<xsl:if test="name()='atomcat'">
									<dt>
										<xsl:value-of select="@type"/>
									</dt>
								</xsl:if>
							
								<xsl:apply-templates/>
							</dl>
						</li>
					</xsl:for-each>
				</ol>	
			</dd>
		</dl>
	</xsl:template>

</xsl:stylesheet>


================================================
FILE: src/opennlp/ccg/grammardoc/html/morph.xsl
================================================
<?xml version="1.0"?>
<!-- 
	$Id: morph.xsl,v 1.12 2006/12/13 19:25:22 coffeeblack Exp $
	Author: Scott Martin (http://www.ling.osu.edu/~scott/)
 -->
<xsl:stylesheet version="1.0"
	xmlns="http://www.w3.org/1999/xhtml"
	xmlns:xsl="http://www.w3.org/1999/XSL/Transform">

	<xsl:import href="base.xsl"/>
	<xsl:import href="categories.xsl"/>
	
	<xsl:template match="morph" mode="invoked">
		<dl class="shortcuts entries box">
			<dt>Entries</dt>
			<dd>
				<dl>
					<xsl:for-each select="entry[
							not(@pos=preceding-sibling::entry/@pos)]">
						<!-- sort by pos -->
						<xsl:sort select="@pos"/>
						<xsl:variable name="entryPos" select="@pos"/>
						
						<dt>
							<a href="#{$entryPos}">
								<xsl:value-of select="$entryPos"/>
							</a>
						</dt>
						<dd>
							<!-- show all stems in pos -->
							<ul class="short">
								<xsl:for-each select="//entry[@pos=$entryPos]">
									<xsl:sort select="@stem"/>	
									<xsl:sort select="@word"/>
									
									<xsl:variable name="entryStem"
										select="@stem"/>
								
									<xsl:variable name="linkContent">
										<xsl:choose>
											<xsl:when test="not(@stem or @word
												=preceding-sibling::entry[
													@pos=$entryPos]/@word)">
												<xsl:value-of select="@word"/>
											</xsl:when>
											<xsl:otherwise>
												<xsl:choose>
													<xsl:when test="@stem and
														not(preceding-sibling::
															entry[
																@pos=$entryPos
																and (@word
																	=$entryStem
																or @stem
																	=$entryStem)
																]
															)">
														<xsl:value-of
															select="@stem"/>
													</xsl:when>
												</xsl:choose>
											</xsl:otherwise>
										</xsl:choose>
									</xsl:variable>
									
									<xsl:if test="not($linkContent='')">
										<li>
											<a>
												<xsl:attribute name="href">
													<xsl:text>#</xsl:text>
													<xsl:value-of
														select="$entryPos"/>
													<xsl:text>-</xsl:text>
													<xsl:value-of
														select="$linkContent"/>
												</xsl:attribute>
												<xsl:value-of
													select="$linkContent"/>
											</a>
										</li>
									</xsl:if>
								</xsl:for-each>
							</ul>
						</dd>
					</xsl:for-each>
				</dl>
			</dd>
		</dl>
					
		<dl class="shortcuts box">
			<dt>Macros</dt>
			<dd>
				<ul>
					<xsl:for-each select="macro">
						<xsl:sort select="@name"/>
						<li>
							<a href="#{@name}">
								<xsl:value-of select="@name"/>
							</a>
						</li>
					</xsl:for-each>
				</ul>
			</dd>
		</dl>
		
		<h2>Entries</h2>
		<xsl:for-each select="entry[not(@pos=preceding-sibling::entry/@pos)]">
			<xsl:sort select="@pos"/>
			
			<xsl:variable name="entryPos" select="@pos"/>
			<xsl:variable name="entryStem" select="@stem"/>
			
			<xsl:call-template name="comment-handler"/>
			
			<h2>
				<a name="{$entryPos}">
					<xsl:value-of select="$entryPos"/>
				</a>
			</h2>
			
			<xsl:apply-templates select="//entry[@pos=$entryPos]">
				<xsl:sort select="@word"/>
			</xsl:apply-templates>
		</xsl:for-each>
		
		<h2>Macros</h2>
		<xsl:apply-templates select="macro">
			<xsl:sort select="@name" data-type="text"/>
		</xsl:apply-templates>
	</xsl:template>
	
	<xsl:template match="entry">
		<xsl:variable name="entryPos" select="@pos"/>
		<xsl:variable name="entryWord" select="@word"/>
		<xsl:variable name="entryStem" select="@stem"/>
		<xsl:variable name="entryName">
			<xsl:choose>
				<xsl:when test="@stem
					and not(preceding-sibling::entry[@pos=$entryPos
						and (@word=$entryStem or @stem=$entryStem)])">
					<xsl:value-of select="$entryStem"/>
				</xsl:when>
				<xsl:otherwise>
					<xsl:value-of select="$entryWord"/>
				</xsl:otherwise>
			</xsl:choose>
		</xsl:variable>
		
		<xsl:call-template name="comment-handler"/>
		
		<xsl:if test="not($entryStem=preceding-sibling::entry[
			@pos=$entryPos]/@word
				or $entryStem=preceding-sibling::entry[@pos=$entryPos]/@stem
				or $entryWord=preceding-sibling::entry[@pos=$entryPos]/@word)">
			<h3>
				<a name="{$entryPos}-{$entryName}">
					<xsl:value-of select="$entryName"/>
				</a>
			</h3>
			
			<xsl:if test="document('lexicon.xml')//family[@pos=$entryPos]">
				<strong>Member of: </strong>
				<ul class="short">
					<xsl:for-each select="document('lexicon.xml')//family[
						@pos=$entryPos and 
						((not(@closed) or @closed='false')
							or (@closed='true' and 
								member[@stem=$entryName]))]">
						<li>
							<a href="lexicon.html#{@name}">
								<xsl:value-of select="@name"/>
							</a>
						</li>
					</xsl:for-each>
				</ul>
			</xsl:if>
	
			<dl class="shortcuts box">
				<xsl:apply-templates select="//entry[@pos=$entryPos
						and(@word=$entryName or @stem=$entryName)
						and not(@word=preceding-sibling::entry[
							@pos=$entryPos]/@word)]"
					mode="invoked">
					<xsl:sort select="@word"/>
				</xsl:apply-templates>
			</dl>
			
			<div class="back">
				<a href="#">Back to top</a>
			</div>
		</xsl:if>
	</xsl:template>
	
	<xsl:template match="entry" mode="invoked">
		<dt>
			<xsl:value-of select="@word"/>
		</dt>
		<dd>
			<xsl:call-template name="macros-handler"/>
		</dd>
	</xsl:template>
	
	<xsl:template name="macros-handler">
		<xsl:if test="@macros and not(@macros='')">
			<ul class="short">
				<xsl:call-template name="macro-link-generator">
					<xsl:with-param name="macro-list" select="@macros"/>
				</xsl:call-template>
			</ul>
		</xsl:if>
	</xsl:template>
	
	<xsl:template name="macro-link-generator">
		<xsl:param name="macro-list"/>
		
		<xsl:if test="not($macro-list='')">
			<xsl:variable name="macro">
				<xsl:choose>
					<xsl:when test="contains($macro-list, ' ')">
						<xsl:value-of select="substring-before(
							$macro-list, ' ')"/>
					</xsl:when>
					<xsl:otherwise>
						<xsl:value-of select="$macro-list"/>
					</xsl:otherwise>
				</xsl:choose>
			</xsl:variable>
			<li>
				<a href="#{$macro}">
					<xsl:value-of select="$macro"/>
				</a>
			</li>
			
			<!-- call self recursively with remainder of list, if any -->
			<xsl:if test="contains($macro-list, ' ')">
				<xsl:call-template name="macro-link-generator">
					<xsl:with-param name="macro-list"
						select="substring-after($macro-list, ' ')"/>
				</xsl:call-template>
			</xsl:if>
		</xsl:if>
	</xsl:template>
	
	<xsl:template match="macro">
		<h3>
			<a name="{@name}">
				<xsl:value-of select="@name"/>
			</a>
		</h3>
		<xsl:if test="fs">
			<dl class="box">
				<dt>Feature Structures</dt>
				<dd>
					<dl class="category">
						<xsl:apply-templates select="fs"/>
					</dl>
				</dd>
			</dl>
		</xsl:if>
		<xsl:if test="lf">
			<dl class="box">
				<dt>Logical Form</dt>
				<xsl:apply-templates select="lf"/>
			</dl>
		</xsl:if>
		
		<div class="back">
			<a href="#">Back to top</a>
		</div>
	</xsl:template>
	
	<xsl:template match="macro/fs">
		<dt>
			<xsl:value-of select="@id"/>
		</dt>
		<dd>
			<xsl:choose>
				<xsl:when test="feat">
					<xsl:apply-templates/>
				</xsl:when>
				<xsl:otherwise>
					<xsl:value-of select="@attr"/>
					<xsl:text>=</xsl:text>
					<xsl:value-of select="@val"/>
				</xsl:otherwise>
			</xsl:choose>
		</dd>
	</xsl:template>
	
	<xsl:template match="macro/fs/feat">
		<xsl:if test="preceding-sibling::feat">, </xsl:if>
		<xsl:value-of select="@attr"/>
		<xsl:if test="@val or lf">
			<xsl:text>=</xsl:text>
			<xsl:choose>
				<xsl:when test="@val">
					<xsl:value-of select="@val"/>
				</xsl:when>
				<xsl:when test="lf">
					<xsl:choose>
						<xsl:when test="lf/prop">
							<xsl:value-of select="lf/prop/@name"/>
						</xsl:when>
						<xsl:when test="lf/var">
							<em>
								<xsl:value-of select="lf/var/@name"/>
							</em>
						</xsl:when>
					</xsl:choose>
				</xsl:when>
			</xsl:choose>
		</xsl:if>
	</xsl:template>
	
	<xsl:template match="lf">
		<dd>
			<dl class="category lf">
				<xsl:apply-templates/>
			</dl>
		</dd>
	</xsl:template>	
	
</xsl:stylesheet>


================================================
FILE: src/opennlp/ccg/grammardoc/html/navigation.xsl
================================================
<?xml version="1.0"?>
<!-- 
	$Id: navigation.xsl,v 1.3 2007/03/19 19:07:14 coffeeblack Exp $
	Author: Scott Martin (http://www.ling.osu.edu/~scott/)
 -->
<xsl:stylesheet version="1.0"
	xmlns="http://www.w3.org/1999/xhtml"
	xmlns:xsl="http://www.w3.org/1999/XSL/Transform">

	<!--
		Default value; actual value set by HTMLDocumenter.
	-->
	<xsl:param name="sections">grammar|lexicon|morph|rules|types</xsl:param>
	

	<xsl:template name="navigation-generator">
		<xsl:param name="current"/>
	
		<ul id="navigation">
			<xsl:call-template name="section-handler">
				<xsl:with-param name="current" select="$current"/>
			</xsl:call-template>
		</ul>
	</xsl:template>

	<xsl:template name="section-handler">
		<xsl:param name="sects" select="$sections"/>
		<xsl:param name="current"/>
		
		<xsl:variable name="sect">
			<xsl:choose>
				<xsl:when test="contains($sects, '|')">
					<xsl:value-of select="substring-before($sects, '|')"/>
				</xsl:when>
				<xsl:otherwise>
					<xsl:value-of select="$sects"/>
				</xsl:otherwise>
			</xsl:choose>
		</xsl:variable>
		
		<li>
			<a>
				<xsl:choose>
					<xsl:when test="$sect=$current">
						<xsl:attribute name="class">current</xsl:attribute>
					</xsl:when>
					<xsl:otherwise>
						<xsl:attribute name="href">
							<xsl:choose>
								<xsl:when test="$sect='grammar'">index</xsl:when>
								<xsl:otherwise>
									<xsl:value-of select="$sect"/>
								</xsl:otherwise>
							</xsl:choose>
							<xsl:text>.html</xsl:text>
						</xsl:attribute>
					</xsl:otherwise>
				</xsl:choose>
				
				<xsl:value-of select="$sect"/>
			</a>
		</li>
		
		<xsl:if test="contains($sects, '|')">
			<xsl:call-template name="section-handler">
				<xsl:with-param name="current" select="$current"/>
				<xsl:with-param name="sects" select="substring-after($sects, '|')"/>
			</xsl:call-template>
		</xsl:if>
	</xsl:template>

</xsl:stylesheet>

================================================
FILE: src/opennlp/ccg/grammardoc/html/rules.xsl
================================================
<?xml version="1.0"?>
<!-- 
	$Id: rules.xsl,v 1.5 2006/12/13 19:25:22 coffeeblack Exp $
	Author: Scott Martin (http://www.ling.osu.edu/~scott/)
 -->
<xsl:stylesheet version="1.0"
	xmlns="http://www.w3.org/1999/xhtml"
	xmlns:xsl="http://www.w3.org/1999/XSL/Transform">

	<xsl:import href="base.xsl"/>
	<xsl:import href="categories.xsl"/>
	
	<xsl:template match="rules" mode="invoked">
		<dl class="shortcuts box">
			<dt>List of Rules</dt>
			<dd>
				<ul>
					<xsl:if test="application">
						<li>
							<a href="#application">Application</a>
						</li>
					</xsl:if>
					<xsl:if test="composition">
						<li>
							<a href="#composition">Composition</a>
						</li>
					</xsl:if>
					<xsl:if test="substitution">
						<li>
							<a href="#substitution">Substitution</a>
						</li>
					</xsl:if>
					<xsl:if test="typeraising">
						<li>
							<a href="#typeraising">Typeraising</a>
						</li>
					</xsl:if>
					<xsl:if test="typechanging">
						<li>
							<a href="#typechanging">Typechanging</a>
							<ul>
								<xsl:for-each select="typechanging">
									<xsl:sort select="@name"/>
									<li>
										<a href="#typechanging-{@name}">
											<xsl:value-of select="@name"/>
										</a>
									</li>
								</xsl:for-each>
							</ul>
						</li>
					</xsl:if>
				</ul>
			</dd>
		</dl>

		<xsl:if test="application">
			<a name="application">
				<h2>Application</h2>
			</a>

			<dl class="box">
				<dt>Rules</dt>
				<dd>
					<ul class="rules">
						<xsl:apply-templates select="application"/>
					</ul>
				</dd>
			</dl>
			
			<div class="back">
				<a href="#">Back to top</a>
			</div>
		</xsl:if>
		<xsl:if test="composition">
			<a name="composition">
				<h2>Composition</h2>
			</a>

			<dl class="box">
				<dt>Rules</dt>
				<dd>
					<ul class="rules">
						<xsl:apply-templates select="composition"/>
					</ul>
				</dd>
			</dl>
			
			<div class="back">
				<a href="#">Back to top</a>
			</div>
		</xsl:if>
		<xsl:if test="substitution">
			<a name="substitution">
				<h2>Substitution</h2>
			</a>

			<dl class="box">
				<dt>Rules</dt>
				<dd>
					<ul class="rules">
						<xsl:apply-templates select="substitution"/>
					</ul>
				</dd>
			</dl>
			
			<div class="back">
				<a href="#">Back to top</a>
			</div>
		</xsl:if>
		<xsl:if test="typeraising">
			<a name="typeraising">
				<h2>Typeraising</h2>
			</a>

			<dl class="box">
				<dt>Rules</dt>
				<dd>
					<ul class="rules">
						<xsl:apply-templates select="typeraising"/>
					</ul>
				</dd>
			</dl>
			
			<div class="back">
				<a href="#">Back to top</a>
			</div>
		</xsl:if>
		<xsl:if test="typechanging">
			<a name="typechanging">
				<h2>Typechanging</h2>
			</a>

			<xsl:apply-templates select="typechanging"/>
		</xsl:if>
	</xsl:template>

	<xsl:template match="typechanging">
		<xsl:call-template name="comment-handler"/>
	
		<a name="typechanging-{@name}">
			<h3>
				<xsl:value-of select="@name"/>
			</h3>
		</a>
		
		<dl class="box">
			<dd>
				<a class="unaryRuleExpander" href="javascript://"
					title="expand feature structures"
					onclick="toggleFeatures(this.parentNode);">[+]</a>
				<dl class="unaryRule">
					<dt>
						<xsl:apply-templates select="arg"/>
						<xsl:call-template name="arrow-generator"/>
					</dt>
					<dd class="unaryResult">
						<xsl:apply-templates select="result"/>
					</dd>
				</dl>
			</dd>
		</dl>
		
		<div class="back">
			<a href="#">Back to top</a>
		</div>
	</xsl:template>
	
	<xsl:template match="arg|result">
		<xsl:for-each select="atomcat|complexcat">
			<dl class="category">
				<xsl:if test="name()='atomcat'">
					<dt>
						<xsl:value-of select="@type"/>
					</dt>
				</xsl:if>
	
				<xsl:apply-templates/>
			</dl>
		</xsl:for-each>
	</xsl:template>
	
	<xsl:template match="application">
		<li>
			<xsl:call-template name="dir-handler"/>
			<xsl:call-template name="extra-handler"/>
		</li>
	</xsl:template>
	
	<xsl:template match="composition">
		<li>
			<xsl:call-template name="dir-handler"/>	
			<xsl:text>B</xsl:text>
			<xsl:call-template name="extra-handler"/>
		</li>
	</xsl:template>
	
	<xsl:template match="typeraising">
		<xsl:variable name="arg">
			<xsl:choose>
				<xsl:when test="arg">
					<xsl:value-of select="arg/atomcat/@type"/>
				</xsl:when>
				<xsl:otherwise>np</xsl:otherwise>
			</xsl:choose>
		</xsl:variable>
		<xsl:variable name="result">
			<xsl:choose>
				<xsl:when test="result">
					<xsl:value-of select="result/atomcat/@type"/>
				</xsl:when>
				<xsl:otherwise>s</xsl:otherwise>
			</xsl:choose>
		</xsl:variable>
		
		<xsl:variable name="firstSlash">
			<xsl:choose>
				<xsl:when test="@dir='backward'">\</xsl:when>
				<xsl:otherwise>/</xsl:otherwise>
			</xsl:choose>
		</xsl:variable>
		
		<li>
			<dl class="category">
				<dt>
					<xsl:value-of select="$arg"/>					
				</dt>
				<xsl:call-template name="arrow-generator"/>
				<dd class="category-container">
					<dl class="category">
						<dt>
							<xsl:value-of select="$result"/>
						</dt>
						<xsl:call-template name="dollar-handler"/>
						<dt>
							<xsl:value-of select="$firstSlash"/>
						</dt>
						<xsl:text>(</xsl:text>
						<dd class="category-container">
							<dl class="category">
								<dt>
									<xsl:value-of select="$result"/>
								</dt>
								<xsl:call-template name="dollar-handler"/>
								<dt>
									<xsl:choose>
										<xsl:when
											test="$firstSlash='/'">\</xsl:when>
										<xsl:otherwise>/</xsl:otherwise>
									</xsl:choose>
								</dt>
								<dt>
									<xsl:value-of select="$arg"/>
								</dt>
							</dl>
						</dd>
						<xsl:text>)</xsl:text>
					</dl>
				</dd>
			</dl>
		</li>
	</xsl:template>
	
	<xsl:template name="dollar-handler">
		<xsl:if test="@useDollar='true'">
			<dd>
				<xsl:text>$</xsl:text>
				<span class="ruleLabel">1</span>
			</dd>
		</xsl:if>
	</xsl:template>
	
	<xsl:template match="substitution">
		<li>
			<xsl:call-template name="dir-handler"/>	
			<xsl:text>S</xsl:text>
			<xsl:call-template name="extra-handler"/>
		</li>
	</xsl:template>
	
	<xsl:template name="dir-handler">
		<xsl:choose>
			<xsl:when test="@dir='forward'">
				<acronym title="forward">&gt;</acronym>
			</xsl:when>
			<xsl:otherwise>
				<acronym title="backward">&lt;</acronym>
			</xsl:otherwise>
		</xsl:choose>
	</xsl:template>

	<xsl:template name="extra-handler">
		<xsl:if test="@harmonic='false'">
			<span class="ruleLabel"><acronym title="crossing">x</acronym></span>
		</xsl:if>
	</xsl:template>
	
	<xsl:template name="arrow-generator">
		<span class="arrow">
			<xsl:text disable-output-escaping="yes">&amp;</xsl:text>nbsp;<xsl:text disable-output-escaping="yes">&amp;</xsl:text>mdash;&gt;<xsl:text disable-output-escaping="yes">&amp;</xsl:text>nbsp;
		</span>
	</xsl:template>

</xsl:stylesheet>


================================================
FILE: src/opennlp/ccg/grammardoc/html/types.xsl
================================================
<?xml version="1.0"?>
<!-- 
	$Id: types.xsl,v 1.2 2006/12/13 19:25:22 coffeeblack Exp $
	Author: Scott Martin (http://www.ling.osu.edu/~scott/)
-->
<xsl:stylesheet version="1.0"
	xmlns="http://www.w3.org/1999/xhtml"
	xmlns:xsl="http://www.w3.org/1999/XSL/Transform">

	<xsl:import href="base.xsl"/>
	
	<xsl:template match="types" mode="invoked">
		<dl class="box">
			<dt>Type Hierarchy</dt>
			<dd>
				<ul>
					<xsl:apply-templates select="type[
							not(@parents) or @parents='']">
						<xsl:sort select="@name"/>
					</xsl:apply-templates>
				</ul>
			</dd>
		</dl>
	</xsl:template>
	
	<xsl:template match="type">
		<xsl:variable name="name" select="@name"/>
		<xsl:variable name="children" select="//type[@parents=$name
				or starts-with(@parents, concat($name, ' '))
				or contains(@parents, concat(' ', $name, ' '))
				or substring(@parents,
					(string-length(@parents) - (string-length($name) + 1)) + 1)
						= concat(' ', $name)]"/>
		
		<li>
			<xsl:value-of select="$name"/>
			
			<xsl:if test="count($children) &gt; 0">
				<ul>
					<xsl:apply-templates select="$children">
						<xsl:sort select="@name"/>
					</xsl:apply-templates>
				</ul>
			</xsl:if>
		</li>
	</xsl:template>
	
</xsl:stylesheet>

================================================
FILE: src/opennlp/ccg/hylo/Alt.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2005-6 Michael White (University of Edinburgh, The Ohio State University)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.hylo;

import java.io.Serializable;
import java.util.BitSet;

/**
 * Class for representing alts.
 * LF alts are used during realization to represent 
 * exclusive disjunctions in the input.
 * The alts are represented as pairs of ints, 
 * one for the alt set and one for the alt within the set.
 * The alts are numbered starting with 0.
 * An alt has a bitset for the elementary predications 
 * within the alt.
 *
 * @author      Michael White
 * @version     $Revision: 1.6 $, $Date: 2009/07/17 04:23:30 $
 */
public final class Alt implements Comparable<Alt>, Serializable {
    
	private static final long serialVersionUID = 7241395629445814238L;
	
	/** The alt set number. */
    public final int altSet;
    /** The alt within the set. */
    public final int numInSet;
    /** The bitset. */
    public final BitSet bitset = new BitSet();
    
    /** Constructor. */
    public Alt(int altSet, int numInSet) { 
        this.altSet = altSet; this.numInSet = numInSet;
    }
    
    /** Equals. */
    public boolean equals(Object o) {
        if (!(o instanceof Alt)) return false;
        Alt a = (Alt) o;
        return altSet == a.altSet && numInSet == a.numInSet;
    }
    /** Comparison. */
    public int compareTo(Alt a) {
        if (altSet < a.altSet) return -1;
        if (altSet == a.altSet && numInSet < a.numInSet) return -1;
        if (altSet == a.altSet && numInSet == a.numInSet) return 0;
        return 1;
    }
}


================================================
FILE: src/opennlp/ccg/hylo/Box.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2002 Jason Baldridge
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.hylo;

import opennlp.ccg.synsem.*;
import opennlp.ccg.unify.*;
import org.jdom.*;


/**
 * A modal box operator, such as [F]q.
 *
 * @author      Jason Baldridge
 * @version     $Revision: 1.5 $, $Date: 2009/07/17 04:23:30 $
 **/
public final class Box extends ModalOp {

	private static final long serialVersionUID = 1575311851235814524L;

	public Box(Element e) {
        super(e);
    }

    private Box(Mode mode, LF arg) {
        super(mode, arg);
    }

    public LF copy() {
        return new Box ((Mode)_mode.copy(), _arg.copy());
    }
    
    public boolean equals(Object o) {
        if (o instanceof Box) {
            return super.equals((Box)o);
        } else {
            return false;
        }
    }

    public void unifyCheck(Object u) throws UnifyFailure {
        if (u instanceof Box) {
            super.unifyCheck((Box)u);
        } else {
            throw new UnifyFailure();
        }
    }

    public Object fill(Substitution sub) throws UnifyFailure {
        return new Box((Mode)_mode.fill(sub), (LF)_arg.fill(sub));
    }
    
    /** Returns the string form of this modal op, without the arg. */
    public String modalOpString() {
        return new StringBuffer().append('[').append(_mode.toString()).append(']').toString();
    }
    

    /**
     * Returns an XML representation of this LF (not currently supported).
     * Throws a runtime exception.
     */
    public Element toXml() {
        throw new RuntimeException("toXml() not currently supported for Box.");
    }
}


================================================
FILE: src/opennlp/ccg/hylo/Compacter.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003-6 Michael White (University of Edinburgh, The Ohio State University)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.hylo;

import opennlp.ccg.synsem.*;
import opennlp.ccg.util.*;

import java.util.*;

/**
 * A class implementing compaction of flattened LFs.
 *
 * @author      Michael White
 * @version     $Revision: 1.1 $, $Date: 2006/09/04 14:09:10 $
 **/
public class Compacter {

    /**
     * Returns a compacted LF from the given flattened one. 
     * A root nominal may also be given (otherwise null). 
     * Nominals with multiple parents are kept separate.
     * If there are any duplicate predications, an attempt 
     * is made to attach them in different locations.
     */
    static LF compact(LF lf, Nominal root) {
        // get preds, make copies
        List<SatOp> preds = HyloHelper.getPreds(lf);
        for (int i=0; i < preds.size(); i++) {
            SatOp pred = preds.get(i);
            preds.set(i, (SatOp) pred.copy());
        }
        
        // check for single pred
        if (preds.size() == 1) return preds.get(0);
        
        // find unique parents and multiple parents
        Map<Nominal,Nominal> parents = new HashMap<Nominal,Nominal>();
        GroupMap<Nominal,Nominal> multipleParents = new GroupMap<Nominal,Nominal>();
        for (int i = 0; i < preds.size(); i++) {
            SatOp pred = preds.get(i);
            // get principal nominal as nom1
            Nominal nom1 = HyloHelper.getPrincipalNominal(pred);
            // get secondary nominal
            Nominal nom2 = HyloHelper.getSecondaryNominal(pred);
            // skip if none or nom2 equal to root
            if (nom2 == null) continue;
            if (root != null && nom2.equals(root)) continue;
            // if nom2 already in group map, add nom1 as another parent
            if (multipleParents.containsKey(nom2)) {
                multipleParents.put(nom2, nom1);
            }
            // if nom2 already in parent map, add existing parent and nom1 to group map, 
            // record pred, then remove nom2 from parent map
            else if (parents.containsKey(nom2)) {
                multipleParents.put(nom2, parents.get(nom2));
                multipleParents.put(nom2, nom1);
                parents.remove(nom2);
            }
            // otherwise put in nom1 as parent
            else {
                parents.put(nom2, nom1);
            }
        }

        // check multiple parent nominals for cycles
        int prevSize = -1;
        List<Nominal> history = new ArrayList<Nominal>();
        while (multipleParents.size() != prevSize) {
            prevSize = multipleParents.size();
            for (Iterator<Nominal> it = multipleParents.keySet().iterator(); it.hasNext(); ) {
            	Nominal nom = it.next();
                Set<Nominal> nomParents = multipleParents.get(nom);
                for (Iterator<Nominal> it2 = nomParents.iterator(); it2.hasNext(); ) {
                	Nominal parent = it2.next();
                    history.clear();
                    history.add(nom);
                    while (parent != null && !history.contains(parent)) { 
                        history.add(parent);
                        parent = parents.get(parent);
                    }
                    // remove if cycle found
                    if (parent != null) it2.remove();
                }
                // switch to single parent if others removed
                if (nomParents.size() == 1) {
                	Nominal parent = nomParents.iterator().next();
                    parents.put(nom, parent);
                    it.remove();
                }
            }
        }
        
        // break any remaining cycles in parent relationships
        for (Iterator<Nominal> it = parents.keySet().iterator(); it.hasNext(); ) {
        	Nominal nom = it.next();
        	Nominal parent = parents.get(nom);
            history.clear();
            history.add(nom);
            while (parent != null && !history.contains(parent)) {
                history.add(parent);
                parent = parents.get(parent);
            }
            if (parent != null) { it.remove(); } 
        }
        
        // ensure sorted
        HyloHelper.sort(preds);
        
        // combine preds on same nominal
        // also: gather any duplicate preds 
        List<SatOp> combinedPreds = new ArrayList<SatOp>(preds.size());
        List<SatOp> dupPreds = new ArrayList<SatOp>(preds.size());
        SatOp currentSatOp = preds.get(0);
        Nominal currentNominal = currentSatOp.getNominal();
        combinedPreds.add(currentSatOp);
        for (int i = 1; i < preds.size(); i++) {
            SatOp satOp = preds.get(i);
            // skip if equal to previous, saving in dupPreds
            if (satOp.equals(preds.get(i-1))) {
            	dupPreds.add(satOp); continue; 
            }
            // check for different nominal
            Nominal nominal = satOp.getNominal();
            if (!nominal.equals(currentNominal)) {
                // add to combined preds, update current refs
                currentSatOp = satOp;
                currentNominal = nominal;
                combinedPreds.add(currentSatOp);
            }
            // otherwise combine
            else {
                combine(currentSatOp, satOp);
            }
        }
        
        // compact preds with unique parent
        for (int i = 0; i < combinedPreds.size(); i++) {
            SatOp satOp1 = combinedPreds.get(i);
            Nominal nom1 = satOp1.getNominal();
            if (!parents.containsValue(nom1)) continue;
            for (int j = 0; j < combinedPreds.size(); j++) {
                SatOp satOp2 = combinedPreds.get(j);
                Nominal nom2 = satOp2.getNominal();
                if (nom1.equals(nom2)) continue;
                if (!parents.containsKey(nom2)) continue;
                if (nom1.equals(parents.get(nom2))) {
                    subst(satOp1, satOp2, nom2, null);
                }
            }
        }
        
        // get root nominals, root preds, and multiple parent preds
        List<Nominal> roots = new ArrayList<Nominal>();
        List<SatOp> rootPreds = new ArrayList<SatOp>();
        List<SatOp> multipleParentPreds = new ArrayList<SatOp>();
        for (int i = 0; i < combinedPreds.size(); i++) {
            SatOp pred = combinedPreds.get(i);
            Nominal nom = pred.getNominal();
            if (!parents.containsKey(nom) && !multipleParents.containsKey(nom)) {
                roots.add(nom);
                rootPreds.add(pred);
            }
            if (multipleParents.containsKey(nom)) {
                multipleParentPreds.add(pred);
            }
        }
        
        // compact preds with multiple parents, using parent that is closest to a root
        prevSize = -1;
        while (multipleParentPreds.size() != prevSize) {
            prevSize = multipleParentPreds.size();
            // for each nominal with multiple parents
            for (Iterator<SatOp> it = multipleParentPreds.iterator(); it.hasNext(); ) {
                SatOp pred = it.next();
                Nominal nom = pred.getNominal();
                // find parent closest to root, but checking for a parent not below a root
                Set<Nominal> nomParents = multipleParents.get(nom);
                Nominal parentClosestToRoot = null;
                int closestDist = 0;
                int closestRootIndex = -1;
                for (Iterator<Nominal> it2 = nomParents.iterator(); it2.hasNext(); ) {
                    Nominal parent = it2.next();
                    int dist = 0;
                    // trace parents to top ancestor
                    Nominal topAncestor = parent;
                    while (parents.containsKey(topAncestor)) {
                        topAncestor = parents.get(topAncestor);
                        dist++;
                    }
                    // if top ancestor a root, update closest parent
                    if (roots.contains(topAncestor)) {
                        if (parentClosestToRoot == null || dist < closestDist) {
                            parentClosestToRoot = parent; 
                            closestDist = dist;
                            closestRootIndex = roots.indexOf(topAncestor);
                        }
                    }
                    // otherwise set closest dist to -1, to indicate that not all ancestors are roots
                    else { closestDist = -1; }
                }
                // check for a parent not below a root, or no closest root, and skip this nom if so
                if (closestDist == -1 || closestRootIndex == -1) { continue; }
                // otherwise compact under root pred of parent closest to root
                SatOp closestRootPred = rootPreds.get(closestRootIndex);
                subst(closestRootPred, pred, nom, parentClosestToRoot);
                // update parents map
                parents.put(nom, parentClosestToRoot);
                // and remove from iterator
                it.remove();
            }
        }
        
        // set retval to single remaining pred or conjunction of remaining ones
        LF retval;
        List<LF> retPreds = new ArrayList<LF>();
        retPreds.addAll(rootPreds);
        retPreds.addAll(multipleParentPreds);
        if (retPreds.size() == 1) { retval = retPreds.get(0); }
        else { retval = new Op(Op.CONJ, retPreds); }
        
        // tmp
        for (SatOp dup : dupPreds) {
        	Nominal nom = dup.getNominal();
        	Nominal dupParent = findDupParent(retval, dup, nom);
        	subst(retval, dup, nom, dupParent); 
        }

        // return
        return retval;
    }
    
    
    // combines two preds for the same nominal into the first pred, 
    // where either both preds are elementary, 
    // or the first is the result of an earlier combination
    private static void combine(SatOp satOp1, SatOp satOp2) {
        // get args
        LF arg1 = satOp1.getArg();
        LF arg2 = satOp2.getArg();
        // check if arg1 already conj op
        if (arg1 instanceof Op && ((Op)arg1).getName().equals(Op.CONJ)) {
            List<LF> args = ((Op)arg1).getArguments();
            args.add(arg2);
        }
        // or make it one
        else {
            List<LF> args = new ArrayList<LF>(2);
            args.add(arg1); args.add(arg2);
            satOp1.setArg(new Op(Op.CONJ, args));
        }
    }
    
    
    // substitutes the second satop into the first lf at nom2, optionally 
    // respecting the given parent constraint (if non-null)
    // returns whether the substitution has been made
    private static boolean subst(LF lf, SatOp satOp2, Nominal nom2, Nominal requiredParent) {
        return subst(lf, null, satOp2, nom2, requiredParent);
    }
    
    // recursive implementation that tracks the current parent and 
    // returns whether the substitution has been made
    private static boolean subst(LF lf, Nominal currentParent, SatOp satOp2, Nominal nom2, Nominal requiredParent) {
        // recurse to nom2, then append if requiredParent constraint met
        if (lf instanceof SatOp) {
            SatOp satOp = (SatOp) lf;
            return subst(satOp.getArg(), satOp.getNominal(), satOp2, nom2, requiredParent);
        }
        else if (lf instanceof Diamond) {
            Diamond d = (Diamond) lf;
            LF arg = d.getArg();
            // check for nom2, and that requiredParent constraint met
            if (arg.equals(nom2) && (requiredParent == null || requiredParent.equals(currentParent))) {
                // make substitution
                d.setArg(HyloHelper.append(arg, satOp2.getArg()));
                return true;
            }
            else {
                return subst(arg, currentParent, satOp2, nom2, requiredParent);
            }
        }
        else if (lf instanceof Op) {
        	Op op = (Op) lf;
            List<LF> args = op.getArguments();
            for (int i = 0; i < args.size(); i++) {
                LF arg = args.get(i);
                if (arg instanceof Nominal) {
                    // check for nom2, and that requiredParent constraint met
                    if (arg.equals(nom2) && (requiredParent == null || requiredParent.equals(currentParent))) {
                        // make substitution
                    	// nb: this (rarely used) operation doesn't nec. preserve the sort order, unfortunately
                    	op.appendArgs(satOp2.getArg());
                        return true;
                    }
                    // otherwise, set current parent and continue
                    else {
	                    currentParent = (Nominal) arg;
	                    continue;
                    }
                }
                boolean madeSubst = subst(arg, currentParent, satOp2, nom2, requiredParent);
                if (madeSubst) return true;
            }
        }
        return false;
    }
    
    
    // returns a parent nominal where the duplicate pred can be substituted 
    // if there is no equivalent pred there already; otherwise returns null
    private static Nominal findDupParent(LF lf, SatOp dup, Nominal dupNom) {
        return findDupParent(lf, null, dup, dupNom);
    }
    
    // recursive implementation that tracks the current parent
    private static Nominal findDupParent(LF lf, Nominal currentParent, SatOp dup, Nominal dupNom) {
        // recurse to dupNom, then return parent if apropos
        if (lf instanceof SatOp) {
            SatOp satOp = (SatOp) lf;
            return findDupParent(satOp.getArg(), satOp.getNominal(), dup, dupNom);
        }
        else if (lf instanceof Diamond) {
            Diamond d = (Diamond) lf;
            LF arg = d.getArg();
            // check for dupNom by itself, and return parent
            if (arg.equals(dupNom)) return currentParent;
            else return findDupParent(arg, currentParent, dup, dupNom);
        }
        else if (lf instanceof Op) {
        	Op op = (Op) lf;
            List<LF> args = op.getArguments();
            for (int i = 0; i < args.size(); i++) {
                LF arg = args.get(i);
                if (arg instanceof Nominal) {
                    // check for dupNom, and that no equiv pred constraint met
                    if (arg.equals(dupNom) && !args.contains(dup.getArg()))
                    	// return parent
                    	return currentParent;
                    // otherwise, set current parent and continue
                    else {
	                    currentParent = (Nominal) arg;
	                    continue;
                    }
                }
                Nominal retval = findDupParent(arg, currentParent, dup, dupNom);
                if (retval != null) return retval;
            }
        }
        return null;
    }
}


================================================
FILE: src/opennlp/ccg/hylo/Converter.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003-9 Michael White (University of Edinburgh, The Ohio State University)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.hylo;

import opennlp.ccg.TextCCG;
import opennlp.ccg.synsem.*;
import java.util.*;
import java.util.prefs.Preferences;

/**
 * A class implementing conversion of nominal variables to nominal atoms.
 *
 * @author      Michael White
 * @version     $Revision: 1.7 $, $Date: 2010/08/31 16:20:43 $
 **/
public class Converter {
    
    /** Preference key for using word positions to name atoms. */
    public static final String USE_WORD_POSITIONS_FOR_ATOM_CONVERSION = "Use Word Positions To Convert Atoms";

	// map to already converted nominals 
    private Map<Nominal,Nominal> nominalMap = new HashMap<Nominal,Nominal>();
    
    // map to int for names
    private Map<String,Integer> nameMap = new HashMap<String,Integer>();
	
    // flag for whether to skip absent props
    private boolean skipAbsentProp = true;
       	
    /** Converts nominal vars to atoms, renaming them based on lexical propositions. */
	static void convertNominals(LF lf) {
		convertNominals(lf, null, null);
    }
	
	/**
	 * Converts nominal vars to atoms, renaming them based on word position, if 
	 * a root sign is given, otherwise using lexical propositions; 
	 * returns the converted nominal root. 
	 */
	static Nominal convertNominals(LF lf, Sign root, Nominal nominalRoot) {
		// check preference for naming with word positions; set root to null if false
        Preferences prefs = Preferences.userNodeForPackage(TextCCG.class);
        boolean useWordPositions = prefs.getBoolean(USE_WORD_POSITIONS_FOR_ATOM_CONVERSION, true);
		if (!useWordPositions) root = null;
        // traverse twice, skipping absent props the first time
    	Converter converter = new Converter();
    	converter.convertNoms(lf, root);
        converter.skipAbsentProp = false;
    	converter.convertNoms(lf, root);
    	// return converted nominal root, if any
    	Nominal retval = null;
    	if (nominalRoot != null) {
    		retval = converter.nominalMap.get(nominalRoot);
    	}
    	return retval;
    }

    // recurse through lf, converting nominals
    private void convertNoms(LF lf, Sign root) {
        if (lf instanceof SatOp) {
            SatOp satOp = (SatOp) lf;
            // try finding word index of lex origin in root sign
            int wordIndex = -1;
            if (root != null) {
	            LexSemOrigin origin = satOp.getOrigin();
	            if (origin instanceof Sign) {
	            	Sign lexSign = (Sign) origin;
	            	// make sure it's not dominated by another lex pred
	            	// nb: also need to check for special pred 'elem', which isn't 
	            	// dominated in sample flights grammar
	            	String lexPred = HyloHelper.getLexPred(satOp);
	            	if (lexPred != null && !lexPred.equals("elem")) {
	            		if (!lexDominated(lexPred, lexSign)) 
		            		wordIndex = root.wordIndex(lexSign);
	            	}
	            }
            }
            Nominal oldNom = satOp.getNominal();
            Proposition prop = null;
            LF arg = satOp.getArg();
            if (arg instanceof Proposition) { prop = (Proposition) arg; }
            else if (arg instanceof Op) {
                Op op = (Op) arg;
                LF first = (LF) op.getArguments().get(0);
                if (first instanceof Proposition) { prop = (Proposition) first; }
            }
            Nominal convertedNom = convertNominal(oldNom, prop, wordIndex);
            satOp.setNominal(convertedNom);
            convertNoms(arg, root);
        }
        else if (lf instanceof Diamond) {
            Diamond d = (Diamond) lf;
            LF arg = d.getArg();
            if (arg instanceof Nominal) {
                Nominal oldNom = (Nominal) arg;
                Nominal convertedNom = convertNominal(oldNom, null, -1);
                d.setArg(convertedNom);
            }
            else if (arg instanceof Op) {
                Op op = (Op) arg;
                List<LF> args = op.getArguments();
                LF first = args.get(0);
                if (first instanceof Nominal) {
                    Nominal oldNom = (Nominal) first;
                    LF second = args.get(1);
                    Proposition prop = null;
                    if (second instanceof Proposition) { prop = (Proposition) second; }
                    Nominal convertedNom = convertNominal(oldNom, prop, -1);
                    args.set(0, convertedNom);
                }
                convertNoms(arg, root);
            }
        }
        else if (lf instanceof Op) {
            List<LF> args = ((Op)lf).getArguments();
            for (int i = 0; i < args.size(); i++) {
            	convertNoms(args.get(i), root);
            }
        }
    }

    // returns a nominal atom based on the old nominal, prop and maps, 
    // which are updated accordingly; 
    // wordIndex is used instead if non-negative;
    // the skipAbsentProp flag controls whether to skip a null prop, 
    // so that a meaningful name might be created later
    private Nominal convertNominal(Nominal oldNom, Proposition prop, int wordIndex) {
        // check for an atom
        if (oldNom instanceof NominalAtom) return oldNom;
        // handle word index case
        if (wordIndex >= 0) return convertNominal(oldNom, "w" + wordIndex);
        // skip absent props according to flag
        if (prop == null && skipAbsentProp) return oldNom;
        // check if already converted, and return copy
        Nominal alreadyConvertedNom = nominalMap.get(oldNom);
        if (alreadyConvertedNom != null) {
            return (Nominal) alreadyConvertedNom.copy();
        }
        // otherwise create new atom, with name based on prop (if possible)
        String nameBase = "x";
        if (prop != null) { 
            nameBase = prop.toString().toLowerCase().substring(0,1); 
            // use "n" if not a letter
            if (!Character.isLetter(nameBase.charAt(0))) nameBase = "n";
        }
        int ext = 1;
        Integer baseCount = nameMap.get(nameBase);
        if (baseCount != null) { ext = baseCount.intValue() + 1; }
        nameMap.put(nameBase, new Integer(ext));
        String name = nameBase + ext;
        return convertNominal(oldNom, name);
    }

    // returns the converted nominal using the given name, updating the map
    private Nominal convertNominal(Nominal oldNom, String name) {
        Nominal retval = new NominalAtom(name, oldNom.getType());
        nominalMap.put(oldNom, retval);
        return retval;
    }
    
    
    //---------------------------------------------------------------------------
    // check for dominating lex pred
    //
    
    // returns true if the EP for the lexPred is dominated by another lex pred
    private static boolean lexDominated(String lexPred, Sign lexSign) {
    	Category cat = lexSign.getCategory();
    	LF lf = cat.getLF();
    	Nominal index = cat.getIndexNominal();
    	List<SatOp> preds = HyloHelper.getPreds(lf);
    	// find EP with lexPred, other lex preds
    	SatOp lexEP = null;
    	List<SatOp> otherLexPreds = new ArrayList<SatOp>();
    	for (SatOp pred : preds) {
    		if (HyloHelper.isLexPred(pred)) {
        		if (lexPred.equals(HyloHelper.getLexPred(pred))) 
        			lexEP = pred; 
        		else otherLexPreds.add(pred);
    		}
    	}
    	if (lexEP == null) { 
    		throw new RuntimeException("Couldn't find lexPred: " + lexPred); 
		}
    	// check domination
    	Nominal lexNom = HyloHelper.getPrincipalNominal(lexEP);
    	for (SatOp pred : otherLexPreds) {
    		Nominal otherNom = HyloHelper.getPrincipalNominal(pred);
    		Stack<Nominal> seen = new Stack<Nominal>();
    		seen.push(index); // don't recurse through index nominal
    		if (dominates(otherNom, lexNom, preds, seen)) return true; 
    	}
    	// otherwise false
    	return false;
    }
    
    // returns true if a dominates b in preds, using seen stack to avoid looping
    private static boolean dominates(Nominal a, Nominal b, List<SatOp> preds, Stack<Nominal> seen) {
    	// check for identity
    	if (a.equals(b)) return false;
    	// push a to seen noms
    	seen.push(a);
    	// check relations
    	for (SatOp pred : preds) {
    		if (a.equals(HyloHelper.getPrincipalNominal(pred))) {
    			Nominal c = HyloHelper.getSecondaryNominal(pred);
    			if (c == null) continue;
    			// check immed dominance
    			if (b.equals(c)) return true; // found dominance!
    			// check seen
    			if (seen.contains(c)) continue;
    			// recurse
    			if (dominates(c, b, preds, seen)) return true;
    		}
    	}
    	// otherwise not; pop a and return
    	seen.pop();
    	return false;
    }
    
    
    //---------------------------------------------------------------------------
    // convert nominal atoms back to vars
    //
    
    /** Converts nominal atoms back to vars. */
	static void convertNominalsToVars(List<SatOp> preds) {
		convertNominalsToVars(preds, null);
    }
	
	/**
	 * Converts nominal atoms back to vars, returning the converted nominal root. 
	 */
	static Nominal convertNominalsToVars(List<SatOp> preds, Nominal nominalRoot) {
		Nominal retval = null;
		for (SatOp pred : preds) {
			Nominal nom = pred._nominal;
			Nominal nv = convertNominalToVar(nom);
			if (nom.equals(nominalRoot)) retval = nv;
			pred.setNominal(nv);
			LF arg = pred.getArg();
			if (arg instanceof Diamond) {
				Diamond dArg = (Diamond) arg;
				LF arg2 = dArg.getArg();
				if (arg2 instanceof Nominal) {
					Nominal nv2 = convertNominalToVar((Nominal)arg2);
					dArg.setArg(nv2);
				}
			}
		}
		return retval;
	}
	
	// returns a nominal var with the same name as the given nominal
	static Nominal convertNominalToVar(Nominal nom) {
		return new NominalVar(nom.getName().toUpperCase(), nom.getType());
	}
}


================================================
FILE: src/opennlp/ccg/hylo/Diamond.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003 Jason Baldridge and University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.hylo;

import opennlp.ccg.synsem.*;
import opennlp.ccg.unify.*;
import org.jdom.*;

/**
 * A modal diamond operator, such as &lt;P&gt;p.
 *
 * @author      Jason Baldridge
 * @author      Michael White
 * @version     $Revision: 1.6 $, $Date: 2009/07/17 04:23:30 $
 **/
public final class Diamond extends ModalOp {

	private static final long serialVersionUID = 543211908001651361L;

	public Diamond(Element e) {
        super(e);
    }

    public Diamond(Mode mode, LF arg) {
        super(mode, arg);
    }

    public LF copy() {
        return new Diamond ((Mode)_mode.copy(), _arg.copy());
    }
    
    public boolean equals(Object o) {
        if (o instanceof Diamond) {
            return super.equals((Diamond)o);
        } else {
            return false;
        }
    }

    public void unifyCheck(Object u) throws UnifyFailure {
        if (u instanceof Diamond) {
            super.unifyCheck((Diamond)u);
        } else {
            throw new UnifyFailure();
        }
    }

    public Object unify(Object u, Substitution sub) throws UnifyFailure {
        if (u instanceof HyloFormula) {
            if (u instanceof Diamond) {
                Mode $mode = (Mode) Unifier.unify(_mode, ((Diamond)u)._mode, sub);
                LF $arg = (LF) Unifier.unify(_arg,((Diamond)u)._arg, sub);
                return new Diamond($mode, $arg);
            }
            else return super.unify(u,sub);
        } else {
            throw new UnifyFailure();
        }
    }

    public Object fill(Substitution sub) throws UnifyFailure {
        return new Diamond((Mode)_mode.fill(sub), (LF)_arg.fill(sub));
    }
    
    /** Returns the string form of this modal op, without the arg. */
    public String modalOpString() {
        return new StringBuffer().append('<').append(_mode.toString()).append('>').toString();
    }
    
    /**
     * Returns an XML representation of this LF.
     */
    public Element toXml() {
        Element retval = new Element("diamond");
        retval.setAttribute("mode", _mode.toString());
        Element argElt = _arg.toXml();
        retval.addContent(argElt);
        return retval;
    }
}


================================================
FILE: src/opennlp/ccg/hylo/EPsScorer.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2009 Michael White (The Ohio State University)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.hylo;

import opennlp.ccg.synsem.*;
import opennlp.ccg.util.Pair;

import java.text.NumberFormat;
import java.util.*;

/**
 * A class implementing LF scoring in terms of recall and precision 
 * of elementary predications.
 *
 * @author      Michael White
 * @version     $Revision: 1.5 $, $Date: 2010/11/15 03:21:12 $
 **/
public class EPsScorer {

	/**
	 * Class for scoring results.
	 */
	public static class Results {
		// results
		public double recall = 0.0;
		public double precision = 0.0;
		public double fscore = 0.0;
		public double depsRecall = 0.0;
		public double depsPrecision = 0.0;
		public double depsFscore = 0.0;
		public double unlabeledDepsRecall = 0.0;
		public double unlabeledDepsPrecision = 0.0;
		public double unlabeledDepsFscore = 0.0;
		// display
		public String toString() {
			return "fscore: " + nf.format(fscore) + 
				"  recall: " + nf.format(recall) + 
				"  precision: " + nf.format(precision) + 
				"  deps fscore: " + nf.format(depsFscore) + 
				"  deps recall: " + nf.format(depsRecall) + 
				"  deps precision: " + nf.format(depsPrecision) +
				"  unlabeled deps fscore: " + nf.format(unlabeledDepsFscore) + 
				"  unlabeled deps recall: " + nf.format(unlabeledDepsRecall) + 
				"  unlabeled deps precision: " + nf.format(unlabeledDepsPrecision);
		}
	    // formats to four decimal places
	    private static final NumberFormat nf = initNF();
	    private static NumberFormat initNF() { 
	        NumberFormat f = NumberFormat.getInstance();
	        f.setMinimumIntegerDigits(1);
	        f.setMinimumFractionDigits(1);
	        f.setMaximumFractionDigits(4);
	        return f;
	    }
	}

	/**
	 * Returns the results of scoring an LF against a gold LF.
	 */
	public static Results score(LF lf, LF goldLF) {
		// get EPs
		List<SatOp> eps = HyloHelper.flatten(lf);
		List<SatOp> goldEPs = HyloHelper.flatten(goldLF);
		Set<SatOp> epsSet = new HashSet<SatOp>(eps);
		Set<SatOp> goldEPsSet = new HashSet<SatOp>(goldEPs);
		// get unlabeled deps
		Set<Pair<Nominal,Nominal>> unlabeledDepsSet = new HashSet<Pair<Nominal,Nominal>>();
		Set<Pair<Nominal,Nominal>> goldUnlabeledDepsSet = new HashSet<Pair<Nominal,Nominal>>();
		for (SatOp ep : eps) {
			Pair<Nominal,Nominal> dep = getDep(ep);
			if (dep != null) unlabeledDepsSet.add(dep);
		}
		for (SatOp ep : goldEPs) {
			Pair<Nominal,Nominal> dep = getDep(ep);
			if (dep != null) goldUnlabeledDepsSet.add(dep);
		}
		// calc recall
		Results retval = new Results();
		int recalled = 0, depsRecalled = 0, unlabeledDepsRecalled = 0;
		int goldDeps = goldUnlabeledDepsSet.size();
		for (SatOp ep : goldEPs) {
			boolean isdep = HyloHelper.isRelPred(ep);
			if (epsSet.contains(ep)) {
				recalled++;
				if (isdep) depsRecalled++;
			}
			if (isdep && unlabeledDepsSet.contains(getDep(ep))) unlabeledDepsRecalled++;
		}
		retval.recall = 1.0 * recalled / goldEPs.size();
		retval.depsRecall = (goldDeps > 0) ? 1.0 * depsRecalled / goldDeps : 1.0;
		retval.unlabeledDepsRecall = (goldDeps > 0) ? 1.0 * unlabeledDepsRecalled / goldDeps : 1.0;
		// calc precision
		int precise = 0, depsPrecise = 0, unlabeledDepsPrecise = 0;
		int lfDeps = unlabeledDepsSet.size();
		for (SatOp ep : eps) {
			boolean isdep = HyloHelper.isRelPred(ep);
			if (goldEPsSet.contains(ep)) {
				precise++;
				if (isdep) depsPrecise++;
			}
			if (isdep && goldUnlabeledDepsSet.contains(getDep(ep))) unlabeledDepsPrecise++;
		}
		retval.precision = 1.0 * precise / eps.size();
		retval.depsPrecision = (lfDeps > 0) ? 1.0 * depsPrecise / lfDeps : 1.0;
		retval.unlabeledDepsPrecision = (lfDeps > 0) ? 1.0 * unlabeledDepsPrecise / lfDeps : 1.0;
		// calc f-score
		retval.fscore = fscore(retval.recall, retval.precision);
		retval.depsFscore = fscore(retval.depsRecall, retval.depsPrecision);
		retval.unlabeledDepsFscore = fscore(retval.unlabeledDepsRecall, retval.unlabeledDepsPrecision);
		// done
		return retval;
	}

	// returns an unlabeled dependency as a pair of nominals, or null if the ep is not relational
	private static Pair<Nominal,Nominal> getDep(SatOp ep) {
		if (HyloHelper.isRelPred(ep)) {
			// put nominals in canonical order, so that direction of dependency doesn't matter
			Nominal n1 = HyloHelper.getPrincipalNominal(ep);
			Nominal n2 = HyloHelper.getSecondaryNominal(ep);
			if (n1.compareTo(n2) <= 0) return new Pair<Nominal,Nominal>(n1, n2);
			else return new Pair<Nominal,Nominal>(n2, n1);
		}
		else
			return null;
	}
	
	/** Calculates f-score as balanced harmonic mean of recall and precision. */
	public static double fscore(double recall, double precision) {
		if (recall + precision == 0.0) return 0.0;
		return 2.0 * recall * precision / (recall + precision);
	}
}


================================================
FILE: src/opennlp/ccg/hylo/EnglishAgreementExtractor.java
================================================
package opennlp.ccg.hylo;

///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2011 Rajakrishnan Rajkumar
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

import opennlp.ccg.lexicon.Word;
import opennlp.ccg.perceptron.Alphabet;
import opennlp.ccg.perceptron.FeatureExtractor;
import opennlp.ccg.perceptron.FeatureMap;
import opennlp.ccg.perceptron.FeatureVector;
import opennlp.ccg.synsem.AtomCat;
import opennlp.ccg.synsem.Category;
import opennlp.ccg.synsem.ComplexCat;
import opennlp.ccg.synsem.Sign;
import opennlp.ccg.unify.FeatureStructure;
import opennlp.ccg.unify.SimpleType;
import opennlp.ccg.util.TrieMap;
import opennlp.ccg.hylo.LexDependency;
import java.util.*;

/**
 * Class which extracts subject verb and relative pronoun agreement features for
 * English (described in):
 * 
 * @InProceedings{rajkumar-white:2010:POSTERS, 
 * 	author = {Rajkumar, Rajakrishnan and White, Michael}, 
 * 	title = {Designing Agreement Features for Realization Ranking}, 
 * 	booktitle = {Coling 2010: Posters}, 
 * 	month = {August}, 
 * 	year = {2010}, 
 * 	address = {Beijing, China}, 
 * 	publisher = {Coling 2010 Organizing Committee}, 
 * 	pages = {1032--1040}, 
 * 	url = {http://www.aclweb.org/anthology/C10-2119} 
 * }
 * 
 * The class extracts features based on the OpenCCG HLDS specific LF rels: ArgN (subject rel), whApposRel, GenRel, First, Next
 * 
 * @author raja
 * @version $Revision: 1.11 $, $Date: 2011/11/25 18:18:33 $
 */
public class EnglishAgreementExtractor implements FeatureExtractor{

	/** Feature map wrapper, for unique retrieval from a sign's data objects. */
	public static class FeatureMapWrapper {
		public FeatureMap featureMap;
		public FeatureMapWrapper(FeatureMap featureMap) { this.featureMap = featureMap;}
	}
	
	/** Inner class to store specific properties of signs (right now for unbalanced punctuation status). */
	private class SignProps{

		//Store comma/dash unbalanced punctuation
		private String unbalPunct=null;
		
		/** Constructor to specify unbalanced punctuation. */
		public SignProps(String unbalPunct){
			this.unbalPunct=unbalPunct;
		}
		
		public String getUnbalancedPunct(){
			return unbalPunct;
		}
	}
	
	/** The alphabet. */
	protected Alphabet alphabet = null;

	/** Current feature map. */
	protected FeatureMap currentMap = null;
	
	/** Head and dependent signs (For feature extraction) .*/
	protected Sign headSign=null;
	protected Sign depSign=null;
	
	/** Error analysis related. */
	//Sentence id
	String sentId=null;
	//Instance num
	int INSTANCENUM=0;
	
	/** Subject-verb agreement feature extractors. */
	protected List<List<TrieMap.KeyExtractor<String>>> agrExtractors = new ArrayList<List<TrieMap.KeyExtractor<String>>>();
	protected List<List<TrieMap.KeyExtractor<String>>> agrConjExtractors = new ArrayList<List<TrieMap.KeyExtractor<String>>>();
	protected List<List<TrieMap.KeyExtractor<String>>> agrOfComplementExtractors = new ArrayList<List<TrieMap.KeyExtractor<String>>>();
	
	/** WH-pronoun agreement feature extractors. */
	protected List<List<TrieMap.KeyExtractor<String>>> whExtractors = new ArrayList<List<TrieMap.KeyExtractor<String>>>();
	protected List<List<TrieMap.KeyExtractor<String>>> whConjExtractors = new ArrayList<List<TrieMap.KeyExtractor<String>>>();
	
	/** Punctuation agreement feature extractors. */
	protected List<List<TrieMap.KeyExtractor<String>>> punctExtractor = new ArrayList<List<TrieMap.KeyExtractor<String>>>();
	
	/** Constructors. */
	
	//Constructor used during actual perceptron training and testing
	public EnglishAgreementExtractor() {
		
		// init lazy feature extractors
		this.init();
	}
	
	//Constructor used during error analysis using serialized signs
	public EnglishAgreementExtractor(String sentId) {
		
		//init lazy feature extractors
		this.sentId=sentId;
		this.INSTANCENUM=0;
		this.init();
	}
	
	/** Sets the alphabet. */
	public void setAlphabet(Alphabet alphabet) {
		this.alphabet = alphabet;
	}
	
	/** Initializes lazy feature extractors .*/
	public void init() {
	
		//Agreement: Simple subj-verb feature extractors
		this.agrExtractors.add(dep_word_head_word(1));
		this.agrExtractors.add(dep_word_head_pos(1));
		this.agrExtractors.add(dep_pos_head_word(1));
		this.agrExtractors.add(dep_pos_head_pos(1));

		//Agreement: Disjunct subj feature extractors
		this.agrConjExtractors.add(dep_word_head_word(2));
		this.agrConjExtractors.add(dep_word_head_pos(2));
		this.agrConjExtractors.add(dep_pos_head_word(2));
		this.agrConjExtractors.add(dep_pos_head_pos(2));
		
		//Agreement: Of-complement feature extractors
		this.agrOfComplementExtractors.add(dep_word_head_word(3));
		this.agrOfComplementExtractors.add(dep_word_head_pos(3));
		this.agrOfComplementExtractors.add(dep_pos_head_word(3));
		this.agrOfComplementExtractors.add(dep_pos_head_pos(3));
		
		//WH-pronoun: Simple relative pronoun feature extractors
		this.whExtractors.add(dep_word_head_stem(4));
		this.whExtractors.add(dep_word_head_pos(4));
		this.whExtractors.add(dep_word_head_class(4));
		
		//WH-pronoun: Conjunct/Disjunct subj feature extractors
		this.whConjExtractors.add(dep_word_head_stem(5));
		this.whConjExtractors.add(dep_word_head_pos(5));
		this.whConjExtractors.add(dep_word_head_class(5));
		
		//Unbalanced punctuation
		this.punctExtractor.add(unbal_punct());
		
	}
	
	/** Returns the features for the given sign and completeness flag. */
	public FeatureVector extractFeatures(Sign sign, boolean complete) {
		addFeatures(sign, complete);
		return getFeatureMap(sign);
	}
	
	/** Recursively adds features to the feature map for the given sign, if not already present. */
	//TODO: Lazier feature extraction involving conditional feature extractors
	protected void addFeatures(Sign sign, boolean complete) {
		// check for existing map, otherwise make one
		if (getFeatureMap(sign) != null) return;
		// lex case
		if (sign.isLexical()) {
			currentMap = new FeatureMap(0);
		}
		// non-terminal
		else {
			Sign[] inputs = sign.getDerivationHistory().getInputs();
			// first recurse
			for (Sign child : inputs) addFeatures(child, false);
			// use input maps in making current map
			if (inputs.length == 1) {
				currentMap = new FeatureMap(getFeatureMap(inputs[0]));
			}
			else if (inputs.length == 2) {
				currentMap = new FeatureMap(getFeatureMap(inputs[0]), getFeatureMap(inputs[1]));
			}

			String subjArg=null;
			
			//do each newly filled dep
			for (LexDependency dep : sign.getFilledDeps()) {
				
				this.headSign=dep.lexHead;
				this.depSign=dep.lexDep;
				//System.out.println("DEP: "+dep);
				
				//Find value of the subject feature
				if(subjArg==null){
					subjArg=getSubjectFeature(dep.lexHead.getCategory());
					//Back-off to Arg0 heuristic if subject feature not available for this verb
					if(subjArg==null)subjArg="Arg0";
				}
				
				//Subject-verb agr features
				if(subjArg.equals(dep.rel) && (dep.lexHead.getOrthography().equals("was") ||  dep.lexHead.getOrthography().equals("were") || dep.lexHead.getPOS().equals("VBZ") || dep.lexHead.getPOS().equals("VBP"))){
					
					//Simple subj-verb feats
					//Increment instance number if in error analysis mode
					if(sentId!=null)INSTANCENUM++;
					inc(agrExtractors);

					//Disjunct features
					if(dep.lexDep.getOrthography().equals("or")){
						ArrayList<String>rels=new ArrayList<String>(2);
						rels.add("First");rels.add("Next");
						Hashtable<LexDependency,Sign>cdeps=this.getLowerSiblingDeps(inputs,dep.lexDep,rels,null);
						if(cdeps!=null){
							for(Enumeration<LexDependency>e=cdeps.keys();e.hasMoreElements();){
								LexDependency cdep=e.nextElement();
								this.depSign=cdep.lexDep;
								inc(agrConjExtractors);
							}
						}
					}
					
					//Of-complement subjects (for non-numeral, non-%-sign subjs)
					String subjClass=dep.lexDep.getWords().get(0).getSemClass();
					String subjPOS=dep.lexDep.getPOS();
					if(subjClass==null)subjClass="NULL";
					if(!subjClass.equals("PERCENT") && !subjPOS.startsWith("CD")){
						ArrayList<String>rels=new ArrayList<String>(1);
						rels.add("Mod");
						ArrayList<String>depPreds=new ArrayList<String>(1);
						depPreds.add("of");
						Hashtable<LexDependency,Sign>ofComplDeps=this.getLowerSiblingDeps(inputs,dep.lexDep,rels,depPreds);
						if(ofComplDeps!=null){
							for(Enumeration<LexDependency>e1=ofComplDeps.keys();e1.hasMoreElements();){
								LexDependency ofComplDep=e1.nextElement();
								Sign[] ofComplSigns=ofComplDeps.get(ofComplDep).getDerivationHistory().getInputs();
								rels=new ArrayList<String>(1);
								rels.add("Arg1");
								Hashtable<LexDependency,Sign>ofDeps=this.getLowerSiblingDeps(ofComplSigns,ofComplDep.lexDep,rels,null);
								if(ofDeps!=null){
									for(Enumeration<LexDependency>e2=ofDeps.keys();e2.hasMoreElements();){
										LexDependency ofDep=e2.nextElement();
										this.depSign=ofDep.lexDep;
										inc(agrOfComplementExtractors);
									}
								}
							}
						}
					}
					
				}
				
				//Relative clause features
				String whPrn=dep.lexDep.getOrthography();
				if((dep.rel.equals("GenRel")||dep.rel.equals("whApposRel")) && (whPrn.equals("that")||whPrn.equals("who")||whPrn.equals("which")||whPrn.equals("whose"))){
					
					//Make sure relative clause is linked to head of the quoted NP 
					//(and not the quotation mark itself)
					Sign sib=this.getSibling(sign.getSiblingFilledDeps(),"Arg");
					if(sib!=null){
						this.headSign=sib;
					}
					
					//Simple WH-pronoun features
					//Increment instance number if in error analysis mode
					if(sentId!=null)INSTANCENUM++;
					inc(whExtractors);

					//Proximal conjunct features
					if(dep.lexDep.getPOS().equals("CC") || dep.lexDep.getOrthography().equals(",") || dep.lexDep.getOrthography().equals(";")|| dep.lexDep.getOrthography().equals("or")|| dep.lexDep.getOrthography().equals("and")){
						ArrayList<String>rels=new ArrayList<String>(1);
						rels.add("Next");
						Hashtable<LexDependency,Sign>cdeps=this.getLowerSiblingDeps(inputs,dep.lexDep,rels,null);
						if(cdeps!=null){
							for(Enumeration<LexDependency>e=cdeps.keys();e.hasMoreElements();){
								LexDependency cdep=e.nextElement();
								this.depSign=cdep.lexDep;
								inc(whConjExtractors);
							}
						}
					}
				}
			}
			
			//Punctuation feature extraction: Unbalanced sentence medial appositions are flagged
			if (sign!=null && inputs!=null) {
				
				//Pass up unbalanced punctuation indicator
				
				//Result cat of current has unbal feature
				Category target = sign.getCategory().getTarget();
				FeatureStructure fs = target.getFeatureStructure();
				String punctFeatVal=null;
				if ( (fs != null && fs.hasAttribute("unbal"))) {
					Object val = fs.getValue("unbal");
					punctFeatVal = (val instanceof SimpleType) ? ((SimpleType)val).getName() : null;
				}
				
				//Right child (binary case) or only child (unary case) has unbalanced punct feature
				SignProps childProps=(SignProps)inputs[inputs.length-1].getData(SignProps.class);
				if(childProps!=null)punctFeatVal=childProps.getUnbalancedPunct();
				
				if(punctFeatVal!=null){
					SignProps currProps=new SignProps(punctFeatVal);
					sign.addData(currProps);
				}
				
				//Extract unbalanced punctuation feature for unbalanced sentence medial punctuation
				if (inputs.length == 2) {
					//Left child has unbalanced punct feature
					SignProps lchildProps=(SignProps)inputs[0].getData(SignProps.class);
					if(lchildProps!=null && lchildProps.getUnbalancedPunct()!=null){
						Word nextWord = inputs[1].getWords().get(0);
						//Check whether right child begins with a punctuation mark; else fire feature
						if (!isPunct(nextWord)){
							inc(punctExtractor);
						}
					}
					
				}
			}
		}
		// store it
		storeFeatureMap(sign);
	}
	
	public Sign getOfComplSign(){
	
		Sign retval=null;
		
		return retval;
	}
	
	/** Stores the current feature map as a data object in the given sign. */
	protected void storeFeatureMap(Sign sign) {
		sign.addData(new FeatureMapWrapper(currentMap));
	}
	
	/** Returns the feature map for this extractor from the given sign (null if none). */
	public FeatureMap getFeatureMap(Sign sign) {
		FeatureMapWrapper fmw = (FeatureMapWrapper)sign.getData(FeatureMapWrapper.class);
		return (fmw != null) ? fmw.featureMap : null;
	}
	

	/**
	 * Increments the count of the given features, if relevant.
	 */
	protected void inc(List<List<TrieMap.KeyExtractor<String>>> extractors) {
		for (List<TrieMap.KeyExtractor<String>> lazyExtractor : extractors) {
			Alphabet.Feature f = alphabet.indexLazy(lazyExtractor);
			if (f != null)currentMap.inc(f);
		}
	}

	//------------------------------------
	// utility functions
	
	//Get value of subject feature from verb's result cat
	public String getSubjectFeature(Category cat){
	
		String retval=null;
		if (cat instanceof ComplexCat) {
			Category resCat = ((ComplexCat)cat).getResult();
			retval=this.getSubjectFeature(resCat);
		}
		else if (cat instanceof AtomCat) {
			AtomCat ac = (AtomCat) cat;
			FeatureStructure fs = ac.getFeatureStructure();
			for(String attr: fs.getAttributes()){
				if(attr.equals("sbj")){
					retval=fs.getValue(attr).toString();
					break;
				}
			}
		}
		
		return retval;
	}
	
	//checks for punct
	private boolean isPunct(Word w) {
		String pos = w.getPOS();
		boolean retval = pos.startsWith("PUNCT");
		retval = retval || pos.equals(".") || pos.equals(",") || pos.equals(";") || pos.equals(":") || pos.equals("LRB") || pos.equals("RRB");
		//if (retval) {
		//System.out.println("isPunct: " + w.getForm() + " pos: " + pos);
		//}
		return retval;
	}
	
	// Get siblings of a given head 1-step down the derivation, given the head-sibling relations and lexical preds of deps .*/
	public Hashtable<LexDependency,Sign> getLowerSiblingDeps(Sign[] inputs,Sign headSign,ArrayList<String>rels,ArrayList<String>depPreds){
		
		Hashtable<LexDependency,Sign> retval=new Hashtable<LexDependency,Sign>();
		for(Sign sign: inputs){
			if(retval.size()==rels.size())break;
			List<LexDependency>sdeps=sign.getSiblingFilledDeps();
			sdeps.addAll(sign.getFilledDeps());
			for(LexDependency sdep: sdeps){
				if(sdep.lexHead==headSign && rels.contains(sdep.rel) && !retval.containsKey(sdep)){
					if(depPreds==null || depPreds.contains(sdep.lexDep.getOrthography())){
						retval.put(sdep,sign);
					}
				}
			}
		}
		if(retval.size()==0)retval=null;
		return retval;
	}
	
	//returns sibling sign of a given head given a relation label
	private Sign getSibling(List<LexDependency> sdeps,String rel){
		
		Sign retval=null;
		if(sdeps!=null){
			for(LexDependency dep: sdeps){
				if(dep.rel.equals(rel)){
					retval=dep.lexDep;
					break;
				}
			}
		}
		
		return retval;
	}
	
	// returns acceptable paraphrases for words
	private String adjustWord(String word) {
		
		String retval=word;
		//Account for acceptable paraphrases
		if (word.equals("'ve"))
			retval="have";
		else if (word.equals("'s"))
			retval="is";
		else if (word.equals("'re"))
			retval="are";
		
		return retval;
	}
	
	//adjusts POS tags
	private String adjustPOS(String word,String pos,String semClass) {
		
		String retval=pos;
		
		if(word.equals("has"))
			retval="VBZ";
		else if (word.equals("have"))
			retval="VBP";
		else if(word.equals("one") || word.equals("1"))
			pos="CD-1";
		else if(semClass!=null && semClass.equals("PERCENT"))
			retval=semClass;
		else if(word.equals(",") || word.equals(";"))
			retval="CC";
		
		return retval;
	}
	
	//adjust sem class info
	private String adjustSemClass(String semClass) {
		String retval="UNK";
		if(semClass!=null){
			String[]temp=semClass.split("\\|");
			retval=temp[0].split(":")[0];
		}
		return retval;
	}
	
	//main prefixes (AGR=Agr; CONJ=Conjn/Disjn; WH=wh-pronoun; OF=Of-complement)
	private void add_prefix_main1(List<TrieMap.KeyExtractor<String>> retval) {
		retval.add(new TrieMap.KeyExtractor<String>(){public String getKey(){ return "AGR"; }});
	}
	private void add_prefix_main2(List<TrieMap.KeyExtractor<String>> retval) {
		retval.add(new TrieMap.KeyExtractor<String>(){public String getKey(){ return "AGRCONJ"; }});
	}
	private void add_prefix_main3(List<TrieMap.KeyExtractor<String>> retval) {
		retval.add(new TrieMap.KeyExtractor<String>(){public String getKey(){ return "AGROF"; }});
	}
	private void add_prefix_main4(List<TrieMap.KeyExtractor<String>> retval) {
		retval.add(new TrieMap.KeyExtractor<String>(){public String getKey(){ return "AGRWH"; }});
	}
	private void add_prefix_main5(List<TrieMap.KeyExtractor<String>> retval) {
		retval.add(new TrieMap.KeyExtractor<String>(){public String getKey(){ return "AGRWHCONJ"; }});
	}
	
	//instance # in error analysis mode
	private void add_instance_num(List<TrieMap.KeyExtractor<String>> retval) {
		retval.add(new TrieMap.KeyExtractor<String>(){public String getKey(){ return Integer.toString(INSTANCENUM); }});
	}
	
	//sub-prefixes (W=Word; P=POS tag; S=Stem; C=SemClass)
	private void add_prefix_sub1(List<TrieMap.KeyExtractor<String>> retval) {
		retval.add(new TrieMap.KeyExtractor<String>(){public String getKey(){ return "WW"; }});
	}
	private void add_prefix_sub2(List<TrieMap.KeyExtractor<String>> retval) {
		retval.add(new TrieMap.KeyExtractor<String>(){public String getKey(){ return "WP"; }});
	}
	private void add_prefix_sub3(List<TrieMap.KeyExtractor<String>> retval) {
		retval.add(new TrieMap.KeyExtractor<String>(){public String getKey(){ return "PW"; }});
	}
	private void add_prefix_sub4(List<TrieMap.KeyExtractor<String>> retval) {
		retval.add(new TrieMap.KeyExtractor<String>(){public String getKey(){ return "PP"; }});
	}
	private void add_prefix_sub5(List<TrieMap.KeyExtractor<String>> retval) {
		retval.add(new TrieMap.KeyExtractor<String>(){public String getKey(){ return "WS"; }});
	}
	private void add_prefix_sub6(List<TrieMap.KeyExtractor<String>> retval) {
		retval.add(new TrieMap.KeyExtractor<String>(){public String getKey(){ return "WC"; }});
	}

	//select required feature prefix
	private void add_prefix(int prefix,List<TrieMap.KeyExtractor<String>> retval) {
        switch (prefix) {
    		case 1:add_prefix_main1(retval);break;
    		case 2:add_prefix_main2(retval);break;
    		case 3:add_prefix_main3(retval);break;
    		case 4:add_prefix_main4(retval);break;
    		case 5:add_prefix_main5(retval);break;
        }
    }
	
	//	-------------------------------
	// feature extractors
	
	// dep-word-head-word
	private List<TrieMap.KeyExtractor<String>> dep_word_head_word(int prefix) {
		List<TrieMap.KeyExtractor<String>> retval = new ArrayList<TrieMap.KeyExtractor<String>>(3);
		if(this.sentId!=null)add_instance_num(retval);
		add_prefix(prefix,retval);
		add_prefix_sub1(retval);
		add_dep_word(retval);
		add_head_word(retval);
		return retval;
	}
	
	//dep-word head-pos
	private List<TrieMap.KeyExtractor<String>> dep_word_head_pos(int prefix) {
		List<TrieMap.KeyExtractor<String>> retval = new ArrayList<TrieMap.KeyExtractor<String>>(3);
		if(this.sentId!=null)add_instance_num(retval);
		add_prefix(prefix,retval);
		add_prefix_sub2(retval);
		add_dep_word(retval);
		add_head_pos(retval);
		return retval;
	}
	
	//dep-pos head-word
	private List<TrieMap.KeyExtractor<String>> dep_pos_head_word(int prefix) {
		List<TrieMap.KeyExtractor<String>> retval = new ArrayList<TrieMap.KeyExtractor<String>>(3);
		if(this.sentId!=null)add_instance_num(retval);
		add_prefix(prefix,retval);
		add_prefix_sub3(retval);
		add_dep_pos(retval);
		add_head_word(retval);
		return retval;
	}
	
	//dep-pos head-pos
	private List<TrieMap.KeyExtractor<String>> dep_pos_head_pos(int prefix) {
		List<TrieMap.KeyExtractor<String>> retval = new ArrayList<TrieMap.KeyExtractor<String>>(3);
		if(this.sentId!=null)add_instance_num(retval);
		add_prefix(prefix,retval);
		add_prefix_sub4(retval);
		add_dep_pos(retval);
		add_head_pos(retval);
		return retval;
	}

	//dep-word head-stem
	private List<TrieMap.KeyExtractor<String>> dep_word_head_stem(int prefix) {
		List<TrieMap.KeyExtractor<String>> retval = new ArrayList<TrieMap.KeyExtractor<String>>(3);
		if(this.sentId!=null)add_instance_num(retval);
		add_prefix(prefix,retval);
		add_prefix_sub5(retval);
		add_dep_word(retval);
		add_head_stem(retval);
		return retval;
	}
	
	//dep-word head-class
	private List<TrieMap.KeyExtractor<String>> dep_word_head_class(int prefix) {
		List<TrieMap.KeyExtractor<String>> retval = new ArrayList<TrieMap.KeyExtractor<String>>(3);
		if(this.sentId!=null)add_instance_num(retval);
		add_prefix(prefix,retval);
		add_prefix_sub6(retval);
		add_dep_word(retval);
		add_head_class(retval);
		return retval;
	}
	
	//unbalanced punctuation
	private List<TrieMap.KeyExtractor<String>> unbal_punct() {
		List<TrieMap.KeyExtractor<String>> retval = new ArrayList<TrieMap.KeyExtractor<String>>(1);
		retval.add(new TrieMap.KeyExtractor<String>(){public String getKey(){ return "$punct"; }});
		return retval;
	}
	
	//head word
	private void add_head_word(List<TrieMap.KeyExtractor<String>> retval) {
		retval.add(new TrieMap.KeyExtractor<String>(){public String getKey(){ String word=adjustWord(headSign.getWordForm());return word; }});
	}
	
	//head stem
	private void add_head_stem(List<TrieMap.KeyExtractor<String>> retval) {
		retval.add(new TrieMap.KeyExtractor<String>(){public String getKey(){ return headSign.getWords().get(0).getStem();}});
	}
	
	//head class
	private void add_head_class(List<TrieMap.KeyExtractor<String>> retval) {
		retval.add(new TrieMap.KeyExtractor<String>(){public String getKey(){ String semClass=adjustSemClass(headSign.getWords().get(0).getSemClass());return semClass;}});
	}
	
	// head pos
	private void add_head_pos(List<TrieMap.KeyExtractor<String>> retval) {
		retval.add(new TrieMap.KeyExtractor<String>(){public String getKey(){ String pos=adjustPOS(headSign.getOrthography(),headSign.getPOS(),headSign.getWords().get(0).getSemClass());return pos; }});
	}
	
	// dep word
	private void add_dep_word(List<TrieMap.KeyExtractor<String>> retval) {
		retval.add(new TrieMap.KeyExtractor<String>(){public String getKey(){ String word=adjustWord(depSign.getWordForm());return word; }});
	}
	
	// dep pos
	private void add_dep_pos(List<TrieMap.KeyExtractor<String>> retval) {
		retval.add(new TrieMap.KeyExtractor<String>(){public String getKey(){ String pos=adjustPOS(depSign.getOrthography(),depSign.getPOS(),depSign.getWords().get(0).getSemClass());return pos; }});
	}
}


================================================
FILE: src/opennlp/ccg/hylo/Flattener.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003-6 Michael White (University of Edinburgh, The Ohio State University)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.hylo;


import opennlp.ccg.synsem.*;
import opennlp.ccg.util.*;

import java.util.*;

import gnu.trove.*;

/**
 * A class for performing flattening operations on LFs.
 *
 * @author      Michael White
 * @version     $Revision: 1.5 $, $Date: 2011/06/06 18:52:30 $
 **/
public class Flattener {

	// the resulting preds
	private List<SatOp> preds = new ArrayList<SatOp>();
    
	// counter for alts
	private int altCount = 0;
	
	// counter for opts
	private int optCount = 0;
	
	// root preds
	private List<SatOp> roots = new ArrayList<SatOp>();
	
	// map from preds to children from original expression (identity keys);
	// includes dummy parents to preserve structure 
	private ListMap<SatOp,SatOp> childMap = new ListMap<SatOp,SatOp>(true);
    
    // map from nominals to highest pred for that nominal from original expression
	private Map<Nominal,SatOp> nomMap = new HashMap<Nominal,SatOp>();
    
    // map from pred to depth in original expression
	private Map<Nominal,Integer> depthMap = new HashMap<Nominal,Integer>(); 
	
	// map from nominal to highest parent nominal in original expression, or null if a root
	private Map<Nominal,Nominal> parentMap = new HashMap<Nominal,Nominal>();
	
	// null nominal for use in dummy parents during flattening
	private static Nominal nullNom = new NominalAtom("null");

	// null prop for use in dummy parents during flattening
	private static Proposition nullProp = new Proposition("null");

	/**
	 * Returns a map from a nominal to its highest parent nominal in the original expression, 
	 * after flattening, or null if none.
	 */
	public Map<Nominal,Nominal> getHighestParentMap() {
		return parentMap;
	}
	
    /**
     * Recursively flattens the given LF and returns a list of elementary preds.
     * LF chunks are preserved on satops, as are alts (exclusive disjunctions) 
     * and opts (optional parts).  
     * Chunks, alts and opts are propagated through shared nominals.
     * A runtime exception is thrown if the LF cannot be flattened.
     */
    public List<SatOp> flatten(LF lf) {
        flatten(lf, null, null, 0, new Stack<Alt>(), new TIntArrayList());
        if (altCount > 0 || optCount > 0) propAltsOptsChunks();
        return preds;
    }

    // recursive flattening, with conversion of alts and opts
    private void flatten(
        LF lf, 
        Nominal currentNominal, SatOp parent, int depth, 
        Stack<Alt> alts, TIntArrayList opts
    ) {
        if (lf instanceof SatOp) {
            // flatten arg with new current nominal
            SatOp satOp = (SatOp) lf;
            currentNominal = satOp.getNominal();
            SatOp dummyParent = makeDummySatOp(currentNominal);
            addSatOp(dummyParent, parent, depth, alts, opts, lf);
            flatten(satOp.getArg(), currentNominal, dummyParent, depth, alts, opts);
        }
        else if (lf instanceof Op) {
            Op op = (Op) lf;
            SatOp dummyParent = makeDummySatOp(currentNominal);
            addSatOp(dummyParent, parent, depth, alts, opts, lf);
            if (op._name.equals(Op.XOR)) {
                // introduce new alt set; add alt for each item
                int altSet = altCount++;
                for (int i = 0; i < op._args.size(); i++) {
                    alts.push(new Alt(altSet, i));
                    LF arg = op._args.get(i);
                    flatten(arg, currentNominal, dummyParent, depth+1, alts, opts);
                    alts.pop();
                }
            }
            else if (op._name.equals(Op.OPT)) {
                // introduce new opt index for arg
                opts.add(optCount++);
                LF arg = op._args.get(0);
                flatten(arg, currentNominal, dummyParent, depth+1, alts, opts);
                opts.remove(opts.size()-1);
            }
            else {
                // otherwise just flatten each item
                for (Iterator<LF> it = op.getArguments().iterator(); it.hasNext(); ) {
                    flatten(it.next(), currentNominal, dummyParent, depth+1, alts, opts);
                }
            }
        }
        else if (lf instanceof Proposition) {
            // add SatOp for lf
            if (currentNominal == null) {
                throw new RuntimeException("No current nominal in trying to flatten " + lf);
            }
            SatOp satOp = new SatOp(currentNominal, lf);
            addSatOp(satOp, parent, depth, alts, opts, lf);
        }
        else if (lf instanceof HyloVar) {
            // just skip for now
        }
        else if (lf instanceof Diamond) {
            Diamond diamond = (Diamond) lf;
            LF arg = diamond.getArg();
            if (arg instanceof Proposition || arg instanceof Nominal || arg instanceof HyloVar) {
                // add SatOp for diamond
                SatOp satOp = new SatOp(currentNominal, lf);
                addSatOp(satOp, parent, depth, alts, opts, lf);
            }
            else if (arg instanceof Op && ((Op)arg)._name.equals(Op.CONJ)) {
                // add SatOp for diamond with first nominal arg, 
                // and flatten the rest of the args with the first nominal arg as the 
                // new current nominal
                Op argOp = (Op) arg;
                Iterator<LF> args = argOp._args.iterator();
                LF firstArg = args.next();
                if (!(firstArg instanceof Nominal)) {
                    throw new RuntimeException("First arg of diamond is not a nominal: " + firstArg);
                }
                Nominal firstNominalArg = (Nominal) firstArg;
                // add SatOp for diamond
                SatOp satOp = new SatOp(currentNominal, new Diamond(diamond.getMode(), firstNominalArg));
                addSatOp(satOp, parent, depth, alts, opts, lf);
                // flatten rest of list
                for (; args.hasNext(); ) {
                    flatten(args.next(), firstNominalArg, satOp, depth+1, alts, opts);
                }
            }
            else if (arg instanceof Op && ((Op)arg)._name.equals(Op.XOR)) {
                Op argOp = (Op) arg;
                SatOp dummyParent = makeDummySatOp(currentNominal);
                addSatOp(dummyParent, parent, depth, alts, opts, lf);
                // as before, process xor by introducing new alt set and adding alt for each disjunct; 
                // this time, also assume each disjunct is a conj op or nominal, and add a diamond satop 
                // to the disjunct nominal
                int altSet = altCount++;
                for (int i = 0; i < argOp._args.size(); i++) {
                    alts.push(new Alt(altSet, i));
                    LF disjunct = argOp._args.get(i);
                    if (!(disjunct instanceof Op && ((Op)disjunct)._name.equals(Op.CONJ)) && !(disjunct instanceof Nominal)) {
                        throw new RuntimeException("Disjunct of diamond is not a conj op or nominal: " + disjunct);
                    }
                    // conj op case
                    if (disjunct instanceof Op) {
                        Op disjunctOp = (Op) disjunct;
                        Iterator<LF> args = disjunctOp._args.iterator();
                        LF firstArg = args.next();
                        if (!(firstArg instanceof Nominal)) {
                            throw new RuntimeException("First arg of conj op under xor op is not a nominal: " + firstArg);
                        }
                        // add SatOp for diamond
                        Nominal disjunctNominal = (Nominal) firstArg;
                        SatOp satOp = new SatOp(currentNominal, new Diamond(diamond.getMode(), disjunctNominal));
                        addSatOp(satOp, dummyParent, depth+1, alts, opts, lf);
                        // flatten rest of list
                        for (; args.hasNext(); ) {
                            flatten(args.next(), disjunctNominal, satOp, depth+2, alts, opts);
                        }
                    }
                    // nominal case
                    else {
                        // just add SatOp for diamond
                        Nominal disjunctNominal = (Nominal) disjunct;
                        SatOp satOp = new SatOp(currentNominal, new Diamond(diamond.getMode(), disjunctNominal));
                        addSatOp(satOp, dummyParent, depth+1, alts, opts, lf);
                    }
                    alts.pop();
                }
            }
            else { 
                throw new RuntimeException("Arg of diamond is not a proposition, nominal or list: " + arg);
            }
        }
        else throw new RuntimeException("Unable to flatten " + lf);
    }

    // makes a dummy satop for the given nominal, if any; otherwise uses nullNom
    private static SatOp makeDummySatOp(Nominal nom) {
        return new SatOp((nom != null) ? nom : nullNom, nullProp);
    }

    // handles new preds
    private void addSatOp(SatOp satOp, SatOp parent, int depth, Stack<Alt> alts, TIntArrayList opts, LF lf) {
    	// add non-dummy satops to result
        if (satOp._arg != nullProp) preds.add(satOp);
        // update roots, maps
        if (parent == null) roots.add(satOp);
        else childMap.put(parent, satOp);
        Nominal nom = satOp._nominal;
        if (!nom.isShared()) {
	        if (!nomMap.containsKey(nom) || depth < depthMap.get(nom)) {
	    		nomMap.put(nom, satOp);
	    		depthMap.put(nom, depth);
	    		parentMap.put(nom, (parent != null && parent._nominal != nullNom) ? parent._nominal : null);
	        }
        }
        // set alts, opts, chunks
        if (!alts.empty()) satOp.alts = new ArrayList<Alt>(alts);
        if (opts.size() > 0) satOp.opts = new TIntArrayList(opts.toNativeArray());
        satOp.setChunks(lf.getChunks());
    }
    
    // propagates alts, opts and chunks down from roots
    private void propAltsOptsChunks() {
        // propagate for each root nom
        List<Alt> alts = Collections.emptyList(); 
        TIntArrayList opts = new TIntArrayList(0);
        TIntArrayList chunks = new TIntArrayList(0);
        for (SatOp root : roots) {
        	propAltsOptsChunks(root, alts, opts, chunks);
        }
    }
    
    // prop alts, opts & chunks, recursing through preds in child map and shared nom refs in nomMap
	private void propAltsOptsChunks(SatOp satOp, List<Alt> alts, TIntArrayList opts, TIntArrayList chunks) { 
        // prop alts and opts
        if (!alts.isEmpty()) {
            if (satOp.alts == null) satOp.alts = new ArrayList<Alt>(3);
            for (Alt alt : alts) {
                if (!satOp.alts.contains(alt)) satOp.alts.add(alt);
            }
            Collections.sort(satOp.alts); 
        }
        if (!opts.isEmpty()) {
            if (satOp.opts == null) satOp.opts = new TIntArrayList(3);
            for (int i=0; i < opts.size(); i++) {
                int opt = opts.get(i);
                if (!satOp.opts.contains(opt)) satOp.opts.add(opt);
            }
            satOp.opts.sort();
        }
        if (!chunks.isEmpty()) {
            if (satOp.chunks == null) satOp.chunks = new TIntArrayList(3);
            for (int i=0; i < chunks.size(); i++) {
                int chunk = chunks.get(i);
                if (!satOp.chunks.contains(chunk)) satOp.chunks.add(chunk);
            }
            satOp.chunks.sort();
        }
        // gather alts, opts & chunks for recursion
        List<Alt> alts2 = (satOp.alts != null) ? satOp.alts : alts;
        TIntArrayList opts2 = (satOp.opts != null) ? satOp.opts : opts;
        TIntArrayList chunks2 = (satOp.chunks != null) ? satOp.chunks : chunks;
        // recurse through children, if any
        List<SatOp> children = childMap.get(satOp);
        if (children != null) {
            for (SatOp child : children) 
            	propAltsOptsChunks(child, alts2, opts2, chunks2);
        }
        // recurse through shared nominals, if apropos
        Nominal nom = satOp._nominal;
        if (nom.isShared()) {
            SatOp nomPred = nomMap.get(nom); 
            if (nomPred != null) 
            	propAltsOptsChunks(nomPred, alts2, opts2, chunks2);
        }
        Nominal nom2 = HyloHelper.getSecondaryNominal(satOp);
        if (nom2 != null && nom2.isShared()) {
            SatOp nom2Pred = nomMap.get(nom2); 
            if (nom2Pred != null) 
            	propAltsOptsChunks(nom2Pred, alts2, opts2, chunks2);
        }
    }
}


================================================
FILE: src/opennlp/ccg/hylo/HyloAtom.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003 Jason Baldridge and University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.hylo;

import opennlp.ccg.unify.*;
import gnu.trove.*;

/**
 * A logical atomic formula.
 * The type is optional, so by default, it is not considered in determining equality.
 *
 * @author      Jason Baldridge
 * @author      Michael White
 * @version     $Revision: 1.9 $, $Date: 2009/12/21 03:27:19 $
 **/
public abstract class HyloAtom extends HyloFormula {
    
	private static final long serialVersionUID = 1L;
	
	protected String _name;
    protected SimpleType type;

    protected HyloAtom(String name) {
        this(name, null);
    }
    
    protected HyloAtom(String name, SimpleType st) {
        _name = name; type = st;
    }
    
    public void setAtomName(String name) {
        _name = name;
    }

    public String getName() { return _name; } 
    
    public SimpleType getType() { return type; }

    public boolean occurs(Variable var) {
        return false;
    }

    public String toString() { 
        return _name;
    }

    /**
     * Returns a pretty-printed string of this LF, with the given indent.
     */
    public String prettyPrint(String indent) {
        return toString();
    }
    
    public int compareTo(HyloAtom ha) {
        return _name.compareTo(ha._name);
    }

    /** Returns a hash code based on the atom name. */
    public int hashCode() { 
        return _name.hashCode();
    }

    /**
     * Returns whether this atom equals the given object  
     * based on the atom name.
     */
    public boolean equals(Object obj) {
        if (this == obj) return true;
        if (obj == null || obj.getClass() != this.getClass()) { return false; }
        HyloAtom ha = (HyloAtom) obj;
        return _name.equals(ha._name);
    }
    
    /**
     * Returns a hash code using the given map from vars to ints.
     */
    public int hashCode(TObjectIntHashMap varMap) { return hashCode(); }
        
    /**
     * Returns whether this atom equals the given object  
     * up to variable names, using the given maps from vars to ints.
     */
    public boolean equals(Object obj, TObjectIntHashMap varMap, TObjectIntHashMap varMap2) {
        return equals(obj);
    }
}


================================================
FILE: src/opennlp/ccg/hylo/HyloFormula.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2002-3 Jason Baldridge and University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.hylo;

import java.io.Serializable;
import org.jdom.*;
import gnu.trove.*;

import opennlp.ccg.synsem.*;
import opennlp.ccg.unify.*;

/**
 * A parent class to implement reasonable default behavior for classes
 * representing data structures for hybrid logic.
 *
 * @author      Jason Baldridge
 * @author      Michael White
 * @version     $Revision: 1.13 $, $Date: 2009/12/21 03:27:19 $
 **/
public abstract class HyloFormula implements LF, Serializable {
    
	private static final long serialVersionUID = 1L;
	
	/**
     * The LF chunks to which this LF belongs.
     */
    protected TIntArrayList chunks = null;
    
    /**
     * Sets the LF chunks to which this LF belongs.
     * LF chunks are used during realization to ensure 
     * that certain edges are semantically complete 
     * before combination is attempted with edges 
     * with semantics outside the chunk.
     * The chunks are numbered starting with 0, 
     * and null represents no chunks.
     */
    public void setChunks(TIntArrayList chunks) { this.chunks = chunks; }
    
    /**
     * Gets the LF chunks to which this LF belongs.
     */
    public TIntArrayList getChunks() { return chunks; }
    
    
    /** Returns null as the default type. */
    public SimpleType getType() { return null; }

    
    /**
     * Returns a copy of this LF.
     * (LF chunks are not copied.)
     */
    public abstract LF copy();
    
    /**
     * Applies a ModFcn to this LF and then applies it to all fields
     * which are themselves Mutables.
     *
     * @param mf a function to be applied
     */
    public void deepMap(ModFcn mf) {
        mf.modify(this);
    }

    
    /**
     * Unify this Unfiable with another Object. 
     * This default implementation will reverse the direction of unification 
     * for a variable, otherwise it fails.
     * <b>NB:</b> The implementation of unification in the hylo package is not 
     * complete; a particular limitation is that no attempt is made to unify lists of terms 
     * connected by an Op instance.
     *
     * @param o object to unify with
     * @param s Substitution containing the variable resolutions
     * @exception UnifyFailure if this Unifiable cannot be unified with 
     *            the Object
     * @return an object which represents the unification of 
     *         this Unifiable with the Object
     */
    public Object unify(Object u, Substitution s) throws UnifyFailure {
        if (u instanceof Variable) return ((Unifiable)u).unify(this, s);
        else throw new UnifyFailure(this.toString(), u.toString());
    }

    
    /**
     * Check if this Unifiable can unify with another Object.  This
     * should be implemented as a quick check to allow users of the
     * Unifiable to scan a group of Unifications to rapidly see if the
     * entire group is at least possible before descending into each
     * one with a full unification procedure.  Thus, if a call to this
     * method does not result in a UnifyFailure exception being
     * thrown, it doesn't mean that the Object can definitely be
     * unified with this Unifiable -- what is important is that when a
     * call to this method throws a UnifyFailure exception, it permits
     * one to avoid calling the unify() method on other Unifiables in
     * a group because the quick check failed on this one.
     *
     * @param o object to check for unifiability
     * @exception UnifyFailure if this Unifiable cannot be unified with 
     *            the Object
     * @return the Object o, unmodified 
     **/
    public void unifyCheck(Object u) throws UnifyFailure {}


    /**
     * Replaces any variables in this Unifiable with the values found
     * for them in the Substitution argument.
     *
     * @param s Substitution containing the variable resolutions
     * @return a copy of this Unifiable with all variables from the
     *         Substitution replaced by their values.  
     */
    public Object fill(Substitution s) throws UnifyFailure {
        return this;
    }
       
    /**
     * Returns a hash code using the given map from vars to ints.
     */
    public abstract int hashCode(TObjectIntHashMap varMap);

    /**
     * Returns whether this LF equals the given object  
     * up to variable names, using the given maps from vars to ints.
     */
    public abstract boolean equals(Object obj, TObjectIntHashMap varMap, TObjectIntHashMap varMap2);
    
    /**
     * Returns an XML representation of this LF.
     */
    public abstract Element toXml();
    
    /**
     * Returns a pretty-printed string of this LF, with the given indent.
     */
    public abstract String prettyPrint(String indent);
}


================================================
FILE: src/opennlp/ccg/hylo/HyloHelper.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003-5 Jason Baldridge and University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.hylo;

import opennlp.ccg.synsem.*;
import opennlp.ccg.unify.*;
import opennlp.ccg.grammar.*;
import opennlp.ccg.lexicon.Lexicon;
import org.jdom.*;

import java.util.*;

import gnu.trove.*;

/**
 * A utility class to help with certain global operations over hybrid logic
 * terms.
 *
 * @author      Jason Baldridge
 * @author      Michael White
 * @version     $Revision: 1.43 $, $Date: 2011/08/26 05:18:39 $
 **/
public class HyloHelper {

    //-----------------------------------------------------------------
    // XML functions
    
    /** 
     * Builds a Hylo term from the given element.
     * An "lf" element may be used to wrap one or more (implicitly conj-ed) terms.
     */
    public static LF getLF(Element e) {
        LF retval = null;
        String type = e.getName();
        if (type.equals("op")) {
            retval = new Op(e);
        } else if (type.equals("var")) {
            String name = getName(e);
            retval = new HyloVar(prefix(name), type(name));
        } else if (type.equals("nomvar")) {
            String name = getName(e); 
            boolean shared = "true".equals(e.getAttributeValue("shared"));
            retval = new NominalVar(prefix(name), type(name), shared);
        } else if (type.equals("nom")) {
            String name = getName(e);
            boolean shared = "true".equals(e.getAttributeValue("shared"));
            retval = new NominalAtom(prefix(name), type(name), shared);
        } else if (type.equals("prop")) {
            String name = getName(e);
            retval = new Proposition(name, existingType(name));
        } else if (type.equals("satop")) {
            retval = new SatOp(e);
        } else if (type.equals("box") || type.equals("b")) {
            retval = new Box(e);
        } else if (type.equals("diamond") || type.equals("d")) {
            retval = new Diamond(e);
        } else if (type.equals("mode")) {
            String name = getName(e);
            retval = new ModeLabel(name);
        } else if (type.equals("modevar")) {
            String name = getName(e);
            retval = new ModeVar(name);
        } else if (type.equals("lf")) {
            retval = getLF_FromChildren(e);
        } else {
            System.out.println("Invalid hybrid logic LF type: " + type);
        }
        // assign chunks
        if (retval != null) {
            String chunks = e.getAttributeValue("chunks");
            if (chunks != null) {
                retval.setChunks(convertChunks(chunks));
            }
        }
        // done
        return retval;
    }

    // returns the value of the attribute 'name' or 'n'
    private static String getName(Element e) { 
        String name = e.getAttributeValue("name");
        if (name == null) name = e.getAttributeValue("n");
        return name;
    }
    
    // returns the simple type with the given name, if it exists, or null if not
    private static SimpleType existingType(String name) {
        Types types = Grammar.theGrammar.types;
        if (types.containsSimpleType(name)) return types.getSimpleType(name);
        else return null;
    }
    
    /** Returns the prefix of the name, up to an optional colon. */
    protected static String prefix(String name) {
        int index = name.indexOf(":");
        if (index >= 0) return name.substring(0, index);
        else return name;
    }

    /** Returns the simple type given by the suffix of the name after the colon, or null if none. */
    protected static SimpleType type(String name) {
        int index = name.indexOf(":");
        String suffix = (index >=0 && index+1 < name.length()) ? name.substring(index+1) : null;
        if (suffix != null) return Grammar.theGrammar.types.getSimpleType(suffix);
        else return null;
    }
    
        
    /**
     * Returns a Hylo term from the children of the given element, 
     * adding an implicit CONJ op if necessary.
     */
    @SuppressWarnings("unchecked")
	public static LF getLF_FromChildren(Element e) {
        List<Element> children = e.getChildren();
        if (children.size() > 1) {
            List<LF> preds = new ArrayList<LF>(children.size());
            for (int i=0; i < children.size(); i++) {
                preds.add(getLF(children.get(i)));
            }
            Op conj = new Op(Op.CONJ, preds);
            return conj;
        }
        else return getLF(children.get(0));
    }

    /**
     * Returns an XML representation of the given LF, 
     * wrapped with an 'lf' element, 
     * removing CONJ ops that may be left implicit.
     */
    public static Element toXml(LF lf) {
        Element retval = new Element("lf");
        retval.addContent(lf.toXml());
        removeConjOps(retval);
        return retval;
    }

    
    //-----------------------------------------------------------------
    // process chunks
    
    /** 
     * Processes and removes any chunk elements.
     * Each chunk element is numbered, and all contained elements are marked 
     * as being contained by this chunk, via a "chunks" attribute.
     */
    public static void processChunks(Element e) {
        processChunks(e, null, 0);
        removeChunkElts(e);
    }
    
    // recursively processes chunks, threading count through calls
    @SuppressWarnings("unchecked")
	private static int processChunks(Element e, String chunks, int count) {
        // check for chunk
        if (e.getName().equals("chunk")) {
            // update chunks string and counter
            if (chunks == null) { chunks = "" + count; }
            else { chunks += " " + count; }
            count++;
        }
        // otherwise add chunks attr, if val non-null
        else if (chunks != null) {
            e.setAttribute("chunks", chunks);
        }
        // do children
        List<Element> children = e.getChildren();
        for (int i=0; i < children.size(); i++) {
            count = processChunks(children.get(i), chunks, count);
        }
        // return current count
        return count;
    }
    
    // converts chunk strings
    private static TIntArrayList convertChunks(String chunks) {
        String[] tokens = chunks.split("\\s+");
        TIntArrayList retval = new TIntArrayList(tokens.length);
        for (int i = 0; i < tokens.length; i++) {
            retval.add(Integer.parseInt(tokens[i]));
        }
        return retval;
    }
    
    //-----------------------------------------------------------------
    // recursively remove certain elements
    
    private static abstract class ElementTest {
        abstract boolean test(Element elt);
    }

    // recursively removes elements meeting given test
    @SuppressWarnings("unchecked")
	private static void removeElts(Element elt, ElementTest eltTest) {
        // nb: need to dump children into a new list, in order to get a list iterator 
        //     that will allow multiple adds
        List<Element> children = elt.getChildren();
        List<Element> newChildren = new ArrayList<Element>(children.size());
        newChildren.addAll(children);
        for (ListIterator<Element> li = newChildren.listIterator(); li.hasNext(); ) {
            Element nextElt = li.next();
            removeElts(nextElt, eltTest);
            if (eltTest.test(nextElt)) {
                li.remove();
                for (Iterator<Element> it = nextElt.getChildren().iterator(); it.hasNext(); ) {
                    Element childElt = it.next();
                    it.remove(); // removes childElt from nextElt's children, so it can become a child of elt
                    li.add(childElt);
                }
            }
        }
        elt.removeContent(); 
        elt.setContent(newChildren); 
    }
    
    // recursively removes conj ops
    private static void removeConjOps(Element lfElt) {
        removeElts(
            lfElt, 
            new ElementTest() {
                boolean test(Element elt) {
                    return elt.getName().equals("op") && 
                           elt.getAttributeValue("name").equals(Op.CONJ);
                }
            }
        );
    }
    
    // recursively removes chunk elements
    private static void removeChunkElts(Element lfElt) {
        removeElts(
            lfElt, 
            new ElementTest() {
                boolean test(Element elt) {
                    return elt.getName().equals("chunk");
                }
            }
        );
    }
    

    //-----------------------------------------------------------------
    // functions for elementary predications

    /**
     * Returns whether the given LF is an elementary predication, 
     * ie a lexical predication, relation predication or attribute-value predication.
     */
    public static boolean isElementaryPredication(LF lf) {
        return isLexPred(lf) || isRelPred(lf) || isAttrPred(lf);
    }
    
    /**
     * Returns whether the given elementary predication is a lexical predication, 
     * ie one of the form @x(prop).
     */
    public static boolean isLexPred(LF pred) {
        if (!(pred instanceof SatOp)) return false;
        SatOp satOp = (SatOp) pred;
        LF arg = satOp.getArg();
        return (arg instanceof Proposition);
    }

    /**
     * Returns whether the given elementary predication is a relation predication, 
     * ie one of the form @x(&lt;Rel&gt;y).
     */
    public static boolean isRelPred(LF pred) {
        if (!(pred instanceof SatOp)) return false;
        SatOp satOp = (SatOp) pred;
        LF arg = satOp.getArg();
        if (!(arg instanceof Diamond)) return false;
        Diamond d = (Diamond) arg;
        return (d.getArg() instanceof Nominal);
    }

    /**
     * Returns whether the given elementary predication is an attribute-value predication, 
     * ie one of the form @x(&lt;Rel&gt;prop).  Note that the prop is also allowed to be 
     * a HyloVar.
     */
    public static boolean isAttrPred(LF pred) {
        if (!(pred instanceof SatOp)) return false;
        SatOp satOp = (SatOp) pred;
        LF arg = satOp.getArg();
        return isAttr(arg);
    }
    
    /**
     * Returns whether the given arg is an attribute-value pair, 
     * ie one of the form &lt;Rel&gt;prop.  Note that the prop is also allowed to be 
     * a HyloVar.
     */
    public static boolean isAttr(LF arg) {
        if (!(arg instanceof Diamond)) return false;
        Diamond d = (Diamond) arg;
        LF dArg = d.getArg();
        return ( dArg instanceof Proposition || 
                 (dArg instanceof HyloVar && !(dArg instanceof NominalVar)) );
    }
    
    /**
     * Returns the name of the lexical predicate of the given elementary predication, 
     * or null, if the given LF is not a lexical predicate.
     */
    public static String getLexPred(LF lf) {
        if (!isLexPred(lf)) return null;
        LF arg = ((SatOp)lf).getArg();
        return ((Proposition)arg).toString();
    }
    
    /**
     * Returns the name of the relation of the given elementary predication, 
     * or null, if the given LF is not a relation or attribute-value predicate.
     */
    public static String getRel(LF lf) {
        if (!isRelPred(lf) && !isAttrPred(lf)) return null;
        LF arg = ((SatOp)lf).getArg();
        return ((Diamond)arg).getMode().toString();
    }
    
    /**
     * Returns the string value of the attribute-value predicate, or 
     * null if the given LF is not an attribute-value predicate or has no value. 
     */
    public static String getVal(LF lf) {
    	if (!isAttrPred(lf)) return null;
        LF arg = ((SatOp)lf).getArg();
        LF dArg = ((Diamond)arg).getArg();
        if (dArg instanceof Proposition) return ((Proposition)dArg).getName();
        return null;
    }
    
    /**
     * Returns the principal nominal the given elementary predication, 
     * or null, if the given LF is not an elementary predication.
     */
    public static Nominal getPrincipalNominal(LF lf) {
        if (!isElementaryPredication(lf)) return null;
        return ((SatOp)lf).getNominal();
    }

    /**
     * Returns the secondary nominal of the given elementary predication, 
     * or null, if the given LF is not a relation predication.
     */
    public static Nominal getSecondaryNominal(LF lf) {
        if (!isRelPred(lf)) return null;
        LF arg = ((SatOp)lf).getArg();
        return (Nominal) ((Diamond)arg).getArg(); 
    }

    
    //-----------------------------------------------------------------
    // flattening 

    /**
     * Returns a flattened, sorted list of elementary preds from the given LF 
     * as a conjunction op, or as a single LF, if there is only one. 
     * LF chunks are preserved on satops, as are alts (exclusive disjunctions) 
     * and opts (optional parts).
     * A runtime exception is thrown if the LF cannot be flattened.
     */
    @SuppressWarnings("unchecked")
	public static LF flattenLF(LF lf) {
        List<?> preds = flatten(lf);
        if (preds.size() == 1) {
            return (LF) preds.get(0);
        }
        else {
        	return new Op(Op.CONJ, (List<LF>)preds);
        }
    }
    
    /**
     * Returns a list of predications from the given LF, which is assumed to be either 
     * a conjunction of elementary predications or a single elementary predication.
     */
    public static List<SatOp> getPreds(LF lf) {
        if (lf instanceof Op && ((Op)lf).getName().equals(Op.CONJ)) {
            List<LF> args = ((Op)lf).getArguments();
            List<SatOp> retval = new ArrayList<SatOp>(args.size());
            for (LF arg : args) retval.add((SatOp)arg);
            return retval;
        }
        else { 
            List<SatOp> retval = new ArrayList<SatOp>(1);
            retval.add((SatOp)lf);
            return retval;
        }
    }
    
    /**
     * Returns the first elementary predication from the given LF, which is assumed to be either 
     * a conjunction of elementary predications or a single elementary predication; 
     * otherwise returns null.
     */
    public static SatOp getFirstPred(LF lf) {
    	if (lf instanceof SatOp) return (SatOp) lf;
        if (lf instanceof Op && ((Op)lf).getName().equals(Op.CONJ)) {
            List<LF> args = ((Op)lf).getArguments();
            return (SatOp) args.get(0);
        }
        return null;
    }
    
    /**
     * Returns a flattened, sorted list of elementary preds from the given LF 
     * as a list.
     * LF chunks are preserved on satops, as are alts (exclusive disjunctions) 
     * and opts (optional parts).
     * Chunks, alts and opts are propagated through shared nominals.
     * A runtime exception is thrown if the LF cannot be flattened.
     */
    public static List<SatOp> flatten(LF lf) { 
        List<SatOp> retval = new Flattener().flatten(lf);
        sort(retval);
        return retval;
    }
    
    /**
     * Returns the first elementary predication in the flattened LF.
     * A runtime exception is thrown if the LF cannot be flattened.
     */
    public static LF firstEP(LF lf) { 
        List<SatOp> preds = new Flattener().flatten(lf);
        return preds.get(0);
    }
    
    /**
     * Sets the origin of the elementary preds in the given LF (if any).
     */
    public static void setOrigin(LF lf, LexSemOrigin origin) {
    	if (lf == null) return;
    	if (lf instanceof SatOp) ((SatOp)lf).setOrigin(origin);
    	else if (lf instanceof Op && ((Op)lf).getName().equals(Op.CONJ)) {
            List<LF> args = ((Op)lf).getArguments();
            for (LF arg : args) {
            	if (arg instanceof SatOp) ((SatOp)arg).setOrigin(origin);
            }
        }

    }
    
    /** 
     * Returns a map from nominals to index positions for the first EP for
     * that nominal in a sorted list of elementary predications. 
     */
    public static Map<Nominal,Integer> nomIndex(List<SatOp> preds) {
    	HashMap<Nominal,Integer> retval = new HashMap<Nominal,Integer>(preds.size()/2);
    	for (int i=0; i < preds.size(); i++) {
    		SatOp pred = preds.get(i);
    		Nominal nom = pred._nominal;
    		if (!retval.containsKey(nom)) retval.put(nom, i);
    	}
    	return retval;
    }
    
    /**
     * Returns whether a nominal is a root in the list of EPs using a linear search.
     */
    public static boolean isRoot(Nominal nom, List<SatOp> preds) {
    	for (SatOp pred : preds) {
    		Nominal child = getSecondaryNominal(pred);
    		if (child != null && child.equals(nom)) return false;
    	}
    	return true;
    }
    
    
    //-----------------------------------------------------------------
    // lexical dependencies 

    /** Returns the unfilled lexical dependencies for a lexical item's LF. */
    public static List<LexDependency> getUnfilledLexDeps(LF lf) {
    	if (lf == null) return Collections.emptyList();
    	return LexDependency.unfilledLexDeps(getPreds(lf));
    }
    
	/**
	 * Returns the filled lexical dependencies from those in the unfilled list 
	 * by checking the sign's LF for ones that have become filled, removing the 
	 * corresponding no longer unfilled deps.  
	 */
	public static List<LexDependency> getFilledLexDeps(List<LexDependency> unfilled, LF lf) {
    	if (lf == null) return Collections.emptyList();
    	return LexDependency.filledLexDeps(unfilled, getPreds(lf));
    }

	/**
	 * Returns the semantic features (attribute-value preds) for the given nominal  
	 * in the given LF. 
	 */
	public static List<SatOp> getSemFeatsForHead(Nominal nominal, LF lf) {
		if (nominal == null || lf == null) return Collections.emptyList();
		List<SatOp> retval = new ArrayList<SatOp>(3);
		for (SatOp pred : getPreds(lf)) {
			if (nominal.equals(pred._nominal) && isAttrPred(pred))
				retval.add(pred);
		}
		return retval;
	}
	
	
    //-----------------------------------------------------------------
    // compacting 
    
    /** Composes compact and convertNominals. */
    public static LF compactAndConvertNominals(LF lf, Nominal root) {
        LF retval = compact(lf, root);
        convertNominals(retval);
        return retval;
    }
    
    /** Composes compact and convertNominals with a root sign, for conversion using word positions. */
    public static LF compactAndConvertNominals(LF lf, Nominal root, Sign rootSign) {
        root = convertNominals(lf, rootSign, root);
        LF retval = compact(lf, root);
        return retval;
    }
    
    /**
     * Returns a compacted LF from the given flattened one. 
     * A root nominal may also be given (otherwise null). 
     * Nominals with multiple parents are kept separate.
     * If there are any duplicate predications, an attempt 
     * is made to attach them in different locations.
     */
    public static LF compact(LF lf, Nominal root) {
    	return Compacter.compact(lf, root);
    }
    
    
    //-----------------------------------------------------------------
    // convert nominals
    
    /** Converts nominal vars to atoms, renaming them based on lexical propositions. */
    public static void convertNominals(LF lf) {
    	Converter.convertNominals(lf);
    }

	/**
	 * Converts nominal vars to atoms, renaming them based on word position, if 
	 * a root sign is given, otherwise using lexical propositions; 
	 * returns the converted nominal root. 
	 */
	public static Nominal convertNominals(LF lf, Sign root, Nominal nominalRoot) {
		return Converter.convertNominals(lf, root, nominalRoot);
	}
	
	/**
	 * Converts nominal atoms back to vars, returning the converted nominal root. 
	 * The LF is assumed to be flattened to elementary predications.
	 */
	public static Nominal convertNominalsToVars(LF lf, Nominal nominalRoot) {
		return Converter.convertNominalsToVars(getPreds(lf), nominalRoot);
	}
	

    //-----------------------------------------------------------------
    // append 

    /**
     * Returns a the conjunction of the two LFs, either 
     * as a conjunction op, or as a single LF, if one is null.
     * If either LF is itself a conj op, its elements are appended  
     * instead of the conj op itself.
     * If both LFs are null, null is returned.
     */
    public static LF append(LF lf1, LF lf2) {
        
        // set up new list
        int size = 0;
        List<LF> args1 = null;
        if (lf1 instanceof Op && ((Op)lf1).getName().equals(Op.CONJ)) {
            args1 = ((Op)lf1).getArguments();
            size += args1.size();
        } else if (lf1 != null) {
            size++;
        } 
        List<LF> args2 = null;
        if (lf2 instanceof Op && ((Op)lf2).getName().equals(Op.CONJ)) {
            args2 = ((Op)lf2).getArguments();
            size += args2.size();
        } else if (lf2 != null) {
            size++;
        }
        List<LF> combined = new ArrayList<LF>(size);
        
        // add to new list
        if (args1 != null) { 
            combined.addAll(args1);
        } else if (lf1 != null) {
            combined.add(lf1);
        }
        if (args2 != null) { 
            combined.addAll(args2);
        } else if (lf2 != null) {
            combined.add(lf2);
        }
        
        // return
        if (combined.isEmpty()) { return null; }
        else if (combined.size() == 1) { return combined.get(0); }
        else { return new Op(Op.CONJ, combined); }
    }

    
    //-----------------------------------------------------------------
    // sort 

    /**
     * Sorts the list of elementary predications in a conj op, 
     * or does nothing if the LF is not a conj op.
     */
    public static void sort(LF lf) {
        if (lf instanceof Op && ((Op)lf).getName().equals(Op.CONJ)) {
            sort(((Op)lf).getArguments());
        }
    }
    
    /**
     * Sorts a list of elementary predications.
     */
    public static void sort(List<? extends LF> preds) {
        Collections.sort(preds, predComparator);
    }

    // compares elementary predications
    private static final Comparator<LF> predComparator = new Comparator<LF>() {
        public int compare(LF lf1, LF lf2){
            // sort first on principal nominal
            int nomCompare = getPrincipalNominal(lf1).compareTo(getPrincipalNominal(lf2));
            if (nomCompare != 0) return nomCompare;
            // sort next on type of elementary predication
            int typeCompare = epType(lf1).compareTo(epType(lf2));
            if (typeCompare != 0) return typeCompare;
            // then on lex pred
            if (isLexPred(lf1)) {
                return getLexPred(lf1).compareToIgnoreCase(getLexPred(lf2));
            }
            // then rels
            String rel1 = getRel(lf1);
            String rel2 = getRel(lf2);
            Lexicon theLexicon = Grammar.theGrammar.lexicon;
            Integer rel1Index = theLexicon.getRelationSortIndex(rel1);
            Integer rel2Index = theLexicon.getRelationSortIndex(rel2);
            int relIndexCompare = rel1Index.compareTo(rel2Index);
            if (relIndexCompare != 0) return relIndexCompare;
            int relCompare = rel1.compareToIgnoreCase(rel2);
            if (relCompare != 0) return relCompare;
            // then secondary nominal
            if (isRelPred(lf1)) {
                return getSecondaryNominal(lf1).compareTo(getSecondaryNominal(lf2));
            }
            // otherwise 0
            return 0;
        }
    };
    
    // order of elementary predication type
    private static Integer epType(LF lf) {
        if (isLexPred(lf)) return LEX_PRED;
        else if (isAttrPred(lf)) return ATTR_PRED;
        else if (isRelPred(lf)) return REL_PRED;
        // shouldn't happen
        else return null;
    }
    
    private static Integer LEX_PRED = new Integer(1);
    private static Integer ATTR_PRED = new Integer(2);
    private static Integer REL_PRED = new Integer(3);

    
    //-----------------------------------------------------------------
    // check

    /**
     * Checks the list of elementary predications in a conj op 
     * for well-formedness, or does nothing if the LF is not a conj op.
     * A UnifyFailure exception is thrown if the check fails.
     * The only current check is that there is no more than one lexical 
     * predication per nominal.  
     * The list of predications is assumed to be already sorted.
     */
    public static void check(LF lf) throws UnifyFailure {
        if (lf instanceof Op && ((Op)lf).getName().equals(Op.CONJ)) {
            check(((Op)lf).getArguments());
        }
    }
    
    private static void check(List<LF> preds) throws UnifyFailure {
        for (int i = 0; i < preds.size()-1; i++) {
            LF lf1 = preds.get(i);
            LF lf2 = preds.get(i+1);
            if (isLexPred(lf1) && isLexPred(lf2) &&
                getPrincipalNominal(lf1).equals(getPrincipalNominal(lf2))) 
            {
                throw new UnifyFailure();
            }
        }
    }
}


================================================
FILE: src/opennlp/ccg/hylo/HyloVar.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003-4 Jason Baldridge and University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.hylo;

import opennlp.ccg.grammar.*;
import opennlp.ccg.synsem.*;
import opennlp.ccg.unify.*;
import org.jdom.*;
import gnu.trove.*;

/**
 * A class for objects which can stand for any HyloFormula object.
 * Types are unified with other hylo vars, and with other hylo formulas when present.
 *
 * @author      Jason Baldridge
 * @author      Michael White
 * @version     $Revision: 1.17 $, $Date: 2009/07/17 04:23:30 $
 **/
public class HyloVar extends HyloFormula implements Variable, Indexed {
    
	private static final long serialVersionUID = 3455577234911944031L;
	
	protected final String _name;
    protected int _index;
    protected int _hashCode;
    protected SimpleType type;
    
    public HyloVar(String name) {
        this(name, 0, null);
    }

    public HyloVar(String name, SimpleType st) {
        this(name, 0, st);
    }

    protected HyloVar(String name, int index, SimpleType st) {
        _name = name;
        _index = index;
        type = (st != null) ? st : Grammar.theGrammar.types.getSimpleType(Types.TOP_TYPE);
        _hashCode = _name.hashCode() + _index + type.getIndex();
    }
    
    public String name() {
        return _name;
    }

    public LF copy() {
        return new HyloVar(_name, _index, type);
    }


    public int getIndex() {
        return _index;
    }

    public void setIndex(int index) {
        _hashCode += index - _index;
        _index = index;
    }

    public SimpleType getType() {
        return type;
    }
    
    public boolean occurs(Variable var) {
        return equals(var);
    }

    public boolean equals(Object o) {
        if (this == o) return true;
        if (!(o instanceof HyloVar)) return false;
        HyloVar var = (HyloVar) o;
        return _index == var._index && _name.equals(var._name) && type.equals(var.type);
    }
    
    public int compareTo(HyloVar hv) {
        int retval = _name.compareTo(hv._name);
        if (retval == 0) {
            if (_index < hv._index) { retval = -1; }
            else if (_index > hv._index) { retval = 1; }
        }
        return retval;
    }
    
    public Object unify(Object u, Substitution sub) throws UnifyFailure {
        // with nominal vars, reverse direction of unification
        if (u instanceof NominalVar) return ((NominalVar)u).unify(this, sub);
        // check for equality with u
        if (equals(u)) return this; 
        // make sure u is an LF
        if (!(u instanceof LF)) throw new UnifyFailure();
        LF lf = (LF) u;
        // check type compatibility, if present
        SimpleType st = null;
        if (lf.getType() != null) st = (SimpleType) type.unify(lf.getType(), sub);
        // with hylo vars, substitute according to type specificity then comparison order, 
        // so that the direction of unification doesn't matter
        if (u instanceof HyloVar) {
            HyloVar u_hv = (HyloVar)u;
            // equal types, use comparison order
            if (type.equals(u_hv.getType())) {
                if (compareTo(u_hv) >= 0) return sub.makeSubstitution(this, u_hv); 
                else return sub.makeSubstitution(u_hv, this);
            }
            // unequal types, use most specific one
            if (type.equals(st)) return sub.makeSubstitution(u_hv, this);
            if (u_hv.getType().equals(st)) return sub.makeSubstitution(this, u_hv); 
            // otherwise make new hylo var with intersection type, 
            // name based on comparison order and index, and new index
            String name = (compareTo(u_hv) >= 0) ? (u_hv._name + u_hv._index) : (_name + this._index);
            HyloVar hv_st = new HyloVar(name, UnifyControl.getUniqueVarIndex(), st);
            // and subst both
            sub.makeSubstitution(u_hv, hv_st);
            return sub.makeSubstitution(this, hv_st); 
        }
        // with props, check for more specific type
        if (u instanceof Proposition) {
            Proposition prop = (Proposition) u;
            // if no or same type, just subst
            if (st == null || prop.getType().equals(st)) return sub.makeSubstitution(this, prop);
            // otherwise subst prop with name of type
            Proposition prop_st = new Proposition(st.getName(), st); 
            return sub.makeSubstitution(this, prop_st);
        }
        // otherwise, do occurs check ... 
        if (((LF)u).occurs(this)) throw new UnifyFailure(); 
        // and then go ahead and substitute
        return sub.makeSubstitution(this, u);
    }

    public Object fill(Substitution sub) throws UnifyFailure {
        Object val = sub.getValue(this);
        if (val != null) {
            return val;
        } else {
            return this;
        }
    }

    public String toString() { 
        String retval = _name+"_"+_index;
        if (!type.getName().equals(Types.TOP_TYPE)) retval += ":" + type.getName();
        return retval;
    }

    /** Returns the name with the type separated by a colon if the type is not the top type. */
    public String nameWithType() { 
        String retval = _name;
        if (!type.getName().equals(Types.TOP_TYPE)) retval += ":" + type.getName();
        return retval;
    }

    /**
     * Returns a pretty-printed string of this LF, with the given indent.
     */
    public String prettyPrint(String indent) {
        return toString();
    }
    
    /** Returns a hash code based on the name, index and type. */
    public int hashCode() {
        return _hashCode;
    }
    
    /**
	 * Returns a hash code using the given map from vars to ints.
	 */
	public int hashCode(TObjectIntHashMap varMap) {
		// see if this already in map
		if (varMap.containsKey(this))
			return varMap.get(this);
		// otherwise add it
		int next = varMap.size() + 1;
		varMap.put(this, next);
		return next;
	}
        
    /**
	 * Returns whether this var equals the given object up to variable names,
	 * using the given maps from vars to ints.
	 * (Note that the name and index may differ, but the types must be equal.)
	 */
    public boolean equals(Object obj, TObjectIntHashMap varMap, TObjectIntHashMap varMap2) {
        if (obj.getClass() != this.getClass()) { return false; }
        HyloVar hv = (HyloVar) obj;
        if (varMap.get(this) != varMap2.get(hv)) return false;
        if (!this.type.equals(hv.type)) return false;
        return true;
    }
    
    /**
     * Returns an XML representation of this LF.
     */
    public Element toXml() {
        Element retval = new Element("var");
        retval.setAttribute("name", nameWithType());
        return retval;
    }
}


================================================
FILE: src/opennlp/ccg/hylo/LexDepFeatureExtractor.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2011-3 Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.hylo;

import java.util.*;

import opennlp.ccg.lexicon.Word;
import opennlp.ccg.perceptron.*;
import opennlp.ccg.synsem.*;
import opennlp.ccg.util.TrieMap;

/** 
 * A class for extracting lexical dependency features.  This class
 * implements the features in White and Rajkumar's EMNLP-12 paper 
 * <a href="http://aclweb.org/anthology-new/D/D12/D12-1023.pdf">
 * Minimal Dependency Length in Realization Ranking</a>.
 * 
 * Features are extracted lazily for efficiency, using a prefix of "ld" 
 * for "lexical dependency".  
 * 
 * Features potentially involve the word, POS tag, word class, definiteness, syntactic 
 * complexity, short-long order, and total dependency length, where the latter 
 * three can be controlled by the appropriate include* flags; of
 * these, only dependency length is included by default.
 *
 * Word class is based on the semantic class, a check for color terms, common suffixes, 
 * and the presence of a hyphen or capitalization.
 * 
 * The checks for definite NPs, color terms and common suffixes are done by methods with 
 * defaults for the English CCGbank, which can be overridden in subclasses or 
 * reconfigured in the case of color terms and suffixes.
 * 
 * @author Michael White
 * @version     $Revision: 1.4 $, $Date: 2011/11/10 15:12:53 $
 */ 
public class LexDepFeatureExtractor implements FeatureExtractor {

	/** Feature prefix constant: "ld". */
	public static final String PREFIX = "ld";
	
	/** Head precedes dep constant: "hpd". */
	public static final String HEAD_PRECEDES_DEP = "hpd";
	
	/** Dep precedes head constant: "dph". */
	public static final String DEP_PRECEDES_HEAD = "dph";
	
	/** Left of head sibs precedence constant: "lsp". */
	public static final String LEFT_SIBS_PRECEDENCE = "lsp";
	
	/** Right of head sibs precedence constant: "rsp". */
	public static final String RIGHT_SIBS_PRECEDENCE = "rsp";
	
	/** Returns the appropriate siblings precedence constant for the head-dep order constant. */
	public static String sibPrecedenceForDep(String depConst) {
		return (depConst == DEP_PRECEDES_HEAD) ? LEFT_SIBS_PRECEDENCE : RIGHT_SIBS_PRECEDENCE;
	}
	
	/** Definiteness constant: "def1". */
	public static final String DEF = "def1";
	
	/** Indefiniteness constant: "def0". */
	public static final String INDEF = "def0";
	
	/** Class constant PRO. */
	public static final String CLASS_PRO = "PRO";
	
	/** Class constant COLOR. */
	public static final String CLASS_COLOR = "COLOR";
	
	/** Class constant HYPH. */
	public static final String CLASS_HYPH = "HYPH";
	
	/** Class constant CAP. */
	public static final String CLASS_CAP = "CAP";
	
	/** Class constant NIL. */
	public static final String CLASS_NIL = "NIL";
	
	/** Flag for whether to include syntactic complexity ordering features (defaults to false). */
	public boolean includeComplexityFeats = false;
	
	/** Complexity ordering constant for verb presence: "1v". */
	public static final String HAS_V = "1v";
	
	/** Complexity ordering constant for verb presence: "0v". */
	public static final String NO_V = "0v";
	
	/** Complexity ordering constant for punct presence: "1p". */
	public static final String HAS_P = "1p";
	
	/** Complexity ordering constant for punct absence: "0p". */
	public static final String NO_P = "0p";
	
	/** Flag for whether to include short-long features (defaults to false). */
	public boolean includeShortLong = false;

	/** Short-long order constant: "sl". */
	public static final String SHORT_LONG_ORDER = "sl";
	
	/** Long-short order constant: "ls". */
	public static final String LONG_SHORT_ORDER = "ls";
	
	/** Flag for whether to include global dependency length features (defaults to true). */
	public boolean includeDepLen = true;

	/** Global dependency length feature constant: "$deplen". */
	public static final String DEPLEN = "$deplen";
	
	/** Conditional lazy extractor, for lazily extracting a feature subject to a test. */
	public static abstract class ConditionalLazyExtractor {
		abstract boolean test();
		List<TrieMap.KeyExtractor<String>> lazyExtractor = new ArrayList<TrieMap.KeyExtractor<String>>(5);
	}
	
	/** Conditional lazy evaluator, for lazily extracting a feature and its value, subject to a test. */
	public static abstract class ConditionalLazyEvaluator extends ConditionalLazyExtractor {
		abstract float eval();
	}
	
	/** Feature map wrapper, for unique retrieval from a sign's data objects. */
	public static class FeatureMapWrapper {
		public FeatureMap featureMap;
		public FeatureMapWrapper(FeatureMap featureMap) { this.featureMap = featureMap; }
	}
	
	/** The alphabet. */
	protected Alphabet alphabet = null;

	/** Current feature map. */
	protected FeatureMap currentMap = null;
	
	/** Current sign (for extracting features). */
	protected Sign currentSign = null;
	
	/** Current input signs (for extracting features). */
	protected Sign[] currentInputs = null;
	
	/** Current dependency (for extracting features). */
	protected LexDependency currentDep = null;

	/** Current head index. */
	protected int currentHeadIndex = -1;
	
	/** Current dependent index. */
	protected int currentDepIndex = -1;
	
	/** Current sibling dependency (for extracting features). */
	protected LexDependency currentSib = null;
	
	/** Current sibling dependent index. */
	protected int currentSibIndex = -1;
	
	/** Current head broad POS (for extracting features). */
	protected String currentHeadBroadPOS = null;

	/** Current head-dependent order (for extracting features). */
	protected String currentHeadDepOrder = null;

	/** Current siblings precedence relation (for extracting features). */
	protected String currentSibsPrecedence = null;

	/** Current dep prececes sib flag (for extracting features). */
	protected boolean currentDepPrecedesSib = false;

	/** Current dep sign (for extracting features). */
	protected Sign currentDepSign = null;
	
	/** Current sib sign (for extracting features). */
	protected Sign currentSibSign = null;
	
	/** Current dep phrase lengths (for extracting features). */
	protected PhraseLengths currentDepLengths = null;
	
	/** Current sib phrase lengths (for extracting features). */
	protected PhraseLengths currentSibLengths = null;
	
	/** Current difference in lengths between second and first siblings (for extracting features). */
	protected PhraseLengths currentLengthsDiff = null;
	
	///** Lexical feature extractors. */
	//protected List<List<TrieMap.KeyExtractor<String>>> lexExtractors = new ArrayList<List<TrieMap.KeyExtractor<String>>>();
	
	/** Dependency order feature extractors. */
	protected List<List<TrieMap.KeyExtractor<String>>> depOrderExtractors = new ArrayList<List<TrieMap.KeyExtractor<String>>>();
	
	/** Siblings order feature extractors. */
	protected List<List<TrieMap.KeyExtractor<String>>> sibsOrderExtractors = new ArrayList<List<TrieMap.KeyExtractor<String>>>();
	
	/** Siblings order conditional feature extractors. */
	protected List<ConditionalLazyExtractor> sibsOrderCondExtractors = new ArrayList<ConditionalLazyExtractor>();
	
	/** Siblings complexity order conditional feature extractors. */
	protected List<ConditionalLazyExtractor> sibsComplexityOrderCondExtractors = new ArrayList<ConditionalLazyExtractor>();
	
	/** Short-long conditional feature evaluators. */
	protected List<ConditionalLazyEvaluator> shortLongCondEvaluators = new ArrayList<ConditionalLazyEvaluator>();
	
	/** Global dependency length keys. */
	protected List<String> depLenKeys = new ArrayList<String>(1);
	
	/** Global dependency length feature. */
	protected Alphabet.Feature depLenFeat = null;
	
	/** Constructor. */
	public LexDepFeatureExtractor() {
		// init lazy feature extractors
		depOrderExtractors.add(head_dep_order_words());
		depOrderExtractors.add(head_dep_order_pos());
		depOrderExtractors.add(head_dep_order_word_pos());
		depOrderExtractors.add(head_dep_order_pos_word());
		sibsOrderExtractors.add(sibs_precedence_words());
		sibsOrderExtractors.add(sibs_precedence_word_pos());
		sibsOrderExtractors.add(sibs_precedence_pos_word());
		sibsOrderCondExtractors.add(sibs_precedence_pos());
		sibsOrderExtractors.add(sibs_precedence_word_class());
		sibsOrderExtractors.add(sibs_precedence_class_word());
		sibsOrderCondExtractors.add(sibs_precedence_class());
		sibsOrderCondExtractors.add(sibs_precedence_rels());
		sibsOrderCondExtractors.add(sibs_precedence_defs());
		// init complexity feature extractors
		sibsComplexityOrderCondExtractors.add(sibs_precedence_verbs());
		sibsComplexityOrderCondExtractors.add(sibs_precedence_puncts());
		// init short-long feature evaluators
		shortLongCondEvaluators.add(short_long_words());
		// init dep len keys
		depLenKeys.add(DEPLEN);
	}
	
	/** Sets the alphabet. */
	public void setAlphabet(Alphabet alphabet) {
		this.alphabet = alphabet;
	}
	
	
	/** Returns the features for the given sign and completeness flag. */
	public FeatureVector extractFeatures(Sign sign, boolean complete) {
		addFeatures(sign, complete);
		return getFeatureMap(sign);
	}
	
	/** Recursively adds features to the feature map for the given sign, if not already present. */
	protected void addFeatures(Sign sign, boolean complete) {
		// check for existing map, otherwise make one
		if (getFeatureMap(sign) != null) return;
		// lex case
		if (sign.isLexical()) {
			currentSign = sign;
			currentMap = new FeatureMap(0);
			//inc(lexExtractors);
		}
		// non-terminal
		else {
			Sign[] inputs = sign.getDerivationHistory().getInputs();
			// first recurse
			for (Sign child : inputs) addFeatures(child, false);
			// use input maps in making current map
			currentSign = sign;
			currentInputs = inputs;
			if (inputs.length == 1) {
				currentMap = new FeatureMap(getFeatureMap(inputs[0]));
			}
			else if (inputs.length == 2) {
				currentMap = new FeatureMap(getFeatureMap(inputs[0]), getFeatureMap(inputs[1]));
			}
			// do each newly filled dep
			for (LexDependency dep : sign.getFilledDeps()) {
				currentDep = dep;
				currentHeadBroadPOS = getHeadBroadPOS(dep);
				setDepIndexes(dep);
				currentHeadDepOrder = getHeadDepOrder();
				inc(depOrderExtractors);
				// do dep len
				if (includeDepLen) {
					Alphabet.Feature f = getDepLenFeat();
					if (f != null) currentMap.add(f, (float)depLen());					
				}
				// do order for each sib on the same side of the same head
				for (LexDependency sib : sign.getSiblingFilledDeps()) {
					currentSib = sib;
					if (dep.lexHead != sib.lexHead) continue;
					setSibIndex(sib);
					if (currentHeadDepOrder != getHeadSibOrder()) continue;
					currentSibsPrecedence = sibPrecedenceForDep(currentHeadDepOrder);
					currentDepPrecedesSib = depPrecedesSib();
					inc(sibsOrderExtractors);
					incCond(sibsOrderCondExtractors);
					// do complexity, length feats
					if (includeComplexityFeats || includeShortLong) {
						setLengthsDiff();
						if (currentLengthsDiff != null) {
							if (includeComplexityFeats) incCond(sibsComplexityOrderCondExtractors);
							if (includeShortLong) addCond(shortLongCondEvaluators);
						}
					}
				}
			}
		}
		// store it
		storeFeatureMap(sign);
	}
	
	/** Stores the current feature map as a data object in the given sign. */
	protected void storeFeatureMap(Sign sign) {
		sign.addData(new FeatureMapWrapper(currentMap));
	}
	
	/** Returns the feature map for this extractor from the given sign (null if none). */
	protected FeatureMap getFeatureMap(Sign sign) {
		FeatureMapWrapper fmw = (FeatureMapWrapper)sign.getData(FeatureMapWrapper.class);
		return (fmw != null) ? fmw.featureMap : null;
	}
	
	/**
	 * Increments the count of the given features, if relevant.
	 */
	protected void inc(List<List<TrieMap.KeyExtractor<String>>> extractors) {
		for (List<TrieMap.KeyExtractor<String>> lazyExtractor : extractors) {
			Alphabet.Feature f = alphabet.indexLazy(lazyExtractor);
			if (f != null) currentMap.inc(f);
		}
	}

	/**
	 * Increments the count of the given conditional features, if relevant.
	 */
	protected void incCond(List<ConditionalLazyExtractor> condExtractors) {
		for (ConditionalLazyExtractor condExtractor : condExtractors) {
			if (condExtractor.test()) {
				Alphabet.Feature f = alphabet.indexLazy(condExtractor.lazyExtractor);
				if (f != null) currentMap.inc(f);
			}
		}
	}

	/**
	 * Adds to the values of the given conditional features, if relevant.
	 */
	protected void addCond(List<ConditionalLazyEvaluator> condEvaluators) {
		for (ConditionalLazyEvaluator condEvaluator : condEvaluators) {
			if (condEvaluator.test()) {
				Alphabet.Feature f = alphabet.indexLazy(condEvaluator.lazyExtractor);
				if (f != null) currentMap.add(f, condEvaluator.eval());
			}
		}
	}

	
	//------------------------------------
	// utility functions
	
	// returns up to the first two chars of the head POS
	private String getHeadBroadPOS(LexDependency dep) {
		String pos = dep.lexHead.getPOS();
		String retval = pos;
		if (pos.length() > 2) retval = pos.substring(0, 2).intern();
		return retval;
		
	}
	
	// sets the current head and dep indexes, and the dep sign
	private void setDepIndexes(LexDependency dep) {
		currentHeadIndex = currentSign.wordIndex(dep.lexHead);
		currentDepIndex = currentSign.wordIndex(dep.lexDep);
		currentDepSign = currentSign.getSignHeadedByDep(dep);
	}

	// returns the head-dependent order
	private String getHeadDepOrder() {
		return (currentHeadIndex < currentDepIndex) ? HEAD_PRECEDES_DEP : DEP_PRECEDES_HEAD;
	}
	
	// sets the current sib index and the sib sign
	private void setSibIndex(LexDependency sib) {
		currentSibIndex = currentSign.wordIndex(sib.lexDep);	
		currentSibSign = currentSign.getSignHeadedByDep(sib);
	}

	// returns the head--sibling dependent order
	private String getHeadSibOrder() {
		return (currentHeadIndex < currentSibIndex) ? HEAD_PRECEDES_DEP : DEP_PRECEDES_HEAD;
	}
	
	// returns whether the dep precedes the sib
	private boolean depPrecedesSib() {
		return currentDepIndex < currentSibIndex;
	}

	
	//------------------------------------
	// definiteness functions
	
	/** Class for storing whether a sign is or immediately contains a definite NP. */
	public static class DefiniteNP {
		/** Definiteness value; null means not an NP (or NP parent). */
		public Boolean def;
		public DefiniteNP(Boolean def) { this.def = def; }
		public String toString() { return "defNP: " + def; }
	}
	
	/** Returns the definite NP status for a sign, caching it in the sign. */
	public DefiniteNP getDefiniteNP(Sign sign) {
		// check cached
		DefiniteNP defNP = (DefiniteNP)sign.getData(DefiniteNP.class);
		if (defNP != null) return defNP;
		// determine def NP status
		Boolean def = null;
		// check for NP
		Sign npSign = getSignOrChildSignAsNP(sign);
		if (npSign != null) {
			// set status to definite by default; check for indef
			def = Boolean.TRUE;
			// get sem feats
			Nominal npNom = npSign.getCategory().getIndexNominal();
			List<SatOp> semFeats = HyloHelper.getSemFeatsForHead(npNom, npSign.getCategory().getLF());
			// check for <det>nil
			for (SatOp feat : semFeats) {
				if (isIndefFeat(feat)) {
					def = Boolean.FALSE; break;
				}
			}
			// otherwise check deps
			if (def) {
				// get all deps
				List<LexDependency> allDeps = new ArrayList<LexDependency>(5);
				allDeps.addAll(npSign.getFilledDeps());
				allDeps.addAll(npSign.getSiblingFilledDeps());
				// check for <Det>a|an|some|any
				for (LexDependency dep : allDeps) {
					if (isIndefDep(dep)) {
						def = Boolean.FALSE; break;
					}
				}
			}
		} 
		// store result and return
		defNP = new DefiniteNP(def);
		sign.addData(defNP);
		return defNP;
	}
	
	/**
	 * Returns the given sign if it's an NP sign;
	 * otherwise returns the first child sign that's an NP sign;
	 * otherwise returns null.
	 */
	protected Sign getSignOrChildSignAsNP(Sign sign) {
		if (isNP(sign)) return sign;
		if (sign.isLexical()) return null;
		Sign[] inputs = sign.getDerivationHistory().getInputs();
        for (int i = 0; i < inputs.length; i++) {
        	if (isNP(inputs[i])) return inputs[i];
        }
		return null;
	}
	
	/**
	 * Returns whether the given sign is an NP.
	 * The default implementation tests for a category type of "np".
	 */
	protected boolean isNP(Sign sign) {
		Category cat = sign.getCategory();
		if (!(cat instanceof AtomCat)) return false;
		AtomCat ac = (AtomCat) cat;
		return (ac.getType().equals("np"));
	}
	
	/** 
	 * Returns whether the given semantic features signals indefiniteness.
	 * The default implementation tests for &lt:det&gt;nil.
	 */
	protected boolean isIndefFeat(SatOp feat) {
		return HyloHelper.getRel(feat).equals("det") && "nil".equals(HyloHelper.getVal(feat));
	}
	
	/**
	 * Returns whether the given lexical dependency signals indefiniteness.
	 * The default implementation checks for &lt;Det&gt;a|an|any|some.
	 */
	protected boolean isIndefDep(LexDependency dep) {
		if (dep.rel.equalsIgnoreCase("Det")) {
			String form = dep.lexDep.getWordForm();
			if (form=="a" || form=="an" || form=="any" || form=="some")
				return true;
		}
		return false;
	}
	
	/** Returns whether two signs differ in definiteness. */
	public boolean defDifference(Sign sign1, Sign sign2) {
		DefiniteNP defNP1 = getDefiniteNP(sign1);
		if (defNP1.def == null) return false;
		DefiniteNP defNP2 = getDefiniteNP(sign2);
		if (defNP2.def == null) return false;
		return defNP1.def != defNP2.def;
	}
	
	/** Returns the appropriate definiteness/indefiniteness constant. */
	public String defConstant(DefiniteNP defNP) {
		return (defNP.def) ? DEF : INDEF;
	}
	
	
	//------------------------------------
	// phrase length functions

	/** 
	 * Class for storing length of phrase in words, puncts and (finite) verbs, for unique retrieval from a sign's data objects. 
	 */
	public static class PhraseLengths {
		public int wordlen, punctlen, verblen;
		public PhraseLengths(int wordlen, int punctlen, int verblen) {
			this.wordlen = wordlen; this.punctlen = punctlen; this.verblen = verblen;
		}
		public String toString() { return " wordlen: " + wordlen + " punctlen: " + punctlen + " verblen: " + verblen; }
	}
	
	/** Returns the phrase lengths for a sign, caching them in the sign. */
	public PhraseLengths getPhraseLengths(Sign sign) {
		// check cached
		PhraseLengths lengths = (PhraseLengths)sign.getData(PhraseLengths.class);
		if (lengths != null) return lengths;
		int wordlen = 0, punctlen = 0, verblen = 0;
		// lex case
		if (sign.isLexical()) {
			for (Word w: sign.getWords()) {
				wordlen++;
				if (isPunct(w)) punctlen++;
				if (isVerb(w)) verblen++;
			}
		}
		// non-lex: add child lengths
		else {
			Sign[] inputs = sign.getDerivationHistory().getInputs();
	        for (int i = 0; i < inputs.length; i++) {
	        	PhraseLengths lengthsI = getPhraseLengths(inputs[i]);
	        	wordlen += lengthsI.wordlen; punctlen += lengthsI.punctlen; verblen += lengthsI.punctlen;
	        }
		}
		// store result and return
		lengths = new PhraseLengths(wordlen, punctlen, verblen);
		sign.addData(lengths);
		return lengths;
	}
	
	/**
	 * Returns whether a word is a punctuation mark that typically signals sentence-internal complexity.
	 * The default implementation tests for commas, dashes (--), semi-colons and colons.
	 */
	protected boolean isPunct(Word word) {
		// NB: in principle could use POS, but sometimes punctuation marks seem to end up with IN as the POS tag
		String form = word.getForm();
		return (form == "," || form == "--" || form == ";" || form == ":");
	}
	
	/**
	 * Returns whether a word is a verb that indicates a substantial clause.
	 * The default implementation tests for the finite verb POS tags VBD, VBP and VBZ.
	 */
	protected boolean isVerb(Word word) {
		String pos = word.getPOS();
		return (pos == "VBD" || pos == "VBP" || pos == "VBZ");
	}
	
	/** 
	 * Sets the differences in length between the signs headed by the current dep and sib, or null if none; 
	 * also sets the current dep and sib lengths.  The lengths are set to the lengths of the second sign 
	 * minus those of the first sign.
	 */
	protected void setLengthsDiff() {
		// reset
		currentLengthsDiff = null; currentDepLengths = null; currentSibLengths = null;
		// ensure both there
		if (currentDepSign == null || currentSibSign == null) return;
		// get phrase lengths
		currentDepLengths = getPhraseLengths(currentDepSign);
		currentSibLengths = getPhraseLengths(currentSibSign);
		// get 1st and 2nd phrase lengths
		PhraseLengths pl1 = (currentDepPrecedesSib) ? currentDepLengths : currentSibLengths;
		PhraseLengths pl2 = (currentDepPrecedesSib) ? currentSibLengths : currentDepLengths;
		// set diff to 2nd - 1st
		currentLengthsDiff = new PhraseLengths(pl2.wordlen-pl1.wordlen, pl2.punctlen-pl1.punctlen, pl2.verblen-pl1.verblen);
	}
	

	//------------------------------------
	// dep len functions
	
	/** Returns the dep len feature if not already set. */
	protected Alphabet.Feature getDepLenFeat() {
		if (depLenFeat == null) 
			depLenFeat = alphabet.index(depLenKeys);
		return depLenFeat;
	}
	
	/**
	 * Returns the dependency length between the current head and the current dependent.
	 * The default implementation returns the number of intervening words excluding 
	 * punctuation (as determined by isPunct), and doesn't count each word in a collapsed NE separately.  
	 */ 
	protected int depLen() {
		List<Word> words = currentSign.getWords();
		int min = Math.min(currentHeadIndex, currentDepIndex);
		int max = Math.max(currentHeadIndex, currentDepIndex);
		int count = 0;
		for (int i=min+1; i < max; i++) {
			Word w = words.get(i); 
			if (!isPunct(w)) count++;
		}
		return count;
	}
	
	
	//------------------------------------
	// word class functions
	
	/**
	 * Returns a class for the word, or CLASS_NIL if none.
	 * The default implementation returns one of the following, in this order:
	 * the semantic class of the word; 
	 * CLASS_PRO, if a pronoun; 
	 * CLASS_COLOR, if a color word; 
	 * the suffix, if getSuffix returns a value; 
	 * CLASS_HYPH, if the word is hyphenated; 
	 * CLASS_CAP, if capitalized; 
	 * or CLASS_NIL, otherwise. 
	 * The word class is cached using cachedWordClasses. 
	 */
	protected String getWordClass(Word word) {
		String retval = cachedWordClasses.get(word);
		if (retval != null) return retval;
		String wClass = word.getSemClass();
		if (wClass != null) return updateCachedWordClasses(word, wClass);
		if (isPro(word)) return updateCachedWordClasses(word, CLASS_PRO);
		String form = word.getForm();
		if (colors.contains(form)) return updateCachedWordClasses(word, CLASS_COLOR);
		String suffix = getSuffix(form);
		if (suffix != null) return updateCachedWordClasses(word, suffix);
		if (form.indexOf('-') >= 0) return updateCachedWordClasses(word, CLASS_HYPH); 
		if (Character.isUpperCase(form.charAt(0))) return updateCachedWordClasses(word, CLASS_CAP);
		return updateCachedWordClasses(word, CLASS_NIL);
	}
	
	/**
	 * Returns whether a word is a pronoun.
	 * The default implementation returns whether the POS tag starts with "PR".
	 */
	protected boolean isPro(Word word) { return word.getPOS().startsWith("PR"); }
	
	/**
	 * The set of color words to check for in determining the word class.
	 */
	protected Set<String> colors = defaultColors();
	
	/**
	 * Sets the set of color words.
	 */
	public void setColorWords(Set<String> colorWords) { colors = colorWords; }
	
	/**
	 * Returns the default set of color words: 11 common English colors, with two spellings of gray/grey.
	 */
	protected Set<String> defaultColors() {
		String[] colors = { 
				"black", "blue", "brown", "gray", "grey", "green", 
				"orange", "pink", "purple", "red", "white", "yellow"
			};
		return new HashSet<String>(Arrays.asList(colors));
	}

	/**
	 * A sequence of suffixes to check for in determining the word class, ordered by specificity.
	 */
	protected String[] suffixClasses = defaultSuffixClasses();
	
	/**
	 * Returns the default suffix classes: 61 common English suffixes from various lists on the web.
	 */
	protected String[] defaultSuffixClasses() {
		return new String[] { 
				"ancy", "aphy", "arch", "crat", "gram", "less", "logy", "ness", "nomy", "ship", "some", "sque", "tude",
				"ade", "age", "ant", "aph", "ary", "ast", "ate", "ble", "dom", "ent", "est", "ful", 
				"ian", "ile", "ion", "ing", "ish", "ism", "ist", "ise", "ite", "ium", "ive", "ize", 
				"nce", "oid", "ory", "ose", "ote", "ous", "sig", "ure",
				"ac", "al", "an", "cy", "ed", "en", "er", "fy", "ic", "le", "ly", "or", "se", "sy", "ty", 
				"y"
			};
	}
	
	/**
	 * Sets the suffix classes, which are assumed to be interned.
	 */
	public void setSuffixClasses(String[] suffixes) { suffixClasses = suffixes; }
	
	/**
	 * Returns a matching suffix class, or null if none.
	 */
	protected String getSuffix(String form) {
		for (int i=0; i < suffixClasses.length; i++) {
			String suff = suffixClasses[i];
			if (form.length() > suff.length() && form.endsWith(suff)) return suff;
		}
		return null;
	}
	
	/**
	 * Cache of word classes, using a weak hash map.
	 */
	protected WeakHashMap<Word,String> cachedWordClasses = new WeakHashMap<Word,String>();
	
	/**
	 * Updates the cached word classes with the given word and word class, and returns the word class.
	 */
	protected String updateCachedWordClasses(Word word, String wordClass) {
		cachedWordClasses.put(word, wordClass); return wordClass;
	}
	
	
	//------------------------------------
	// shared feature extractor elements

	// prefix: "ld" + head broad POS
	private void add_prefix(List<TrieMap.KeyExtractor<String>> retval) {
		retval.add(new TrieMap.KeyExtractor<String>(){public String getKey(){ return PREFIX; }});
		retval.add(new TrieMap.KeyExtractor<String>(){public String getKey(){ return currentHeadBroadPOS; }});
	}
	
	// head-dep order
	private void add_head_dep_order(List<TrieMap.KeyExtractor<String>> retval) {
		retval.add(new TrieMap.KeyExtractor<String>(){public String getKey(){ return currentHeadDepOrder; }});
	}
	
	// rel
	private void add_rel(List<TrieMap.KeyExtractor<String>> retval) {
		retval.add(new TrieMap.KeyExtractor<String>(){public String getKey(){ return currentDep.rel.intern(); }});
	}
	
	// common head-dep order elements
	private void add_head_dep_order_common(List<TrieMap.KeyExtractor<String>> retval) {
		add_prefix(retval);
		add_head_dep_order(retval);
		add_rel(retval);
	}
	
	// head word
	private void add_head_word(List<TrieMap.KeyExtractor<String>> retval) {
		retval.add(new TrieMap.KeyExtractor<String>(){public String getKey(){ return currentDep.lexHead.getWordForm(); }});
	}
	
	// head pos
	private void add_head_pos(List<TrieMap.KeyExtractor<String>> retval) {
		retval.add(new TrieMap.KeyExtractor<String>(){public String getKey(){ return currentDep.lexHead.getPOS(); }});
	}
	
	// dep word
	private void add_dep_word(List<TrieMap.KeyExtractor<String>> retval) {
		retval.add(new TrieMap.KeyExtractor<String>(){public String getKey(){ return currentDep.lexDep.getWordForm(); }});
	}
	
	// dep pos
	private void add_dep_pos(List<TrieMap.KeyExtractor<String>> retval) {
		retval.add(new TrieMap.KeyExtractor<String>(){public String getKey(){ return currentDep.lexDep.getPOS(); }});
	}
	
	// sibs precedence
	private void add_sibs_precedence(List<TrieMap.KeyExtractor<String>> retval) {
		retval.add(new TrieMap.KeyExtractor<String>(){public String getKey(){ return currentSibsPrecedence; }});
	}
	
	// common sibs precedence elements
	private void add_sibs_precedence_common(List<TrieMap.KeyExtractor<String>> retval) {
		add_prefix(retval);
		add_sibs_precedence(retval);
	}
	
	// sibs word1
	private void add_sibs_word1(List<TrieMap.KeyExtractor<String>> retval) {
		retval.add(new TrieMap.KeyExtractor<String>(){public String getKey(){ 
			return (currentDepPrecedesSib) ? currentDep.lexDep.getWordForm() : currentSib.lexDep.getWordForm(); 
		}});
	}
	
	// sibs word2
	private void add_sibs_word2(List<TrieMap.KeyExtractor<String>> retval) {
		retval.add(new TrieMap.KeyExtractor<String>(){public String getKey(){ 
			return (currentDepPrecedesSib) ? currentSib.lexDep.getWordForm() : currentDep.lexDep.getWordForm(); 
		}});
	}
	
	// sibs pos1
	private void add_sibs_pos1(List<TrieMap.KeyExtractor<String>> retval) {
		retval.add(new TrieMap.KeyExtractor<String>(){public String getKey(){ 
			return (currentDepPrecedesSib) ? currentDep.lexDep.getPOS() : currentSib.lexDep.getPOS(); 
		}});
	}
	
	// sibs pos2
	private void add_sibs_pos2(List<TrieMap.KeyExtractor<String>> retval) {
		retval.add(new TrieMap.KeyExtractor<String>(){public String getKey(){ 
			return (currentDepPrecedesSib) ? currentSib.lexDep.getPOS() : currentDep.lexDep.getPOS(); 
		}});
	}
	
	// sibs class1
	private void add_sibs_class1(List<TrieMap.KeyExtractor<String>> retval) {
		retval.add(new TrieMap.KeyExtractor<String>(){public String getKey(){
			Sign first = (currentDepPrecedesSib) ? currentDep.lexDep : currentSib.lexDep;
			return getWordClass(first.getWords().get(0));
		}});
	}
	
	// sibs class2
	private void add_sibs_class2(List<TrieMap.KeyExtractor<String>> retval) {
		retval.add(new TrieMap.KeyExtractor<String>(){public String getKey(){
			Sign second = (currentDepPrecedesSib) ? currentSib.lexDep : currentDep.lexDep;
			return getWordClass(second.getWords().get(0));
		}});
	}
	
	// sibs rel1
	private void add_sibs_rel1(List<TrieMap.KeyExtractor<String>> retval) {
		retval.add(new TrieMap.KeyExtractor<String>(){public String getKey(){ 
			return (currentDepPrecedesSib) ? currentDep.rel.intern() : currentSib.rel.intern(); 
		}});
	}
	
	// sibs rel2
	private void add_sibs_rel2(List<TrieMap.KeyExtractor<String>> retval) {
		retval.add(new TrieMap.KeyExtractor<String>(){public String getKey(){ 
			return (currentDepPrecedesSib) ? currentSib.rel.intern() : currentDep.rel.intern(); 
		}});
	}
	

	//-------------------------------
	// feature extractors
	
	// head-dep order words
	private List<TrieMap.KeyExtractor<String>> head_dep_order_words() {
		List<TrieMap.KeyExtractor<String>> retval = new ArrayList<TrieMap.KeyExtractor<String>>(5);
		add_head_dep_order_common(retval);
		add_head_word(retval);
		add_dep_word(retval);
		return retval;
	}
	
	// head-dep order pos
	private List<TrieMap.KeyExtractor<String>> head_dep_order_pos() {
		List<TrieMap.KeyExtractor<String>> retval = new ArrayList<TrieMap.KeyExtractor<String>>(5);
		add_head_dep_order_common(retval);
		add_head_pos(retval);
		add_dep_pos(retval);
		return retval;
	}

	// head-dep order word/pos
	private List<TrieMap.KeyExtractor<String>> head_dep_order_word_pos() {
		List<TrieMap.KeyExtractor<String>> retval = new ArrayList<TrieMap.KeyExtractor<String>>(5);
		add_head_dep_order_common(retval);
		add_head_word(retval);
		add_dep_pos(retval);
		return retval;
	}
	
	// head-dep order pos/word
	private List<TrieMap.KeyExtractor<String>> head_dep_order_pos_word() {
		List<TrieMap.KeyExtractor<String>> retval = new ArrayList<TrieMap.KeyExtractor<String>>(5);
		add_head_dep_order_common(retval);
		add_head_pos(retval);
		add_dep_word(retval);
		return retval;
	}
	
	// sibs precedence words
	private List<TrieMap.KeyExtractor<String>> sibs_precedence_words() {
		List<TrieMap.KeyExtractor<String>> retval = new ArrayList<TrieMap.KeyExtractor<String>>(5);
		add_sibs_precedence_common(retval);
		add_sibs_word1(retval);
		add_sibs_word2(retval);
		return retval;
	}
	
	// sibs precedence word pos
	private List<TrieMap.KeyExtractor<String>> sibs_precedence_word_pos() {
		List<TrieMap.KeyExtractor<String>> retval = new ArrayList<TrieMap.KeyExtractor<String>>(5);
		add_sibs_precedence_common(retval);
		add_sibs_word1(retval);
		add_sibs_pos2(retval);
		return retval;
	}
	
	// sibs precedence pos word
	private List<TrieMap.KeyExtractor<String>> sibs_precedence_pos_word() {
		List<TrieMap.KeyExtractor<String>> retval = new ArrayList<TrieMap.KeyExtractor<String>>(5);
		add_sibs_precedence_common(retval);
		add_sibs_pos1(retval);
		add_sibs_word2(retval);
		return retval;
	}
	
	// sibs precedence pos
	private ConditionalLazyExtractor sibs_precedence_pos() {
		ConditionalLazyExtractor retval = new ConditionalLazyExtractor() {
			boolean test() { return currentDep.lexDep.getPOS() != currentSib.lexDep.getPOS(); }
		};
		add_sibs_precedence_common(retval.lazyExtractor);
		add_sibs_pos1(retval.lazyExtractor);
		add_sibs_pos2(retval.lazyExtractor);
		return retval;
	}
	
	// sibs precedence word / class
	private List<TrieMap.KeyExtractor<String>> sibs_precedence_word_class() {
		List<TrieMap.KeyExtractor<String>> retval = new ArrayList<TrieMap.KeyExtractor<String>>(5);
		add_sibs_precedence_common(retval);
		add_sibs_word1(retval);
		add_sibs_class2(retval);
		return retval;
	}
	
	// sibs precedence class / word
	private List<TrieMap.KeyExtractor<String>> sibs_precedence_class_word() {
		List<TrieMap.KeyExtractor<String>> retval = new ArrayList<TrieMap.KeyExtractor<String>>(5);
		add_sibs_precedence_common(retval);
		add_sibs_class1(retval);
		add_sibs_word2(retval);
		return retval;
	}
	
	// sibs precedence class
	private ConditionalLazyExtractor sibs_precedence_class() {
		ConditionalLazyExtractor retval = new ConditionalLazyExtractor() {
			boolean test() { 
				return getWordClass(currentDep.lexDep.getWords().get(0)) != getWordClass(currentSib.lexDep.getWords().get(0)); 
			}
		};
		add_sibs_precedence_common(retval.lazyExtractor);
		add_sibs_class1(retval.lazyExtractor);
		add_sibs_class2(retval.lazyExtractor);
		return retval;
	}
	
	// sibs precedence rels
	private ConditionalLazyExtractor sibs_precedence_rels() {
		ConditionalLazyExtractor retval = new ConditionalLazyExtractor() {
			boolean test() { return !currentDep.rel.equals(currentSib.rel); }
		};
		add_sibs_precedence_common(retval.lazyExtractor);
		add_sibs_rel1(retval.lazyExtractor);
		add_sibs_rel2(retval.lazyExtractor);
		return retval;
	}
	
	// sibs precedence defs
	private ConditionalLazyExtractor sibs_precedence_defs() {
		ConditionalLazyExtractor retval = new ConditionalLazyExtractor() {
			boolean test() {
				if (currentDepSign == null || currentSibSign == null) return false;
				return defDifference(currentDepSign, currentSibSign); 
			}
		};
		add_sibs_precedence_common(retval.lazyExtractor);
		retval.lazyExtractor.add(new TrieMap.KeyExtractor<String>(){public String getKey(){ 
			return (currentDepPrecedesSib) ? defConstant(getDefiniteNP(currentDepSign)) : defConstant(getDefiniteNP(currentSibSign));
		}});
		retval.lazyExtractor.add(new TrieMap.KeyExtractor<String>(){public String getKey(){ 
			return (currentDepPrecedesSib) ? defConstant(getDefiniteNP(currentSibSign)) : defConstant(getDefiniteNP(currentDepSign));
		}});
		return retval;
	}
	
	// sibs precedence verbs
	private ConditionalLazyExtractor sibs_precedence_verbs() {
		ConditionalLazyExtractor retval = new ConditionalLazyExtractor() {
			boolean test() { 
				return currentLengthsDiff.verblen != 0 && 
						(currentDepLengths.verblen == 0 || currentSibLengths.verblen == 0); 
			}
		};
		add_sibs_precedence_common(retval.lazyExtractor);
		retval.lazyExtractor.add(new TrieMap.KeyExtractor<String>(){public String getKey(){ 
			return (currentLengthsDiff.verblen > 0) ? NO_V : HAS_V;
		}});
		retval.lazyExtractor.add(new TrieMap.KeyExtractor<String>(){public String getKey(){ 
			return (currentLengthsDiff.verblen > 0) ? HAS_V : NO_V;
		}});
		return retval;
	}
	
	// sibs precedence puncts
	private ConditionalLazyExtractor sibs_precedence_puncts() {
		ConditionalLazyExtractor retval = new ConditionalLazyExtractor() {
			boolean test() { 
				return currentLengthsDiff.punctlen != 0 && 
						(currentDepLengths.punctlen == 0 || currentSibLengths.punctlen == 0); 
			}
		};
		add_sibs_precedence_common(retval.lazyExtractor);
		retval.lazyExtractor.add(new TrieMap.KeyExtractor<String>(){public String getKey(){ 
			return (currentLengthsDiff.punctlen > 0) ? NO_P : HAS_P;
		}});
		retval.lazyExtractor.add(new TrieMap.KeyExtractor<String>(){public String getKey(){ 
			return (currentLengthsDiff.punctlen > 0) ? HAS_P : NO_P;
		}});
		return retval;
	}

	// short-long words
	private ConditionalLazyEvaluator short_long_words() {
		ConditionalLazyEvaluator retval = new ConditionalLazyEvaluator() {
			boolean test() { return currentLengthsDiff.wordlen != 0; }
			float eval() { return (float) Math.abs(currentLengthsDiff.wordlen); }
		};
		add_sibs_precedence_common(retval.lazyExtractor);
		retval.lazyExtractor.add(new TrieMap.KeyExtractor<String>(){public String getKey(){ 
			return (currentLengthsDiff.wordlen > 0) ? SHORT_LONG_ORDER : LONG_SHORT_ORDER;
		}});
		return retval;
	}
}


================================================
FILE: src/opennlp/ccg/hylo/LexDependency.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2011 Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.hylo;

import java.util.*;

import opennlp.ccg.synsem.*;

/** 
 * A class for tracking semantic dependencies between lexical items.
 * A lex dependency is a triple consisting of a lexical head, a relation 
 * and a lexical dependent.  Either the head or dependent can be null, in 
 * which case the dependency is considered unfilled.  To be equal, a lex 
 * dependency must have identical heads and dependents and equal relations.
 * Relations can involve chains of individual relations (concatenated with dots) 
 * when there are intervening nominals for the same lexical item.
 * 
 * @author Michael White
 * @version     $Revision: 1.2 $, $Date: 2011/08/26 21:31:52 $
 */ 
public class LexDependency {

	/** The lexical head. */
	public Sign lexHead;
	
	/** The relation. */
	public String rel;
	
	/** The lexical dependent. */
	public Sign lexDep;
	
	/** Constructor. */
	public LexDependency(Sign lexHead, String rel, Sign lexDep) {
		this.lexHead = lexHead; this.rel = rel; this.lexDep = lexDep;
	}
	
	/** Hash code. */
	public int hashCode() {
		int retval = rel.hashCode();
		if (lexHead != null) retval += 31 * lexHead.hashCode();
		if (lexDep != null) retval += 7 * lexDep.hashCode();
		return retval;
	}
	
	/** Equals. */
	public boolean equals(Object obj) {
        if (obj == this) return true;
        if (!(obj instanceof LexDependency)) return false;
        LexDependency dep = (LexDependency) obj;
		return lexHead == dep.lexHead && lexDep == dep.lexDep && rel.equals(dep.rel);
	}
	
	/** toString. */
	public String toString() {
		StringBuffer retval = new StringBuffer();
		if (lexHead == null) retval.append("null");
		else retval.append(lexHead.getOrthography());
		retval.append('<').append(rel).append('>');
		if (lexDep == null) retval.append("null");
		else retval.append(lexDep.getOrthography());
		return retval.toString();
	}
	
	/** Filled test: neither head nor dependent null. */
	public boolean filled() {
		return lexHead != null && lexDep != null;
	}
	
	/**
	 * Returns a list of unfilled dependencies for a list of EPs 
	 * for a lexical item.
	 */
	public static List<LexDependency> unfilledLexDeps(List<SatOp> preds) {
		List<LexDependency> retval = new ArrayList<LexDependency>(4);
		Map<Nominal,Integer> nomIndex = HyloHelper.nomIndex(preds);
		Set<Nominal> nominals = nomIndex.keySet();
		// special case for indexRels
		if (nominals.size() == 1 && !HyloHelper.isLexPred(preds.get(0))) {
			Sign lexHead = null;
			LexSemOrigin origin = preds.get(0).getOrigin();
			if (origin instanceof Sign) lexHead = (Sign) origin;
			else return retval;
			for (SatOp pred : preds) {
				String rel = HyloHelper.getRel(pred);
				if (rel != null) {
					// add unfilled dep with lex head as dep
					retval.add(new LexDependency(null, rel, lexHead));
					if (HyloHelper.isRelPred(pred)) {
						// also add unfilled dep with lex head as head
						retval.add(new LexDependency(lexHead, rel, null));
					}
				}
			}
			return retval;
		}
		// otherwise, starting with each root nominal, enumerate paths to leaf nominals
		for (Nominal root : nominals) {
			// check for root nominal
			if (!HyloHelper.isRoot(root, preds)) continue;
			// set lex head
			Sign lexHead = null;
			int rootIndex = nomIndex.get(root);
			SatOp rootPred = preds.get(rootIndex);
			if (HyloHelper.isLexPred(rootPred)) {
				LexSemOrigin origin = rootPred.getOrigin();
				if (origin instanceof Sign) lexHead = (Sign) origin;
				rootIndex++;
			}
			// start path for each rel for root nom
			for (int i=rootIndex; i < preds.size() && HyloHelper.getPrincipalNominal(preds.get(i)).equals(root); i++) {
				rootPred = preds.get(i);
				Nominal dep = HyloHelper.getSecondaryNominal(rootPred);
				if (dep == null) continue;
				String rel = HyloHelper.getRel(rootPred);
				addUnfilledLexDep(dep, lexHead, rel, preds, nomIndex, retval);
			}
		}
		return retval;
	}
	
	// recursively adds unfilled lex deps to retval for leaf nominals 
	private static void addUnfilledLexDep(Nominal dep, Sign lexHead, String rel, List<SatOp> preds, Map<Nominal,Integer> nomIndex, List<LexDependency> retval) {
		// if dep not in nom index, then just add unfilled dep for the current rel
		if (!nomIndex.containsKey(dep)) {
			retval.add(new LexDependency(lexHead, rel, null));
			return;
		}
		// otherwise continue with the preds for the current dep
		int depIndex = nomIndex.get(dep);
		SatOp depPred = preds.get(depIndex);
		// if lex head null, add unfilled dep for the current rel, 
		// then update lex head and reset rel
		if (lexHead == null) {
			Sign lexDep = null;
			LexSemOrigin origin = depPred.getOrigin();
			if (origin instanceof Sign) {
				lexDep = (Sign) origin;
				retval.add(new LexDependency(lexHead, rel, lexDep));
			}
			lexHead = lexDep;
			rel = null;
		}
		// then recurse through further rels, if any
		for (int i=depIndex; i < preds.size() && HyloHelper.getPrincipalNominal(preds.get(i)).equals(dep); i++) {
			depPred = preds.get(i);
			Nominal depdep = HyloHelper.getSecondaryNominal(depPred);
			if (depdep == null) continue;
			String relrel = (rel == null) 
				? HyloHelper.getRel(depPred) 
				: rel + "." + HyloHelper.getRel(depPred);
			addUnfilledLexDep(depdep, lexHead, relrel, preds, nomIndex, retval);
		}
	}
	
	
	/**
	 * Returns the filled lexical dependencies from those in the unfilled list 
	 * by checking the list of EPs for ones that have become filled, removing the 
	 * corresponding no longer unfilled deps.  
	 */
	public static List<LexDependency> filledLexDeps(List<LexDependency> unfilled, List<SatOp> preds) {
		List<LexDependency> retval = new ArrayList<LexDependency>(unfilled.size());
		Map<Nominal,Integer> nomIndex = HyloHelper.nomIndex(preds);
		// check each unfilled dep
		for (Iterator<LexDependency> it = unfilled.iterator(); it.hasNext(); ) {
			LexDependency udep = it.next();
			String[] rels = udep.rel.split("\\.");
			// dependent missing case
			if (udep.lexDep == null) {
				// follow rels to descendant pred
				SatOp relPred = findPred(udep.lexHead, rels[0], preds);
				SatOp descendantPred = findDescendantPred(relPred, 0, rels, preds, nomIndex);
				// check if dep filled
				Nominal depnom = HyloHelper.getSecondaryNominal(descendantPred);
				if (!nomIndex.containsKey(depnom)) continue;
				SatOp depPred = preds.get(nomIndex.get(depnom));
				if (HyloHelper.isLexPred(depPred)) {
					// remove dep from unfilled
					it.remove();
					// add filled dep, if lexical
					if (depPred.getOrigin() instanceof Sign) {
						Sign lexDep = (Sign) depPred.getOrigin();
						retval.add(new LexDependency(udep.lexHead, udep.rel, lexDep));
					}
				}
			}
			// head missing case
			else if (udep.lexHead == null) {
				// follow rels to ancestor pred
				SatOp relPred = findPred(udep.lexDep, rels[rels.length-1], preds);
				SatOp ancestorPred = findAncestorPred(relPred, rels.length-1, rels, preds);
				// check if head filled
				Nominal headnom = HyloHelper.getPrincipalNominal(ancestorPred);
				if (!nomIndex.containsKey(headnom)) continue;
				SatOp headPred = preds.get(nomIndex.get(headnom));
				if (HyloHelper.isLexPred(headPred)) {
					// remove dep from unfilled
					it.remove();
					// add filled dep, if lexical
					if (headPred.getOrigin() instanceof Sign) {
						Sign lexHead = (Sign) headPred.getOrigin();
						retval.add(new LexDependency(lexHead, udep.rel, udep.lexDep));
					}
				}
			}
		}
		return retval;
	}
	
	// returns the EP with the given origin and rel, or null if not found
	private static SatOp findPred(Sign origin, String rel, List<SatOp> preds) {
		for (SatOp pred : preds) {
			if (pred.getOrigin() != origin) continue;
			if (rel.equals(HyloHelper.getRel(pred))) return pred;
		}
		return null;
	}
	
	// returns the descendant EP for the given rels, or null if not found
	private static SatOp findDescendantPred(SatOp current, int index, String[] rels, List<SatOp> preds, Map<Nominal,Integer> nomIndex) {
		if (index == rels.length-1) return current;
		// find EP for next rel
		SatOp next = null;
		String rel = rels[++index];
		Nominal depnom = HyloHelper.getSecondaryNominal(current);
		for (int i=nomIndex.get(depnom); i < preds.size() && HyloHelper.getPrincipalNominal(preds.get(i)).equals(depnom); i++) {
			SatOp pred = preds.get(i);
			if (rel.equals(HyloHelper.getRel(pred))) {
				next = pred; break;
			}
		}
		if (next == null) return null;
		// recurse
		return findDescendantPred(next, index, rels, preds, nomIndex);
	}
	
	// returns the ancestor EP for the given rels, or null if not found
	private static SatOp findAncestorPred(SatOp current, int index, String[] rels, List<SatOp> preds) {
		if (index == 0) return current;
		// find EP for previous rel
		SatOp prev = null;
		String rel = rels[--index];
		Nominal headnom = HyloHelper.getPrincipalNominal(current);
		for (int i=0; i < preds.size(); i++) {
			SatOp pred = preds.get(i);
			if (headnom.equals(HyloHelper.getSecondaryNominal(pred)) && rel.equals(HyloHelper.getRel(pred))) {
				prev = pred; break;
			}
		}
		if (prev == null) return null;
		// recurse
		return findAncestorPred(prev, index, rels, preds);
	}
	
	
	/** 
	 * Filters the first list of dependencies to those sharing a head with a dependency in the second list.
	 */
	public static List<LexDependency> filterSameHead(List<LexDependency> deps1, List<LexDependency> deps2) {
		if (deps1.isEmpty() || deps2.isEmpty()) return Collections.emptyList();
		List<LexDependency> retval = new ArrayList<LexDependency>(deps1.size());
		for (LexDependency dep1 : deps1) {
			for (LexDependency dep2 : deps2) {
				if (dep1.lexHead == dep2.lexHead) {
					retval.add(dep1); break;
				}
			}
		}
		return retval;
	}
}


================================================
FILE: src/opennlp/ccg/hylo/ModalOp.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003 Jason Baldridge and University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.hylo;

import opennlp.ccg.synsem.*;
import opennlp.ccg.unify.*;
import org.jdom.*;
import java.util.*;
import gnu.trove.*;

/**
 * A parent class for modal operators, such as &lt;P&gt;p, [F]q, and
 * &lt;&gt;(p ^ q).
 *
 * @author      Jason Baldridge
 * @author      Michael White
 * @version     $Revision: 1.6 $, $Date: 2009/12/21 03:27:19 $
 **/
public abstract class ModalOp extends HyloFormula {

	private static final long serialVersionUID = 1L;
	
	protected Mode _mode;
    protected LF _arg;

    @SuppressWarnings("unchecked")
	protected ModalOp(Element e) {
        String atomLabel = e.getAttributeValue("mode");
        if (atomLabel == null) atomLabel = e.getAttributeValue("m");
        if (atomLabel != null) {
            _mode = new ModeLabel(atomLabel);
            _arg = HyloHelper.getLF_FromChildren(e);
        } else {
            List<Element> children = e.getChildren();
            _mode = (Mode)HyloHelper.getLF((Element)children.get(0));
            _arg = HyloHelper.getLF((Element)children.get(1));
        }
    }
    
    protected ModalOp(Mode mode, LF arg) {
        _mode = mode;
        _arg = arg;
    }

    public Mode getMode() { return _mode; }
    public void setMode(Mode mode) { _mode = mode; }

    public LF getArg() { return _arg; }
    public void setArg(LF arg) { _arg = arg; }
    
    public void deepMap(ModFcn mf) {
        _arg.deepMap(mf);
        mf.modify(this);
    }

    public boolean occurs(Variable var) {
        return _mode.occurs(var) || _arg.occurs(var);
    }

    protected boolean equals(ModalOp mo) {
        if (_mode.equals(mo._mode) && _arg.equals(mo._arg)) {
            return true;
        } else {
            return false;
        }
    }

    protected void unifyCheck(ModalOp mo) throws UnifyFailure {
        _mode.unifyCheck(mo._mode);
        _arg.unifyCheck(mo._arg);
    }

    /** Returns a hash code based on the mode and arg. */
    public int hashCode() { return _mode.hashCode() + _arg.hashCode(); }
    
    /**
     * Returns a hash code using the given map from vars to ints.
     */
    public int hashCode(TObjectIntHashMap varMap) { 
        return _mode.hashCode(varMap) + _arg.hashCode(varMap); 
    }
        
    /**
     * Returns whether this modal op equals the given object  
     * up to variable names, using the given maps from vars to ints.
     */
    public boolean equals(Object obj, TObjectIntHashMap varMap, TObjectIntHashMap varMap2) {
        if (obj.getClass() != this.getClass()) { return false; }
        ModalOp mo = (ModalOp) obj;
        return _mode.equals(mo._mode, varMap, varMap2) && 
               _arg.equals(mo._arg, varMap, varMap2); 
    }

    /** Returns the string form of this modal op, without the arg. */
    abstract public String modalOpString();
    
    public String toString() {
        return new StringBuffer().append(modalOpString()).append(_arg.toString()).toString();
    }

    /**
     * Returns a pretty-printed string of this LF, with the given indent.
     */
    public String prettyPrint(String indent) {
        // calc new indent
        StringBuffer ibuf = new StringBuffer();
        ibuf.append(indent).append(' ');
        String modalOpString = modalOpString(); 
        for (int i = 0; i < modalOpString.length(); i++) {
            ibuf.append(' ');
        }
        String newIndent = ibuf.toString();
        // calc string
        StringBuffer sb = new StringBuffer();
        sb.append('\n').append(indent).append(modalOpString);
        sb.append(_arg.prettyPrint(newIndent));
        // done
        return sb.toString();
    }
}


================================================
FILE: src/opennlp/ccg/hylo/Mode.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2002 Jason Baldridge
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.hylo;

import opennlp.ccg.synsem.*;

/**
 * A interface for hybrid logic nominals, to allow polymorphism for
 * both Modality labels and variables over Modality labels.
 *
 * @author      Jason Baldridge
 * @author 		<a href="http://www.ling.ohio-state.edu/~scott/">Scott Martin</a>
 * @version     $Revision: 1.2 $, $Date: 2005/10/19 21:27:15 $
 **/
public interface Mode extends LF {
	
	/**
	 * Gets the name of this mode.
	 */
	String getName();
}


================================================
FILE: src/opennlp/ccg/hylo/ModeLabel.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2002-4 Jason Baldridge and University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.hylo;

import opennlp.ccg.synsem.*;
import opennlp.ccg.unify.*;
import org.jdom.*;

/**
 * A modality label.
 * Types are not currently supported.
 *
 * @author      Jason Baldridge
 * @author      Michael White
 * @version     $Revision: 1.5 $, $Date: 2009/07/17 04:23:30 $
 **/
public final class ModeLabel extends HyloAtom implements Mode {

	private static final long serialVersionUID = -4101305505903588678L;

	public ModeLabel(String name) {
        super(name);
    }

    public LF copy() {
        return new ModeLabel(_name);
    }

    public Object unify(Object u, Substitution sub) throws UnifyFailure {
        if (equals(u)) return this;
        return super.unify(u, sub);
    }
    
    /**
     * Returns an XML representation of this LF (not currently supported).
     * Throws a runtime exception.
     */
    public Element toXml() {
        throw new RuntimeException("toXml() not currently supported for ModeLabel.");
    }
}


================================================
FILE: src/opennlp/ccg/hylo/ModeVar.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2002-4 Jason Baldridge and University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.hylo;

import opennlp.ccg.synsem.*;
import opennlp.ccg.unify.*;
import org.jdom.*;

/**
 * A class for variables over ModeLabel objects.
 * Mode vars are not really supported at present, and 
 * type unification is not implemented.
 *
 * @author      Jason Baldridge
 * @author		<a href="http://www.ling.ohio-state.edu/~scott/">Scott Martin</a>
 * @version     $Revision: 1.5 $, $Date: 2009/07/17 04:23:30 $
 **/
public class ModeVar extends HyloVar implements Mode {
    
	private static final long serialVersionUID = -6872985893931836901L;

	public ModeVar(String name) {
        super(name);
    }

    protected ModeVar(String name, int index, SimpleType st) {
        super(name, index, st);
    }
    
    /**
     * Gets the name of this mode variable.
     * @return This method just delegates to the {@link #name()} method.
     */
    @Override
	public String getName() {
		return name();
	}

	public LF copy() {
        return new ModeVar(_name, _index, type);
    }

    
    public boolean equals(Object o) {
        if (!(o instanceof ModeVar)) return false;
        return super.equals(o);
    }
    
    public Object unify(Object u, Substitution sub) throws UnifyFailure {
        if (u instanceof ModeLabel) {
            return sub.makeSubstitution(this, u);
        } else if (u instanceof ModeVar) {
            ModeVar u_nv = (ModeVar)u;
            if (equals(u_nv)) return this;
            // substitute according to comparison order, 
            // so that the direction of unification doesn't matter
            if (compareTo(u_nv) >= 0) {
                return sub.makeSubstitution(this, u_nv);
            } else {
                return sub.makeSubstitution(u_nv, this);
            }
        } else {
            throw new UnifyFailure();
        }
    }

    public Object fill(Substitution sub) throws UnifyFailure {
        Object val = sub.getValue(this);
        if (val != null) {
            return val;
        } else {
            return this;
        }
    }

    
    /**
     * Returns an XML representation of this LF (not currently supported).
     * Throws a runtime exception.
     */
    public Element toXml() {
        throw new RuntimeException("toXml() not currently supported for ModeVar.");
    }
}


================================================
FILE: src/opennlp/ccg/hylo/Nominal.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2002-3 Jason Baldridge and University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.hylo;

import opennlp.ccg.synsem.*;

/**
 * A interface for hybrid logic nominals, to allow polymorphism for
 * both Nominal atoms and Nominal variables.
 *
 * @author      Jason Baldridge
 * @author      Michael White
 * @version     $Revision: 1.6 $, $Date: 2005/11/01 19:39:27 $
 **/
public interface Nominal extends LF {
    public String getName();
    public boolean isShared();
    public void setShared(boolean shared);
    public int compareTo(Nominal nom);
}


================================================
FILE: src/opennlp/ccg/hylo/NominalAtom.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003-4 Jason Baldridge and University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.hylo;

import java.io.FileInputStream;
import java.io.FileOutputStream;
import java.io.IOException;
import java.io.ObjectInputStream;
import java.io.ObjectOutputStream;

import opennlp.ccg.grammar.*;
import opennlp.ccg.synsem.*;
import opennlp.ccg.unify.*;

import org.jdom.*;

/**
 * A hybrid logic nominal, an atomic formula which holds true at exactly one
 * point in a model.
 * The type is checked for compatibility during unification with nominal vars, 
 * but it is not updated, since nominal atoms are constants.
 * If no type is given, the TOP type is used for backwards compatibility.
 *
 * @author      Jason Baldridge
 * @author      Michael White
 * @version     $Revision: 1.10 $, $Date: 2009/07/17 04:23:30 $
 **/
public class NominalAtom extends HyloAtom implements Nominal {

	private static final long serialVersionUID = -6002484920078196411L;
	
	protected boolean shared = false;
    
    public NominalAtom(String name) {
        this(name, null);
    }
    
    public NominalAtom(String name, SimpleType st) {
        this(name, st, false);
    }
    
    public NominalAtom(String name, SimpleType st, boolean shared) {
        super(name, st);
        type = (st != null) ? st : Grammar.theGrammar.types.getSimpleType(Types.TOP_TYPE);
        this.shared = shared;
    }

    public String getName() { return _name; }
    
    public boolean isShared() { return shared; }

    public void setShared(boolean shared) { this.shared = shared; }
    
    public LF copy() {
        return new NominalAtom(_name, type, shared);
    }

    /** Returns a hash code based on the atom name and type. */
    public int hashCode() { 
        return _name.hashCode() + type.hashCode();
    }

    /**
     * Returns whether this atom equals the given object based on the atom name and type.
     */
    public boolean equals(Object obj) {
        if (!super.equals(obj)) return false;
        NominalAtom nom = (NominalAtom) obj;
        return type.equals(nom.type);
    }

    public Object unify(Object u, Substitution sub) throws UnifyFailure {
        if (equals(u)) return this;
        return super.unify(u, sub);
    }
    
    public int compareTo(Nominal nom) {
        if (nom instanceof NominalAtom) { 
            return super.compareTo((NominalAtom)nom);
        }
        int retval = _name.compareTo(nom.getName());
        if (retval == 0) { retval = -1; } // atom precedes var if names equal
        return retval;
    }
    
    public String toString() {
        String retval = _name;
        if (!type.getName().equals(Types.TOP_TYPE)) retval += ":" + type.getName();
        return retval;
    }
    
    /**
     * Returns an XML representation of this LF.
     */
    public Element toXml() {
        Element retval = new Element("nom");
        retval.setAttribute("name", toString());
        return retval;
    }
    
    /** Tests serialization. */
    public static void debugSerialization() throws IOException, ClassNotFoundException {
        // test serialization
        NominalAtom n = new NominalAtom("w1");
    	String filename = "tmp.ser";
    	ObjectOutputStream out = new ObjectOutputStream(new FileOutputStream(filename));
    	System.out.println("Writing n: " + n);
    	out.writeObject(n);
    	out.close();
    	ObjectInputStream in = new ObjectInputStream(new FileInputStream(filename));
    	System.out.print("Reading n2: ");
    	NominalAtom n2 = (NominalAtom) in.readObject();
    	System.out.println(n2);
    	in.close();
    	// test identity and equality
    	System.out.println("n == n2?: " + (n == n2));
    	System.out.println("n.equals(n2)?: " + (n.equals(n2)));
    }
}


================================================
FILE: src/opennlp/ccg/hylo/NominalVar.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003-4 Jason Baldridge and University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.hylo;

import opennlp.ccg.synsem.*;
import opennlp.ccg.unify.*;
import org.jdom.*;

/**
 * A class for variables over NominalAtom objects.
 * Nominal vars take precedence over generic hylo vars.
 * Types are unified with other hylo vars and nominal atoms.
 *
 * @author      Jason Baldridge
 * @author      Michael White
 * @version     $Revision: 1.13 $, $Date: 2009/07/17 04:23:30 $
 **/
public class NominalVar extends HyloVar implements Nominal {
    
	private static final long serialVersionUID = -2086362887254623273L;
	
	protected boolean shared = false;
    
    public NominalVar(String name) {
        super(name);
    }

    public NominalVar(String name, SimpleType st) {
        super(name, st);
    }

    public NominalVar(String name, SimpleType st, boolean shared) {
        super(name, st);
        this.shared = shared;
    }

    protected NominalVar(String name, int index, SimpleType st) {
        super(name, index, st);
    }
    
    protected NominalVar(String name, int index, SimpleType st, boolean shared) {
        super(name, index, st);
        this.shared = shared;
    }
    
    public String getName() { return _name; }
    
    public boolean isShared() { return shared; }

    public void setShared(boolean shared) { this.shared = shared; }
    
    public void setType(SimpleType st) { 
        _hashCode += st.getIndex() - type.getIndex();
        type = st; 
    }
    
    public LF copy() {
        return new NominalVar(_name, _index, type, shared);
    }

    
    public boolean equals(Object o) {
        if (!(o instanceof NominalVar)) return false;
        return super.equals(o);
    }
    
    public int compareTo(Nominal nom) {
        if (nom instanceof NominalVar) { 
            return super.compareTo((NominalVar)nom);
        }
        int retval = _name.compareTo(nom.getName());
        if (retval == 0) { retval = 1; } // atom precedes var if names equal
        return retval;
    }
    
    
    public Object unify(Object u, Substitution sub) throws UnifyFailure {
        // check for equality with u
        if (equals(u)) return this; 
        // make sure u is an LF
        if (!(u instanceof LF)) throw new UnifyFailure(); 
        // check type compatibility
        LF lf = (LF) u;
        if (lf.getType() == null) throw new UnifyFailure();
        SimpleType st = (SimpleType) type.unify(lf.getType(), sub);
        // with nominal atoms, go ahead and substitute
        if (u instanceof NominalAtom) return sub.makeSubstitution(this, u); 
        // with nominal vars, substitute according to type specificity then comparison order,  
        // so that the direction of unification doesn't matter
        if (u instanceof NominalVar) {
            NominalVar u_nv = (NominalVar) u;
            // equal types, use comparison order
            if (type.equals(u_nv.getType())) {
                if (super.compareTo(u_nv) >= 0) return sub.makeSubstitution(this, u_nv); 
                else return sub.makeSubstitution(u_nv, this);
            }
            // unequal types, use most specific one
            if (type.equals(st)) return sub.makeSubstitution(u_nv, this);
            if (u_nv.getType().equals(st)) return sub.makeSubstitution(this, u_nv); 
            // otherwise make new nom var with intersection type, 
            // name based on comparison order and index, and new index
            String name = (super.compareTo(u_nv) >= 0) ? (u_nv._name + u_nv._index) : (_name + _index);
            NominalVar nv_st = new NominalVar(name, UnifyControl.getUniqueVarIndex(), st);
            // and subst both
            sub.makeSubstitution(u_nv, nv_st);
            return sub.makeSubstitution(this, nv_st); 
        }
        // with hylo vars, substitute the hylo var for this 
        if (u instanceof HyloVar) { 
            HyloVar u_hv = (HyloVar) u;
            // check for same type
            if (type.equals(st)) return sub.makeSubstitution(u_hv, this); 
            // otherwise make new nom var with intersection type, 
            // same name, and new index
            NominalVar nv_st = new NominalVar(this._name, UnifyControl.getUniqueVarIndex(), st);
            // and subst both
            sub.makeSubstitution(u_hv, nv_st);
            return sub.makeSubstitution(this, nv_st); 
        }
        // otherwise give up
        throw new UnifyFailure();
    }

    public Object fill(Substitution sub) throws UnifyFailure {
        Object val = sub.getValue(this);
        if (val != null) {
            return val;
        } else {
            return this;
        }
    }
    
    /**
     * Returns an XML representation of this LF.
     */
    public Element toXml() {
        Element retval = new Element("nomvar");
        retval.setAttribute("name", nameWithType());
        return retval;
    }
}


================================================
FILE: src/opennlp/ccg/hylo/Op.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003-5 Jason Baldridge and University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.hylo;

import opennlp.ccg.synsem.*;
import opennlp.ccg.unify.*;
import opennlp.ccg.grammar.Grammar;
import org.jdom.*;
import java.util.*;
import gnu.trove.*;

/**
 * A generic operator, such as conjunction, disjunction, exclusive-or, 
 * negation or optionality (^, v, v_, ~, ?).
 *
 * @author      Jason Baldridge
 * @author      Michael White
 * @version     $Revision: 1.17 $, $Date: 2009/12/21 03:27:19 $
 **/
public class Op extends HyloFormula {
    
	private static final long serialVersionUID = -7489598953770901195L;

	/** Conjunction constant. */
    public static final String CONJ = "conj";
    
    /** Disjunction constant. */
    public static final String DISJ = "disj";
    
    /** Exclusive-or constant. */
    public static final String XOR = "xor";
    
    /** Negation constant. */
    public static final String NEG = "neg";
    
    /** Optionality constant. */
    public static final String OPT = "opt";

    
    /** The name of the operator (ie its kind). */
    protected final String _name;
    
    /** The args. */
    protected List<LF> _args;
    
    /** Element constructor. */
    @SuppressWarnings("unchecked")
	public Op(Element e) {
        String name = e.getAttributeValue("name");
        if (name == null) name = e.getAttributeValue("n");
        _name = name;
        List<Element> argElements = e.getChildren();
        int argSize = argElements.size();
        List<LF> args = new ArrayList<LF>(argSize);
        for (int i=0; i<argSize; i++) {
            args.add(HyloHelper.getLF((Element)argElements.get(i)));
        }
        // add implicit CONJ op with NEG or OPT
        if (args.size() > 1 && (name.equals(NEG) || name.equals(OPT))) {
            _args = new ArrayList<LF>(1);
            _args.add(new Op(CONJ, args));
        }
        else _args = args;
    }

    /** Constructor. */
    public Op(String name, List<LF> args) {
        _name = name; _args = args; 
    }

    /** Two arg convenience constructor. */
    public Op(String name, LF first, LF second) {
        _name = name;
        _args = new ArrayList<LF>();
        _args.add(first); _args.add(second);
    }
    
	public String getName() { 
        return _name;
    }

    public List<LF> getArguments() {
        return _args;
    }
    
    public void addArgument(LF formula) {
        _args.add(formula);
    }
    
    /**
     * Appends the args if the given lf is a CONJ op,
     * otherwise just adds it.
     */
    public void appendArgs(LF lf) {
        if (lf instanceof Op && ((Op)lf).getName().equals(Op.CONJ)) 
            _args.addAll(((Op)lf).getArguments());
        else _args.add(lf);
    }

    public LF copy() {
        List<LF> $args = new ArrayList<LF>(_args.size());
        for (LF arg : _args) {
            $args.add(arg.copy());
        }
        return new Op(_name, $args);
    }

    public void deepMap(ModFcn mf) {
        for (Iterator<LF> argsIt = _args.iterator(); argsIt.hasNext(); ) {
            argsIt.next().deepMap(mf);
        }
        mf.modify(this);
    }

    public boolean occurs(Variable var) {
        for (Iterator<LF> argsIt = _args.iterator(); argsIt.hasNext(); ) {
            if (argsIt.next().occurs(var)) {
                return true;
            }
        }
        return false;
    }

    /** Returns true iff the given object equals this op. */
    public boolean equals(Object o) {
        if (!(o instanceof Op)) return false;
        Op op = (Op) o;
        if (_name != op._name) return false;
        List<LF> opArgs = op._args;
        if (_args.size() != opArgs.size()) return false;
        if (!opArgs.containsAll(_args)) return false;
        return true;
    }
    
    /** Unification is not attempted for Ops. */
    public void unifyCheck(Object u) throws UnifyFailure {
        throw new UnifyFailure();
    }

    /** Unification is not attempted for Ops. */
    public Object unify(Object u, Substitution s) throws UnifyFailure {
        throw new UnifyFailure();
    }
    
    public Object fill(Substitution sub) throws UnifyFailure {
        List<LF> $args = new ArrayList<LF>(_args.size());
        for (LF arg : _args) {
            $args.add((LF)arg.fill(sub));
        }
        return new Op(_name, $args);
    }
    
    public String toString() {
        StringBuffer sb = new StringBuffer();
        String opString = printOp(_name);
        if (_args.size() == 1) {
            sb.append(opString);
            sb.append(_args.get(0).toString());
        } else {
            sb.append('(');
            Iterator<LF> argsIt = filteredArgs().iterator();
            for (; argsIt.hasNext(); ) {
                sb.append(argsIt.next().toString());
                if (argsIt.hasNext()) sb.append(' ').append(opString).append(' ');
            }
            sb.append(')');
        }
        return sb.toString();
    }
    
    /**
     * Returns a pretty-printed string of this LF, with the given indent.
     */
    public String prettyPrint(String indent) {
        StringBuffer sb = new StringBuffer();
        String opString = printOp(_name);
        if (_args.size() == 1) {
            sb.append(opString);
            sb.append(((LF)_args.get(0)).prettyPrint(indent));
        } else {
            sb.append('(');
            Iterator<LF> argsIt = filteredArgs().iterator();
            for (; argsIt.hasNext(); ) {
                sb.append(argsIt.next().prettyPrint(indent));
                if (argsIt.hasNext()) sb.append(' ').append(opString).append(' ');
            }
            sb.append(')');
        }
        return sb.toString();
    }
    
    public static String printOp(String o) {
        if (o.equals(CONJ))      return "^";
        else if (o.equals(DISJ)) return "v";
        else if (o.equals(XOR))  return "v_";
        else if (o.equals(NEG))  return "~";
        else if (o.equals(OPT))  return "?";
        else                     return o;
    }
    
    // filters out semantic features if apropos
    private List<LF> filteredArgs() {
        String featsToShow = Grammar.theGrammar.prefs.featsToShow;
        if (featsToShow.length() == 0) return _args;
        List<LF> retval = new ArrayList<LF>(_args.size());
        for (Iterator<LF> it = _args.iterator(); it.hasNext(); ) {
            LF arg = it.next();
            String attr = null;
            if (arg instanceof SatOp && HyloHelper.isAttrPred(arg)) 
                attr = HyloHelper.getRel(arg);
            else if (arg instanceof Diamond && HyloHelper.isAttr(arg))
                attr = ((Diamond)arg).getMode().toString();
            if (attr == null || featsToShow.indexOf(attr) != -1)
                retval.add(arg);
        }
        return retval;
    }

    /** Returns a hash code. */
    public int hashCode() {
        int retval = _name.hashCode();
        for (Iterator<LF> it = _args.iterator(); it.hasNext(); ) {
            retval += it.next().hashCode();
        }
        return retval;
    }
    
    /**
     * Returns a hash code using the given map from vars to ints.
     */
    public int hashCode(TObjectIntHashMap varMap) { 
        int retval = _name.hashCode();
        for (Iterator<LF> it = _args.iterator(); it.hasNext(); ) {
            LF arg = it.next();
            retval += arg.hashCode(varMap);
        }
        return retval;
    }
        
    /**
     * Returns whether this op equals the given object  
     * up to variable names, using the given maps from vars to ints
     * (where args must be in the same order).
     */
    public boolean equals(Object obj, TObjectIntHashMap varMap, TObjectIntHashMap varMap2) {
        if (obj.getClass() != this.getClass()) { return false; }
        Op op = (Op) obj;
        if (!_name.equals(op._name)) return false;
        if (_args.size() != op._args.size()) return false;
        for (int i = 0; i < _args.size(); i++) {
            LF arg = (LF) _args.get(i);
            LF arg2 = (LF) op._args.get(i);
            if (!arg.equals(arg2, varMap, varMap2)) return false;
        }
        return true;
    }
    
    /**
     * Returns an XML representation of this LF.
     */
    public Element toXml() {
        Element retval = new Element("op");
        retval.setAttribute("name", _name);
        for (int i = 0; i < _args.size(); i++) {
            LF arg = (LF) _args.get(i);
            Element argElt = arg.toXml();
            retval.addContent(argElt);
        }
        return retval;
    }
}


================================================
FILE: src/opennlp/ccg/hylo/Proposition.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003-4 Jason Baldridge and University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.hylo;

import opennlp.ccg.synsem.*;
import opennlp.ccg.unify.*;
import org.jdom.*;

/**
 * A propositional value, such as the predicate "sleep", 
 * or the value of a semantic feature, such as "past" for tense.
 * Types are unified if present.
 *
 * @author      Jason Baldridge
 * @author      Michael White
 * @version     $Revision: 1.7 $, $Date: 2009/07/17 04:23:30 $
 **/
public class Proposition extends HyloAtom {

	private static final long serialVersionUID = -5392519210634765414L;

	public Proposition(String name) {
        super(name);
    }
    
    public Proposition(String name, SimpleType st) {
        super(name, st);
    }
    
    public LF copy() {
        return new Proposition(_name, type);
    }
    
    public Object unify(Object u, Substitution sub) throws UnifyFailure {
        // check equality
        if (equals(u)) return this;
        // check for prop with compatible type
        if (u instanceof Proposition) {
            Proposition prop = (Proposition) u;
            if (type == null || prop.type == null) throw new UnifyFailure();
            SimpleType st = (SimpleType) type.unify(prop.type, sub);
            // return prop with most specific type
            if (st.equals(type)) return this;
            if (st.equals(prop.type)) return prop;
            // otherwise return prop with name of intersection type
            return new Proposition(st.getName(), st);
        }
        // otherwise defer to default routine
        return super.unify(u, sub);
    }
    
    /**
     * Returns an XML representation of this LF.
     */
    public Element toXml() {
        Element retval = new Element("prop");
        retval.setAttribute("name", toString());
        return retval;
    }
}


================================================
FILE: src/opennlp/ccg/hylo/SatOp.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003-5 Jason Baldridge and University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.hylo;

import opennlp.ccg.synsem.*;
import opennlp.ccg.unify.*;
import org.jdom.*;
import java.util.*;
import gnu.trove.*;

/**
 * A hybrid logic satifaction operator, which tests whether a formula is true
 * a particular point named by a nominal.
 *
 * @author      Jason Baldridge
 * @author      Michael White
 * @version     $Revision: 1.13 $, $Date: 2009/07/17 04:23:30 $
 **/
public class SatOp extends HyloFormula {
    
	private static final long serialVersionUID = -4953978442971984002L;
	
	/**
     * The LF alts to which this LF belongs.
     * Null represents no alts.
     */
    protected List<Alt> alts = null;
    
    /**
     * Gets the LF alts to which this LF belongs.
     */
    public List<Alt> getAlts() { return alts; }
    
    /**
     * The LF opts (optional parts) to which this LF belongs.
     * LF opts are used during realization to represent 
     * optional parts of the input.
     * The opts are numbered starting with 0, 
     * and null represents no opts.
     */
    protected TIntArrayList opts = null;
    
    /**
     * Gets the LF opts to which this LF belongs.
     */
    public TIntArrayList getOpts() { return opts; }
    
    /**
     * The sign or unary rule which introduced this predication.
     */
    protected LexSemOrigin _origin = null;
    
    /**
     * Gets the sign or unary rule which introduced this predication (or null if none).
     */
    public LexSemOrigin getOrigin() { return _origin; }
    
    /**
     * Sets the sign or unary rule which introduced this predication.
     */
    public void setOrigin(LexSemOrigin origin) { _origin = origin; }
    
    
    // the real contents of the satop
    protected Nominal _nominal;
    protected LF _arg;

    public SatOp(Element e) {
        boolean shared = "true".equals(e.getAttributeValue("shared"));
        String nom = e.getAttributeValue("nom");
        if (nom != null) {
            _nominal = new NominalAtom(HyloHelper.prefix(nom), HyloHelper.type(nom), shared);
        } else {
            nom = e.getAttributeValue("nomvar");
            if (nom != null) {
                _nominal = new NominalVar(HyloHelper.prefix(nom), HyloHelper.type(nom), shared);
            } else {
                throw new RuntimeException("Satop must have a nom or nomvar.");
            }
        }
        _arg = HyloHelper.getLF_FromChildren(e);
    }

    public SatOp(Nominal nom, LF arg) {
        _nominal = nom;
        _arg = arg;
    }

    public Nominal getNominal() { return _nominal; }
    public void setNominal(Nominal nominal) { _nominal = nominal; }

    public LF getArg() { return _arg; }
    public void setArg(LF arg) { _arg = arg; }
    
    public LF copy() {
        SatOp retval = new SatOp((Nominal)_nominal.copy(), _arg.copy());
        retval._origin = _origin;
        return retval;
    }

    public void deepMap(ModFcn mf) {
        _nominal.deepMap(mf);
        _arg.deepMap(mf);
        mf.modify(this);
    }

    public boolean occurs(Variable var) {
        return (_nominal.occurs(var) || _arg.occurs(var));
    }

    /** Returns true iff the nominal and arg are equal. */
    public boolean equals(Object o) {
        if (o instanceof SatOp
            && _nominal.equals(((SatOp)o)._nominal)
            && _arg.equals(((SatOp)o)._arg)) 
        {
            return true;
        } else {
            return false;
        }
    }
    
    public Object unify(Object u, Substitution sub) throws UnifyFailure {
        if (u instanceof HyloFormula) {
            if (u instanceof SatOp) {
                Nominal $nom = (Nominal) Unifier.unify(_nominal, ((SatOp)u)._nominal, sub);
                LF $arg = (LF)Unifier.unify(_arg,((SatOp)u)._arg, sub);
                SatOp retval = new SatOp($nom, $arg);
                retval._origin = _origin;
                return retval;
            }
            else return super.unify(u,sub);
        } else {
            throw new UnifyFailure();
        }
    }

    public Object fill(Substitution sub) throws UnifyFailure {
        SatOp retval = new SatOp((Nominal)_nominal.fill(sub), (LF)_arg.fill(sub));
        retval._origin = _origin;
        return retval;
    }

    public String toString() { 
        boolean includeParens = !(_arg instanceof Op);
        StringBuffer sbuf = new StringBuffer();
        sbuf.append('@').append(_nominal.toString());
        if (includeParens) { sbuf.append('('); }
        sbuf.append(_arg.toString());
        if (includeParens) { sbuf.append(')'); }
        return sbuf.toString();
    }

    /**
     * Returns a pretty-printed string of this LF, with the given indent.
     */
    public String prettyPrint(String indent) {
        // calc new indent
        StringBuffer ibuf = new StringBuffer();
        ibuf.append(indent).append("  ");
        String nomStr = _nominal.toString();
        for (int i = 0; i < nomStr.length(); i++) {
            ibuf.append(' ');
        }
        String newIndent = ibuf.toString();
        // calc string
        boolean includeParens = !(_arg instanceof Op);
        StringBuffer sbuf = new StringBuffer();
        sbuf.append('@').append(nomStr); 
        if (includeParens) { sbuf.append('('); }
        sbuf.append(_arg.prettyPrint(newIndent));
        if (includeParens) { sbuf.append(')'); }
        // done
        return sbuf.toString();
    }
    
    
    /** Returns a hash code using the nominal and arg. */
    public int hashCode() { return _nominal.hashCode() + _arg.hashCode(); }
    
    /**
     * Returns a hash code using the given map from vars to ints.
     */
    public int hashCode(TObjectIntHashMap varMap) { 
        return _nominal.hashCode(varMap) + _arg.hashCode(varMap); 
    }
        
    /**
     * Returns whether this sat op equals the given object  
     * up to variable names, using the given maps from vars to ints.
     */
    public boolean equals(Object obj, TObjectIntHashMap varMap, TObjectIntHashMap varMap2) {
        if (obj.getClass() != this.getClass()) { return false; }
        SatOp so = (SatOp) obj;
        return _nominal.equals(so._nominal, varMap, varMap2) && 
               _arg.equals(so._arg, varMap, varMap2); 
    }
    
    /**
     * Returns an XML representation of this LF.
     */
    public Element toXml() {
        Element retval = new Element("satop");
        if (_nominal instanceof NominalAtom) {
            retval.setAttribute("nom", _nominal.toString());
        } else {
            retval.setAttribute("nomvar", ((NominalVar)_nominal).nameWithType());
        }
        Element argElt = _arg.toXml();
        retval.addContent(argElt);
        return retval;
    }
}


================================================
FILE: src/opennlp/ccg/hylo/graph/DefaultLFEdgeFactory.java
================================================
//////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2012 Scott Martin
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.hylo.graph;

/**
 * A factory for LF edges that creates edges from specified source and target vertices and an edge label.
 * This class provides a default implementation of the {@link LFEdgeFactory} interface for instantiating
 * {@link LFGraph}s.
 * 
 * @author <a href="http://www.ling.ohio-state.edu/~scott/">Scott Martin</a>
 */
public class DefaultLFEdgeFactory implements LFEdgeFactory {
	
	/**
	 * Creates an edge from a specified source and target vertex.
	 * @return A new edge with a <tt>null</tt> label.
	 * @see #createLabeledEdge(LFVertex, LFVertex, LFEdgeLabel)
	 */
	@Override
	public LFEdge createEdge(LFVertex sourceVertex, LFVertex targetVertex) {
		return createLabeledEdge(sourceVertex, targetVertex, null);
	}

	/**
	 * Creates a new labeled, directed edge from a specified vertex pair and edge label.
	 * @param sourceVertex The source vertex of the new edge.
	 * @param targetVertex The target vertex of the new edge.
	 * @param label The label of the new edge.
	 * @return An instance of {@link LFEdge} with the specfied parameters.
	 * 
	 * @see LFEdge#LFEdge(LFVertex, LFVertex, LFEdgeLabel)
	 */
	@Override
	public LFEdge createLabeledEdge(LFVertex sourceVertex, LFVertex targetVertex, LFEdgeLabel label) {
		return new LFEdge(sourceVertex, targetVertex, label);
	}

}


================================================
FILE: src/opennlp/ccg/hylo/graph/LFEdge.java
================================================
//////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2012 Scott Martin
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.hylo.graph;

/**
 * An edge in an {@linkplain LFGraph LF graph}. LF graph edges are directed, containing a 
 * {@linkplain #getSource() source} and {@linkplain #getTarget() target} vertex as well as
 * an {@linkplain #getLabel() edge label} representing the type of relation between the two
 * vertices.
 * 
 * @author <a href="http://www.ling.ohio-state.edu/~scott/">Scott Martin</a>
 */
public class LFEdge {

	final LFVertex source, target;
	final LFEdgeLabel label;
	
	/**
	 * Convenience constructor for creating edges with a <tt>null</tt> edge label. This constructor just
	 * calls <tt>LFEdge(source, target, null)</tt>.
	 * @see #LFEdge(LFVertex, LFVertex, LFEdgeLabel)
	 */
	public LFEdge(LFVertex source, LFVertex target) {
		this(source, target, null);
	}
	
	/**
	 * Creates a new LF edge with the specified source and target vertices, and edge label.
	 * @param source The source vertex of the new edge.
	 * @param target The target vertex of the new edge.
	 * @param label The label of the new edge, possibly <tt>null</tt>.
	 * 
	 * @throws IllegalArgumentException If either <tt>source</tt> or <tt>target</tt> is <tt>null</tt>.
	 */
	public LFEdge(LFVertex source, LFVertex target, LFEdgeLabel label) {
		checkVertex(source, "source");
		checkVertex(target, "target");
		
		this.source = source;
		this.target = target;
		this.label = label;
	}
	
	void checkVertex(LFVertex v, String name) {
		if(v == null) {
			throw new IllegalArgumentException(name + " is null");
		}
	}

	/**
	 * Gets the edge label, which may be <tt>null</tt>.
	 */
	public LFEdgeLabel getLabel() {
		return label;
	}

	/**
	 * Gets the source vertex.
	 */
	public LFVertex getSource() {
		return source;
	}
	
	/**
	 * Gets the target vertex.
	 */
	public LFVertex getTarget() {
		return target;
	}

	/**
	 * Tests whether this edge is equal to another by comparing the source and target vertices by using their
	 * {@link LFVertex#equals(Object)} methods.
	 * If the label is <tt>null</tt>, it is considered equivalent to the other edge's label only if
	 * the other edge's label is also <tt>null</tt>. Otherwise, the labels are compared using their
	 * {@link LFEdgeLabel#equals(Object)} method.
	 * 
	 * @param o The edge to compare this edge to.
	 */
	@Override
	public boolean equals(Object o) {
		if(o instanceof LFEdge) {
			LFEdge e = (LFEdge)o;
			return source.equals(e.source) && target.equals(e.target) 
				&& (label != null) ? label.equals(e.label) : e.label == null;
		}
		
		return false;
	}

	/**
	 * Computes a hash code for this edge based on the hash codes of its vertices and label, assuming the
	 * label is non-null.
	 */
	@Override
	public int hashCode() {
		int h = 37 * source.hashCode() + target.hashCode();
		
		if(label != null) {
			h += label.hashCode();
		}
		
		return h;
	}
	
	/**
	 * Gets a string representation of this edge. For example, if the edge's source is <tt>w1@woman</tt>,
	 * its target is <tt>w0@the</tt>, and its label is <tt>Det</tt>, this method returns
	 * <tt>w1@woman --Det--> w0@the</tt>.
	 */
	@Override
	public String toString() {
		StringBuilder sb = new StringBuilder(source.toString());
		sb.append(" --");
		sb.append((label == null) ? "(no label)" : label.toString());
		sb.append("--> ");
		sb.append(target.toString());
		
		return sb.toString();
	}
}


================================================
FILE: src/opennlp/ccg/hylo/graph/LFEdgeFactory.java
================================================
//////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2012 Scott Martin
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.hylo.graph;

import org.jgrapht.EdgeFactory;

/**
 * A factory for LF edges that creates edges from specified source and target vertices and an edge label.
 * This interface extends the {@link EdgeFactory} interface for the specialized case of
 * directed, labeled LF edges with LF vertices as their nodes. A default implementation
 * is provided in {@link DefaultLFEdgeFactory}.
 * 
 * @author <a href="http://www.ling.ohio-state.edu/~scott/">Scott Martin</a>
 */
public interface LFEdgeFactory extends EdgeFactory<LFVertex, LFEdge> {
	
	/**
	 * Creates a new labeled, directed edge from a specified vertex pair and edge label.
	 * @param sourceVertex The source vertex of the new edge.
	 * @param targetVertex The target vertex of the new edge.
	 * @param label The label of the new edge.
	 * @return An instance of {@link LFEdge} with the specified parameters.
	 * 
	 * @see LFEdge#LFEdge(LFVertex, LFVertex, LFEdgeLabel)
	 */
	public LFEdge createLabeledEdge(LFVertex sourceVertex, LFVertex targetVertex, LFEdgeLabel label);

}


================================================
FILE: src/opennlp/ccg/hylo/graph/LFEdgeLabel.java
================================================
//////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2012 Scott Martin
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.hylo.graph;

import java.util.HashMap;
import java.util.Map;

import opennlp.ccg.hylo.Mode;

/**
 * A label for an {@linkplain LFEdge LF edge}. LF edge labels are drawn from 
 * {@link Mode}s, so this class encapsulates one.
 * <p>
 * Since certain modes reoccur frequently, this class maintains a cache of
 * modes mapped to edge labels, accessible via {@link #forMode(Mode)}.
 * 
 * @author <a href="http://www.ling.ohio-state.edu/~scott/">Scott Martin</a>
 */
public class LFEdgeLabel {

	final Mode mode;
	
	private static Map<Mode, LFEdgeLabel> labelCache;
	
	/**
	 * Creates an LF edge label with the specified mode.
	 * @param mode The mode representing the type of relation between the vertices.
	 * @throws IllegalArgumentException if <tt>mode</tt> is <tt>null</tt>.
	 */
	public LFEdgeLabel(Mode mode) {
		if(mode == null) {
			throw new IllegalArgumentException("mode is null");
		}
		
		this.mode = mode;
	}

	/**
	 * Gets a cached LF edge label for the specified mode, if one is available. If none
	 * has been created yet, a new LF edge label is created and cached for later use.
	 * Access to the cached LF edge labels is synchronized to avoid threading isues.
	 * 
	 * @param mode The mode to create a label for.
	 * @return Either a cached LF edge label corresponding to the specified mode, if one
	 * is available, or a newly created one.
	 */
	public static LFEdgeLabel forMode(Mode mode) {
		synchronized(LFEdgeLabel.class) {
			LFEdgeLabel l = null;
			
			if(labelCache == null) {
				 labelCache = new HashMap<Mode, LFEdgeLabel>();
			}
			else {			
				l = labelCache.get(mode);
			}
			
			if(l == null) {
				l = new LFEdgeLabel(mode);
				labelCache.put(mode, l);
			}
			
			return l;
		}
	}
	
	/**
	 * Gets the name of this label, as specified by its underlying 
	 * {@linkplain Mode mode}.
	 * @return The value of <tt>getMode().getName()</tt>.
	 */
	public String getName() {
		return mode.getName();
	}
	
	/**
	 * Gets the mode underlying this edge label.
	 * @return The mode specified at creation.
	 * @see #LFEdgeLabel(Mode)
	 */
	public Mode getMode() {
		return mode;
	}

	/**
	 * Computes a hash code for this LF edge label based on the hash code of its
	 * underlying mode.
	 */
	@Override
	public int hashCode() {
		return 31 * mode.hashCode();
	}

	/**
	 * Tests whether this LF edge label is equivalent to another by comparing their
	 * modes, using their {@link Mode#equals(Object)} methods.
	 */
	@Override
	public boolean equals(Object obj) {
		return (obj instanceof LFEdgeLabel) && mode.equals(((LFEdgeLabel)obj).mode);
	}

	/**
	 * Gets a string representation of this LF edge label.
	 * @return The value of <tt>getName()</tt>.
	 */
	@Override
	public String toString() {
		return getName();
	}
}


================================================
FILE: src/opennlp/ccg/hylo/graph/LFGraph.java
================================================
//////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2012 Scott Martin
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.hylo.graph;

import java.util.HashMap;
import java.util.LinkedHashSet;
import java.util.Map;
import java.util.Set;

import opennlp.ccg.hylo.Flattener;
import opennlp.ccg.hylo.Nominal;
import opennlp.ccg.synsem.LF;

import org.jgrapht.graph.DirectedMultigraph;

/**
 * A graph representation of an {@link LF}. By default, LF graphs are empty. But populated LF graphs can
 * be easily created using the {@link LFGraphFactory} class.
 * <p>
 * This class extends the 
 * {@link DirectedMultigraph} class from the <tt>org.jgrapht.graph</tt> package that provides some
 * specialized methods for dealing with OpenCCG LFs. It provides some flexibility for edge creation
 * by allowing an {@link LFEdgeFactory} to be specified at creation. The original LF structure is also
 * reflected in the {@link #getLFAncestry(LFVertex)}, {@link #highestLFAncestors()}, and
 * {@link #highestLFAncestorOf(LFVertex)} methods.
 * <p>
 * As a convenience, the method {@link #findVertexByNominal(Nominal)} provides access to the vertex
 * corresponding to a given nominal. This is implemented by a hash map so that the lookup takes place in 
 * constant time. 
 * 
 * @see <a href="http://jgrapht.org/">JGraphT website</a>
 * 
 * @author <a href="http://www.ling.ohio-state.edu/~scott/">Scott Martin</a>
 */
public class LFGraph extends DirectedMultigraph<LFVertex,LFEdge> {

	private static final long serialVersionUID = 1L; //TODO make this really serializable?
	
	/**
	 * The map reflecting LF ancestry by giving the highest ancestor for a specified
	 * vertex, or <tt>null</tt> if it is the highest ancestor.
	 */
	protected Map<LFVertex, LFVertex> highestAncestorMap = new HashMap<LFVertex, LFVertex>();
	
	
	/**
	 * Convenience cache of nominals mapped to vertices.
	 * @see #findVertexByNominal(Nominal)
	 */
	protected Map<Nominal, LFVertex> nominalVertexMap = new HashMap<Nominal, LFVertex>();
	
	/**
	 * Creates a new, empty LF graph that uses an implementation of {@link LFEdgeFactory}
	 * as its edge factory.
	 * @see #LFGraph(LFEdgeFactory)
	 */
	public LFGraph() {
		this(LFGraphFactory.DEFAULT_EDGE_FACTORY);
	}
	
	/**
	 * Creates a new, empty LF graph using the specified edge factory.
	 * @param lfEdgeFactory The edge factory to use for creating edges.
	 * 
	 * @see LFGraphFactory
	 */
	public LFGraph(LFEdgeFactory lfEdgeFactory) {
		super(lfEdgeFactory);
	}
	
	/**
	 * Gets the {@link LFEdgeFactory} used to create this LF graph.
	 * @return The value of {@link #getEdgeFactory()}, cast to an 
	 * {@link LFEdgeFactory}.
	 */
	public LFEdgeFactory getLFEdgeFactory() {
		return (LFEdgeFactory)getEdgeFactory();
	}

	/**
	 * Adds a new labeled edge based on the specified source and target vertices and edge label by calling
	 * <tt>getLFEdgeFactory().createLabeledEdge(source, target, label)</tt>. The new
	 * edge is added to this graph's {@linkplain #edgeSet() edge set}.
	 * @param source The source vertex of the new edge.
	 * @param target The target vertex of the new edge.
	 * @param label The label of the new edge.
	 * @return The newly created edge if it was successfully added to this graph, <tt>null</tt> otherwise.
	 */
	public LFEdge addLabeledEdge(LFVertex source, LFVertex target, LFEdgeLabel label) {
		LFEdge e = getLFEdgeFactory().createLabeledEdge(source, target, label);
		return addEdge(source, target, e) ? e : null;
	}
	
	/**
	 * Finds a vertex by its nominal. This method does a lookup on a dictionary mapping each vertex's 
	 * {@linkplain LFVertex#getNominal() nominal} to members of the{@link #vertexSet()}. 
	 * @param nominal The nominal to test for.
	 * @return A vertex whose nominal is equivalent to the one specified, or <tt>null</tt> if none is present.
	 */
	public LFVertex findVertexByNominal(Nominal nominal) { 
		return nominalVertexMap.get(nominal);
	}

	/**
	 * Overrides the superclass method to add a mapping from the vertex's {@linkplain LFVertex#getNominal() nominal}
	 * to the vertex itself, for later retrieval via {@link #findVertexByNominal(Nominal)}.
	 */
	@Override
	public boolean addVertex(LFVertex v) {
		boolean b = super.addVertex(v); // give this a chance first
		
		if(b) {
			nominalVertexMap.put(v.nominal, v);
		}
		
		return b;
	}

	/**
	 * Overrides the superclass method to remove any existing mapping from some nominal to the specified vertex.
	 * @see #addVertex(LFVertex)
	 * @see #findVertexByNominal(Nominal)
	 */
	@Override
	public boolean removeVertex(LFVertex v) {
		boolean b = super.removeVertex(v); // invoke this first
	
		if(b) {
			nominalVertexMap.values().remove(v);
		}
		
		return b;
	}

	/**
	 * Gets the highest LF ancestor of the specified vertex, as determined by the LF structure.
	 * @param vertex The vertex to get the highest ancestor for.
	 * @return The highest ancestor of the specified vertex, or <tt>null</tt> if it is the highest in its
	 * ancestry.
	 * @see Flattener#getHighestParentMap()
	 */
	public LFVertex highestLFAncestorOf(LFVertex vertex) {
		return highestAncestorMap.get(vertex);
	}
	
	/**
	 * Gets the LF ancestry corresponding to the specified vertex.
	 * 
	 * @return The parents of the specified vertex in the LF ancestry.
	 * @see #highestLFAncestorOf(LFVertex) 
	 * @see Flattener#getHighestParentMap()
	 */
	public Set<LFVertex> getLFAncestry(LFVertex vertex) {
		LFVertex a = highestLFAncestorOf(vertex);
		Set<LFVertex> as = new LinkedHashSet<LFVertex>();
		
		for(LFVertex v : vertexSet()) {
			if(!v.equals(vertex) && highestLFAncestorOf(v).equals(a)) {
				as.add(v);
			}
		}
		
		return as;
	}
	
	/**
	 * Gets the vertex or vertices that are at the top of the LF ancestry hierarchy. 
	 * @return The set of vertices <tt>v</tt> for which {@link #highestLFAncestorOf(LFVertex)} returns
	 * <tt>null</tt>.
	 * @see Flattener#getHighestParentMap()
	 */
	public Set<LFVertex> highestLFAncestors() {
		Set<LFVertex> ps = new LinkedHashSet<LFVertex>();
		
		for(LFVertex v : vertexSet()) {
			if(highestLFAncestorOf(v) == null) {
				ps.add(v);
			}
		}
		
		return ps;
	}
}


================================================
FILE: src/opennlp/ccg/hylo/graph/LFGraphFactory.java
================================================
//////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2012 Scott Martin
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.hylo.graph;

import static opennlp.ccg.hylo.HyloHelper.isAttrPred;
import static opennlp.ccg.hylo.HyloHelper.isElementaryPredication;
import static opennlp.ccg.hylo.HyloHelper.isLexPred;
import static opennlp.ccg.hylo.HyloHelper.isRelPred;

import java.util.List;
import java.util.Map;

import opennlp.ccg.hylo.Diamond;
import opennlp.ccg.hylo.Flattener;
import opennlp.ccg.hylo.HyloHelper;
import opennlp.ccg.hylo.Nominal;
import opennlp.ccg.hylo.Proposition;
import opennlp.ccg.hylo.SatOp;
import opennlp.ccg.realize.Realizer;
import opennlp.ccg.synsem.LF;

import org.jdom.Element;
import org.jdom.input.DOMBuilder;

/**
 * Factory class for creating LF graphs based on {@link LF}s and XML elements 
 * that represent them. Graph factories cannot be instantiated, however, their
 * methods for building LF graphs are statically accessible.
 * 
 * @author <a href="http://www.ling.ohio-state.edu/~scott/">Scott Martin</a>
 * @see LFGraph
 * @see LFGraphFactory#newGraphFrom(LF)
 */
public class LFGraphFactory {
	
	/**
	 * An instance of {@link DefaultLFEdgeFactory}.
	 */
	public static final LFEdgeFactory DEFAULT_EDGE_FACTORY = new DefaultLFEdgeFactory();
	static final DOMBuilder DOM_BUILDER = new DOMBuilder();
	static final Flattener FLATTENER = new Flattener();
	
	private LFGraphFactory() {
		// can't instantiate
	}
	
	/**
	 * Builds a new LF graph based on the representation provided in the specified w3c XML element.
	 * @param lfElement The XML element with root element tagged <tt>lf</tt>.
	 * @return The value of {@link #newGraphFrom(Element)} after using a {@link DOMBuilder} to create a
	 * jdom document.
	 * 
	 * @see #newGraphFrom(Element)
	 */
	public static LFGraph newGraphFrom(org.w3c.dom.Element lfElement) {
		return newGraphFrom(DOM_BUILDER.build(lfElement));
	}
	
	/**
	 * Creates a new LF graph from the corresponding representation contained in the specified 
	 * jdom XML element.
	 * @param lfElement The jdom element containing the representation of the LF.
	 * @return An LF graph build from an {@link LF} object obtained by calling 
	 * {@link Realizer#getLfFromElt(Element)}.
	 * 
	 * @see LFGraphFactory#newGraphFrom(LF)
	 */
	public static LFGraph newGraphFrom(Element lfElement) {
		return newGraphFrom(Realizer.getLfFromElt(lfElement));
	}
	
	/**
	 * Creates a new LF graph based on the specified LF object. The LF object is first flattened, and then
	 * its LF ancestry structure is obtained by calling {@link Flattener#getHighestParentMap()}.
	 * <p>
	 * This method makes two passes over the list of {@link SatOp}s obtained by flattening the specified LF.
	 * The first pass adds vertices to the graph for every lexical predication, as determined by calling
	 * {@link HyloHelper#isLexPred(LF)} on the {@linkplain SatOp#getNominal() SatOp's nominal} and
	 * {@linkplain SatOp#getArg() proposition argument}.
	 * <p>
	 * The second pass proceeds by cases, depending on the nature of the SatOp in question:
	 * <dl>
	 * 	<dt>Lexical predications</dt>
	 * 	<dd>cause the new LF graph to be updated with the corresponding LF ancestry, as determined by
	 * 		{@link Flattener#getHighestParentMap()}.</dd>
	 *  <dt>Relation predications</dt>
	 *  <dd>cause a new {@link LFEdge} to be added to the LF graph based on the
	 *  	{@linkplain SatOp#getArg() SatOp's argument} and {@linkplain Diamond#getMode() the argument's 
	 *  	mode}.</dd>
	 *  <dt>Attribute-value predications</dt>
	 *  <dd>cause the vertex corresponding to the {@linkplain SatOp#getNominal() SatOp's nominal} to have
	 *  	attributes {@linkplain LFVertex#setAttribute(opennlp.ccg.hylo.Mode, Proposition) added} based on
	 *  	the {@linkplain SatOp#getArg() SatOp's argument}.</dd>
	 * </dl>
	 * where the nature of the SatOp in question is determined using {@link HyloHelper#isLexPred(LF)},
	 * {@link HyloHelper#isRelPred(LF)}, and {@link HyloHelper#isAttrPred(LF)}.
	 * 
	 * @param lf The LF object to build an LF graph for.
	 * @return A new LF graph whose vertices represent the nominals in the LF's flattened representation and
	 * whose edges represent its relation predications.
	 * @throws IllegalArgumentException If <tt>lf</tt> is <tt>null</tt>.
	 */
	public static LFGraph newGraphFrom(LF lf) {
		if(lf == null) {
			throw new IllegalArgumentException("lf is null");
		}
		
		LFGraph g = new LFGraph(DEFAULT_EDGE_FACTORY);
		
		Flattener f = new Flattener();
		List<SatOp> satOps = f.flatten(lf);
		Map<Nominal,Nominal> ancestorMap = f.getHighestParentMap();
		
		for(SatOp so : satOps) { // first pass adds vertices
			if(isLexPred(so)) {
				g.addVertex(new LFVertex(so.getNominal(), (Proposition)so.getArg()));
			}
		}
		
		for(SatOp so : satOps) { // second pass adds edges and attributes, sets highest parent (if any)
			if(isElementaryPredication(so)) {
				Nominal soNom = so.getNominal();
				LFVertex source = g.findVertexByNominal(soNom);
				
				// check if node is not yet added (not a lex. pred.)
				if(source == null) {
					source = new LFVertex(soNom);
					g.addVertex(source);
				}
				
				if(isLexPred(so)) {
					Nominal parent = ancestorMap.get(source.nominal);
					if(parent != null) {
						g.highestAncestorMap.put(source, g.findVertexByNominal(parent));
					}
				}
				else if(isRelPred(so)) {
					Diamond d = (Diamond)so.getArg();
					
					Nominal dArg = (Nominal)d.getArg();
					LFVertex target = g.findVertexByNominal(dArg);
					
					if(target == null) { 
						target = new LFVertex(dArg);
						g.addVertex(target);
					}
					
					g.addLabeledEdge(source, target, LFEdgeLabel.forMode(d.getMode()));
				}
				else if(isAttrPred(so)) {
					Diamond d = (Diamond)so.getArg();
					source.addAttribute(d.getMode(), (Proposition)d.getArg());
				}
			}
		}
		
		return g;
	}

}


================================================
FILE: src/opennlp/ccg/hylo/graph/LFVertex.java
================================================
//////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2012 Scott Martin
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.hylo.graph;

import java.util.Collections;
import java.util.HashMap;
import java.util.Map;
import java.util.Set;

import opennlp.ccg.hylo.Mode;
import opennlp.ccg.hylo.Nominal;
import opennlp.ccg.hylo.Proposition;
import opennlp.ccg.hylo.SatOp;

/**
 * A vertex in an {@link LFGraph}. Vertices are based on {@link SatOp}s, encapsulating their
 * {@linkplain SatOp#getNominal() nominal} and {@linkplain SatOp#getArg() proposition argument} (or
 * <tt>null</tt> if there is no associated proposition).
 * Vertices also maintain a list of attribute/value pairs representing their associated attribute/value
 * predications.
 * <p>
 * The {@linkplain #getIndex() index} and {@linkplain #getType() type} of an LF vertex are determined by
 * the specified nominal's {@linkplain Nominal#getName() name}. For example, if a vertex's 
 * {@linkplain #getName() name} is <tt>w12</tt>, then {@link #getIndex()} returns <tt>12</tt> and
 * {@link #getType()} returns {@link LFVertexType#WORD}.
 * 
 * @author <a href="http://www.ling.ohio-state.edu/~scott/">Scott Martin</a>
 * @see LFGraph
 * @see LFVertexType
 * @see SatOp
 */
public class LFVertex {

	final Nominal nominal;
	final Proposition proposition;
	
	/**
	 * This vertex's attribute map.
	 */
	protected Map<Mode,Proposition> attributes;
	
	private Integer index;
	private LFVertexType type;
	
	/**
	 * Creates a new LF vertex based on the specified SatOp.
	 * @param satOp The SatOp to use for creating a new LF vertex, using its nominal and argument.
	 * @see #LFVertex(Nominal, Proposition)
	 */
	public LFVertex(SatOp satOp) {
		this(satOp.getNominal(), (Proposition)satOp.getArg());
	}
	
	/**
	 * Creates a new LF vertex based on the specified nominal, with a <tt>null</tt> proposition.
	 * @see #LFVertex(Nominal, Proposition) 
	 */
	public LFVertex(Nominal nominal) {
		this(nominal, null);
	}
	
	/**
	 * Creates a new LF vertex based on the specified nominal and proposition.
	 * @see #LFVertex(Nominal, Proposition, Map)
	 */
	public LFVertex(Nominal nominal, Proposition proposition) {
		this(nominal, proposition, null);
	}
	
	/**
	 * Creates a new LF vertex based on the specified nominal and proposition, with the specified attribute
	 * map (which can be <tt>null</tt>).
	 * @throws IllegalArgumentException if <tt>nominal</tt> is <tt>null</tt>.
	 */
	public LFVertex(Nominal nominal, Proposition proposition, Map<Mode,Proposition> attributes) {
		if(nominal == null) {
			throw new IllegalArgumentException("nominal is null");
		}
		
		this.nominal = nominal;
		this.proposition = proposition;
		this.attributes = attributes;
	}

	/**
	 * Gets this LF vertex's name, determined by the name of its {@linkplain #getNominal() nominal}.
	 * @return The value of <tt>getNominal().getName()</tt>.
	 */
	public String getName() {
		return getNominal().getName();
	}
	
	/**
	 * Gets this LF vertex's associated predicate, the name of its {@linkplain #getProposition() proposition}.
	 * @return The value of <tt>getProposition().getName()</tt>, if this vertex's proposition is non-null,
	 * and <tt>null</tt> otherwise.
	 */
	public String getPredicate() {
		Proposition p = getProposition();
		return (p == null) ? null : p.getName();
	}
	
	/**
	 * Gets this LF vertex's associated nominal.
	 */
	public Nominal getNominal() {
		return nominal;
	}

	/**
	 * Gets this LF vertex's associated proposition.
	 * @return Possibly <tt>null</tt>, if no proposition was provided at creation.
	 * @see #LFVertex(Nominal)
	 */
	public Proposition getProposition() {
		return proposition;
	}
	
	/**
	 * Gets the type of this LF vertex, as determined by the prefix of its {@linkplain #getNominal() nominal}'s
	 * name. For example, if this vertex's {@linkplain Nominal#getName() name} is <tt>x3</tt>, then
	 * this method returns
	 * {@link LFVertexType#fromPrefix(String) LFVertexType.fromPrefix}<tt>('x') == </tt>{@link LFVertexType#NONWORD}.
	 * @return The value of {@link LFVertexType#fromPrefix(String)} for this vertex's 
	 * {@linkplain #getNominal() nominal}'s {@linkplain Nominal#getName() name}.
	 * @see LFVertexType
	 */
	public LFVertexType getType() {
		return (type == null) ? (type = LFVertexType.fromPrefix(nominal.getName())) : type;
	}

	/**
	 * Gets the word index associated with this LF vertex, as determined by {@link #parseVertexIndex(Nominal)}.
	 */
	public Integer getIndex() {
		return (index == null) ? (index = parseVertexIndex(nominal)) : index;
	}
	
	/**
	 * Parses the word index associated with the specified nominal, obtained by parsing its name. For
	 * example, if the specified nominal's name is <tt>x9</tt>, this method returns the integer 
	 * <tt>9</tt>.
	 * @param nominal The nominal to find the word index for.
	 * @return The integer index corresponding to the specified nominal, determined by parsing its
	 * {@linkplain Nominal#getName() name}.
	 */
	public static Integer parseVertexIndex(Nominal nominal) {
		String nm = nominal.getName();
		int colidx = nm.indexOf(':');
		String s = (colidx == -1) ? nm : nm.substring(0, colidx);
		
		return Integer.parseInt(s.substring(1));
	}
	
	/**
	 * Gets the attribute map associated with this LF vertex. Note that the returned map is
	 * not modifiable; to modify a vertex's attributes, the methods
	 * {@link #setAttribute(Mode, Proposition)} and {@link #removeAttribute(Mode)}
	 * should be used.
	 * @return An unmodifiable copy of the attribute map encapsulated by this vertex, or
	 * {@link Collections#EMPTY_MAP} if no attributes are present.
	 * @see Collections#unmodifiableMap(Map)
	 */
	@SuppressWarnings("unchecked")
	public Map<Mode, Proposition> getAttributeMap() {
		return (attributes == null) ? Collections.EMPTY_MAP : Collections.unmodifiableMap(attributes);
	}
	
	/**
	 * Gets the names of this LF vertex's attributes. Note that the returned set is not modifiable;
	 * the methods {@link #setAttribute(Mode, Proposition)} and {@link #removeAttribute(Mode)} should
	 * be used to modify this vertex's attribute/value pairs.
	 * @return The value of <tt>getAttributeMap().keySet()</tt>, or {@link Collections#EMPTY_SET} if
	 * no attributes are present.
	 * @see Collections#unmodifiableSet(Set)
	 */
	@SuppressWarnings("unchecked")
	public Set<Mode> attributeNames() {
		return (attributes == null) ? Collections.EMPTY_SET : Collections.unmodifiableSet(attributes.keySet());
	}
	
	/**
	 * Tests whether this vertex contains an attribute with the associated attribute name.
	 * @param attributeName The name of the attribute to test for.
	 * @return <tt>true</tt> if this vertex has an attribute named <tt>attributeName</tt>.
	 * @see #attributeNames()
	 */
	public boolean containsAttribute(Mode attributeName) {
		return (attributes != null && attributes.containsKey(attributeName));
	}
	
	/**
	 * Gets the value of the attribute with the specified mode name.
	 * @param attributeName The attribute name to retrieve a value for.
	 * @return The associated attribute value, or <tt>null</tt> if none is present.
	 */
	public Proposition getAttributeValue(Mode attributeName) {
		return (attributes == null) ? null : attributes.get(attributeName);
	}
	
	/**
	 * Adds an attribute/value to this vertex's attributes. 
	 * @param attributeName The name of the new attribute.
	 * @param value The value of the new attribute.
	 * @return True if this vertex's attribute/value map changed as a result of the call because
	 * either (1) no attribute named <tt>attributeName</tt> was present or (2)
	 * the value associated with <tt>attributeName</tt> changed (was different from <tt>value</tt>).
	 * @see #setAttribute(Mode, Proposition)
	 */
	public boolean addAttribute(Mode attributeName, Proposition value) {
		// works even when setAttribute() returns null
		return !value.equals(setAttribute(attributeName, value)); 
	}
	
	/**
	 * Sets the attribute associated with the specified mode name to the specified proposition value.
	 * @param attributeName The key to set the value for.
	 * @param value The value that will be associated with <tt>attributeName</tt>.
	 * @return The value previously associated with <tt>attributeName</tt>, or <tt>null</tt> if no value
	 * was previously associated.
	 * @see Map#put(Object, Object)
	 */
	public Proposition setAttribute(Mode attributeName, Proposition value) {
		if(attributes == null) {
			attributes = new HashMap<Mode, Proposition>();
		}
		
		return attributes.put(attributeName, value);
	}
	
	/**
	 * Removes and returns the value associated with the specified attribute name.
	 * @param attributeName The name to remove the value for.
	 * @return The value previously associated with <tt>attributeName</tt>, or <tt>null</tt> if no value
	 * was associated with it.
	 */
	public Proposition removeAttribute(Mode attributeName) {
		return (attributes == null) ? null : attributes.remove(attributeName); 
	}

	/**
	 * Gets a hash code for this vertex based on its nominal and proposition, if the proposition is
	 * non-null.
	 */
	@Override
	public int hashCode() {
		int i = 37 * nominal.hashCode();
		
		if(proposition != null) {
			i += proposition.hashCode();
		}
		
		// Don't include attributes in hash code calculation. This could cause problems if a vertex is
		// added to a collection that relies on hashing, and then the attributes are later modified.
		
		return i;
	}

	/**
	 * Tests whether this LF vertex is equal to another by comparing their nominals and possibly also their
	 * propositions and attributes, if they are non-null/non-empty.
	 * @see #getNominal()
	 * @see #getProposition()
	 * @see #getAttributeMap()
	 */
	@Override
	public boolean equals(Object obj) {
		if(obj instanceof LFVertex) {
			LFVertex v = (LFVertex)obj;
			return nominal.equals(v.nominal) 
					&& ((proposition == null) ? v.proposition == null : proposition.equals(v.proposition))
					&& ((attributes == null) ? v.attributes == null : attributes.equals(v.attributes));
		}
		
		return false;
	}

	/**
	 * Gets a string representation of this LF vertex. For example, if this vertex's name is <tt>w9</tt>,
	 * its proposition's name is <tt>walk</tt>, and its attribute map contains <tt>num=sg</tt> and
	 * <tt>det=nil</tt>, this method returns <tt>w9@walk {num=sg, det=nil}</tt>.
	 */
	@Override
	public String toString() {
		StringBuilder sb = new StringBuilder(nominal.getName());
		
		if(proposition != null) {
			sb.append('@');
			sb.append(proposition.getName());
		}
		
		if(attributes != null && !attributes.isEmpty()) {
			sb.append(' ');
			sb.append(attributes.toString());
		}
			
		return sb.toString();
	}
}


================================================
FILE: src/opennlp/ccg/hylo/graph/LFVertexType.java
================================================
//////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2012 Scott Martin
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.hylo.graph;

/**
 * A set of enum constants indicating the type of an LF vertex. The type of a vertex is
 * also signaled by the character prefix of its name, as in <tt>w9</tt> and <tt>x3</tt>.
 * 
 * @author <a href="http://www.ling.ohio-state.edu/~scott/">Scott Martin</a>
 */
public enum LFVertexType {
	
	/**
	 * The type of vertices representing words, with prefix <tt>w</tt>.
	 */
	WORD('w'),
	
	/**
	 * The type of vertices representing nonwords, prefixed <tt>x</tt>.
	 */
	NONWORD('x');
	
	/**
	 * The prefix character for this vertex type.
	 */
	final Character prefix;
	
	private LFVertexType(Character prefix) {
		this.prefix = prefix;
	}
	
	/**
	 * Gets the naming prefix used by this vertex type.
	 */
	public Character getPrefix() {
		return prefix;
	}
	
	/**
	 * Gets the LF vertex type corresponding to the specified prefix string.
	 * 
	 * @param string The prefix string.
	 * @return The value of {@link #fromPrefix(Character)} for the first character in the
	 * specified string.
	 * 
	 * @see #fromPrefix(Character)
	 */
	public static LFVertexType fromPrefix(String string) {
		return fromPrefix(Character.valueOf(string.charAt(0)));
	}
	
	/**
	 * Gets the LF vertex type corresponding to the specified character prefix.
	 * @param prefix The prefix character.
	 * @return The vertex type with the specified prefix, as determined by
	 * {@link #getPrefix()}, or {@link #NONWORD} if there is no vertex type for the given
	 * prefix character.
	 */
	public static LFVertexType fromPrefix(Character prefix) {
		for(LFVertexType type : values()) {
			if(type.prefix.equals(prefix)) {
				return type;
			}
		}
		
		return NONWORD;
	}
}


================================================
FILE: src/opennlp/ccg/hylo/graph/package.html
================================================
<body>
	
<p>Provides representations of {@link opennlp.ccg.synsem.LF}s as traversible graphs based
on the <a href="http://jgrapht.org/">JGraphT</a> package, as well as customized filters for
sets of edges in those graphs.</p>

<p>{@link opennlp.ccg.hylo.graph.LFGraph}s can be created on their own, or from an existing
{@link opennlp.ccg.synsem.LF} (or XML structure representing one) using the
{@link opennlp.ccg.hylo.graph.LFGraphFactory}. LF graphs are also
customizable in that different edge factories can be specified by implementing
{@link opennlp.ccg.hylo.graph.LFEdgeFactory} (a default implementation is provided in
{@link opennlp.ccg.hylo.graph.DefaultLFEdgeFactory}).</p>


</body>

================================================
FILE: src/opennlp/ccg/lexicon/DataItem.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2002 Jason Baldridge and Gann Bierner
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.lexicon;

import org.jdom.*;

/**
 * Data structure for storing information about a lexical entry.  Specifically
 * used by LMR grammars.
 *
 * @author      Jason Baldridge
 * @version $Revision: 1.2 $, $Date: 2007/12/17 20:02:23 $
 */
public class DataItem {
    private String stem = "";
    private String pred = "";
    
    public DataItem() {}
    public DataItem (String s, String p) {
		stem = s;
		pred = p;
    }

    
    public DataItem(Element datael) {
		stem = datael.getAttributeValue("stem");	
	
		pred = datael.getAttributeValue("pred");	
		if (null == pred) {
		    pred = stem;
		}
    }

    public void setStem(String s) { stem = s; }
    public void setPred(String s) { pred = s; }

    public String getStem() { return stem; }
    public String getPred() { return pred; }
}


================================================
FILE: src/opennlp/ccg/lexicon/DefaultTokenizer.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2004-5 University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.lexicon;

import opennlp.ccg.grammar.Grammar;
import opennlp.ccg.util.*;

import java.text.*;
import java.util.*;
import javax.xml.datatype.*;
import gnu.trove.*;

/**
 * DefaultTokenizer provides a default implementation of the 
 * Tokenizer interface.
 *
 * @author      Michael White
 * @version     $Revision: 1.32 $, $Date: 2010/12/09 04:58:12 $
 **/

public class DefaultTokenizer implements Tokenizer {

    // date format with pattern yyyy.MM.dd, strict parsing
    private DateFormat dateFormat = null;

    // date format with pattern *.MM.dd, strict parsing
    private DateFormat dateFormatNoYear = null;

    // time format with pattern HH:mm, strict parsing
    private DateFormat timeFormat = null;
    
    // factory for parsing durations, in format "PnYnMnDTnHnMnS", as defined in XML Schema 1.0 section 3.2.6.1
    private DatatypeFactory datatypeFactory = null;
    
    /**
     * Map from special token semantic classes to special token constants. 
     * The map is initialized in the constructor, where 
     * the standard constants (eg Tokenizer.DATE_CLASS and Tokenizer.DATE_VAL) are added.
     */
    protected Map<String, String> specialTokenMap = null;
    
    /** 
     * A set containing semantic classes to replace words with for language models.
     * Equality is checked with identity, for use with interned strings.
     */
    @SuppressWarnings("unchecked")
	protected Set<String> replacementSemClasses = new THashSet(new TObjectIdentityHashingStrategy());


    /**
     * Constructor.
     */
    public DefaultTokenizer() {
        // init date, time formats
        dateFormat = new SimpleDateFormat("yyyy.MM.dd", Locale.ENGLISH);
        dateFormat.setLenient(false);
        dateFormatNoYear = new SimpleDateFormat("*.MM.dd", Locale.ENGLISH);
        dateFormatNoYear.setLenient(false);
        timeFormat = new SimpleDateFormat("HH:mm", Locale.ENGLISH);
        timeFormat.setLenient(false);
        // init data type factory
        try {
            datatypeFactory = DatatypeFactory.newInstance();
        } catch (DatatypeConfigurationException exc) {
            throw (RuntimeException) new RuntimeException().initCause(exc);
        }
        // init special token map
        specialTokenMap = new HashMap<String, String>();
        specialTokenMap.put(Tokenizer.DATE_CLASS, Tokenizer.DATE_VAL);
        specialTokenMap.put(Tokenizer.TIME_CLASS, Tokenizer.TIME_VAL);
        specialTokenMap.put(Tokenizer.NUM_CLASS, Tokenizer.NUM_VAL);
        specialTokenMap.put(Tokenizer.AMT_CLASS, Tokenizer.AMT_VAL);
        specialTokenMap.put(Tokenizer.DUR_CLASS, Tokenizer.DUR_VAL);
        specialTokenMap.put(Tokenizer.NE_CLASS, Tokenizer.NE_VAL);
    }
    
    
    /**
     * Adds a semantic class to replace words with for language models.
     */
    public void addReplacementSemClass(String semClass) {
        replacementSemClasses.add(semClass.intern());
    }
    
    /** 
     * Returns whether the given semantic class is one to replace words with for language models.
     * The sem class is assumed to have been interned.
     */
    public boolean isReplacementSemClass(String semClass) {
        return replacementSemClasses.contains(semClass);
    }

    
    /**
     * Parses an input string into a list of words, 
     * including any explicitly given factors, 
     * and the semantic class of special tokens.
     * Tokens are parsed into words using parseToken with the strictFactors
     * flag set to false.
     */
    public List<Word> tokenize(String s) { return tokenize(s, false); }

    /**
     * Parses an input string into a list of words, 
     * including any explicitly given factors, 
     * and the semantic class of special tokens.
     * Tokens are parsed into words using parseToken, according to the given 
     * flag for whether to parse factors strictly.
     * The string is assumed to have white-space delimited tokens.
     */
    public List<Word> tokenize(String s, boolean strictFactors) {
        List<Word> retval = new ArrayList<Word>();
        StringTokenizer st = new StringTokenizer(s);
        while (st.hasMoreTokens()) { retval.add(parseToken(st.nextToken(), strictFactors)); }
        return retval;
    }

    
    /** 
     * Parses a token into a word, including any explicitly given factors 
     * and the semantic class of special tokens.
     * Parsing is performed using parseToken with the strictFactors
     * flag set to false.
     */
    public Word parseToken(String token) { return parseToken(token, false); }
    
    /** 
     * Parses a token into a word, including any explicitly given factors 
     * and the semantic class of special tokens, according to the given 
     * flag for whether to parse factors strictly.
     * Recognized pitch accents may be appended to the word form with an underscore.
     * If the strictFactors flag is true, then colons are always assumed to 
     * separate attribute-value pairs, and hyphens are always assumed to 
     * separate attributes from values, and thus colons or hyphens not used as separators 
     * must be escaped. 
     * If the strictFactors flag is false, then there must be at least one colon 
     * and at least one hyphen in the token to trigger parsing of factors, 
     * in which case colons or hyphens not used as separators 
     * must again be escaped; otherwise, colons or hyphens on their own may 
     * appear without escaping in the word form.
     * After splitting the token into factors, it is unescaped.
     */
    public Word parseToken(String token, boolean strictFactors) {
        // init
        String form = token;
        String pitchAccent = null;
        List<Pair<String, String>> attrValPairs = null;
        String stem = null;
        String POS = null;
        String supertag = null;
        String semClass = null;
        // handle colon-separated attr-val pairs
        int colonPos = token.indexOf(':');
        int hyphenPos = token.indexOf('-');
        if (strictFactors || (colonPos > 0 && hyphenPos > 0)) {
            // deal with special cases before first colon, if any
            String suffix;
            if (colonPos > 0 && hyphenPos > colonPos) {
                form = token.substring(0, colonPos);
                suffix = token.substring(colonPos+1);
            }
            else if (colonPos < 0 && hyphenPos < 0) {
                form = token;
                suffix = null;
            }
            else {
                form = null;
                suffix = token;
            }
            while (suffix != null) {
                hyphenPos = suffix.indexOf('-');
                String attr = suffix.substring(0, hyphenPos);
                String val =  suffix.substring(hyphenPos+1);
                colonPos = suffix.indexOf(':');
                if (colonPos > 0) {
                    val = suffix.substring(hyphenPos+1, colonPos);
                    suffix = suffix.substring(colonPos+1);
                }
                else suffix = null;
                attr = unescape(attr); val = unescape(val);
                if (attr.equals(Tokenizer.WORD_ATTR)) { form = val; continue; }
                if (attr.equals(Tokenizer.STEM_ATTR)) { stem = val; continue; }
                if (attr.equals(Tokenizer.POS_ATTR)) { POS = val; continue; }
                if (attr.equals(Tokenizer.SUPERTAG_ATTR)) { supertag = val; continue; }
                if (attr.equals(Tokenizer.SEM_CLASS_ATTR)) { semClass = val; continue; }
                if (attr.equals(Tokenizer.PITCH_ACCENT_ATTR)) { pitchAccent = val; continue; }
                if (attrValPairs == null) attrValPairs = new ArrayList<Pair<String,String>>(5);
                attrValPairs.add(new Pair<String,String>(attr, val));
            }
        }
        // check for pitch accent preceded by an underscore
        int pos = (form != null) ? form.lastIndexOf("_") : -1;
        if (pos > 0) {
            String suffix = form.substring(pos+1);
            if (Grammar.isPitchAccent(suffix)) {
                pitchAccent = suffix;
                form = form.substring(0, pos);
            }
        }
        // unescape form (unless it happens to be "null")
        if (!"null".equals(form)) form = unescape(form);
        // check for special token
        String specialTokenClass = isSpecialToken(form);
        if (specialTokenClass != null) semClass = specialTokenClass;
        // done
        return Word.createWord(form,pitchAccent,attrValPairs,stem,POS,supertag,semClass);
    }
    
    
    /**
     * Returns a string (eg Tokenizer.DATE_CLASS) indicating the semantic class  
     * of special token, if the given token is recognized as a special 
     * token; otherwise returns null. 
     */
    public String isSpecialToken(String token) {
        if (token == null) return null;
        if (isDate(token)) return Tokenizer.DATE_CLASS;
        if (isTime(token)) return Tokenizer.TIME_CLASS;
        if (isNum(token)) return Tokenizer.NUM_CLASS;
        if (isAmt(token)) return Tokenizer.AMT_CLASS;
        if (isDur(token)) return Tokenizer.DUR_CLASS;
        if (isNamedEntity(token)) return Tokenizer.NE_CLASS;
        return null;
    }
    
    /**
     * Returns the special token constant for the given special token class, 
     * or null if none.
     */
    public String getSpecialTokenConstant(String semClass) {
        if (semClass == null) return null;
        return specialTokenMap.get(semClass);
    }
    
    /** 
     * Returns true iff the given string is a special token constant 
     * (eg Tokenizer.DATE_VAL).
     */
    public boolean isSpecialTokenConstant(String s) {
        return specialTokenMap.containsValue(s);
    }
    
    
    /** 
     * Returns true iff the token is recognized as a date.
     * The default implementation recognizes dates in the 
     * format yyyy.MM.dd, e.g. "2004.05.07", or *.MM.dd, e.g. "*.05.07", 
     * which is taken to mean the 5th of May (in the contextually 
     * appropriate year).  Note that by including the "*." prefix, 
     * the format avoids being ambiguous between a date or number; 
     * that is, with this format, something like "10.01" is 
     * unambiguously a number, whereas "*.10.01" means the 1st of 
     * October.
     */
    public boolean isDate(String token) {
        ParsePosition pos = new ParsePosition(0);
        Date date = dateFormat.parse(token, pos);
        if (date != null && pos.getIndex() == token.length()) return true;
        pos = new ParsePosition(0);
        date = dateFormatNoYear.parse(token, pos);
        return (date != null && pos.getIndex() == token.length());
    }
    
    /** 
     * Returns true iff the token is recognized as a time. 
     * The default implementation recognizes times in the 
     * 24-hour format HH:mm, e.g. "00:12" or "15:03".
     */
    public boolean isTime(String token) {
        ParsePosition pos = new ParsePosition(0);
        Date time = timeFormat.parse(token, pos);
        return (time != null && pos.getIndex() == token.length());
    }
    
    /** 
     * Returns true iff the token is recognized as a number.
     * The default implementation returns true if the token 
     * can be parsed as an integer or double, though not one 
     * in scientific notation.
     */
    public boolean isNum(String token) {
        try {
            Integer.parseInt(token);
            return true; 
        }
        catch (NumberFormatException exc) { 
            try {
                Double.parseDouble(token);
                if (token.indexOf('E') != -1) return false;
                if (token.indexOf('e') != -1) return false;
                return true;
            }
            catch (NumberFormatException exc2) {
                return false; 
            }
        }
    }
    
    /** 
     * Returns true iff the token is recognized as an amount.
     * The default implementation only handles currency amounts.
     * The token is recognized as an amount if it begins with 
     * a number and ends with an ISO-4217 currency code.
     * (See http://www.xe.com/iso4217.htm.)
     */
    public boolean isAmt(String token) { 
        if (token.length() < 4) return false;
        String code = token.substring(token.length()-3);
        try { Currency.getInstance(code); }
        catch (IllegalArgumentException exc) { return false; }
        String num = token.substring(0,token.length()-3).trim();
        return isNum(num);
    }

    /**
     * Returns true iff the token is recognized as a duration.
     * The format is "PnYnMnDTnHnMnS", as defined in XML Schema 1.0 section 3.2.6.1.
     * For example, "PT5H30" is 5 hours and 30 minutes.
     */
    public boolean isDur(String token) {
        try { datatypeFactory.newDuration(token); return true; }
        catch (Exception exc) { return false; }
    }
    
    /** 
     * Returns true iff the token is recognized as a named entity (not listed in lexicon). 
     * The default implementation always returns false.
     */
    public boolean isNamedEntity(String token) {
        return false;
    }
    
    
    /**
     * Returns a string for the given list of words.
     * A space separates the string for each word, as determined by getOrthography(Word,false).
     */
    public String getOrthography(List<Word> words) {
        return getOrthography(words, false);
    }
    
    /**
     * Returns a string for the given list of words, optionally with semantic class replacement.
     * A space separates the string for each word, as determined by getOrthography(Word,semClassReplacement).
     */
    public String getOrthography(List<Word> words, boolean semClassReplacement) {
        StringBuffer sb = new StringBuffer();
        for (int i = 0; i < words.size(); i++) {
            Word w = (Word) words.get(i);
            sb.append(getOrthography(w, semClassReplacement));
            if (i < words.size()-1) sb.append(" ");
        }
        return sb.toString();
    }
    

    /**
     * Returns a string for the given word, optionally with semantic class replacement.
     * The default implementation returns the word's form - or semantic class, if apropos - 
     * followed by its pitch accent (if non-null) separated by an underscore, 
     * followed by any further attribute values, also separated by underscores.
     * With the semantic class replacement option, the word form is replaced with 
     * the semantic class, uppercased, if the class is listed as one to replace words with for 
     * language models.
     */
    public String getOrthography(Word w, boolean semClassReplacement) {
        StringBuffer sb = new StringBuffer();
        String semClass = w.getSemClass();
        if (semClassReplacement && semClass != null && replacementSemClasses.contains(semClass))
            sb.append(semClass.toUpperCase());
        else
            sb.append(w.getForm());
        if (w.getPitchAccent() != null)
            sb.append("_").append(w.getPitchAccent());
        for (Iterator<Pair<String,String>> it = w.getAttrValPairs(); it.hasNext(); ) {
            Pair<String,String> p = it.next();
            sb.append("_").append(p.b);
            
        }
        return sb.toString();
    }
    
    /**
     * Returns a string for the given list of words, 
     * in the format expected by the SRILM tool for factored language models.
     * A space separates the string for each word, determined by format(Word).
     */
    public String format(List<Word> words) { return format(words, false); }

    /**
     * Returns a string for the given list of words, 
     * in the format expected by the SRILM tool for factored language models, 
     * optionally with semantic class replacement.
     * A space separates the string for each word, determined by format(Word,boolean).
     */
    public String format(List<Word> words, boolean semClassReplacement) {
        StringBuffer sb = new StringBuffer();
        sb.append("<s> ");
        for (int i = 0; i < words.size(); i++) {
            Word w = words.get(i);
            if (w.getForm() == "<s>" || w.getForm() == "</s>") continue; // skip <s> or </s>
            sb.append(format(w, semClassReplacement));
            sb.append(" ");
        }
        sb.append("</s>");
        return sb.toString();
    }
    
    /**
     * Returns a string for the given word,  
     * in the format expected by the SRILM tool for factored language models.
     * All factors are escaped.
     */
    public String format(Word w) { return format(w, false); }
    
    /**
     * Returns a string for the given word,  
     * in the format expected by the SRILM tool for factored language models, 
     * optionally with semantic class replacement.
     * All factors are escaped.
     * With the semantic class replacement option, the word form and stem are replaced with 
     * the semantic class, uppercased, if the class is listed as one to replace words with for 
     * language models.
     */
    public String format(Word w, boolean semClassReplacement) {
        StringBuffer sb = new StringBuffer();
        String form = w.getForm();
        String pitchAccent = w.getPitchAccent();
        String stem = w.getStem();
        String POS = w.getPOS();
        String supertag = w.getSupertag();
        String semClass = w.getSemClass();
        if (semClassReplacement && semClass != null && replacementSemClasses.contains(semClass)) {
            form = escape(semClass.toUpperCase()); stem = form; 
        }
        sb.append(escape(form));
        if (pitchAccent != null) sb.append(":").append(Tokenizer.PITCH_ACCENT_ATTR).append("-").append(escape(pitchAccent));
        for (Iterator<Pair<String,String>> it = w.getAttrValPairs(); it.hasNext(); ) {
            Pair<String,String> p = it.next();
            String attr = p.a; String val = p.b;
            if (val != null) sb.append(":").append(escape(attr)).append("-").append(escape(val));
        }
        if (stem != null) sb.append(":").append(Tokenizer.STEM_ATTR).append("-").append(escape(stem));
        if (POS != null) sb.append(":").append(Tokenizer.POS_ATTR).append("-").append(escape(POS));
        if (supertag != null) sb.append(":").append(Tokenizer.SUPERTAG_ATTR).append("-").append(escape(supertag));
        if (semClass != null) sb.append(":").append(Tokenizer.SEM_CLASS_ATTR).append("-").append(escape(semClass));
        return sb.toString();
    }

    
    /**
     * Returns an encoding of the given string where 
     * the characters for ampersand, less-than, greater-than, 
     * apostrophe, quote, colon and hyphen are escaped 
     * using HTML conventions.
     * Null is returned for the null string.
     * An initial substring 'null' is doubled.
     */
    public static String escape(String s) {
        if (s == null) return null;
        StringBuffer output = null; // instantiate only if needed
        if (s.startsWith("null")) {
            output = new StringBuffer();
            output.append("null");
        }
        for(int i=0; i < s.length(); i++) {
            char c = s.charAt(i);
            if (output == null && (c=='<' || c=='>' || c=='&' || c=='\'' || c=='"' || c==':' || c=='-')) {
                output = new StringBuffer();
                output.append(s.substring(0,i));
            }
            if (output != null) {
                switch(c) {
                    case '<': output.append("&lt;"); break;
                    case '>': output.append("&gt;"); break;
                    case '&': output.append("&amp;"); break;
                    case '\'': output.append("&apos;"); break;
                    case '"': output.append("&quot;"); break;
                    case ':': output.append("&#").append((int)':').append(";"); break;
                    case '-': output.append("&#").append((int)'-').append(";"); break;
                    default: output.append(c);
                }
            }
        }
        return (output != null) ? output.toString() : s;
    }
    
    /**
     * Returns a decoding of the given string where 
     * the characters for ampersand, less-than, greater-than, 
     * apostrophe, quote, colon and hyphen (and any other 
     * character whose code is given numerically) are unescaped 
     * using HTML conventions.
     * An exception is that ampersands may be left unescaped 
     * for convenience, when there is no following semicolon 
     * in the string.
     * Null is returned for the null string and for the string "null".
     * An initial substring 'nullnull' is halved.
     */
    public static String unescape(String s) {
        if (s == null || s.equals("null")) return null;
        StringBuffer output = null; // instantiate only if needed
        if (s.startsWith("nullnull")) {
        	s = s.substring(4);
            output = new StringBuffer();
        }
        for (int i=0; i < s.length(); i++) {
            char c = s.charAt(i);
            if (c == '&') {
                int endPos = s.indexOf(";", i);
                if (endPos < 0) {
                	// allow unescaped ampersands
                	if (output != null) output.append(c);
                	continue;
                }
                if (output == null) {
                    output = new StringBuffer();
                    output.append(s.substring(0,i));
                }
                String escaped = s.substring(i+1, endPos);
                if (escaped.equals("lt")) { output.append('<'); i = endPos; continue; }
                if (escaped.equals("gt")) { output.append('>'); i = endPos; continue; }
                if (escaped.equals("amp")) { output.append('&'); i = endPos; continue; }
                if (escaped.equals("apos")) { output.append('\''); i = endPos; continue; }
                if (escaped.equals("quot")) { output.append('"'); i = endPos; continue; }
                if (s.charAt(i+1) == '#') {
                    escaped = s.substring(i+2, endPos);
                    output.append((char)Integer.parseInt(escaped)); i = endPos; continue;
                }
                throw new RuntimeException(
                    "Unable to unescape " + s.substring(i,endPos+1) + "at position " + i + " in: " + s
                );
            }
            else if (output != null) output.append(c);
        }
        return (output != null) ? output.toString() : s;
    }

    
    /**
     * Returns one or more orthographic words for the given word's form.
     * This method is called from within Sign.getWordsInXml as 
     * part of producing the textual output of realization.
     * The default implementation checks the semantic class 
     * for a special token class, and if true, returns the result 
     * of expandDate, expandTime, expandNum, expandAmt, or 
     * expandNamedEntity, as appropriate, after first checking that 
     * the corresponding isDate, ..., isNamedEntity method returns true.
     * Otherwise, it splits the word form using underscore as a delimiter.
     */
    public List<String> expandWord(Word word) {
        String token = word.getForm();
        String sc = word.getSemClass();
        if (sc == Tokenizer.DATE_CLASS && isDate(token)) return expandDate(token);
        if (sc == Tokenizer.TIME_CLASS && isTime(token)) return expandTime(token);
        if (sc == Tokenizer.NUM_CLASS && isNum(token)) return expandNum(token);
        if (sc == Tokenizer.AMT_CLASS && isAmt(token)) return expandAmt(token);
        if (sc == Tokenizer.DUR_CLASS && isDur(token)) return expandDur(token);
        if (sc == Tokenizer.NE_CLASS && isNamedEntity(token)) return expandNamedEntity(token);
        String[] words = token.split("_");
        return Arrays.asList(words);
    }
    
    /**
     * Returns one or more orthographic words for the given date token.
     * The default implementation expands the date with 
     * EnglishExpander.expandDate, using the long option if the year is 
     * present, and the medium option if not.
     */
    public List<String> expandDate(String date) {
        ArrayList<String> retval = new ArrayList<String>();
        try {
            ParsePosition pos = new ParsePosition(0);
            Date dateObj = dateFormat.parse(date, pos);
            if (dateObj != null && pos.getIndex() == date.length()) {
                EnglishExpander.expandDate(dateObj, DateFormat.LONG, retval);
            }
            else {
                dateObj = dateFormatNoYear.parse(date);
                EnglishExpander.expandDate(dateObj, DateFormat.MEDIUM, retval);
            }
        }
        // shouldn't happen if isDate called first
        catch (ParseException exc) {
            // just add date string as a fall-back option
            retval.add(date);
        }
        return retval;
    }
    
    /**
     * Returns one or more orthographic words for the given time token.
     * The default implementation expands the time using 
     * EnglishExpander.expandTime.
     */
    public List<String> expandTime(String time) {
        ArrayList<String> retval = new ArrayList<String>();
        try {
            EnglishExpander.expandTime(timeFormat.parse(time), retval);
        }
        // shouldn't happen if isTime called first
        catch (ParseException exc) {
            // just add time string as a fall-back option
            retval.add(time);
        }
        return retval;
    }
    
    /**
     * Returns one or more orthographic words for the given number token.
     * The default implementation expands the number using 
     * EnglishExpander.expandNumber.
     */
    public List<String> expandNum(String num) {
        ArrayList<String> retval = new ArrayList<String>();
        EnglishExpander.expandNumber(num, retval);
        return retval;
    }
    
    /**
     * Returns one or more orthographic words for the given amount token.
     * The default implementation expands the number using 
     * EnglishExpander.expandAmount.
     */
    public List<String> expandAmt(String amt) {
        String code = amt.substring(amt.length()-3);
        String num = amt.substring(0,amt.length()-3).trim();
        ArrayList<String> retval = new ArrayList<String>();
        EnglishExpander.expandAmount(num, code, retval);
        return retval;
    }
    
    /**
     * Returns one or more orthographic words for the given duration token.
     * The default implementation expands the number using 
     * EnglishExpander.expandDuration.
     */
    public List<String> expandDur(String dur) {
        Duration duration = null;
        try {
            duration = datatypeFactory.newDuration(dur);
        } catch (Exception exc) {
            // parsing not expected to fail
            throw (RuntimeException) new RuntimeException().initCause(exc);
        }
        ArrayList<String> retval = new ArrayList<String>();
        EnglishExpander.expandDuration(duration, retval);
        return retval;
    }
    
    /**
     * Returns one or more orthographic words for the given named entity token.
     * The default implementation just splits the token using underscore as a delimiter.
     */
    public List<String> expandNamedEntity(String namedEntity) {
        String[] words = namedEntity.split("_");
        return Arrays.asList(words);
    }
    
    /** Test: tokenize args[0], expand each token; and optionally do parseToken(args[1],true). */
    public static void main(String[] args) {
        Tokenizer tk = new DefaultTokenizer();
        String s = args[0];
        List<Word> words = tk.tokenize(s);
        String expw = "";
        System.out.println("words: ");
        for (int i = 0; i < words.size(); i++) {
            Word word = words.get(i);
            System.out.print(word + " ");
            List<String> orthWords = tk.expandWord(word);
            for (int j = 0; j < orthWords.size(); j++) {
                expw += orthWords.get(j) + " ";
            }
        }
        System.out.println();
        System.out.println("expanded: " + expw);
        System.out.println("formatted: " + tk.format(words));
        if (args.length > 1) {
            System.out.println();
            Word strictlyParsed = tk.parseToken(args[1], true);
            System.out.println("strictly parsed word: " + strictlyParsed);
            System.out.println("formatted: " + tk.format(strictlyParsed));
        }
    }
}


================================================
FILE: src/opennlp/ccg/lexicon/EnglishExpander.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2004-5 University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.lexicon;

import java.util.*;
import java.text.*;
import javax.xml.datatype.*;

/**
 * EnglishExpander provides methods for expanding numbers, amounts, durations, 
 * dates and times as English words.
 * The class com.sun.speech.freetts.en.us.NumberExpander served 
 * as a reference point in part, but the implementation has been 
 * rewritten from scratch, streamlined and extended.
 *
 * @author      Michael White
 * @version     $Revision: 1.7 $, $Date: 2005/10/20 17:30:30 $
 **/
public class EnglishExpander {

    //--------------------------------------------
    // dates 
    //
    
    // formats date in month
    private static final DateFormat dateInMonthFormat = new SimpleDateFormat("dd", Locale.ENGLISH);

    // formats month in full
    private static final DateFormat monthFormat = new SimpleDateFormat("MMMM", Locale.ENGLISH);

    // formats year in full
    private static final DateFormat yearFormat = new SimpleDateFormat("yyyy", Locale.ENGLISH);
    
    /**
     * Expands a date to English words in short, 
     * medium or long forms, adding the words to 
     * the given list.  The style is given by 
     * DateFormat.SHORT (e.g., "the first"), 
     * DateFormat.MEDIUM (e.g., "the first of May"), and 
     * DateFormat.LONG (e.g., "the first of May, two thousand and four").
     */
    public static void expandDate(Date date, int style, List<String> list) {
        list.add("the");
        expandOrdinal(dateInMonthFormat.format(date), list);
        if (style == DateFormat.MEDIUM || style == DateFormat.LONG) {
            list.add("of");
            list.add(monthFormat.format(date));
        }
        if (style == DateFormat.LONG) {
            list.add(",");
            String year = yearFormat.format(date);
            // x00y
            if (year.charAt(1) == '0' && year.charAt(2) == '0') {
                expandNumber(year, list);
            }
            // xxyy
            else {
                expandNumber(year.substring(0,2), list);
                expandNumber(year.substring(2), list);
            }
        }
    }

    //--------------------------------------------
    // times
    //
    
    // formats hours in range 1-12
    private static final DateFormat hoursFormat = new SimpleDateFormat("hh", Locale.ENGLISH);

    // formats minutes
    private static final DateFormat minutesFormat = new SimpleDateFormat("mm", Locale.ENGLISH);

    // formats am/pm
    private static final DateFormat amPmFormat = new SimpleDateFormat("a", Locale.ENGLISH);

    /**
     * Expands a time to English words, 
     * adding the words to the given list.
     * For example, a date object with time set to 23:02 
     * is expanded to "eleven oh two PM".
     */
    public static void expandTime(Date time, List<String> list) {
        // add hours
        String hours = hoursFormat.format(time);
        expandNDigitNumber(hours, list);
        // add minutes, with special case for 'oh'
        String minutes = minutesFormat.format(time);
        if (minutes.charAt(0) == '0' && minutes.charAt(1) != '0') {
            list.add("oh");
            expandNDigitNumber(minutes.substring(1), list);
        }
        else {
            expandNDigitNumber(minutes, list);
        }
        // add AM or PM
        list.add(amPmFormat.format(time));
    }

    //--------------------------------------------
    // amounts
    //
    
    /**
     * Expands a digit string and currency code to 
     * number words and the currency name, which 
     * are added to the given list.
     * For example, "12.50" and "GBP" are expanded to 
     * "twelve pounds and fifty pence".
     * The codes GBP, USD and EUR are converted to 
     * names, while other codes are left as is.
     */
    public static void expandAmount(String digitString, String currencyCode, List<String> list) {
        // establish names for currency (singular and plural), 
        // and fractional parts
        String currSing = null; String currPlur = null;
        String fracSing = null; String fracPlur = null;
        if (currencyCode.equals("GBP")) {
            currSing = "pound"; currPlur = "pounds";
            fracSing = "penny"; fracPlur = "pence";
        }
        else if (currencyCode.equals("USD")) {
            currSing = "dollar"; currPlur = "dollars";
            fracSing = "cent"; fracPlur = "cents";
        }
        else if (currencyCode.equals("EUR")) {
            currSing = "euro"; currPlur = "euros";
            fracSing = "cent"; fracPlur = "cents";
        }
        // if none, just expand digit string and append code
        if (currSing == null) {
            expandNumber(digitString, list);
            list.add(currencyCode);
            return;
        }
        // otherwise, get whole and fractional parts of digit string
        String whole = digitString; String frac = null;
        int dotIndex = digitString.indexOf(".");
        if (dotIndex != -1) {
            whole = digitString.substring(0,dotIndex); 
            frac = digitString.substring(dotIndex+1);
        }
        // expand whole
        expandNumber(whole, list);
        // add currency name
        if (whole.equals("1")) 
            list.add(currSing);
        else 
            list.add(currPlur);
        // add fractional part, if any
        if (frac != null) {
            // add "and"
            list.add("and");
            // expand frac
            expandNDigitNumber(frac, list);
            // add fractional name
            if (frac.equals("01"))
                list.add(fracSing);
            else
                list.add(fracPlur);
        }
    }


    //--------------------------------------------
    // durations
    //
    
    /**
     * Expands a duration into a string of words.
     * NB: Fractions of seconds are ignored at present.
     */
    public static void expandDuration(Duration duration, List<String> list) {
        int[] durationFields = { 
            duration.getYears(), duration.getMonths(), duration.getDays(), 
            duration.getHours(), duration.getMinutes(), duration.getSeconds()
        };
        int counter = 0;
        for (int i = 0; i < durationFields.length; i++) {
            if (durationFields[i] > 0) counter++;
        }
        for (int i = 0; i < durationFields.length; i++) {
            if (durationFields[i] > 0) {
                counter--;
                String str = Integer.toString(durationFields[i]);
                expandNumber(str, list);
                String unit = durUnits[i];
                if (durationFields[i] != 1) unit += "s";
                list.add(unit);
                if (counter > 1) list.add(",");
                if (counter == 1) list.add("and");
            }
        }
    }
    
    // duration units
    private static String[] durUnits = { "year", "month", "day", "hour", "minute", "second" };
    
    
    //--------------------------------------------
    // numbers
    //
    
    /**
     * Expands a digit string to a sequence of digit words, 
     * which are added to the given list.
     * For example, "1234" is expanded to "one two three four".
     */
    public static void expandDigits(String digitString, List<String> list) {
        for (int i = 0; i < digitString.length(); i++) {
            list.add(zeroToNine[digitString.charAt(i)-'0']);
        }
    }
    
    /**
     * Expands a digit string to number words, 
     * which are added to the given list.
     * For example, "1234" is expanded to 
     * "one thousand two hundred and thirty four".
     * The digit string may contain a single dot in it, 
     * as well as an initial plus or minus character.
     * For example, "-100.011" is expanded to 
     * "minus one hundred point zero one one".
     * Scientific notation is not currently handled.
     */
    public static void expandNumber(String digitString, List<String> list) {
        // do nothing with empty strings
        if (digitString.length() == 0) return;
        // handle plus or minus
        char c0 = digitString.charAt(0);
        if (c0 == '+' || c0 == '-') {
            list.add((c0 == '+') ? "plus" : "minus");
            digitString = digitString.substring(1);
        }
        // check for dot
        int dotIndex = digitString.indexOf(".");
        if (dotIndex != -1) {
            // add numbers "point" digits
            expandNDigitNumber(digitString.substring(0,dotIndex), list);
            list.add("point");
            expandDigits(digitString.substring(dotIndex+1), list);
        }
        else {
            // add numbers
            expandNDigitNumber(digitString, list);
        }
    }
    
    /**
     * Expands a digit string to words for an ordinal number, 
     * which are added to the given list.
     * For example, "1234" is expanded to 
     * "one thousand two hundred and thirty fourth".
     */
    public static void expandOrdinal(String digitString, List<String> list) {
        // expand number
        expandNDigitNumber(digitString, list);
        // replace last one
        int lastPos = list.size() - 1;
        String ordinal = getOrdinal(list.get(lastPos));
        list.set(lastPos, ordinal);
    }

    // n-digit number    
    public static void expandNDigitNumber(String digitString, List<String> list) {
        int numDigits = digitString.length();
        if (numDigits == 2) 
            expand2DigitNumber(digitString, list); 
        else if (numDigits == 3) 
            expand3DigitNumber(digitString, list); 
        else if (numDigits >= 4 && numDigits <= 12) 
            expand4to12DigitNumber(digitString, list);
        else 
            expandDigits(digitString, list);
    }
    
    // 2 digit numbers
    private static void expand2DigitNumber(String digitString, List<String> list) {
        // 0x case
        if (digitString.charAt(0) == '0') {
            // do nothing for 00 case
            if (digitString.charAt(1) != '0')
                expandDigits(digitString.substring(1), list);
        }
        // 1x case
        else if (digitString.charAt(0) == '1') {
            list.add(tenToNineteen[digitString.charAt(1)-'0']);
        }
        // xy case, x >= 2
        else {
            list.add(zeroToNinety[digitString.charAt(0)-'0']);
            // do nothing for x0 case
            if (digitString.charAt(1) != '0')
                expandDigits(digitString.substring(1), list);
        }
    }

    // 3 digit numbers
    private static void expand3DigitNumber(String digitString, List<String> list) {
        // add hundreds if non-zero
        if (digitString.charAt(0) != '0') {
            // add hundreds digit
            expandDigits(digitString.substring(0,1), list);
            // add unit ("hundred")
            list.add("hundred");
        }
        // add "and", if final two digits non-zero
        if (digitString.charAt(1) != '0' || digitString.charAt(2) != '0')
            list.add("and");
        // expand final two digits
        expand2DigitNumber(digitString.substring(1), list);
    }
    
    // 4-12 digit numbers
    private static void expand4to12DigitNumber(String digitString, List<String> list) {
        int numDigitsModThree = digitString.length() % 3;
        int numInitialDigits = (numDigitsModThree != 0) ? numDigitsModThree : 3;
        int unitsIndex = ((digitString.length() - 1) / 3) - 1;
        // add initial digits
        expandNDigitNumber(digitString.substring(0, numInitialDigits), list);
        // add unit
        list.add(thousandToBillion[unitsIndex]);
        // add rest
        expandNDigitNumber(digitString.substring(numInitialDigits), list);
    }
    
    
    //------------------------
    // arrays of number words
    //
    
    private static final String[] zeroToNine = {
        "zero", "one", "two", "three", "four", 
        "five", "six", "seven", "eight", "nine" 
    };
    
    private static final String[] tenToNineteen = {
        "ten",  "eleven", "twelve", "thirteen", "fourteen", 
        "fifteen", "sixteen", "seventeen", "eighteen", "nineteen" 
    };
    
    private static final String[] zeroToNinety = {
        "zero",  "ten", "twenty", "thirty", "forty", 
        "fifty", "sixty", "seventy", "eighty", "ninety" 
    };
    
    private static final String[] thousandToBillion = {
        "thousand", "million", "billion"
    };
    
    private static final String[] zerothToNinth = {
        "zeroth", "first", "second", "third", "fourth", 
        "fifth", "sixth", "seventh", "eighth", "ninth" 
    };
    
    private static final String[] tenthToNineteenth = {
        "tenth",  "eleventh", "twelfth", "thirteenth", "fourteenth", 
        "fifteenth", "sixteenth", "seventeenth", "eighteenth", "nineteenth" 
    };
    
    private static final String[] zerothToNinetieth = {
        "zeroth", "tenth", "twentieth", "thirtieth", "fortieth", 
        "fiftieth", "sixtieth", "seventieth", "eightieth", "ninetieth" 
    };
    
    private static final String[] thousandthToBillionth = {
        "thousandth", "millionth", "billionth"
    };

    
    //--------------------------------------------
    // corresponding ordinals
    //
    
    // map from numbers to corresponding ordinals
    private static Map<String, String> ordinalMap = null;
    
    // returns corresponding ordinal
    private static String getOrdinal(String number) {
        // ensure ordinalMap instantiated
        if (ordinalMap == null) {
            ordinalMap = new HashMap<String, String>();
            for (int i = 0; i < zeroToNine.length; i++) {
                ordinalMap.put(zeroToNine[i], zerothToNinth[i]);
            }
            for (int i = 0; i < tenToNineteen.length; i++) {
                ordinalMap.put(tenToNineteen[i], tenthToNineteenth[i]);
            }
            for (int i = 0; i < zeroToNinety.length; i++) {
                ordinalMap.put(zeroToNinety[i], zerothToNinetieth[i]);
            }
            ordinalMap.put("hundred", "hundredth");
            for (int i = 0; i < thousandToBillion.length; i++) {
                ordinalMap.put(thousandToBillion[i], thousandthToBillionth[i]);
            }
        }
        return ordinalMap.get(number);
    }
}


================================================
FILE: src/opennlp/ccg/lexicon/EntriesItem.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2002-9 Jason Baldridge, Gann Bierner and 
//                      University of Edinburgh / Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.lexicon;

import opennlp.ccg.synsem.*;
import org.jdom.*;

/**
 * Data structure for storing information about a category family entry.
 *
 * @author  Jason Baldridge
 * @author  Gann Bierner
 * @author  Michael White
 * @version $Revision: 1.10 $, $Date: 2009/10/17 20:46:20 $
 */
public class EntriesItem {
    
    private Family family;
    private Boolean active = Boolean.TRUE;
    private String name;
    private String stem;
    private String indexRel;
    private Category cat;

    public EntriesItem(Element el, Family family) {
        this.family = family;
        name = el.getAttributeValue("name");

        stem = el.getAttributeValue("stem");
        if (stem == null) stem = Lexicon.DEFAULT_VAL; 

        String isActive = el.getAttributeValue("active");
        if (isActive != null && isActive.equals("false"))
            active = Boolean.FALSE;

        String indexRelVal = el.getAttributeValue("indexRel");
        if (indexRelVal != null) indexRel = indexRelVal;
        else indexRel = family.getIndexRel();

        cat = CatReader.getCat((Element)el.getChildren().get(0));
    }

    public Boolean getActive() { return active; }
    /** Returns the name of this entry. */
    public String getName() { return name; }
    /** Returns the qualified name in the form familyName.name. */ 
    public String getQualifiedName() { return getFamilyName() + "." + name; }
    /** Returns the name of this entry's family. */
    public String getFamilyName() { return family.getName(); }
    /** Returns the supertag of this entry's category. */
    public String getSupertag() { return cat.getSupertag(); }
    public Family getFamily() { return family; }
    public String getStem() { return stem; }
    public String getIndexRel() { return indexRel; }
    /** Returns this entry's family's coart rel. */
    public String getCoartRel() { return family.getCoartRel(); }
    public Category getCat() { return cat; }
        
    public String toString () {
        return getQualifiedName() + ":" + stem + " :- " + cat;
    }
}


================================================
FILE: src/opennlp/ccg/lexicon/FactorChainWord.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2005 University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.lexicon;

import opennlp.ccg.util.*;

import java.util.*;

/**
 * A FactorChainWord represents a word via a chain of references to 
 * factor keys, or just to a string in the case of the word form. 
 * Canonical instances are created by a factory method, and stored 
 * in a trie map.  The factor chain representation should be more 
 * space efficient when dealing with large numbers of words.
 *
 *
 * @author      Michael White
 * @version     $Revision: 1.3 $, $Date: 2009/07/17 04:23:30 $
 */
public class FactorChainWord extends Word {
    
	private static final long serialVersionUID = 952665894357382685L;

	/** The referenced factor key or string (for the word form). */
    protected Object key;
    
    /** The previous node in the chain. */
    protected FactorChainWord prev;
    
    /** Constructor. */
    protected FactorChainWord(Object key, FactorChainWord prev) {
        this.key = key; this.prev = prev; 
    }
    
    
    /** Returns the surface form. */
    public String getForm() { return getValFromInterned(Tokenizer.WORD_ATTR); }
    
    /** Returns the pitch accent. */
    public String getPitchAccent() { return getValFromInterned(Tokenizer.PITCH_ACCENT_ATTR); }
    
    /** Returns the list of extra attribute-value pairs. */
    protected List<Pair<String,String>> getAttrValPairsList() { 
        List<Pair<String,String>> retval = null; 
        FactorChainWord current = this;
        while (current != null) {
            if (current.key instanceof FactorKey) {
                FactorKey fkey = (FactorKey) current.key;
                if (!isKnownAttr(fkey.factor)) {
                    if (retval == null) retval = new ArrayList<Pair<String,String>>(5);
                    retval.add(0, new Pair<String,String>(fkey.factor, fkey.val));
                }
            }
            current = current.prev;
        }
        return retval; 
    }
    
    /** Returns the stem. */
    public String getStem() { return getValFromInterned(Tokenizer.STEM_ATTR); }
    
    /** Returns the part of speech. */
    public String getPOS() { return getValFromInterned(Tokenizer.POS_ATTR); }
    
    /** Returns the supertag. */
    public String getSupertag() { return getValFromInterned(Tokenizer.SUPERTAG_ATTR); }
    
    /** Returns the semantic class. */
    public String getSemClass() { return getValFromInterned(Tokenizer.SEM_CLASS_ATTR); }

    
    /** Returns the value of the attribute with the given name, or null if none. 
        The attribute names Tokenizer.WORD_ATTR, ..., Tokenizer.SEM_CLASS_ATTR 
        may be used to retrieve the form, ..., semantic class. */
    public String getVal(String attr) {
        String internedAttr = attr.intern(); // use == on interned attr
        return getValFromInterned(internedAttr); 
    }
    
    /** Returns the value of the given interned attr, or null if none. */
    protected String getValFromInterned(String attr) {
        FactorChainWord current = this;
        while (current != null) {
            if (attr == Tokenizer.WORD_ATTR) {
                if (current.key instanceof String) return (String) current.key;
            }
            else if (current.key instanceof FactorKey) {
                FactorKey fkey = (FactorKey) current.key;
                if (fkey.factor == attr) return fkey.val;
            }
            current = current.prev;
        }
        return null;
    }
    
    /** Factory. */
    public static class Factory implements WordFactory {
        
        /** Trie map for canonical instances. */
        protected TrieMap<Object,FactorChainWord> factorChainRoot = new TrieMap<Object,FactorChainWord>(null);
        
        /** Creates a surface word with the given interned form. */
        public synchronized Word create(String form) {
            return create(factorChainRoot, Tokenizer.WORD_ATTR, form);
        }
        
        /** Creates a (surface or full) word with the given normalized attribute name and value.
            The attribute names Tokenizer.WORD_ATTR, ..., Tokenizer.SEM_CLASS_ATTR 
            may be used for the form, ..., semantic class. */
        public synchronized Word create(String attr, String val) {
            return create(factorChainRoot, attr, val);
        }
        
        /** Creates a (surface or full) word from the given normalized factors. 
            Returns null if no non-null vals. */
        public synchronized Word create(
            String form, String pitchAccent, List<Pair<String,String>> attrValPairs, 
            String stem, String POS, String supertag, String semClass 
        ) {
            // adds non-null vals from the root, in a rough specificity order 
            TrieMap<Object,FactorChainWord> currentNode = factorChainRoot;
            if (POS != null) currentNode = findChild(currentNode, Tokenizer.POS_ATTR, POS);
            if (supertag != null) currentNode = findChild(currentNode, Tokenizer.SUPERTAG_ATTR, supertag);
            if (semClass != null) currentNode = findChild(currentNode, Tokenizer.SEM_CLASS_ATTR, semClass);
            if (stem != null) currentNode = findChild(currentNode, Tokenizer.STEM_ATTR, stem);
            if (form != null) currentNode = findChild(currentNode, Tokenizer.WORD_ATTR, form);
            if (pitchAccent != null) currentNode = findChild(currentNode, Tokenizer.PITCH_ACCENT_ATTR, pitchAccent);
            if (attrValPairs != null) {
                for (int i = 0; i < attrValPairs.size(); i++) {
                	Pair<String,String> p = attrValPairs.get(i);
                    String attr = p.a;
                    String val = p.b; 
                    currentNode = findChild(currentNode, attr, val);
                }
            }
            return currentNode.data;
        }
        
        /** Creates a word from the given node, adding the given interned attr 
            and non-null val. */
        protected Word create(TrieMap<Object,FactorChainWord> currentNode, String attr, String val) {
            TrieMap<Object,FactorChainWord> child = findChild(currentNode, attr, val);
            return child.data;
        }
        
        /** Gets or makes a child node from the given node. */
        protected TrieMap<Object,FactorChainWord> findChild(TrieMap<Object,FactorChainWord> currentNode, String attr, String val) {
            Object key = FactorKey.getKey(attr, val);
            TrieMap<Object,FactorChainWord> child = currentNode.findChild(key);
            if (child.data == null) {
                FactorChainWord parent = currentNode.data;
                child.data = new FactorChainWord(key, parent);
            }
            return child;
        }
    }
}


================================================
FILE: src/opennlp/ccg/lexicon/FactorKey.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2005 University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.lexicon;

import opennlp.ccg.util.*;
// import java.util.*;

/** 
 * Factor key, with identity equals for the factor and value. 
 *
 * @author      Michael White
 * @version     $Revision: 1.1 $, $Date: 2005/03/22 20:59:32 $
 */
public class FactorKey {

    /** The factor. */
    public final String factor;

    /** The value. */
    public final String val;

    /** Constructor.  Assumes interned components. */
    private FactorKey(String factor, String val) { this.factor = factor; this.val = val; }

    /** Makes/retrieves an interned factor key for the given interned attr and val; 
        for the word form, the string itself is returned. 
        Null vals are replaced with &lt;NULL&gt;. */
    public static Object getKey(String attr, String val) {
        if (val == null) val = "<NULL>";
        if (attr == Tokenizer.WORD_ATTR) return val;
        else return Interner.globalIntern(new FactorKey(attr, val));
    }

    /** Returns a hash code constructed from the component identity hash codes. */
    public int hashCode() { 
        return System.identityHashCode(factor) - System.identityHashCode(val);
    }

    /** Returns true if the given factor key has identical components. */
    public boolean equals(Object obj) {
        if (this == obj) return true;
        if (!(obj instanceof FactorKey)) return false;
        FactorKey key = (FactorKey) obj;
        return factor == key.factor && val == key.val;
    }

    /** Returns "factor-val". */
    public String toString() { return factor + "-" + val; }
}    


================================================
FILE: src/opennlp/ccg/lexicon/Family.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2002-9 Jason Baldridge, Gann Bierner and 
//                      University of Edinburgh / Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.lexicon;

import org.jdom.*;
import java.util.*;

/**
 * Lexicon category family.
 *
 * @author      Jason Baldridge
 * @author      Gann Bierner
 * @author      Michael White
 * @version     $Revision: 1.11 $, $Date: 2010/11/30 18:51:05 $
 */
public class Family {
	
    private String name = "";
    private Boolean closed = Boolean.FALSE;
    private String pos = "";
    private String indexRel = ""; 
    private String coartRel = ""; 
    private DataItem[] data;
    private EntriesItem[] entries;

    @SuppressWarnings("unchecked")
	public Family(Element famel) {
    	
        setName(famel.getAttributeValue("name"));
        pos = famel.getAttributeValue("pos");
        
        String isClosed = famel.getAttributeValue("closed");
        if (isClosed != null && isClosed.equals("true")) {
            setClosed(Boolean.TRUE);
        }

        String indexRelVal = famel.getAttributeValue("indexRel");
        if (indexRelVal != null) { indexRel = indexRelVal; }

        String coartRelVal = famel.getAttributeValue("coartRel");
        if (coartRelVal != null) { coartRel = coartRelVal; }

        List<Element> entriesList = famel.getChildren("entry");
        entries = new EntriesItem[entriesList.size()];
        for (int j=0; j < entriesList.size(); j++) {
            entries[j] = new EntriesItem(entriesList.get(j), this);
        }
        
        List<Element> members = famel.getChildren("member");
        data = new DataItem[members.size()];
        for (int j=0; j < members.size(); j++) {
            data[j] = new DataItem(members.get(j));
        }
    }

    public Family(String s) { setName(s); }

    public boolean isClosed() { return closed.booleanValue(); }
    
    public void setName(String s) { name = s; }
    public void setClosed(Boolean b) { closed = b; }
    public void setPOS(String s) { pos = s; }
    public void setIndexRel(String s) { indexRel = s; }
    public void setCoartRel(String s) { coartRel = s; }
    public void setData(DataItem[] dm) { data = dm; }
    public void setEntries(EntriesItem[] em) { entries = em; }

    public String getName() { return name; }
    /** Delegates to first entry. */
    public String getSupertag() { return entries[0].getSupertag(); } 
    public Boolean getClosed() { return closed; }
    public String getPOS() { return pos; }
    public String getIndexRel() { return indexRel; }
    public String getCoartRel() { return coartRel; }
    public DataItem[] getData() { return data; }
    public EntriesItem[] getEntries() { return entries; }
}


================================================
FILE: src/opennlp/ccg/lexicon/FullWord.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2004-5 University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.lexicon;

import opennlp.ccg.util.*;

import java.util.*;

/**
 * A FullWord object is a word with all possible fields. 
 * The factory methods return interned objects.
 *
 * @author      Michael White
 * @version     $Revision: 1.6 $, $Date: 2009/07/17 04:23:30 $
 */
public class FullWord extends WordWithPitchAccent {
    
	private static final long serialVersionUID = -3115687437782457735L;

	/** List of attribute-value pairs, which must be strings. */
    protected List<Pair<String,String>> attrValPairs;
    
    /** The stem. */
    protected String stem;
    
    /** The part of speech. */
    protected String POS;
    
    /** The supertag. */
    protected String supertag;
    
    /** The semantic class (optional). */
    protected String semClass;

    
    /** Returns the list of extra attribute-value pairs. */
    protected List<Pair<String,String>> getAttrValPairsList() { return attrValPairs; }
    
    /** Returns the stem. */
    public String getStem() { return stem; }
    
    /** Returns the part of speech. */
    public String getPOS() { return POS; }
    
    /** Returns the supertag. */
    public String getSupertag() { return supertag; }
    
    /** Returns the semantic class (may be null). */
    public String getSemClass() { return semClass; }

    
    /** Constructor for full word. */
    protected FullWord(
        String form, String pitchAccent, List<Pair<String,String>> attrValPairs, 
        String stem, String POS, String supertag, String semClass 
    ) {
        super(form, pitchAccent);
        this.attrValPairs = attrValPairs; 
        this.stem = stem; this.POS = POS; this.supertag = supertag; this.semClass = semClass; 
    }
    
    /** Factory. */
    public static class Factory implements WordFactory {

        // reusable word, for looking up already interned ones
        private FullWord w = new FullWord(null, null, null, null, null, null, null);
    
        // sets the form and factors of the reusable word w 
        private void setW(
            String form, String pitchAccent, List<Pair<String,String>> attrValPairs, 
            String stem, String POS, String supertag, String semClass 
        ) {
            w.form = form; w.pitchAccent = pitchAccent;
            w.attrValPairs = attrValPairs;
            w.stem = stem; w.POS = POS; w.supertag = supertag; w.semClass = semClass;
        }
        
        // looks up the word equivalent to w, or if none, returns a new one based on it
        private Word getOrCreateFromW() {
            Word retval = (Word) Interner.getGlobalInterned(w);
            if (retval != null) return retval;
            if (w.isSurfaceWord() && w.attrValPairs == null) {
                if (w.pitchAccent == null) retval = new SimpleWord(w.form);
                else retval = new WordWithPitchAccent(w.form, w.pitchAccent);
            }
            else retval = new FullWord(w.form, w.pitchAccent, w.attrValPairs, w.stem, w.POS, w.supertag, w.semClass);
            return (Word) Interner.globalIntern(retval);
        }
        
        /** Creates a surface word with the given interned form. */
        public synchronized Word create(String form) {
            return create(form, null, null, null, null, null, null);
        }
        
        /** Creates a (surface or full) word with the given normalized attribute name and value.
            The attribute names Tokenizer.WORD_ATTR, ..., Tokenizer.SEM_CLASS_ATTR 
            may be used for the form, ..., semantic class. */
        public synchronized Word create(String attr, String val) {
            String form = null; String pitchAccent = null;
            List<Pair<String,String>> attrValPairs = null; 
            String stem = null; String POS = null; String supertag = null; String semClass = null;
            if (attr == Tokenizer.WORD_ATTR) form = val;
            else if (attr == Tokenizer.PITCH_ACCENT_ATTR) pitchAccent = val;
            else if (attr == Tokenizer.STEM_ATTR) stem = val;
            else if (attr == Tokenizer.POS_ATTR) POS = val;
            else if (attr == Tokenizer.SUPERTAG_ATTR) supertag = val;
            else if (attr == Tokenizer.SEM_CLASS_ATTR) semClass = val;
            else {
                attrValPairs = new ArrayList<Pair<String,String>>(1);
                attrValPairs.add(new Pair<String,String>(attr, val));
            }
            return create(form, pitchAccent, attrValPairs, stem, POS, supertag, semClass);
        }
        
        /** Creates a (surface or full) word from the given canonical factors. */
        public synchronized Word create(
            String form, String pitchAccent, List<Pair<String,String>> attrValPairs, 
            String stem, String POS, String supertag, String semClass 
        ) {
            setW(form, pitchAccent, attrValPairs, stem, POS, supertag, semClass);
            return getOrCreateFromW();
        }
    }
}


================================================
FILE: src/opennlp/ccg/lexicon/LexException.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2002-3 Jason Baldridge, Gann Bierner and 
//                      University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.lexicon;

/**
 * Any exception thrown if something wrong happens in the lexicon.
 *
 * @author      Gann Bierner
 * @author      Michael White
 * @version     $Revision: 1.3 $, $Date: 2005/10/20 17:30:30 $
 */
public class LexException extends Exception {

	private static final long serialVersionUID = 1L;
	
	/** The message. */
    protected String msg;

    /**
     * Constructor with message.
     */    
    public LexException(String s) { msg = s; }

    /** Returns exception message. */
    public String toString() {
        return "Lexicon Exception: " + msg;
    }
}


================================================
FILE: src/opennlp/ccg/lexicon/Lexicon.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2004-9 Jason Baldridge, Gann Bierner and 
//                      Michael White (University of Edinburgh, The Ohio State University)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.lexicon;

import opennlp.ccg.grammar.*;
import opennlp.ccg.synsem.*;
import opennlp.ccg.unify.*;
import opennlp.ccg.util.*;
import opennlp.ccg.hylo.*;

import org.jdom.*;

import java.io.*;
import java.net.*;
import java.util.*;

import gnu.trove.*;


/**
 * Contains words and their associated categories and semantics.
 * Lookup can be filtered by plugging in a supertagger.
 * 
 *
 * @author      Gann Bierner
 * @author      Jason Baldridge
 * @author      Michael White
 * @version     $Revision: 1.78 $, $Date: 2011/10/31 02:01:06 $
 */
public class Lexicon { 
    
    /** Flag used to indicate a purely syntactic edge, with no associated semantics. */
    public static final String NO_SEM_FLAG = "*NoSem*";
    
    /** Constant used to signal the substitution of the stem or pred. */
    public static final String DEFAULT_VAL = "[*DEFAULT*]";
    
    // supertagger
    private SupertaggerAdapter _supertagger = null;
    
    // various maps
    private GroupMap<Word,MorphItem> _words;
    private GroupMap<String,Object> _stems;
    private GroupMap<String,FeatureStructure> _macros;
    private HashMap<String,MacroItem> _macroItems;

    private GroupMap<String,EntriesItem[]> _posToEntries;
    private GroupMap<String,EntriesItem> _stagToEntries;
    private GroupMap<String,Word> _predToWords;
    private GroupMap<String,String> _relsToPreds;
    private GroupMap<String,String> _coartRelsToPreds;
    
    // coarticulation attrs
    private Set<String> _coartAttrs;
    private Set<String> _indexedCoartAttrs;
    
    // attrs per atomic category type, across all entries
    private GroupMap<String,String> _catsToAttrs;
    private Set<String> _lfAttrs;
    
    // distributive attributes
    private String[] _distributiveAttrs = null;
    
    // licensing features
    private LicensingFeature[] _licensingFeatures = null;
    
    // relation sorting
    private HashMap<String,Integer> _relationIndexMap = new HashMap<String,Integer>();
    
    // interner for caching lex lookups during realization
    private Interner<Object> lookupCache = new Interner<Object>(true);
    
    /** The grammar that this lexicon is part of. */
    public final Grammar grammar;
    
    /** The tokenizer.  (Defaults to DefaultTokenizer.) */
    public final Tokenizer tokenizer;
    
    /** Flag for whether the lexicon is open, ie complete lexical category mappings are not expected. (Defaults to false.) */
    public boolean openlex = false;
    
    /** Flag for whether to show warnings for failed sem class unification. (Defaults to false.) */
    public boolean debugSemClasses = false;
    

    /*************************************************************
     * Constructor
     *************************************************************/
    public Lexicon(Grammar grammar) {
        this.grammar = grammar;
        this.tokenizer = new DefaultTokenizer();
    }

    /** Constructor with tokenizer. */
    public Lexicon(Grammar grammar, Tokenizer tokenizer) {
        this.grammar = grammar;
        this.tokenizer = tokenizer;
    }

    //-------------------------------------------------------------
    
    /** Sets the supertagger (null if none). */
    public void setSupertagger(SupertaggerAdapter supertagger) { _supertagger = supertagger; }
    
    
    /** Loads the lexicon and morph files. */
    public void init(URL lexiconUrl, URL morphUrl) throws IOException {
        
    	List<Family> lexicon = null;
        List<MorphItem> morph = null;
        List<MacroItem> macroModel = null;

        // load category families (lexicon), morph forms and macros
        lexicon = getLexicon(lexiconUrl);
        Pair<List<MorphItem>,List<MacroItem>> morphInfo = getMorph(morphUrl);
        morph = morphInfo.a; macroModel = morphInfo.b;

        // index words; also index stems to words, as default preds
        // store indexed coarticulation attrs too
        _words = new GroupMap<Word,MorphItem>();
        _predToWords = new GroupMap<String,Word>();
        _coartAttrs = new HashSet<String>();
        _indexedCoartAttrs = new HashSet<String>();
        for (MorphItem morphItem : morph) {
            Word surfaceWord = morphItem.getSurfaceWord();
            _words.put(surfaceWord, morphItem);
            _predToWords.put(morphItem.getWord().getStem(), surfaceWord);
            if (morphItem.isCoart()) {
                Word indexingWord = morphItem.getCoartIndexingWord();
                _words.put(indexingWord, morphItem);
                Pair<String,String> first = indexingWord.getSurfaceAttrValPairs().next();
                _indexedCoartAttrs.add(first.a);
                for (Iterator<Pair<String,String>> it = surfaceWord.getSurfaceAttrValPairs(); it.hasNext(); ) {
                	Pair<String,String>  p = it.next();
                    _coartAttrs.add(p.a);
                }
            }
        }

        // index entries based on stem+pos
        _stems = new GroupMap<String,Object>();
        _posToEntries = new GroupMap<String,EntriesItem[]>();
        // index entries by supertag+pos, for supertagging
        _stagToEntries = new GroupMap<String,EntriesItem>();
        // also index rels and coart rels to preds
        _relsToPreds = new GroupMap<String,String>();
        _coartRelsToPreds = new GroupMap<String,String>();
        // and gather list of attributes used per atomic category type 
        _catsToAttrs = new GroupMap<String,String>();
        _lfAttrs = new HashSet<String>();
        // and remember family and ent, names, for checking excluded list on morph items
        HashSet<String> familyAndEntryNames = new HashSet<String>();
        
        // index each family
        for (Family family : lexicon) {

        	familyAndEntryNames.add(family.getName());
            EntriesItem[] entries = family.getEntries();
            DataItem[] data = family.getData();

            // for generic use when we get an unknown stem
            // from the morphological analyzer
            if (!family.isClosed()) {
                _posToEntries.put(family.getPOS(), entries);
            }

            // scan through entries
            for (int j=0; j < entries.length; j++) {
                // index
                EntriesItem eItem = entries[j];
            	_stagToEntries.put(eItem.getSupertag()+family.getPOS(), eItem);
                if (eItem.getStem().length() > 0) {
                    _stems.put(eItem.getStem()+family.getPOS(), eItem);
                }
                try {
                    // gather features
                    eItem.getCat().forall(gatherAttrs);
                    // record names
                    familyAndEntryNames.add(eItem.getName());
                    familyAndEntryNames.add(eItem.getQualifiedName());
                }
                catch (RuntimeException exc) {
                    System.err.println("exception for: " + family.getName() + ": " + exc);
                }
            }

            // scan through data
            for (int j=0; j < data.length; j++) {
                DataItem dItem = data[j];
                _stems.put(dItem.getStem()+family.getPOS(), new Pair<DataItem, EntriesItem[]>(dItem,entries));
                // index non-default preds to words
                if (!dItem.getStem().equals(dItem.getPred())) {
                    Collection<Word> words = (Collection<Word>) _predToWords.get(dItem.getStem());
                    if (words == null) {
                    	if (!openlex) {
	                        System.out.print("Warning: couldn't find words for pred '");
	                        System.out.println(dItem.getPred() + "' with stem '" + dItem.getStem() + "'");
                    	}
                    }
                    else {
                        for (Iterator<Word> it = words.iterator(); it.hasNext(); ) {
                            _predToWords.put(dItem.getPred(), it.next());
                        }
                    }
                }
            }

            // index rels to preds
            // nb: this covers relational (eg @x<GenRel>e) and featural (eg @e<tense>past) 
            //     elementary predications
            List<String> indexRels = new ArrayList<String>(3);
            String familyIndexRel = family.getIndexRel();
            if (familyIndexRel.length() > 0) { 
                indexRels.add(familyIndexRel); 
            }
            for (int j=0; j < entries.length; j++) {
                EntriesItem eItem = entries[j];
                String indexRel = eItem.getIndexRel();
                if (indexRel.length() > 0 && !indexRel.equals(familyIndexRel)) {
                    indexRels.add(indexRel);
                }
            }
            for (Iterator<String> it = indexRels.iterator(); it.hasNext(); ) {
                String indexRel = it.next();
                // nb: not indexing on entries items, b/c some stems are still defaults 
                for (int j=0; j < data.length; j++) {
                    DataItem dItem = data[j];
                    _relsToPreds.put(indexRel, dItem.getPred());
                }
            }
            
            // index coart rels (features, really) to preds
            String coartRel = family.getCoartRel();
            if (coartRel.length() > 0) {
                for (int j=0; j < data.length; j++) {
                    _coartRelsToPreds.put(coartRel, data[j].getPred());
                }
            }
        }

        // index the macros
        _macros = new GroupMap<String, FeatureStructure>();
        // nb: could just index MacroItem objects for feature structures too;
        //     this might be a bit cleaner, but life is short
        _macroItems = new HashMap<String, MacroItem>();
        for (MacroItem mi : macroModel) {
            String macName = mi.getName();
            FeatureStructure[] specs = mi.getFeatureStructures();
            for (int j=0; j < specs.length; j++) {
                _macros.put(macName, specs[j]);
            }
            // this is for handling LF part of macros
            _macroItems.put(macName, mi);
        }

        // with morph items, check POS, macro names, excluded list for xref
        for (MorphItem morphItem : morph) {
            Word w = morphItem.getWord();
            if (!openlex && 
            	!_stems.containsKey(w.getStem() + w.getPOS()) &&
                !_posToEntries.containsKey(w.getPOS())) 
            {
                System.err.println(
                    "Warning: no entries for stem '" + w.getStem() + 
                    "' and POS '" + w.getPOS() + 
                    "' found for word '" + w + "'"
                );
            }
            String[] macroNames = morphItem.getMacros();
            for (int j=0; j < macroNames.length; j++) {
                if (!_macroItems.containsKey(macroNames[j])) {
                    System.err.println("Warning: macro " + macroNames[j] + 
                        " not found for word '" + morphItem.getWord() + "'");
                }
            }
            String[] excludedNames = morphItem.getExcluded();
            for (int j=0; j < excludedNames.length; j++) {
                if (!familyAndEntryNames.contains(excludedNames[j])) {
                    System.err.println("Warning: excluded family or entry '" + excludedNames[j] + 
                        "' not found for word '" + morphItem.getWord() + "'");
                }
            }
        }
    }
    
    /** Expands inheritsFrom links to feature equations for those features not explicitly listed. */ 
    public void expandInheritsFrom(Category cat) {
        expandInheritsFrom(cat, null);
    }
    
    /** Expands inheritsFrom links to feature equations for those features not explicitly listed. */ 
    public void expandInheritsFrom(Category cat, Category cat2) {
        // index feature structures
        featStrucMap.clear();
        cat.forall(indexFeatStrucs);
        if (cat2 != null) { cat2.forall(indexFeatStrucs); }
        // add feature eqs 
        cat.forall(doInheritsFrom);
        if (cat2 != null) { cat2.forall(doInheritsFrom); }
    }
    
    // gathers attrs from a category
    private CategoryFcn gatherAttrs = new CategoryFcnAdapter() {
        public void forall(Category c) {
            if (!(c instanceof AtomCat)) return;
            String type = ((AtomCat)c).getType();
            FeatureStructure fs = c.getFeatureStructure();
            if (fs == null) return;
            for (Iterator<String> it = fs.getAttributes().iterator(); it.hasNext(); ) {
                String att = it.next();
                _catsToAttrs.put(type, att);
                if (fs.getValue(att) instanceof LF) {
                    _lfAttrs.add(att);
                }
            }
        }
    };

    // a map from indices to atomic categories, reset for each category
    private TIntObjectHashMap featStrucMap = new TIntObjectHashMap();
    
    // fills in featStrucMap for a category
    private CategoryFcn indexFeatStrucs = new CategoryFcnAdapter() {
        public void forall(Category c) {
            FeatureStructure fs = c.getFeatureStructure();
            if (fs != null && fs.getIndex() != 0)
                featStrucMap.put(fs.getIndex(), fs);
        }
    };

    // adds feature equations to percolate attributes from inheritsFrom feature 
    // structure, except for any attributes already present
    private CategoryFcn doInheritsFrom = new CategoryFcnAdapter() {
        public void forall(Category c) {
            // get feature structures
            if (!(c instanceof AtomCat)) return;
            String type = ((AtomCat)c).getType();
            FeatureStructure fs = c.getFeatureStructure();
            GFeatStruc gfs = (GFeatStruc) fs;
            if (gfs == null || gfs.getInheritsFrom() == 0) return;
            int inhf = gfs.getInheritsFrom();
            FeatureStructure inhfFS = (FeatureStructure) featStrucMap.get(inhf);
            if (inhfFS != null) {
                // copy values of features from inhfFS not already present
                for (Iterator<String> it = inhfFS.getAttributes().iterator(); it.hasNext(); ) {
                    String att = it.next(); 
                    if (gfs.hasAttribute(att)) continue;
                    gfs.setFeature(att, UnifyControl.copy(inhfFS.getValue(att)));
                }
                // for each possible attr used with this type and not already present, 
                // add feature equation
                Collection<String> attrs = (Collection<String>) _catsToAttrs.get(type);
                if (attrs == null) return;
                for (Iterator<String> it = attrs.iterator(); it.hasNext(); ) {
                    String att = it.next(); 
                    if (gfs.hasAttribute(att)) continue;
                    String varName = att.toUpperCase() + inhf;
                    if (_lfAttrs.contains(att)) {
                        gfs.setFeature(att, new HyloVar(varName));
                        inhfFS.setFeature(att, new HyloVar(varName));
                    }
                    else {
                        gfs.setFeature(att, new GFeatVar(varName));
                        inhfFS.setFeature(att, new GFeatVar(varName));
                    }
                }
            }
            else {
                System.err.println(
                    "Warning: no feature structure with inheritsFrom index of " + inhf + 
                    " found in category " + c
                );
            }
        }
    };

    
    /**
     * Returns the lexical signs indexed by the given rel, or null if none. 
     */
    public Collection<Sign> getSignsFromRel(String rel) {
        // check cache (if not doing supertagging)
    	if (_supertagger == null) {
	        RelLookup lookup = new RelLookup(rel);
	        RelLookup retLookup = (RelLookup) lookupCache.getInterned(lookup);
	        if (retLookup != null) return retLookup.signs;
    	}
        // lookup signs via preds
        Collection<String> preds = (Collection<String>) _relsToPreds.get(rel);
        if (preds == null) return null;
        Collection<Sign> retval = getSignsFromRelAndPreds(rel, preds);
        // cache non-null result (if not doing supertagging)
        if (_supertagger == null && retval != null) {
        	RelLookup lookup = new RelLookup(rel);
            lookup.signs = retval; lookupCache.intern(lookup);
        }
        return retval;
    }

    // get signs for rel via preds, or null if none
    private Collection<Sign> getSignsFromRelAndPreds(String rel, Collection<String> preds) {
        List<Sign> retval = new ArrayList<Sign>();
        for (Iterator<String> it = preds.iterator(); it.hasNext(); ) {
            String pred = it.next();
            Collection<Sign> signs = getSignsFromPredAndTargetRel(pred, rel);
            if (signs != null) retval.addAll(signs);
        }
        // return null if none survive filter
        if (retval.size() > 0) return retval;
        else return null;
    }

    /**
     * Returns the lexical signs indexed by the given pred.
     * If the pred is not listed in the lexicon, the tokenizer is 
     * consulted to see if it is a special token (date, time, etc.); 
     * otherwise, null is returned.
     * Coarticulations are applied for the given rels, if non-null.
     */
    public Collection<Sign> getSignsFromPred(String pred, List<String> coartRels) {
        // check cache (if not doing supertagging)
    	if (_supertagger == null) {
	        PredLookup lookup = new PredLookup(pred, coartRels);
	        PredLookup retLookup = (PredLookup) lookupCache.getInterned(lookup);
	        if (retLookup != null) return retLookup.signs;
    	}
        // lookup pred
        Collection<Sign> result = getSignsFromPredAndTargetRel(pred, null);
        if (result == null) return null;
        // apply coarts for rels
        if (coartRels != null) applyCoarts(coartRels, result);
        // cache result (if not doing supertagging)
    	if (_supertagger == null) {
	        PredLookup lookup = new PredLookup(pred, coartRels);
    		lookup.signs = result; lookupCache.intern(lookup);
    	}
        // and return
        return result;
    }
        
    // get signs using an additional arg for a target rel
    private Collection<Sign> getSignsFromPredAndTargetRel(String pred, String targetRel) {
        
        Collection<Word> words = (Collection<Word>) _predToWords.get(pred);
        String specialTokenConst = null;
        
        // for robustness, when using supertagger, add words for pred sans sense index
        int dotIndex = -1;
        if (_supertagger != null && !Character.isDigit(pred.charAt(0)) && // skip numbers 
        		(dotIndex = pred.lastIndexOf('.')) > 0 && pred.length() > dotIndex+1 &&
        		pred.charAt(dotIndex+1) != '_') // skip titles, eg Mr._Smith
        {
        	String barePred = pred.substring(0, dotIndex);
        	Collection<Word> barePredWords = (Collection<Word>) _predToWords.get(barePred);
        	if (words == null) words = barePredWords;
        	else if (barePredWords != null) {
        		Set<Word> unionWords = new HashSet<Word>(words);
        		unionWords.addAll(barePredWords);
        		words = unionWords;
        	}
        }
        
        if (words == null) {
            specialTokenConst = tokenizer.getSpecialTokenConstant(tokenizer.isSpecialToken(pred));
            if (specialTokenConst == null) return null;
            // lookup words with pred = special token const
            Collection<Word> specialTokenWords = (Collection<Word>) _predToWords.get(specialTokenConst);
            // replace special token const with pred
            if (specialTokenWords == null) return null;
            words = new ArrayList<Word>(specialTokenWords.size());
            for (Iterator<Word> it = specialTokenWords.iterator(); it.hasNext(); ) {
                Word stw = it.next();
                Word w = Word.createSurfaceWord(stw, pred);
                words.add(w);
            }
        }
        
        List<Sign> retval = new ArrayList<Sign>();
        for (Iterator<Word> it = words.iterator(); it.hasNext(); ) {
            Word w = it.next();
            try {
                SignHash signs = getSignsFromWord(w, specialTokenConst, pred, targetRel);
                retval.addAll(signs.asSignSet());
            }
            // shouldn't happen
            catch (LexException exc) {
                System.err.println("Unexpected lex exception for word " + w + ": " + exc);
            }
        }
        return retval;
    }
    
    // look up and apply coarts for given rels to each sign in result
    private void applyCoarts(List<String> coartRels, Collection<Sign> result) {
        List<Sign> inputSigns = new ArrayList<Sign>(result);
        result.clear();
        List<Sign> outputSigns = new ArrayList<Sign>(inputSigns.size());
        // for each rel, lookup coarts and apply to input signs, storing results in output signs
        for (Iterator<String> it = coartRels.iterator(); it.hasNext(); ) {
            String rel = it.next();
            Collection<String> preds = (Collection<String>) _coartRelsToPreds.get(rel);
            if (preds == null) continue; // not expected
            Collection<Sign> coartResult = getSignsFromRelAndPreds(rel, preds);
            if (coartResult == null) continue;
            for (Iterator<Sign> it2 = coartResult.iterator(); it2.hasNext(); ) {
                Sign coartSign = it2.next();
                // apply to each input
                for (int j = 0; j < inputSigns.size(); j++) {
                    Sign sign = inputSigns.get(j);
                    grammar.rules.applyCoart(sign, coartSign, outputSigns);
                }
            }
            // switch output to input for next iteration
            inputSigns.clear();
            inputSigns.addAll(outputSigns);
            outputSigns.clear();
        }
        // add results back
        result.addAll(inputSigns);
    }

    
    /**
     * For a string of 1 or more surface words, return all of the lexical
     * entries for each word as a list of sign hashes.
     * Tokenization is performed using the configured tokenizer.
     *
     * @param w the words in string format
     * @return a list of sign hashes
     * @exception LexException thrown if word not found
     */
    public List<SignHash> getEntriesFromWords(String s) throws LexException { 
        List<SignHash> entries = new ArrayList<SignHash>();
        List<Word> words = tokenizer.tokenize(s);
        for (Iterator<Word> it = words.iterator(); it.hasNext(); ) {
            Word w = it.next();
            SignHash signs = getSignsFromWord(w);
            if (signs.size() == 0) {
                throw new LexException("Word not in lexicon: \"" + w +"\"");
            }
            entries.add(signs);
        }
        return entries;
    }
    
    /**
     * For a given word, return all of its surface word's lexical entries.
     * If the word is not listed in the lexicon, the tokenizer is 
     * consulted to see if it is a special token (date, time, etc.); 
     * otherwise an exception is thrown.
     * If the word has coarticulations, all applicable coarticulation 
     * entries are applied to the base word, in an arbitrary order.
     *
     * @param w the word
     * @return a sign hash
     * @exception LexException thrown if word not found
     */
    public SignHash getSignsFromWord(Word w) throws LexException {
        // reduce word to its core, removing coart attrs if any
    	Word surfaceWord = Word.createSurfaceWord(w);
        Word coreWord = (surfaceWord.attrsIntersect(_coartAttrs)) 
            ? Word.createCoreSurfaceWord(surfaceWord, _coartAttrs) 
            : surfaceWord;
        // lookup core word
        SignHash result = getSignsFromWord(coreWord, null, null, null);
        if (result.size() == 0) {
            throw new LexException(coreWord + " not found in lexicon");
        }
        // return signs if no coart attrs
        if (coreWord == surfaceWord) return result; 
        // otherwise apply coarts for word
        applyCoarts(surfaceWord, result);
        return result; 
    }
    
    // look up and apply coarts for w to each sign in result
    @SuppressWarnings("unchecked")
	private void applyCoarts(Word w, SignHash result) throws LexException {
        List<Sign> inputSigns = new ArrayList<Sign>(result.asSignSet());
        result.clear();
        List<Sign> outputSigns = new ArrayList<Sign>(inputSigns.size());
        // for each surface attr, lookup coarts and apply to input signs, storing results in output signs
        for (Iterator<Pair<String,String>> it = w.getSurfaceAttrValPairs(); it.hasNext(); ) {
            Pair<String,String> p = it.next();
            String attr = (String) p.a;
            if (!_indexedCoartAttrs.contains(attr)) continue;
            String val = (String) p.b;
            Word coartWord = Word.createWord(attr, val);
            SignHash coartResult = getSignsFromWord(coartWord, null, null, null);
            for (Iterator<Sign> it2 = coartResult.iterator(); it2.hasNext(); ) {
                Sign coartSign = it2.next();
                // apply to each input
                for (int j = 0; j < inputSigns.size(); j++) {
                    Sign sign = inputSigns.get(j);
                    grammar.rules.applyCoart(sign, coartSign, outputSigns);
                }
            }
            // switch output to input for next iteration
            inputSigns.clear();
            inputSigns.addAll(outputSigns);
            outputSigns.clear();
        }
        // add results back
        result.addAll(inputSigns);
    }
    
    // get signs with additional args for a known special token const, target pred and target rel        
    private SignHash getSignsFromWord(Word w, String specialTokenConst, String targetPred, String targetRel) throws LexException {

        Collection<MorphItem> morphItems = (specialTokenConst == null)
            ? (Collection<MorphItem>) _words.get(w)
            : null;

        if (morphItems == null) {
            // check for special tokens
            if (specialTokenConst == null) {
                specialTokenConst = tokenizer.getSpecialTokenConstant(tokenizer.isSpecialToken(w.getForm()));
                targetPred = w.getForm();
            }
            if (specialTokenConst != null) {
                Word key = Word.createSurfaceWord(w, specialTokenConst);
                morphItems = (Collection<MorphItem>) _words.get(key);
            }
            // otherwise throw lex exception
            if (morphItems == null)
                throw new LexException(w + " not in lexicon");
        }

        SignHash result = new SignHash();

        for (Iterator<MorphItem> MI = morphItems.iterator(); MI.hasNext();) {
            getWithMorphItem(w, MI.next(), targetPred, targetRel, result);
        }

        return result;
    }


    // given MorphItem
    private void getWithMorphItem(Word w, MorphItem mi, String targetPred, String targetRel, SignHash result)
        throws LexException 
    {
    	// get supertags for filtering, if a supertagger is installed
    	Map<String,Double> supertags = null;
    	Set<String> supertagsFound = null;
    	if (_supertagger != null) {
    		supertags = _supertagger.getSupertags();
    		if (supertags != null) supertagsFound = new HashSet<String>(supertags.size());
    	}
    	
        // get macro adder
        MacroAdder macAdder = getMacAdder(mi);
        
        // if we have this stem in our lexicon
        String stem = mi.getWord().getStem();
        String pos = mi.getWord().getPOS();
        Set<EntriesItem[]> explicitEntries = null; // for storing entries from explicitly listed family members
        if (_stems.containsKey(stem+pos)) {
            explicitEntries = new HashSet<EntriesItem[]>();
            Collection<Object> stemItems = (Collection<Object>)_stems.get(stem+pos);
            for (Iterator<Object> I=stemItems.iterator(); I.hasNext();) {
                Object item = I.next();
                // see if it's an EntriesItem
                if (item instanceof EntriesItem) {
                    EntriesItem entry = (EntriesItem) item;
                    // do lookup
                    getWithEntriesItem(w, mi, stem, stem, targetPred, targetRel, entry, macAdder, supertags, supertagsFound, result);
                } 
                // otherwise it has to be a Pair containing a DataItem and 
                // an EntriesItem[]
                else {
                    @SuppressWarnings("rawtypes")
					DataItem dItem = (DataItem)((Pair)item).a;
                    @SuppressWarnings("rawtypes")
					EntriesItem[] entries = (EntriesItem[])((Pair)item).b;
                    // store entries
                    explicitEntries.add(entries);
                    // do lookup
                    getWithDataItem(w, mi, dItem, entries, targetPred, targetRel, macAdder, supertags, supertagsFound, result);
                }
            }
        }
        
        // for entries that are not explicitly in the lexicon file, we have to create
        // Signs from the open class entries with the appropriate part-of-speech
        Collection<EntriesItem[]> entrySets = (Collection<EntriesItem[]>)_posToEntries.get(pos);
        if (entrySets != null) {
	        for (Iterator<EntriesItem[]> E=entrySets.iterator(); E.hasNext(); ) {
	            EntriesItem[] entries = E.next();  
	            // skip if entries explicitly listed
	            if (explicitEntries != null && explicitEntries.contains(entries)) continue;
	            // otherwise get entries with pred = targetPred, or stem if null
	            String pred = (targetPred != null) ? targetPred : stem;
	            getWithDataItem(w, mi, new DataItem(stem, pred), entries, targetPred, targetRel, macAdder, supertags, supertagsFound, result);
	        }
        }
        
        // finally do entries for any remaining supertags
        if (supertags != null) {
        	for (String supertag : supertags.keySet()) {
        		if (supertagsFound.contains(supertag)) continue;
        		Set<EntriesItem> entries = _stagToEntries.get(supertag+pos);
        		if (entries == null) continue; // nb: could be a POS mismatch
	            // get entries with pred = targetPred, or stem if null
	            String pred = (targetPred != null) ? targetPred : stem;
        		for (EntriesItem entry : entries) {
        			if (!entry.getStem().equals(DEFAULT_VAL)) continue;
		            getWithEntriesItem(w, mi, stem, pred, targetPred, targetRel, entry, macAdder, supertags, supertagsFound, result);
        		}
        	}
        }
    }

    
    // given DataItem
    private void getWithDataItem(Word w, MorphItem mi,  
                                 DataItem item, EntriesItem[] entries, 
                                 String targetPred, String targetRel, 
                                 MacroAdder macAdder,
                                 Map<String,Double> supertags,
                                 Set<String> supertagsFound,
                                 SignHash result) 
    {
        for (int i=0; i < entries.length; i++) {
            EntriesItem entry = entries[i];
            if (entry.getStem().equals(DEFAULT_VAL)) {
                getWithEntriesItem(w, mi, item.getStem(), item.getPred(), targetPred, targetRel, entry, macAdder, supertags, supertagsFound, result);
            }
        }
    }

    // given EntriesItem
    private void getWithEntriesItem(Word w, MorphItem mi, 
                                    String stem, String pred, 
                                    String targetPred, String targetRel,
                                    EntriesItem item,
                                    MacroAdder macAdder,
                                    Map<String,Double> supertags,
                                    Set<String> supertagsFound,
                                    SignHash result) 
    {
        // ensure apropos
        if (targetPred != null && !targetPred.equals(pred)) return; 
        if (targetRel != null && !targetRel.equals(item.getIndexRel()) && !targetRel.equals(item.getCoartRel())) return; 
        if (!item.getActive().booleanValue()) return;
        if (mi.excluded(item)) return;
        
        try {
	        // copy and add macros
	        Category cat = item.getCat().copy();
	        macAdder.addMacros(cat);
	
	        // replace DEFAULT_VAL with pred, after first 
	        // unifying type of associated nom var(s) with sem class 
	        unifySemClass(cat, mi.getWord().getSemClass());
	        REPLACEMENT = pred; 
	        cat.deepMap(defaultReplacer);
	        
	        // check supertag
	        // TODO: think about earlier checks for efficiency, for grammars where macros and preds don't matter
	        //Double lexprob = null; // nb: skipping lex log probs, don't seem to be helpful
	        if (supertags != null) {
	        	// skip if not found
	        	String stag = cat.getSupertag();
	        	if (!supertags.containsKey(stag)) return;
	        	// otherwise update found supertags
	        	supertagsFound.add(stag);
	        	// get lex prob
	        	//lexprob = supertags.get(stag);
	        }
	        
	        // propagate types of nom vars
	        propagateTypes(cat);
	        
	        // handle distrib attrs and inherits-from
	        propagateDistributiveAttrs(cat);
	        expandInheritsFrom(cat);
	        
	        // merge stem, pos, sem class from morph item, plus supertag from cat
	        Word word = Word.createFullWord(w, mi.getWord(), cat.getSupertag());

	        // set origin and lexprob
	        Sign sign = new Sign(word, cat);
	        sign.setOrigin();
	        //if (lexprob != null) {
	        //	sign.addData(new SupertaggerAdapter.LexLogProb((float) Math.log10(lexprob)));
	        //}
	        // return sign
	        result.insert(sign);
        }
        catch (RuntimeException exc) {
        	System.err.println(
        			"Warning: ignoring entry: " + item.getName() + " of family: " + item.getFamilyName() + 
        			" for stem: " + stem + " b/c: " + exc.toString()
        	);
        }
    }

    // the sem class for defaultNomvarSetter
    private SimpleType SEMCLASS = null;
    
    // unify sem class with default nom var(s)
    private void unifySemClass(Category cat, String semClass) {
        if (semClass == null || cat.getLF() == null) return;
        SEMCLASS = grammar.types.getSimpleType(semClass);
        try {
            cat.getLF().deepMap(defaultNomvarUnifier);
        } catch (TypePropagationException tpe) {
        	if (debugSemClasses) {
	            System.err.println(
	                "Warning: unable to unify types '" + tpe.st1 + "' and '" + tpe.st2 + 
	                "' in unifying sem class in cat: \n" + cat
	            );
        	}
        }
    }
    
    // mod function to unify type of nom var for DEFAULT_VAL with SEMCLASS
    private ModFcn defaultNomvarUnifier = new ModFcn() {
        public void modify(Mutable m) {
            if (!(m instanceof SatOp)) return;
            SatOp satop = (SatOp) m;
            if (!(satop.getArg() instanceof Proposition)) return; 
            Proposition prop = (Proposition) satop.getArg();
            if (!prop.getName().equals(DEFAULT_VAL)) return;
            if (!(satop.getNominal() instanceof NominalVar)) return;
            NominalVar nv = (NominalVar) satop.getNominal();
            SimpleType st = nv.getType();
            // check equality
            if (st.equals(SEMCLASS)) return;
            // otherwise unify types, update nv
            try {
                SimpleType stU = (SimpleType) st.unify(SEMCLASS, null);
                nv.setType(stU);
            } catch (UnifyFailure uf) {
                throw new TypePropagationException(st, SEMCLASS);
            }
        }
    };

    // the replacement string for defaultReplacer
    private String REPLACEMENT = "";
    
    // mod function to replace DEFAULT_VAL with REPLACEMENT
    private ModFcn defaultReplacer = new ModFcn() {
        public void modify(Mutable m) {
            if (m instanceof Proposition) {
                Proposition prop = (Proposition) m; 
                if (prop.getName().equals(DEFAULT_VAL)) prop.setAtomName(REPLACEMENT);
            }
            else if (m instanceof FeatureStructure) {
                FeatureStructure fs = (FeatureStructure) m;
                for (Iterator<String> it = fs.getAttributes().iterator(); it.hasNext(); ) {
                    String attr = it.next();
                    Object val = fs.getValue(attr);
                    if (val instanceof SimpleType && 
                        ((SimpleType)val).getName().equals(DEFAULT_VAL))
                    {
                        fs.setFeature(attr, grammar.types.getSimpleType(REPLACEMENT));
                    }
                }
            }
        }
    };


    // a cache for macro adders
    private Map<MorphItem, MacroAdder> macAdderMap = new HashMap<MorphItem, MacroAdder>();
    
    // returns a macro adder for the given morph item
    private MacroAdder getMacAdder(MorphItem mi) {
        
        // check map
        MacroAdder retval = macAdderMap.get(mi);
        if (retval != null) return retval;
        
        // set up macro adder
        IntHashSetMap macrosFromLex = new IntHashSetMap();
        String[] newMacroNames = mi.getMacros();
        List<MacroItem> macroItems = new ArrayList<MacroItem>();
        for (int i=0; i < newMacroNames.length; i++) {
            Set<FeatureStructure> featStrucs = (Set<FeatureStructure>)_macros.get(newMacroNames[i]);
            if (featStrucs != null) {
                for (Iterator<FeatureStructure> fsIt = featStrucs.iterator(); fsIt.hasNext();) {
                    FeatureStructure fs = fsIt.next();
                    macrosFromLex.put(fs.getIndex(), fs);
                }
            }
            MacroItem macroItem = _macroItems.get(newMacroNames[i]);
            if (macroItem != null) { macroItems.add(macroItem); }
            else { 
                // should be checked earlier too
                System.err.println("Warning: macro " + newMacroNames[i] + 
                    " not found for word '" + mi.getWord() + "'");
            }
        }
        retval = new MacroAdder(macrosFromLex, macroItems);
        
        // update map and return
        macAdderMap.put(mi, retval);
        return retval; 
    }
        
    
    //
    // type propagation
    //

    /** Propagates types of nomvars in the given category. */
    public void propagateTypes(Category cat) {
        propagateTypes(cat, null);
    }        
    
    /** Propagates types of nomvars in the given categories. */
    public void propagateTypes(Category cat, Category cat2) {
        try {
            nomvarMap.clear();
            cat.deepMap(nomvarTypePropagater);
            if (cat2 != null) cat2.deepMap(nomvarTypePropagater);
            cat.deepMap(nomvarTypePropagater);
            if (cat2 != null) cat2.deepMap(nomvarTypePropagater);
        } catch (TypePropagationException tpe) {
        	if (debugSemClasses) {
	            System.err.println(
	                "Warning: unable to unify types '" + tpe.st1 + "' and '" + tpe.st2 + 
	                "' in cat: \n" + cat
	            );
	            if (cat2 != null) System.err.println("and cat: \n" + cat2);
        	}
        }
    }
        
    // a map from a cat's nomvars to types, 
    // just using the var's name for equality
    @SuppressWarnings("unchecked")
	private Map<NominalVar,SimpleType> nomvarMap = new THashMap(
        new TObjectHashingStrategy() {
			private static final long serialVersionUID = 1L;
			public int computeHashCode(Object o) {
                return ((NominalVar)o).getName().hashCode();
            }
            public boolean equals(Object o1, Object o2) {
                return ((NominalVar)o1).getName().equals(((NominalVar)o2).getName());
            }
        }
    );
    
    // exception for unification failures in propagating types
    private class TypePropagationException extends RuntimeException {
		private static final long serialVersionUID = 1L;
		SimpleType st1; SimpleType st2;
        TypePropagationException(SimpleType st1, SimpleType st2) {
            this.st1 = st1; this.st2 = st2;
        }
    }
    
    // mod function to propagate nomvar types; 
    // needs to be called twice after clearing nomvarMap
    private ModFcn nomvarTypePropagater = new ModFcn() {
        public void modify(Mutable m) {
            if (m instanceof NominalVar) {
                NominalVar nv = (NominalVar) m;
                SimpleType st = nv.getType();
                SimpleType st0 = nomvarMap.get(nv);
                // add type to map if no type found
                if (st0 == null) { nomvarMap.put(nv, st); return; }
                // check equality
                if (st.equals(st0)) return;
                // otherwise unify types, update nv and map
                try {
                    SimpleType stU = (SimpleType) st.unify(st0, null);
                    nv.setType(stU);
                    nomvarMap.put(nv, stU);
                } catch (UnifyFailure uf) {
                    throw new TypePropagationException(st, st0);
                }
            }
        }
    };
    

    //
    // distributive attribute propagation
    //

    /**
     * Returns the list of distributive attributes, or null if none.
     */
    public String[] getDistributiveAttrs() { return _distributiveAttrs; }
    
    /**
     * Gathers and propagates the unique values of each 
     * distributive attribute.
     */
    public void propagateDistributiveAttrs(Category cat) {
        propagateDistributiveAttrs(cat, null);
    }
    
    /**
     * Gathers and propagates the unique values of each 
     * distributive attribute.
     */
    public void propagateDistributiveAttrs(Category cat, Category cat2) {
        if (_distributiveAttrs == null) return;
        resetDistrAttrVals();
        cat.forall(gatherDistrAttrVals);
        if (cat2 != null) { cat2.forall(gatherDistrAttrVals); }
        cat.forall(propagateUniqueDistrAttrVals);
        if (cat2 != null) { cat2.forall(propagateUniqueDistrAttrVals); }
    }
    
    // an array of lists, one for each distributive attr    
    @SuppressWarnings("rawtypes")
	private List[] distrAttrVals = null;
    @SuppressWarnings("rawtypes")
	private void resetDistrAttrVals() {
        if (distrAttrVals == null) { 
            distrAttrVals = new List[_distributiveAttrs.length];
            for (int i = 0; i < distrAttrVals.length; i++) {
                distrAttrVals[i] = new ArrayList(3);
            }
            return;
        }
        for (int i = 0; i < distrAttrVals.length; i++) {
            distrAttrVals[i].clear();
        }
    }
    
    // gathers distinct values for each distributive attr
    private CategoryFcn gatherDistrAttrVals = new CategoryFcnAdapter() {
        @SuppressWarnings("unchecked")
		public void forall(Category c) {
            if (!(c instanceof AtomCat)) return;
            FeatureStructure fs = c.getFeatureStructure();
            if (fs == null) return;
            for (int i = 0; i < _distributiveAttrs.length; i++) {
                String attr = _distributiveAttrs[i];
                Object val = fs.getValue(attr);
                if (val != null && !distrAttrVals[i].contains(val)) { 
                    distrAttrVals[i].add(val); 
                }
            }
        }
    };

    // propagates unique values for each distributive attr
    private CategoryFcn propagateUniqueDistrAttrVals = new CategoryFcnAdapter() {
        public void forall(Category c) {
            if (!(c instanceof AtomCat)) return;
            FeatureStructure fs = c.getFeatureStructure();
            if (fs == null) return;
            for (int i = 0; i < _distributiveAttrs.length; i++) {
                if (distrAttrVals[i].size() != 1) continue;
                Object distVal = distrAttrVals[i].get(0);
                String attr = _distributiveAttrs[i];
                Object val = fs.getValue(attr);
                if (val == null) {
                    fs.setFeature(attr, UnifyControl.copy(distVal));
                }
            }
        }
    };

    
    //
    // licensing features
    //

    /**
     * Returns the list of licensing features.
     */
    public LicensingFeature[] getLicensingFeatures() { return _licensingFeatures; }
    
    
    /**
     * Returns the index of the given relation in the relation sort order, 
     * or the index of "*" if the relation is not explicitly listed.
     */
    public Integer getRelationSortIndex(String rel) {
        Integer retval = _relationIndexMap.get(rel);
        if (retval != null) return retval;
        retval = _relationIndexMap.get("*");
        if (retval != null) return retval;
        return new Integer(-1);
    }
    
    
    //
    // access to maps (limited)
    //

    /** Returns whether the given rel (semantic feature, really) is one used to signal coarticulation. */
    public boolean isCoartRel(String rel) {
        return _coartRelsToPreds.containsKey(rel);
    }
    
    
    //
    // classes for caching lex lookups during realization
    //

    // a class for caching lookups of signs from rels
    // nb: equality is checked just on the rel, to check for a cached lookup
    private static class RelLookup {
        String rel; Collection<Sign> signs;
        RelLookup(String s) { rel = s; }
        public int hashCode() { return rel.hashCode(); }
        public boolean equals(Object obj) { 
            return (obj instanceof RelLookup) && rel.equals(((RelLookup)obj).rel);
        }
    }
    
    // a class for caching lookups of signs from preds and coart rels
    // nb: equality is checked just on the pred and coart rels, to check for a cached lookup
    private static class PredLookup {
        String pred; List<String> coartRels; Collection<Sign> signs;
        PredLookup(String s, List<String> l) { pred = s; coartRels = l; }
        public int hashCode() { 
            return pred.hashCode() + ((coartRels != null) ? coartRels.hashCode() : 0); 
        }
        public boolean equals(Object obj) { 
            if (!(obj instanceof PredLookup)) return false;
            PredLookup pLook = (PredLookup) obj;
            if (!pred.equals(pLook.pred)) return false;
            if (coartRels == null) return (pLook.coartRels == null);
            return coartRels.equals(pLook.coartRels);
        }
    }

    
    //
    // XML loading routines
    //
    
	private class MorphScanner extends XmlScanner {
    	List<MorphItem> morphItems = new ArrayList<MorphItem>();
    	List<MacroItem> macroItems = new ArrayList<MacroItem>();
    	public void handleElement(Element e) {
            // create morph item
			if (e.getName().equals("entry")) {
                try { morphItems.add(new MorphItem(e)); }
                catch (RuntimeException exc) {
                    System.err.println("Skipping morph item: " + e.getAttributeValue("word"));
                    System.err.println(exc.toString());
                }
            }
            // create macro item
			else if (e.getName().equals("macro")) {
                try { macroItems.add(new MacroItem(e)); }
                catch (RuntimeException exc) {
                    System.err.println("Skipping macro item: " + e.getAttributeValue("name"));
                    System.err.println(exc.toString());
                }
            }
		}
	};
	
    private Pair<List<MorphItem>,List<MacroItem>> getMorph(URL url) throws IOException {
    	// scan XML
    	MorphScanner morphScanner = new MorphScanner();
    	morphScanner.parse(url);
        // return morph and macro items
        return new Pair<List<MorphItem>,List<MacroItem>>(morphScanner.morphItems, morphScanner.macroItems);
    }
    
	private class LexiconScanner extends XmlScanner {
    	List<Family> lexicon = new ArrayList<Family>();
    	Element distrElt = null;
    	Element licensingElt = null;
    	Element relationSortingElt = null;
    	public void handleElement(Element e) {
            // create family
			if (e.getName().equals("family")) {
                try { lexicon.add(new Family(e)); }
                catch (RuntimeException exc) {
                    System.err.println("Skipping family: " + e.getAttributeValue("name"));
                    System.err.println(exc.toString());
                }
            }
            // save distributive attributes
			else if (e.getName().equals("distributive-features")) distrElt = e; 
            // save licensing features
			else if (e.getName().equals("licensing-features")) licensingElt = e; 
            // save relation sort order
			else if (e.getName().equals("relation-sorting")) relationSortingElt = e; 
		}
	};
	
    private List<Family> getLexicon(URL url) throws IOException {
    	// scan XML, creating families
    	LexiconScanner lexiconScanner = new LexiconScanner();
    	lexiconScanner.parse(url);
        // get distributive attributes, if any
        if (lexiconScanner.distrElt != null) {
            String distrAttrs = lexiconScanner.distrElt.getAttributeValue("attrs");
            _distributiveAttrs = distrAttrs.split("\\s+");
        }
        // load licensing features
        loadLicensingFeatures(lexiconScanner.licensingElt);
        // load relation sort order
        loadRelationSortOrder(lexiconScanner.relationSortingElt);
        // return families
        return lexiconScanner.lexicon;
    }
    
    // get licensing features, with appropriate defaults
    @SuppressWarnings("unchecked")
	private void loadLicensingFeatures(Element licensingElt) {
        List<LicensingFeature> licensingFeats = new ArrayList<LicensingFeature>();
        boolean containsLexFeat = false;
        if (licensingElt != null) {
            for (Iterator<Element> it = licensingElt.getChildren("feat").iterator(); it.hasNext(); ) {
                Element featElt = it.next();
                String attr = featElt.getAttributeValue("attr");
                if (attr.equals("lex")) containsLexFeat = true;
                String val = featElt.getAttributeValue("val");
                List<String> alsoLicensedBy = null;
                String alsoVals = featElt.getAttributeValue("also-licensed-by");
                if (alsoVals != null) {
                    alsoLicensedBy = Arrays.asList(alsoVals.split("\\s+"));
                }
                boolean licenseEmptyCats = true;
                boolean licenseMarkedCats = false;
                boolean instantiate = true; 
                byte loc = LicensingFeature.BOTH;
                String lmc = featElt.getAttributeValue("license-marked-cats");
                if (lmc != null) {
                    licenseMarkedCats = Boolean.valueOf(lmc).booleanValue();
                    // change defaults
                    licenseEmptyCats = false;
                    loc = LicensingFeature.TARGET_ONLY;
                    instantiate = false;
                }
                String lec = featElt.getAttributeValue("license-empty-cats");
                if (lec != null) {
                    licenseEmptyCats = Boolean.valueOf(lec).booleanValue();
                }
                String inst = featElt.getAttributeValue("instantiate");
                if (inst != null) {
                    instantiate = Boolean.valueOf(inst).booleanValue();
                }
                String locStr = featElt.getAttributeValue("location");
                if (locStr != null) {
                    if (locStr.equals("target-only")) loc = LicensingFeature.TARGET_ONLY;
                    if (locStr.equals("args-only")) loc = LicensingFeature.ARGS_ONLY;
                    if (locStr.equals("both")) loc = LicensingFeature.BOTH;
                }
                licensingFeats.add(
                    new LicensingFeature(
                        attr, val, alsoLicensedBy, 
                        licenseEmptyCats, licenseMarkedCats, instantiate, 
                        loc
                    )
                );
            }
        }
        if (!containsLexFeat) {
            licensingFeats.add(LicensingFeature.defaultLexFeature);
        }
        _licensingFeatures = new LicensingFeature[licensingFeats.size()];
        licensingFeats.toArray(_licensingFeatures);
    }
    
    
    // default relation sort order
    private static String[] defaultRelationSortOrder = {
        "BoundVar", "PairedWith", 
        "Restr", "Body", "Scope", 
        "*", 
        "GenRel", "Coord", "Append"
    };
    
    // get relation sort order, or use defaults
    private void loadRelationSortOrder(Element relationSortingElt) {
        // use defaults if no order specified
        if (relationSortingElt == null) {
            for (int i = 0; i < defaultRelationSortOrder.length; i++) {
                _relationIndexMap.put(defaultRelationSortOrder[i], new Integer(i));
            }
            return;
        }
        // otherwise load from 'order' attribute
        String orderAttr = relationSortingElt.getAttributeValue("order");
        String[] relSortOrder = orderAttr.split("\\s+");
        for (int i = 0; i < relSortOrder.length; i++) {
            _relationIndexMap.put(relSortOrder[i], new Integer(i));
        }
    }
		/*
		 * Accessor for words map
		 */
    public GroupMap<Word,MorphItem> getWords() {
			return _words;
		}
}


================================================
FILE: src/opennlp/ccg/lexicon/LicensingFeature.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003-4 University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.lexicon;

import java.util.*;

/**
 * A licensing feature is one which controls the licensing and 
 * instantiation of semantically null or marked categories 
 * in the realizer.  Defaults are handled in Lexicon.loadLicensingFeatures.
 *
 * @author      Michael White
 * @version     $Revision: 1.7 $, $Date: 2009/12/21 03:27:18 $
 */
public class LicensingFeature
{

    /**
     * The name of the licensing feature.
     */
    public final String attr;

    /**
     * The string value of the licensing feature, or null if any value will do.
     */
    public final String val;
    
    /**
     * A list of string values of other features that suffice to license 
     * categories with this feature.
     */
    public final List<String> alsoLicensedBy;
    
    /**
     * A flag indicating whether semantically null categories with the 
     * licensing feature need to be licensed.
     */
    public final boolean licenseEmptyCats;
    
    /**
     * A flag indicating whether initial categories with the 
     * licensing feature are marked and need to be licensed.
     */
    public final boolean licenseMarkedCats;
    
    /**
     * A flag indicating whether semantically empty categories with the 
     * licensing feature should be instantiated.
     */
    public final boolean instantiate;
    
    /**
     * The location of the licensing feature on the category to be licensed.
     * The value must be one of TARGET_ONLY, ARGS_ONLY or BOTH.
     */
    public final byte loc;
    
    /**
     * Location of the feature on the target category only.
     */
    public static final byte TARGET_ONLY = 1;
    
    /**
     * Location of the feature on the argument categories only.
     */
    public static final byte ARGS_ONLY = 2;
    
    /**
     * Location of the feature on either the target category 
     * or the argument categories.
     */
    public static final byte BOTH = 0;
    
    
    /** Constructor. */
    public LicensingFeature(
        String attr, String val, List<String> alsoLicensedBy, 
        boolean licenseEmptyCats, boolean licenseMarkedCats, boolean instantiate, 
        byte loc
    ) 
    {
        this.attr = attr; this.val = val;
        List<String> emptyList = Collections.emptyList();
        this.alsoLicensedBy = (alsoLicensedBy != null) ? alsoLicensedBy : emptyList;
        this.licenseEmptyCats = licenseEmptyCats; 
        this.licenseMarkedCats = licenseMarkedCats; 
        this.instantiate = instantiate; 
        this.loc = loc;
    }
    
    /** Default lex feature. */
    public static final LicensingFeature defaultLexFeature = 
        new LicensingFeature("lex", null, null, true, false, true, BOTH);
    
    /** Simple lex feature, for comparison purposes. */
    public static final LicensingFeature simpleLexFeature = 
        new LicensingFeature("lex", null, null, true, false, false, BOTH);
}
    

================================================
FILE: src/opennlp/ccg/lexicon/ListPairWord.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2010 Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.lexicon;

import java.util.*;

import opennlp.ccg.util.Pair;

/**
 * A ListPairWord represents a word via a list of pairs of interned 
 * attributes and values.  It is intended to be a simple wrapper of 
 * the list to make it act like a word, without requiring canonical 
 * instances. 
 *
 * @author      Michael White
 * @version     $Revision: 1.1 $, $Date: 2010/01/17 04:49:24 $
 */
public class ListPairWord extends Word {

	private static final long serialVersionUID = 1L;
	
	/**
	 * The list of pairs of attributes and values.
	 */
	protected List<Pair<String,String>> pairsList;
	
	/** Constructor. */
	public ListPairWord(List<Pair<String,String>> pairsList) { this.pairsList = pairsList; }
	
    /** Returns the surface form. */
    public String getForm() { return getValFromInterned(Tokenizer.WORD_ATTR); }
    
    /** Returns the pitch accent. */
    public String getPitchAccent() { return getValFromInterned(Tokenizer.PITCH_ACCENT_ATTR); }
    
    /** Returns the list of extra attribute-value pairs. */
    protected List<Pair<String,String>> getAttrValPairsList() { 
        List<Pair<String,String>> retval = null; 
		for (Pair<String,String> pair : pairsList) {
            if (!isKnownAttr(pair.a)) {
                if (retval == null) retval = new ArrayList<Pair<String,String>>(5);
                retval.add(pair);
            }
		}
        return retval; 
    }
    
    /** Returns the stem. */
    public String getStem() { return getValFromInterned(Tokenizer.STEM_ATTR); }
    
    /** Returns the part of speech. */
    public String getPOS() { return getValFromInterned(Tokenizer.POS_ATTR); }
    
    /** Returns the supertag. */
    public String getSupertag() { return getValFromInterned(Tokenizer.SUPERTAG_ATTR); }
    
    /** Returns the semantic class. */
    public String getSemClass() { return getValFromInterned(Tokenizer.SEM_CLASS_ATTR); }


    /** Returns the value of the attribute with the given name, or null if none. 
    The attribute names Tokenizer.WORD_ATTR, ..., Tokenizer.SEM_CLASS_ATTR 
    may be used to retrieve the form, ..., semantic class. */
	public String getVal(String attr) {
		String internedAttr = attr.intern(); // use == on interned attr
		return getValFromInterned(internedAttr); 
	}

	/** Returns the value of the given interned attr, or null if none. */
	protected String getValFromInterned(String attr) {
		for (Pair<String,String> pair : pairsList) {
			if (pair.a == attr) return pair.b;
		}
	    return null;
	}
}


================================================
FILE: src/opennlp/ccg/lexicon/MacroAdder.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003 Jason Baldridge, Gann Bierner and 
//                    University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.lexicon;

import opennlp.ccg.synsem.*;
import opennlp.ccg.util.*;
import opennlp.ccg.unify.*;
import opennlp.ccg.hylo.*;

import java.util.*;

/**
 * Adds the features from macros to a category.
 *
 * @author      Jason Baldridge
 * @author      Gann Bierner
 * @author      Michael White
 * @version     $Revision: 1.6 $, $Date: 2011/03/20 20:11:57 $
 */
public class MacroAdder {

    private IntHashSetMap _specificMacros;
    private List<MacroItem> _macroItems; // for LF macros

    public MacroAdder(IntHashSetMap sm, List<MacroItem> macroItems) {
        _specificMacros = sm;
        _macroItems = macroItems;
    }

    public void addMacros(Category cat) {
        // add features 
        cat.deepMap(addIndexedFeatures);
        // append preds to LF
        LF lf = cat.getLF();
        for (int i=0; i < _macroItems.size(); i++) {
            MacroItem mi = _macroItems.get(i);
            LF[] preds = mi.getPreds();
            for (int j=0; j < preds.length; j++) {
                LF pred = (LF) preds[j].copy();
                if (!HyloHelper.isElementaryPredication(pred)) {
                    System.out.println(
                        "Warning: ignoring LF macro pred, which is not an elementary predication: " +
                        pred
                    );
                    continue;
                }
                lf = HyloHelper.append(lf, pred);
            }
        }
        // sort and reset LF
        HyloHelper.sort(lf);
        cat.setLF(lf);
    }
    
    private ModFcn addIndexedFeatures = new ModFcn() {
        @SuppressWarnings("rawtypes")
		public void modify(Mutable c) {
            if (c instanceof AtomCat) {
                FeatureStructure fs = ((AtomCat)c).getFeatureStructure();
                int fsIndex = fs.getIndex();
                Set featStrucs = (Set)_specificMacros.get(fsIndex);
                if (null == featStrucs) {
                    return;
                }
                FeatureStructure $fs = fs.copy();
                for (Iterator fsIt = featStrucs.iterator(); fsIt.hasNext();) {
                    FeatureStructure macroFS = (FeatureStructure) fsIt.next();
                    $fs = $fs.inherit(macroFS);
                }
                ((AtomCat)c).setFeatureStructure($fs);
            }
        }
    };
}


================================================
FILE: src/opennlp/ccg/lexicon/MacroItem.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003-4 Jason Baldridge, Gann Bierner and 
//                      University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.lexicon;

import opennlp.ccg.unify.*;
import opennlp.ccg.synsem.*;
import opennlp.ccg.hylo.HyloHelper;

import org.jdom.*;
import java.util.*;

/**
 * Data structure for storing information about morphological macros.
 *
 * @author      Jason Baldridge
 * @author      Gann Bierner
 * @author      Michael White
 * @version $Revision: 1.5 $, $Date: 2009/12/21 03:27:18 $
 */
public class MacroItem {
    private String name;
    private FeatureStructure[] featStrucs;
    private LF[] preds;
    
    public MacroItem() {};

    @SuppressWarnings("unchecked")
	public MacroItem (Element e) {
        name = e.getAttributeValue("name");
        if (name == null) { name = e.getAttributeValue("n"); }
        List<Element> fsEls = e.getChildren("fs");
        featStrucs = new FeatureStructure[fsEls.size()];
        for (int i=0; i<featStrucs.length; i++) {
            featStrucs[i] = new GFeatStruc(fsEls.get(i));
        }
        Element lfElt = e.getChild("lf");
        if (lfElt == null) preds = new LF[0];
        else {
            List<Element> predElts = lfElt.getChildren();
            preds = new LF[predElts.size()];
            for (int i=0; i < predElts.size(); i++) {
                preds[i] = HyloHelper.getLF(predElts.get(i));
            }
        }
    }
    
    public void setName(String s) {
        name=s;
    }

    //public void setSpecs(ArrayList al) {specs = al; }

    public String getName() {
        return name;
    }

    public FeatureStructure[] getFeatureStructures() {
        return featStrucs;
    }
    
    public LF[] getPreds() {
        return preds;
    }

    //public void addSpec(String s) { specs.add(s); }
    //public void removeSpec(String s) {
    //  specs.remove(specs.indexOf(s));
    //}
    
}


================================================
FILE: src/opennlp/ccg/lexicon/MorphItem.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003-5 Jason Baldridge, Gann Bierner and 
//                      University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.lexicon;

import org.jdom.*;

import opennlp.ccg.grammar.Grammar;


/**
 * A data structure for morphological entries.
 *
 * @author      Jason Baldridge
 * @author      Gann Bierner
 * @author      Michael White
 * @version     $Revision: 1.11 $, $Date: 2009/10/17 20:46:20 $
 */
public class MorphItem {

    private static final String[] emptyStringArray = new String[0];
    
    private Word surfaceWord;
    private Word word;
    private Word coartIndexingWord = null;
        
    private String[] macros = emptyStringArray;
    private String[] excluded = emptyStringArray; 

    private boolean coart = false;
    
    /** Constructor. */
    public MorphItem() {};

    /** Constructor from XML element. */
    public MorphItem(Element e) {
        
        String coartString = e.getAttributeValue("coart");
        if ("true".equals(coartString)) coart = true;
        
        String wordString = e.getAttributeValue("word");
        boolean strictFactors = coart; // parse with flag for strict factors with coart items
        Word tokenizedWord = Grammar.theGrammar.lexicon.tokenizer.parseToken(wordString, strictFactors);
        surfaceWord = Word.createSurfaceWord(tokenizedWord);
        
        String stem = e.getAttributeValue("stem");
        if (stem == null) stem = surfaceWord.getForm();
        
        String POS = e.getAttributeValue("pos");
        String supertag = null; // supertag comes later from syn cat
        String semClass = e.getAttributeValue("class");
        
        word = Word.createFullWord(surfaceWord, stem, POS, supertag, semClass);
        
        String macrosString = e.getAttributeValue("macros");
        if (macrosString != null) {
            macros = macrosString.split("\\s+");
        }

        String excludedString = e.getAttributeValue("excluded");
        if (excludedString != null) {
            excluded = excludedString.split("\\s+");
        }

        // index on first attr of coarts
        if (coart) {
            String indexAttr = wordString.substring(0, wordString.indexOf("-"));
            String indexVal = surfaceWord.getVal(indexAttr);
            coartIndexingWord = Word.createWord(indexAttr, indexVal);
        }
    }

    /** Returns whether the name, qualified name or family name of the given entries item is in the excluded list. */
    public boolean excluded(EntriesItem eItem) {
        if (excluded.length == 0) return false;
        for (int i = 0; i < excluded.length; i++) {
            if (eItem.getName().equals(excluded[i])) return true;
            if (eItem.getQualifiedName().equals(excluded[i])) return true;
            if (eItem.getFamilyName().equals(excluded[i])) return true;
        }
        return false;
    }
    
    
    /** Returns the full word. */
    public Word getWord() { return word; }

    /** Returns the surface word (without the stem, POS and semantic class). */
    public Word getSurfaceWord() { return surfaceWord; }

    /** Returns the macro names. */
    public String[] getMacros() { return macros; }
    
    /** Returns the names of the excluded entries. */
    public String[] getExcluded() { return excluded; }

    /** Returns whether the morph item is a coarticulation, eg a pitch accent. */
    public boolean isCoart() { return coart; }
    
    /** Returns the word for indexing this coarticulation (or null if not a coarticulation). */
    public Word getCoartIndexingWord() { return coartIndexingWord; }

    
    /** Returns a string for this morph item. */
    // nb: excluded not handled
    public String toString() {
    	StringBuffer sb = new StringBuffer();
    	sb.append('[');
    	for (int i=0; i < macros.length; i++) {
    		sb.append(macros[i]);
    		if (i < macros.length-1) sb.append(',');
    	}
    	sb.append(']');
        return "{" + word + " => " + sb + "}";
    }
}


================================================
FILE: src/opennlp/ccg/lexicon/SimpleWord.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2004 University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.lexicon;

import opennlp.ccg.util.*;
import java.util.*;

/**
 * A SimpleWord object is a surface word which stores just the word form.
 * SimpleWord serves as the base class for concrete instantiations of words.
 *
 * @author      Michael White
 * @version     $Revision: 1.4 $, $Date: 2009/07/17 04:23:30 $
 */
public class SimpleWord extends Word {
    
	private static final long serialVersionUID = 181491057498517717L;
	
	/** The surface form. */
    protected String form;
    
    /** Returns the surface form. */
    public String getForm() { return form; }
    
    /** Returns the pitch accent. */
    public String getPitchAccent() { return null; }
    
    /** Returns the list of extra attribute-value pairs. */
    protected List<Pair<String,String>> getAttrValPairsList() { return null; }
    
    /** Returns the stem. */
    public String getStem() { return null; }
    
    /** Returns the part of speech. */
    public String getPOS() { return null; }
    
    /** Returns the supertag. */
    public String getSupertag() { return null; }
    
    /** Returns the semantic class. */
    public String getSemClass() { return null; }

    
    /** Returns the value of the attribute with the given name, or null if none. 
        The attribute names Tokenizer.WORD_ATTR, ..., Tokenizer.SEM_CLASS_ATTR 
        may be used to retrieve the form, ..., semantic class. */
    public String getVal(String attr) {
        String internedAttr = attr.intern(); // use == on interned attr
        if (internedAttr == Tokenizer.WORD_ATTR) return getForm();
        if (internedAttr == Tokenizer.PITCH_ACCENT_ATTR) return getPitchAccent();
        if (internedAttr == Tokenizer.STEM_ATTR) return getStem();
        if (internedAttr == Tokenizer.POS_ATTR) return getPOS();
        if (internedAttr == Tokenizer.SUPERTAG_ATTR) return getSupertag();
        if (internedAttr == Tokenizer.SEM_CLASS_ATTR) return getSemClass();
        List<Pair<String,String>> pairs = getAttrValPairsList(); 
        if (pairs == null) return null;
        for (int i = 0; i < pairs.size(); i++) {
            Pair<String,String> p = pairs.get(i);
            if (p.a == internedAttr) return p.b;
        }
        return null; // not found
    }

    
    /** Constructor. */
    protected SimpleWord(String form) {
        this.form = form; 
    }
}


================================================
FILE: src/opennlp/ccg/lexicon/SupertaggerAdapter.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2008-9 Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.lexicon;

import java.util.*;

/**
 * The SupertaggerAdapter interface is for plugging a supertagger into the 
 * lexicon in order to return only the desired, high probability categories 
 * during lexical lookup.  Once the supertagger has been plugged in, 
 * using Lexicon.setSupertagger, the supertagger will be consulted during 
 * each lexical lookup for the desired categories, using getSupertags. 
 * Note that this entails that the supertagger must update its state between lexical 
 * lookup calls; in this way, identical words in a sentence can have different 
 * predicted categories.
 * 
 * The supertagger returns beta-best categories for lexical lookup 
 * according to a sequence of beta settings it maintains internally.
 * Associated probabilities for each supertag are also returned.
 * The 'include gold' option controls whether gold standard tags are included 
 * during training.
 * 
 * At present, the lexicon must contain appropriate morph items for all words. 
 * However, the supertags assigned to a word need not be limited to those explicitly 
 * listed in the lexicon.  When there is an explicit entry, it will be used, 
 * as doing so allows the specification of a 'pred' which differs from the stem, 
 * as well as macros that can affect the supertag.  Otherwise, when using a supertagger, 
 * it is no longer necessary to list stems with categories in the lexicon, as the 
 * supertagger becomes responsible for this mapping.
 *
 * Note also that at present, only one supertagger (for either parsing or realization) 
 * may be plugged in to the lexicon at a time.
 *  
 * @author      Michael White
 * @version     $Revision: 1.11 $, $Date: 2010/12/08 15:24:26 $
 */
public interface SupertaggerAdapter {
	
	/**
	 * Class for caching a lexical item's log prob in a sign.
	 */
	public static class LexLogProb {
		/** The log prob. */
		public final float logprob;
		/** Constructor. */
		public LexLogProb(float logprob) { this.logprob = logprob; }
	}
	
	/**
	 * Returns the supertags of the desired categories for the current lexical lookup 
	 * as a map from supertags to contextual probabilities (or null to accept all). 
	 */
	public Map<String,Double> getSupertags();
	
	/**
	 * Sets the flag for whether to include gold tags.
	 */
	public void setIncludeGold(boolean includeGold);
	
	/**
	 * Resets beta to the most restrictive value.
	 */
	public void resetBeta();

	/**
	 * Resets beta to the least restrictive value.
	 */
	public void resetBetaToMax();

	/**
	 * Advances beta to the next most restrictive setting.
	 */
	public void nextBeta();
	
	/**
	 * Advances beta to the next less restrictive setting.
	 */
	public void previousBeta();
	
	/**
	 * Returns whether there are any less restrictive beta settings
	 * remaining in the sequence.
	 */
	public boolean hasMoreBetas();

	/**
	 * Returns whether there are any more restrictive beta settings
	 * remaining in the sequence.
	 */
	public boolean hasLessBetas();

	/** Returns all the beta values. */
	public double[] getBetas();
	
	/** Sets the beta values. */
	public void setBetas(double[] betas);
	
	/** Returns the current beta value. */
	public double getCurrentBetaValue();
}


================================================
FILE: src/opennlp/ccg/lexicon/Tokenizer.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2004-5 University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.lexicon;

import java.util.*;

/**
 * The Tokenizer interface provides a way to customize tokenization 
 * and handling of special tokens.
 * A custom tokenizer may be specified in the grammar file.
 * DefaultTokenizer provides a default implementation, which can also 
 * be subclassed for custom behavior.
 *
 * @author      Michael White
 * @version     $Revision: 1.14 $, $Date: 2005/10/20 17:30:30 $
 **/

public interface Tokenizer {

    /** Name used to tokenize word form attribute (usually left implicit). */
    public static final String WORD_ATTR = "W";
    
    /** Name used to tokenize stem attribute. */
    public static final String STEM_ATTR = "S";
    
    /** Name used to tokenize part-of-speech attribute. */
    public static final String POS_ATTR = "P";
    
    /** Name used to tokenize supertag attribute. */
    public static final String SUPERTAG_ATTR = "T";
    
    /** Name used to tokenize semantic class attribute. */
    public static final String SEM_CLASS_ATTR = "C";
    
    /** Name used to tokenize pitch accent attribute. */
    public static final String PITCH_ACCENT_ATTR = "A";
    
    
    /** Constant used to signal the substitution of a date as the pred. */
    public static final String DATE_VAL = "[*DATE*]";
    
    /** Constant used to represent the semantic class date. */
    public static final String DATE_CLASS = "date";
    
    /** Constant used to signal the substitution of a time as the pred. */
    public static final String TIME_VAL = "[*TIME*]";
    
    /** Constant used to represent the semantic class time. */
    public static final String TIME_CLASS = "time";
    
    /** Constant used to signal the substitution of a number as the pred. */
    public static final String NUM_VAL = "[*NUM*]";
    
    /** Constant used to represent the semantic class number. */
    public static final String NUM_CLASS = "num";
    
    /** Constant used to signal the substitution of an amount as the pred. */
    public static final String AMT_VAL = "[*AMT*]";
    
    /** Constant used to represent the semantic class amount. */
    public static final String AMT_CLASS = "amt";
    
    /** Constant used to signal the substitution of a duration as the pred. */
    public static final String DUR_VAL = "[*DUR*]";
    
    /** Constant used to represent the semantic class duration. */
    public static final String DUR_CLASS = "dur";
    
    /** 
     * Constant used to signal the substitution of a named entity 
     * (not listed in lexicon) as the pred. 
     */
    public static final String NE_VAL = "[*NE*]";
    
    /** Constant used to represent the semantic class (other) named entity. */
    public static final String NE_CLASS = "ne";
    

    /**
     * Parses an input string into a list of words, 
     * including any explicitly given factors, 
     * and the semantic class of special tokens.
     * Tokens are parsed into words using parseToken.
     */
    public List<Word> tokenize(String s);

    /**
     * Parses an input string into a list of words, 
     * including any explicitly given factors, 
     * and the semantic class of special tokens.
     * Tokens are parsed into words using parseToken, according to the given 
     * flag for whether to parse factors strictly.
     */
    public List<Word> tokenize(String s, boolean strictFactors);
    
    /** 
     * Parses a token into a word, including any explicitly given factors 
     * and the semantic class of special tokens.
     */
    public Word parseToken(String token);
 
    /** 
     * Parses a token into a word, including any explicitly given factors 
     * and the semantic class of special tokens, according to the given 
     * flag for whether to parse factors strictly.
     */
    public Word parseToken(String token, boolean strictFactors);
 
 
    /**
     * Returns a string (eg Tokenizer.DATE_CLASS) indicating the semantic class  
     * of special token, if the given token is recognized as a special 
     * token; otherwise returns null. 
     */
    public String isSpecialToken(String token);
    
    /**
     * Returns the special token constant for the given special token class, 
     * or null if none.
     */
    public String getSpecialTokenConstant(String semClass);
    
    /** 
     * Returns true iff the given string is a special token constant 
     * (eg Tokenizer.DATE_VAL).
     */
    public boolean isSpecialTokenConstant(String s);
    
    
    /** Returns true iff the token is recognized as a date. */
    public boolean isDate(String token);
    
    /** Returns true iff the token is recognized as a time. */
    public boolean isTime(String token);
    
    /** Returns true iff the token is recognized as a number. */
    public boolean isNum(String token);
    
    /** Returns true iff the token is recognized as an amount. */
    public boolean isAmt(String token);
    
    /** 
     * Returns true iff the token is recognized as a named entity (not listed in lexicon). 
     */
    public boolean isNamedEntity(String token);
    
    
    /**
     * Adds a semantic class to replace words with for language models.
     */
    public void addReplacementSemClass(String semClass);
    
    /** 
     * Returns whether the given semantic class is one to replace words with for language models.
     * The sem class is assumed to have been interned.
     */
    public boolean isReplacementSemClass(String semClass);

    
    /**
     * Returns a string for the given list of words.
     */
    public String getOrthography(List<Word> words);
    
    /**
     * Returns a string for the given list of words, optionally with semantic class replacement.
     */
    public String getOrthography(List<Word> words, boolean semClassReplacement);
    
    /**
     * Returns a string for the given word, optionally with semantic class replacement.
     */
    public String getOrthography(Word w, boolean semClassReplacement);
    
    /**
     * Returns a string for the given list of words, 
     * in the format expected by the SRILM tool for factored language models.
     */
    public String format(List<Word> words);
    
    /**
     * Returns a string for the given word, 
     * in the format expected by the SRILM tool for factored language models.
     */
    public String format(Word word);
    
    /**
     * Returns a string for the given list of words, 
     * in the format expected by the SRILM tool for factored language models, 
     * optionally with semantic class replacement.
     */
    public String format(List<Word> words, boolean semClassReplacement);
    
    /**
     * Returns a string for the given word, 
     * in the format expected by the SRILM tool for factored language models, 
     * optionally with semantic class replacement.
     */
    public String format(Word word, boolean semClassReplacement);

    /**
     * Returns one or more orthographic words for the given word.
     * This method is called from within Sign.getWordsInXml as 
     * part of producing the textual output of realization.
     */
    public List<String> expandWord(Word word);
    
    /**
     * Returns one or more orthographic words for the given date token.
     */
    public List<String> expandDate(String date);
    
    /**
     * Returns one or more orthographic words for the given time token.
     */
    public List<String> expandTime(String time);
    
    /**
     * Returns one or more orthographic words for the given number token.
     */
    public List<String> expandNum(String num);
    
    /**
     * Returns one or more orthographic words for the given amount token.
     */
    public List<String> expandAmt(String amt);
    
    /**
     * Returns one or more orthographic words for the given named entity token.
     */
    public List<String> expandNamedEntity(String namedEntity);
}


================================================
FILE: src/opennlp/ccg/lexicon/TrueCaser.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2011 Dennis N. Mehay
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.lexicon;

/**
 * A simple class that is constructed with a file containing a list of words
 * that are all and only those found (presumably from a large corpus) to be
 * more frequently upper-cased.  Any word-string passed to it (that is also
 * not a named entity string) is queried in this list.  If the word is there
 * it is restored to the casing found in the list, if it is not, it is converted
 * to lower-case.
 *
 * There is an option, skipAlreadyLower, to skip any word that is already in lower case, 
 * so as to avoid mistakenly uppercasing words.  This option is enabled by default.  
 * 
 * @author      Dennis N. Mehay
 *
 */

import java.util.*;
import java.io.*;
import java.nio.charset.Charset;
import opennlp.ccg.lexicon.Word;
import opennlp.ccg.lexicon.DefaultTokenizer;
import java.util.zip.GZIPInputStream;

public class TrueCaser {

    /** Flag for skipping words already in lower case (enabled by default). */
    public boolean skipAlreadyLower = true;
    
    /**
     * A map from lower-cased keys to the true-cased forms (from the list passed in during construction).
     */
    private Map<String,String> caseMap = new HashMap<String,String>();

    /**
     * For the heuristics that determine whether something is in title case: what percentage of the sentence must be
     * cased to make the title-case detector go off?
     */
    private double titleCaseThreshold;

    /**
     * Constructor that just takes a path to a list of words that are only upper-case (title-case is default = 0.9).
     */
    public TrueCaser(String pathToOnlyUCWords) {
    	this(pathToOnlyUCWords, 0.5);
    }

    /**
     * Constructor that takes a path to a list of words that are only upper-case and a title-case threshold.
     */
    public TrueCaser(String pathToOnlyUCWords, double titleCaseThreshold) {
		this.titleCaseThreshold = titleCaseThreshold;
		this.caseMap = TrueCaser.readInCaseMap(pathToOnlyUCWords);
		if (this.caseMap == null) {
		    System.err.println("Something went wrong."+System.getProperty("line.separator")+
				       "Make sure you passed in a file of true-cased words, etc.");
		    System.exit(-1);
		} else {
		    //System.err.println("Reading in list of true-cased words: "+pathToOnlyUCWords+System.getProperty("line.separator")+
		    //		       " at a title-case heursitic detection threshold of: "+titleCaseThreshold);
		}
    }

    /**
     * Static method to read in the list of words.
     */ 
    public static Map<String,String> readInCaseMap(String pathToOnlyUCWords) {
		Map<String,String> caseMap = new HashMap<String,String>();
		BufferedReader inRead = null;
		try {
		    Charset utf8 = Charset.availableCharsets().get("UTF-8");
	
		    inRead = new BufferedReader(
						(pathToOnlyUCWords.toLowerCase().endsWith(".gz")) ?
						(new InputStreamReader(new GZIPInputStream(new FileInputStream(new File(pathToOnlyUCWords))), utf8)) :
						(new InputStreamReader(new FileInputStream(new File(pathToOnlyUCWords)), utf8))
						);
	
		    String ln = inRead.readLine();
		    while(ln != null) {
			ln = ln.trim();
			if(!ln.startsWith("#")) {
			    caseMap.put(ln.toLowerCase(), ln);
			}
				ln = inRead.readLine();
		    }
		} catch (IOException ioe) { 
		    return null;
		} finally {
		    try {
		    	inRead.close();
		    } catch (Exception e) {
		    	// do nothing.
		    }
		}
		return caseMap;
    }

    /**
     * Truecase a candidate word. If the word is in the list of more commonly
     * cased words, then return this cased form.  If not, normalize to lowercase if
     * this is the first word or the sentence is in titlecase. Else return the word as-is.
     * If skipAlreadyLower is enabled, skip the word if it is already in lower case.
     */ 
    public String trueCase(String theWord, boolean isTitle, boolean isFirstWord) {
		String loweredWord = theWord.toLowerCase();
		// skip word in lower case per flag
		if (skipAlreadyLower && theWord.equals(loweredWord))
			return theWord;
		// look up the truecased version; if not there, and title-case or first
		// word in sentence, lowercase it, otherwise, don't touch it.
		String trueCasedTheWord = caseMap.get(loweredWord);
		if (trueCasedTheWord != null) {
			return trueCasedTheWord;
		} else {
			return (isTitle || isFirstWord) ? loweredWord : theWord;
		}
    }

    /**
     * Truecase a whole sentence.  If the sentence appears to be in title-case (as determined by a heuristic
     * that is triggered by there being greater than 0.X of the first 10 words, if there are that many,
     * being cased) normalize any word that is not in the true-case list to lower-case.  Otherwise, leave all
     * words that are not in the true-case list alone, except the first word (which is normalized to lower-case)
     * The title-case threshold is a creation-time parameter. 
     * As always, if skipAlreadyLower is enabled, the word is skipped if it is already in lower case.  Note that 
     * the second word is counted as the first word if the first token is a left quote (single or double).
     */
    public String trueCaseSentence(String sentence) { 
		String[] parts = sentence.split("\\s+");
		StringBuffer res = new StringBuffer(parts.length);

		boolean isTitle = isTitleCased(parts);
		// truecase the whole sentence (only normalizing by lowercasing if
		// titlecase detector went off).
		int i = 0;
		for (String prt : parts) {
			boolean isFirstWord = (i == 0 || (i == 1 && (parts[0].equals("``") || parts[0].equals("`"))));
			res.append(" " + trueCase(prt, isTitle, isFirstWord));
			i++;
		}
		return res.toString().trim();
    }

    /**
     * Returns true iff the percentage of the first 10 words (or the whole sentence if it's less than 10 words) 
     * that have a case distinction is greater than or equal to 'titleCaseThreshold'.
     */
    public boolean isTitleCased(String[] words) {
		int numCased = 0, cursor = 0;
		for (String wd : words) {
			if (cursor >= 10) {
				break;
			}
			if (!wd.toLowerCase().equals(wd)) {
				numCased++;
			}
			cursor++;
		}
		return (numCased / ((words.length < 10) ? (words.length + 0.0) : 10.0) >= titleCaseThreshold);
    }

    public String tcWordToString(String newWordForm, Word oldWord) {
        StringBuffer sb = new StringBuffer();
        sb.append(newWordForm);
        if (oldWord.getPOS() != null) sb.append(":P-").append(DefaultTokenizer.escape(oldWord.getPOS()));
        if (oldWord.getSupertag() != null) sb.append(":T-").append(DefaultTokenizer.escape(oldWord.getSupertag()));
        if (oldWord.getSemClass() != null) sb.append(":C-").append(DefaultTokenizer.escape(oldWord.getSemClass()));
        if (sb.length() == 0) sb.append((String) null);
        return sb.toString();
    }

    public static void main(String[] args) throws IOException {
    	String newline = System.getProperty("line.separator");
    	String usage = 
    			newline + 
    			"java TrueCaser -t <truecase-file> -r <title-threshold> -i <input [default=stdin]> -o <output [default=stdout]>" 
    			+ newline;
    	if(args.length == 0 || args[0] .equals("h") || args[0] .equals("-h") || args[0] .equals("--h") 
    			|| args[0] .equals("--help") || args[0] .equals("-help")) {
		    System.err.println(usage);
		    System.exit(0);
		}

		String truecasefile = null, inputfile = null, outputfile = null;
		double tcThresh = 0.5;
		for (int a = 0; a < args.length; a++) {
			if (args[a].equals("-t")) {
				truecasefile = args[++a];
				continue;
			}
			if (args[a].equals("-r")) {
				tcThresh = Double.parseDouble(args[++a]);
				continue;
			}
			if (args[a].equals("-i")) {
				inputfile = args[++a];
				continue;
			}
			if (args[a].equals("-o")) {
				outputfile = args[++a];
				continue;
			}

			System.err.println("unrecognized option " + args[a] + ".");
			System.err.println(usage);
			System.exit(0);
		}    
		
		Charset utf8 = Charset.availableCharsets().get("UTF-8");

		// input of text (assumed to be tokenized utf-8-encoded text).
		BufferedReader in = new BufferedReader(new InputStreamReader(
				((inputfile == null) ? System.in : (new FileInputStream(
						new File(inputfile)))), utf8));

		// output stream (back to tokenized utf-8-encoded text).
		BufferedWriter out = new BufferedWriter(new OutputStreamWriter(
				((outputfile == null) ? System.out : (new FileOutputStream(
						new File(outputfile)))), utf8));

		// file of true-cased words is arg0.
		TrueCaser tc = new TrueCaser(truecasefile, tcThresh);

		String sent = in.readLine();
		while (sent != null) {
			sent = tc.trueCaseSentence(sent.trim());
			out.write(sent + System.getProperty("line.separator"));
			sent = in.readLine();
		}
		out.close();
		in.close();
	}
}

================================================
FILE: src/opennlp/ccg/lexicon/Word.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2004-5 University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.lexicon;

import opennlp.ccg.util.*;

import java.io.*;
import java.util.*;
import gnu.trove.*;

/**
 * A Word object may either be a surface word or a full word.
 * A surface word holds a surface form, an optional pitch accent, and an 
 * optional list of extra attribute-value pairs.
 * A full word additionally contains a stem, part of speech, supertag and semantic class.
 * A word may be a multiword consisting of multiple orthographic words, 
 * typically separated by underscores in the surface form.
 * For efficient storage and equality checking, Word objects are interned by 
 * the factory methods of the configured WordFactory.
 *
 * @author      Michael White
 * @version     $Revision: 1.21 $, $Date: 2009/12/16 22:39:20 $
 */
abstract public class Word implements Serializable, Comparable<Word> {

	private static final long serialVersionUID = 1L;

	/** Returns the surface form. */
    abstract public String getForm();
    
    /** Returns the pitch accent. */
    abstract public String getPitchAccent();
    
    // empty iterator
    private static Iterator<Pair<String,String>> emptyIterator = new ArrayList<Pair<String,String>>(0).iterator();

    /** Returns an iterator over the extra attribute-value pairs. */
    public Iterator<Pair<String,String>> getAttrValPairs() { 
        List<Pair<String,String>> pairs = getAttrValPairsList();
        return (pairs != null) ? pairs.iterator() : emptyIterator; 
    } 
    
    /** Returns an iterator over the surface attribute-value pairs, including the pitch accent (if any). */
    public Iterator<Pair<String,String>> getSurfaceAttrValPairs() {
        List<Pair<String,String>> pairs = getAttrValPairsList(); String pitchAccent = getPitchAccent();
        if (pairs == null && pitchAccent == null) return emptyIterator; 
        else if (pairs == null) { 
            List<Pair<String,String>> retval = new ArrayList<Pair<String,String>>(1); 
            retval.add(new Pair<String,String>(Tokenizer.PITCH_ACCENT_ATTR, pitchAccent));
            return retval.iterator();
        }
        else if (pitchAccent == null) return pairs.iterator();
        else {
            List<Pair<String,String>> retval = new ArrayList<Pair<String,String>>(pairs);
            retval.add(new Pair<String,String>(Tokenizer.PITCH_ACCENT_ATTR, pitchAccent));
            return retval.iterator();
        }
    }            
    
    /** Returns the list of extra attribute-value pairs. */
    abstract protected List<Pair<String,String>> getAttrValPairsList();
    
    /** Returns the stem. */
    abstract public String getStem();
    
    /** Returns the part of speech. */
    abstract public String getPOS();
    
    /** Returns the supertag. */
    abstract public String getSupertag();
    
    /** Returns the semantic class. */
    abstract public String getSemClass();

    
    /** Returns the value of the attribute with the given name, or null if none. 
        The attribute names Tokenizer.WORD_ATTR, ..., Tokenizer.SEM_CLASS_ATTR 
        may be used to retrieve the form, ..., semantic class. */
    abstract public String getVal(String attr);

    
    // the known attr names
    private static Set<String> knownAttrs = initKnownAttrs(); 
    @SuppressWarnings("unchecked")
	private static Set<String> initKnownAttrs() {
        Set<String> knownAttrs = new THashSet(new TObjectIdentityHashingStrategy());
        String[] names = {
            Tokenizer.WORD_ATTR, Tokenizer.PITCH_ACCENT_ATTR, 
            Tokenizer.STEM_ATTR, Tokenizer.POS_ATTR, 
            Tokenizer.SUPERTAG_ATTR, Tokenizer.SEM_CLASS_ATTR
        };
        for (int i = 0; i < names.length; i++) { knownAttrs.add(names[i]); }
        return knownAttrs;
    }
    
    /** Returns whether the given attr is a known one (vs an extra one). */
    public static boolean isKnownAttr(String attr) {
        return knownAttrs.contains(attr.intern());
    }
    
    
    /** Returns true if the form is non-null, while the stem, part of speech, supertag and semantic class are null. */
    public boolean isSurfaceWord() {
        return getForm() != null && getStem() == null && getPOS() == null && getSupertag() == null && getSemClass() == null;
    }
    
    
    // factory methods
    
    /** Factory interface. */
    public interface WordFactory {
        /** Creates a surface word with the given interned form. */
        public Word create(String form);
        /** Creates a (surface or full) word with the given normalized attribute name and value.
            The attribute names Tokenizer.WORD_ATTR, ..., Tokenizer.SEM_CLASS_ATTR 
            may be used for the form, ..., semantic class. */
        public Word create(String attr, String val);
        /** Creates a (surface or full) word from the given canonical factors. */
        public Word create(
            String form, String pitchAccent, List<Pair<String,String>> attrValPairs, 
            String stem, String POS, String supertag, String semClass 
        );
    }
    
    /** The word factory to use. */
    protected static WordFactory wordFactory = new FullWord.Factory();

    // NB: could try different factory methods for concrete words, but 
    //     it's unclear whether it makes much difference
    // protected static WordFactory wordFactory = new FactorChainWord.Factory();
    
    /** Creates a surface word with the given form. */
    public static synchronized Word createWord(String form) { 
        form = (form != null) ? form.intern() : null; 
        return wordFactory.create(form);
    }
    
    /** Creates a (surface or full) word. */
    public static synchronized Word createWord(
        String form, String pitchAccent, List<Pair<String,String>> attrValPairs, 
        String stem, String POS, String supertag, String semClass 
    ) {
        // normalize factors
        form = (form != null) ? form.intern() : null; 
        pitchAccent = (pitchAccent != null) ? pitchAccent.intern() : null;
        if (attrValPairs != null) {
            if (attrValPairs.isEmpty()) attrValPairs = null;
            else {
                attrValPairs = new ArrayList<Pair<String,String>>(attrValPairs);
                sortAttrValPairs(attrValPairs);
                for (int i = 0; i < attrValPairs.size(); i++) {
                    Pair<String,String> p = attrValPairs.get(i);
                    String attr = p.a.intern();
                    String val = (p.b != null) ? p.b.intern() : null;
                    attrValPairs.set(i, new Pair<String,String>(attr, val));
                }
            }
        }
        stem = (stem != null) ? stem.intern() : null; 
        POS = (POS != null) ? POS.intern() : null;
        supertag = (supertag != null) ? supertag.intern() : null;
        semClass = (semClass != null) ? semClass.intern() : null; 
        // create word
        return createWordDirectly(form, pitchAccent, attrValPairs, stem, POS, supertag, semClass);
    }

    // comparator for attr-val pairs
    private static Comparator<Pair<String,String>> attrValComparator = new Comparator<Pair<String,String>>() {
        public int compare(Pair<String,String> p1, Pair<String,String> p2) {
            return p1.a.compareTo(p2.a);
        }
    };
    
    /** Sorts attr-val pairs by attr name. */
    private static void sortAttrValPairs(List<Pair<String,String>> pairs) {
        Collections.sort(pairs, attrValComparator);
    }
    
    /** Creates a (surface or full) word directly, from the given canonical factors. */
    private static synchronized Word createWordDirectly(
        String form, String pitchAccent, List<Pair<String,String>> attrValPairs, 
        String stem, String POS, String supertag, String semClass 
    ) {
        return wordFactory.create(form, pitchAccent, attrValPairs, stem, POS, supertag, semClass);
    }
    
    /** Creates a (surface or full) word with the given attribute name and value.
        The attribute names Tokenizer.WORD_ATTR, ..., Tokenizer.SEM_CLASS_ATTR 
        may be used for the form, ..., semantic class. */
    public static synchronized Word createWord(String attr, String val) {
        attr = attr.intern(); val = (val != null) ? val.intern() : null; 
        return wordFactory.create(attr, val);
    }
    
    /** Creates a (surface or full) word from the given one, replacing the word form with the given one. */
    public static synchronized Word createWord(Word word, String form) {
        if (form != null) form = form.intern();
        return createWordDirectly(
            form, word.getPitchAccent(), word.getAttrValPairsList(), 
            word.getStem(), word.getPOS(), word.getSupertag(), word.getSemClass()
        );
    }
    
    /** Creates a (surface or full) word from the given one, 
        replacing the form and stem with the semantic class, uppercased. */
    public static synchronized Word createWordUsingSemClass(Word word) {
        String form = word.getSemClass().toUpperCase().intern();
        String stem = form;
        return createWordDirectly(
            form, word.getPitchAccent(), word.getAttrValPairsList(), 
            stem, word.getPOS(), word.getSupertag(), word.getSemClass()
        );
    }
    
    /** Creates a (surface or full) word from the given surface one, adding the 
        second word's additional attr-val pairs. */
    public static synchronized Word createWordWithAttrs(Word word, Word word2) {
        // get accent
        String accent = word.getPitchAccent();
        if (accent == null) accent = word2.getPitchAccent();
        // get attrs
        boolean mixedAttrs = false;
        List<Pair<String,String>> pairs = word.getAttrValPairsList();
        List<Pair<String,String>> pairs2 = word2.getAttrValPairsList(); 
        if (pairs == null && pairs2 != null) { pairs = pairs2; }
        else if (pairs2 != null) {
            mixedAttrs = true;
            pairs = new ArrayList<Pair<String,String>>(pairs); 
            for (int i = 0; i < pairs2.size(); i++) {
                if (!pairs.contains(pairs2.get(i))) {
                    pairs.add(pairs2.get(i)); 
                }
            }
        }
        // get rest
        String form = word.getForm(); String stem = word.getStem(); 
        String POS = word.getPOS(); String supertag = word.getSupertag(); String semClass = word.getSemClass(); 
        // with mixed attrs, need to normalize
        if (mixedAttrs) 
            return createWord(form, accent, pairs, stem, POS, supertag, semClass);
        else 
            return createWordDirectly(form, accent, pairs, stem, POS, supertag, semClass);
    }
    
    
    /** Creates a full word from the given surface one, adding the given stem, POS and semantic class. */
    public static synchronized Word createFullWord(Word word, String stem, String POS, String supertag, String semClass) {
        stem = (stem != null) ? stem.intern() : null; 
        POS = (POS != null) ? POS.intern() : null;
        supertag = (supertag != null) ? supertag.intern() : null;
        semClass = (semClass != null) ? semClass.intern() : null; 
        return createWordDirectly(word.getForm(), word.getPitchAccent(), word.getAttrValPairsList(), stem, POS, supertag, semClass);
    }
    
    /** Creates a full word from the given surface one, 
        adding the second (full) given word's stem, POS and semantic class, 
        as well as the second word's additional attr-val pairs, 
        plus the given supertag. */
    public static synchronized Word createFullWord(Word word, Word word2, String supertag) {
        boolean mixedAttrs = false;
        List<Pair<String,String>> pairs = word.getAttrValPairsList(); 
        List<Pair<String,String>> pairs2 = word2.getAttrValPairsList(); 
        if (pairs == null && pairs2 != null) { pairs = pairs2; }
        else if (pairs2 != null) {
            mixedAttrs = true;
            pairs = new ArrayList<Pair<String,String>>(pairs); 
            for (int i = 0; i < pairs2.size(); i++) {
                if (!pairs.contains(pairs2.get(i))) {
                    pairs.add(pairs2.get(i)); 
                }
            }
        }
        if (mixedAttrs) { 
            return createWord(
                word.getForm(), word.getPitchAccent(), pairs, 
                word2.getStem(), word2.getPOS(), supertag, word2.getSemClass()
            );
        }
        else {
            supertag = (supertag != null) ? supertag.intern() : null;
            return createWordDirectly(
                word.getForm(), word.getPitchAccent(), pairs, 
                word2.getStem(), word2.getPOS(), supertag, word2.getSemClass()
            );
        }
    }
    

    /** Creates a surface word from the given one, removing the stem, POS, supertag and semantic class. */
    public static synchronized Word createSurfaceWord(Word word) {
        return createWordDirectly(word.getForm(), word.getPitchAccent(), word.getAttrValPairsList(), null, null, null, null);
    }
    
    /** Creates a surface word from the given one, removing the stem, POS, supertag and semantic class, 
        and replacing the form with the given one. */
    public static synchronized Word createSurfaceWord(Word word, String form) {
        form = (form != null) ? form.intern() : null; 
        return createWordDirectly(form, word.getPitchAccent(), word.getAttrValPairsList(), null, null, null, null);
    }
    
    /** Creates a surface word from the given one, removing the stem, POS, supertag and semantic class, 
        and replacing the form with the semantic class, uppercased. */
    public static synchronized Word createSurfaceWordUsingSemClass(Word word) {
        String form = word.getSemClass().toUpperCase().intern();
        return createWordDirectly(form, word.getPitchAccent(), word.getAttrValPairsList(), null, null, null, null);
    }

    
    /** Creates a core surface word from the given one, removing all attrs in the given set. */
    public static synchronized Word createCoreSurfaceWord(Word word, Set<String> attrsSet) {
        String form = word.getForm();
        String accent = word.getPitchAccent();
        if (accent != null && attrsSet.contains(Tokenizer.PITCH_ACCENT_ATTR)) accent = null;
        List<Pair<String,String>> pairs = word.getAttrValPairsList(); 
        if (pairs != null) {
            pairs = new ArrayList<Pair<String,String>>(pairs); 
            Iterator<Pair<String,String>> pairsIt = pairs.iterator(); 
            while (pairsIt.hasNext()) {
                Pair<String,String> pair = pairsIt.next(); 
                if (attrsSet.contains(pair.a)) { pairsIt.remove(); }
            }
            return createWord(form, accent, pairs, null, null, null, null);
        }
        else {
            return createWordDirectly(form, accent, null, null, null, null, null);
        }
    }
    

    /** Returns a hash code for this word. */
    public int hashCode() {
        int hc = System.identityHashCode(getForm());
        hc = 31*hc + System.identityHashCode(getPitchAccent());
        for (Iterator<Pair<String,String>> it = getAttrValPairs(); it.hasNext(); ) {
            Pair<String,String> p = it.next();
            hc = 31*hc + System.identityHashCode(p.a);
            hc = 31*hc + System.identityHashCode(p.b);
        }
        hc = 31*hc + System.identityHashCode(getStem()); 
        hc = 31*hc + System.identityHashCode(getPOS()); 
        hc = 31*hc + System.identityHashCode(getSupertag()); 
        hc = 31*hc + System.identityHashCode(getSemClass()); 
        return hc;
    }
    
    /** Returns whether this word equals the given object. */
    public boolean equals(Object obj) {
        if (this == obj) return true;
        // nb: can use ==, since constructor interns all factors
        if (!(obj instanceof Word)) return false;
        Word word = (Word) obj;
        boolean sameFields =
            getForm() == word.getForm() && 
            getPitchAccent() == word.getPitchAccent() &&
            getStem() == word.getStem() && 
            getPOS() == word.getPOS() && 
            getSupertag() == word.getSupertag() && 
            getSemClass() == word.getSemClass();
        if (!sameFields) return false;
        List<Pair<String,String>> pairs = getAttrValPairsList();
        List<Pair<String,String>> wordPairs = word.getAttrValPairsList();
        if (pairs == null && wordPairs == null) return true;
        if (pairs == null || wordPairs == null) return false;
        if (pairs.size() != wordPairs.size()) return false;
        for (int i = 0; i < pairs.size(); i++) {
            if (!pairs.get(i).equals(wordPairs.get(i))) return false;
        }
        return true;
    }
    
    /** Returns an int representing lexicographic sorting. */
    public int compareTo(Word word) {
    	if (this == word) return 0;
    	int cmp = 0;
    	cmp = compare(getForm(), word.getForm());
    	if (cmp != 0) return cmp;
    	cmp = compare(getPitchAccent(), word.getPitchAccent());
    	if (cmp != 0) return cmp;
    	cmp = compare(getStem(), word.getStem());
    	if (cmp != 0) return cmp;
    	cmp = compare(getPOS(), word.getPOS());
    	if (cmp != 0) return cmp;
    	cmp = compare(getSupertag(), word.getSupertag());
    	if (cmp != 0) return cmp;
    	cmp = compare(getSemClass(), word.getSemClass());
    	if (cmp != 0) return cmp;
        List<Pair<String,String>> pairs = getAttrValPairsList();
        List<Pair<String,String>> wordPairs = word.getAttrValPairsList();
        if (pairs == null && wordPairs == null) return 0;
        if (pairs == null) return -1;
        if (wordPairs == null) return 1;
        if (pairs.size() < wordPairs.size()) return -1;
        if (pairs.size() > wordPairs.size()) return 1;
        for (int i = 0; i < pairs.size(); i++) {
        	Pair<String,String> p = pairs.get(i);
        	Pair<String,String> wp = wordPairs.get(i);
        	cmp = p.a.compareTo(wp.a);
        	if (cmp != 0) return cmp;
        	cmp = p.b.compareTo(wp.b);
        	if (cmp != 0) return cmp;
        }
    	return 0;
    }
    
    // compares strings, accounting for nulls
    private int compare(String s1, String s2) {
    	if (s1 == null && s2 == null) return 0;
    	if (s1 == null) return -1;
    	if (s2 == null) return 1;
    	return s1.compareTo(s2);
    }
    
    /** Returns whether this word's surface attributes intersect with the given ones. */
    public boolean attrsIntersect(Set<String> attrsSet) {
        if (getPitchAccent() != null && attrsSet.contains(Tokenizer.PITCH_ACCENT_ATTR))
            return true;
        for (Iterator<Pair<String,String>> it = getAttrValPairs(); it.hasNext(); ) {
            Pair<String,String> p = it.next();
            if (attrsSet.contains(p.a)) return true;
        }
        return false;
    }
    
    /** Returns a hash code for this word's restriction to a surface word. */
    public int surfaceWordHashCode() {
        int hc = System.identityHashCode(getForm());
        hc = 31*hc + System.identityHashCode(getPitchAccent());
        for (Iterator<Pair<String,String>> it = getAttrValPairs(); it.hasNext(); ) {
            Pair<String,String> p = it.next();
            hc = 31*hc + System.identityHashCode(p.a);
            hc = 31*hc + System.identityHashCode(p.b);
        }
        return hc;
    }
    
    /** Returns whether this word and the given object have equal restrictions to surface words. */
    public boolean surfaceWordEquals(Object obj) {
        if (this == obj) return true;
        // nb: can use ==, since constructor interns all factors
        if (!(obj instanceof Word)) return false;
        Word word = (Word) obj;
        boolean sameFields =
            getForm() == word.getForm() && 
            getPitchAccent() == word.getPitchAccent();
        if (!sameFields) return false;
        List<Pair<String,String>> pairs = getAttrValPairsList();
        List<Pair<String,String>> wordPairs = word.getAttrValPairsList();
        if (pairs == null && wordPairs == null) return true;
        if (pairs == null || wordPairs == null) return false;
        if (pairs.size() != wordPairs.size()) return false;
        for (int i = 0; i < pairs.size(); i++) {
            if (!pairs.get(i).equals(wordPairs.get(i))) return false;
        }
        return true;
    }
    
    /** Returns canonical version of deserialized word. */
    public Object readResolve() throws ObjectStreamException {
    	return createWord(getForm(), getPitchAccent(), getAttrValPairsList(), getStem(), getPOS(), getSupertag(), getSemClass());
    }
    
    /** Shows non-trivial fields separated by underscores. */
    public String toString() {
        StringBuffer sb = new StringBuffer();
        if (getForm() != null) sb.append(getForm());
        if (getPitchAccent() != null) sb.append('_').append(getPitchAccent());
        for (Iterator<Pair<String,String>> it = getAttrValPairs(); it.hasNext(); ) {
            Pair<String,String> p = it.next();
            sb.append('_').append(p.b);
        }
        if (getStem() != null && getStem() != getForm()) sb.append('_').append(getStem());
        if (getPOS() != null) sb.append('_').append(getPOS());
        if (getSupertag() != null) sb.append('_').append(getSupertag());
        if (getSemClass() != null) sb.append('_').append(getSemClass());
        if (sb.length() == 0) sb.append((String)null);
        return sb.toString();
    }
    
    /** Tests serialization. */
    public static void main(String[] argv) throws IOException, ClassNotFoundException {
    	// create words
    	Word w = createWord("ran");
    	Word fw = createFullWord(w, "run", "VBD", "s\\np", "MOTION");
    	Word wb = createWordWithAttrs(w, createWord("B", "L"));
    	// write to tmp.out
    	String filename = "tmp.ser";
    	ObjectOutputStream out = new ObjectOutputStream(new FileOutputStream(filename));
    	System.out.println("Writing w: " + w);
    	out.writeObject(w);
    	System.out.println("Writing fw: " + fw);
    	out.writeObject(fw);
    	System.out.println("Writing wb: " + wb);
    	out.writeObject(wb);
    	out.close();
    	// read from tmp.out
    	ObjectInputStream in = new ObjectInputStream(new FileInputStream(filename));
    	System.out.print("Reading w2: ");
    	Word w2 = (Word) in.readObject();
    	System.out.println(w2);
    	System.out.print("Reading fw2: ");
    	Word fw2 = (Word) in.readObject();
    	System.out.println(fw2);
    	System.out.print("Reading wb2: ");
    	Word wb2 = (Word) in.readObject();
    	System.out.println(wb2);
    	in.close();
    	// test identity (and thus readResolve)
    	System.out.println("w == w2?: " + (w == w2));
    	System.out.println("fw == fw2?: " + (fw == fw2));
    	System.out.println("wb == wb2?: " + (wb == wb2));
    }
}


================================================
FILE: src/opennlp/ccg/lexicon/WordWithPitchAccent.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2004 University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.lexicon;

/**
 * A WordWithPitchAccent object is a surface word with an optional pitch accent 
 * but no further attributes.
 *
 * @author      Michael White
 * @version     $Revision: 1.4 $, $Date: 2009/07/17 04:23:30 $
 */
public class WordWithPitchAccent extends SimpleWord {
    
	private static final long serialVersionUID = 1510997962756436949L;
	
	/** The pitch accent. */
    protected String pitchAccent;
    
    /** Returns the pitch accent. */
    public String getPitchAccent() { return pitchAccent; }
    
    /** Constructor. */
    protected WordWithPitchAccent(String form, String pitchAccent) {
        super(form); 
        this.pitchAccent = pitchAccent;
    }
}


================================================
FILE: src/opennlp/ccg/ngrams/AAnFilter.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2004 University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.ngrams;

import opennlp.ccg.lexicon.*;
import opennlp.ccg.util.*;

import java.util.*;
import java.io.*;

import gnu.trove.*;

/**
 * AN n-gram filter that detects "a" followed by a word beginning with a vowel, 
 * or "an" followed by a word beginning with a consonant.
 * Note that this filter only makes an approximate check, which may be augmented 
 * with a set of exceptions. 
 * Exceptions may be culled from a file of bigrams using cullAAnExceptions, 
 * which may be accessed from the command line using the -c option.
 * An appropriate bigrams file can be produced using the SRILM ngram-count tool, 
 * with the -text and -write2 options.
 *
 * @author      Michael White
 * @version     $Revision: 1.8 $, $Date: 2011/03/20 20:11:58 $
 */
public class AAnFilter implements NgramFilter, Reversible
{
    // exceptions
    private Set<List<Word>> exceptions = null;
    
    
    /** Constructor. */
    public AAnFilter() {}
    
    /** Constructor that loads a/an exceptions from the given infile of bigrams. */
    public AAnFilter(String infile) throws IOException { 
        loadAAnExceptions(infile); 
    }
    

    /** Flag for whether to reverse words before filtering. */
    protected boolean reverse = false;
    
    /** Get reverse flag. */
    public boolean getReverse() { return reverse; }
    
    /** Set reverse flag. */
    public void setReverse(boolean reverse) { this.reverse = reverse; }
    

    /** Returns whether to filter out the given word sequence. */
    public boolean filterOut(List<Word> words) {
        for (int i = 0; i < words.size()-1; i++) {
            Word w1 = words.get(i);
            Word w2 = words.get(i+1);
            if (filterOut(w1, w2)) return true;
        }
        return false; 
    }
    
    /** Returns whether to filter out the given word bigram (reversed if apropos). */
    public boolean filterOut(Word w1, Word w2) {
        if (reverse) {
            Word tmp = w1; w1 = w2; w2 = tmp;
        }
        String f1 = w1.getForm(); 
        if (f1 != "a" && f1 != "an") return false;
        String f1Alt = (f1 == "a") ? "an" : "a";
        String f2 = w2.getForm();
        boolean defaultRetval = filterOutByDefault(f1, f2);
        if (isException(f1, f2) || isException(f1Alt, f2))
            return !defaultRetval;
        else
            return defaultRetval;
    }
    
    // returns whether to filter out the bigram by default
    private static boolean filterOutByDefault(String w1, String w2) {
        boolean w2StartsWithVowel = startsWithVowel(w2);
        return (w1 == "a" && w2StartsWithVowel) || (w1 == "an" && !w2StartsWithVowel);
    }
    
    // initial vowel
    private static boolean startsWithVowel(String word) {
        char c = word.charAt(0);
        return (c == 'a' || c == 'e' || c == 'i' || c == 'o' || c == 'u') ||
               (c == 'A' || c == 'E' || c == 'I' || c == 'O' || c == 'U');
    }
    
    // words for a/an
    private static final Word A_WORD = Word.createWord("a");
    private static final Word AN_WORD = Word.createWord("an");
    
    // reusable list for lookup
    private List<Word> keyList = new ArrayListWithIdentityEquals<Word>(2);
    
    // looks up whether the bigram is an exception
    private boolean isException(String w1, String w2) {
        if (exceptions == null) return false;
        keyList.clear();
        keyList.add((w1 == "a") ? A_WORD : AN_WORD);
        keyList.add(Word.createWord(w2));
        return exceptions.contains(keyList);
    }
    
    // singletons for a/an
    @SuppressWarnings("unchecked")
	private static final List<Word> A_SINGLETON = (List<Word>) Interner.globalIntern(new SingletonList<Word>(A_WORD));
    @SuppressWarnings("unchecked")
    private static final List<Word> AN_SINGLETON = (List<Word>) Interner.globalIntern(new SingletonList<Word>(AN_WORD));
    
    /** Adds an a/an bigram as an exception. */
    @SuppressWarnings("unchecked")
    public void addException(String w1, String w2) {
        // make sure w1 is a/an
        w1 = w1.intern();
        if (w1 != "a" && w1 != "an") {
            System.err.println("Warning: ignoring exception not starting with a/an: " + w1 + " " + w2);
            return;
        }
        // ensure exceptions initialized
        if (exceptions == null) exceptions = new THashSet();
        // intern and add bigram
        List<Word> w1Singleton = (w1 == "a") ? A_SINGLETON : AN_SINGLETON;
        List<Word> w2Singleton = (List<Word>) Interner.globalIntern(new SingletonList<Word>(Word.createWord(w2)));
        List<Word> excBigram = (List<Word>) Interner.globalIntern(new StructureSharingList<Word>(w1Singleton, w2Singleton));
        exceptions.add(excBigram);
    }

    
    /** Culls a/an exceptions from the given infile of bigrams, writing them to the given outfile. */
    public static void cullAAnExceptions(String infile, String outfile) throws IOException {
        Reader in = new BufferedReader(new FileReader(infile));
        StreamTokenizer tokenizer = NgramScorer.initTokenizer(in);
        PrintWriter out = new PrintWriter(new FileWriter(outfile));
        String[] tokens = new String[2];
        // loop through lines
        while (tokenizer.ttype != StreamTokenizer.TT_EOF) {
            // read line into tokens
            NgramScorer.readLine(tokenizer, tokens);
            // check for blank/incomplete line
            if (tokens[1] == null) continue;
            // check for a/an exception
            if (tokens[0].equals("a") || tokens[0].equals("an")) {
                String aan = tokens[0].intern();
                String word = tokens[1];
                if (filterOutByDefault(aan, word)) {
                    // write to exceptions file
                    out.println(aan + " " + word);
                }
            }
        }
        // done
        in.close();
        out.flush(); out.close();
    }
    

    /** Loads a/an exceptions from the given infile of bigrams. */
    public void loadAAnExceptions(String infile) throws IOException {
        Reader in = new BufferedReader(new FileReader(infile));
        StreamTokenizer tokenizer = NgramScorer.initTokenizer(in);
        String[] tokens = new String[2];
        // loop through lines
        while (tokenizer.ttype != StreamTokenizer.TT_EOF) {
            // read line into tokens
            NgramScorer.readLine(tokenizer, tokens);
            // check for blank/incomplete line
            if (tokens[1] == null) continue;
            // add a/an exception
            addException(tokens[0], tokens[1]);
        }
        // done
        in.close();
    }

    
    /** Test loading and filtering, or cull exceptions from bigrams. */
    public static void main(String[] args) throws IOException {
        
        String usage = "Usage: java opennlp.ccg.ngrams.AAnFilter (<exceptionsfile>) <tokens> | -c <bigramsfile> <exceptionsfile>";
        
        if (args.length > 0 && args[0].equals("-h")) {
            System.out.println(usage);
            System.exit(0);
        }
        
        // cull exceptions with -c
        if (args[0].equals("-c")) {
            String infile = args[1]; String outfile = args[2];
            System.out.println("Culling a/an exceptions from " + infile + " to " + outfile);
            cullAAnExceptions(infile, outfile);
            System.exit(0);
        }
        
        // otherwise optionally load exceptions, ... 
        AAnFilter aanFilter = new AAnFilter();
        String infile = null; String tokens = null;
        if (args.length >= 2) { infile = args[0]; tokens = args[1]; }
        else tokens = args[0];
        if (infile != null) {
            System.out.println("Loading exceptions from: " + infile);
            System.out.println();
            aanFilter.loadAAnExceptions(infile);
        }
        
        // then filter given tokens
        Tokenizer tokenizer = new DefaultTokenizer();
        List<Word> words = tokenizer.tokenize(tokens); //, true);
        System.out.println("filtering: " + tokens);
        System.out.println("filter out: " + aanFilter.filterOut(words));
    }
}


================================================
FILE: src/opennlp/ccg/ngrams/AbstractStandardNgramModel.java
================================================
/*
 * $Id: AbstractStandardNgramModel.java,v 1.3 2009/12/21 03:27:18 mwhite14850 Exp $ 
 */
package opennlp.ccg.ngrams;

import java.util.ArrayList;
import java.util.Iterator;
import java.util.List;

import opennlp.ccg.lexicon.Word;
import opennlp.ccg.util.Pair;


/**
 * Abstract class for shared methods used by all standard ngram models.
 * Adapted from the original StandardNgramModel class. 
 * 
 * @author <a href="http://www.ling.osu.edu/~scott/">Scott Martin</a>
 * @version $Revision: 1.3 $
 * @since 0.9.2
 */
abstract class AbstractStandardNgramModel extends NgramScorer {

	/** Reusable list of strings to score. */
    protected List<String> stringsToScore = new ArrayList<String>();
	
    /**
     * Creates a new ngram model of the given order.
     * @param order The order of the model.
     * @param useSemClasses Whether this model should use semantic classes.
     * @see NgramScorer#NgramScorer(int, boolean)
     */
    protected AbstractStandardNgramModel(int order, boolean useSemClasses) {
		super(order, useSemClasses);
		numNgrams = new int[order];
	}

    /**
     * Creates a new ngram model with the specified order.
     * @see AbstractStandardNgramModel#AbstractStandardNgramModel(int, boolean)
     */
    protected AbstractStandardNgramModel(int order) {
		this(order, false);
	}

	/**
     * Converts the words in wordsToScore to strings in stringsToScore, before
     * scoring.
     */
    @Override
    protected void prepareToScoreWords() {
        stringsToScore.clear();
        for (int i = 0; i < wordsToScore.size(); i++) {
            Word w = wordsToScore.get(i);
            String s = w.getForm();
            // check for sem class replacement
            String scr = semClassReplacement(w);
            if (scr != null) s = scr;
            // add pitch accent and attrs, if any
            String pitchAccent = w.getPitchAccent();
            Iterator<Pair<String,String>> pairs = w.getAttrValPairs();
            if (pitchAccent != null || pairs.hasNext()) {
                StringBuffer sb = new StringBuffer();
                sb.append(s);
                if (pitchAccent != null) sb.append('_').append(pitchAccent);
                for (; pairs.hasNext(); ) {
                	Pair<String,String> p = pairs.next();
                    sb.append('_').append(p.b);
                }
                s = sb.toString().intern();
            }
            // check for unknown word
            if (openVocab && trieMapRoot.getChild(s) == null)
                s = "<unk>";
            // add key
            stringsToScore.add(s);
        }
    }
    
    /**
     * Returns the log prob of the ngram starting at the given index 
     * in wordsToScore and with the given order, with backoff. 
     * (Assumes words in wordsToScore have already been converted to strings in 
     * stringsToScore, via call to prepareToScoreWords.)
     */
    @Override
    protected float logProbFromNgram(int i, int order) {
        // skip initial start tag
        if (i == 0 && order == 1 && stringsToScore.get(0) == "<s>") return 0;
        // set keys list
        keysList.clear();
        for (int j = i; j < i+order; j++) {
            keysList.add(stringsToScore.get(j));
        }
        if (debugScore) {
            System.out.print("logp( " + keysList.get(order-1) + " | ");
            if (order > 1) { 
                System.out.print(keysList.get(order-2) + " ... ");
            }
            System.out.print(") = ");
        }
        // calc log prob
        float retval = logProb(0, order);
        if (debugScore) System.out.println("" + retval);
        return retval;
    }

}


================================================
FILE: src/opennlp/ccg/ngrams/ConditionalProbabilityTable.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2010 Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.ngrams;

import java.io.IOException;
import java.util.*;

import opennlp.ccg.lexicon.*;
import opennlp.ccg.util.*;

/**
 * A conditional probability table implemented via a FactoredNgramModelFamily, 
 * where probabilities are determined by n-grams of "factors" of a single "word" 
 * (whether the pairs of attributes and values have anything to do with words
 * or not).
 *
 * @author      Michael White
 * @version     $Revision: 1.2 $, $Date: 2010/02/25 22:26:10 $
 */
public class ConditionalProbabilityTable {
	
	/**
	 * The model, as a factored n-gram model family.
	 */
	protected FactoredNgramModelFamily model;
	
	/**
	 * Constructor with filename for model as a factored n-gram model family.
	 */
	public ConditionalProbabilityTable(String filename) throws IOException {
		model = new FactoredNgramModelFamily(filename, false);
		if (model.order != 1) {
			throw new RuntimeException("A conditional probability table must have n-gram order 1.");
		}
	}

    /** Sets the debug score flag. */
    public void setDebug(boolean debugScore) { model.setDebug(debugScore); }
    
	/**
	 * Returns a probability from the model for the given list of attribute-value 
	 * pairs, which are assumed to have already been interned, by converting 
	 * the result of the <code>logprob</code> method.
	 */
	public double score(List<Pair<String,String>> attrValList) {
		return NgramScorer.convertToProb(logprob(attrValList));
	}
	
	/**
	 * Returns a log probability from the model for the given list of attribute-value 
	 * pairs, which are assumed to have already been interned.
	 * The order of the list does not matter because the model probabilities are 
	 * defined by the factored n-gram model family specification.
	 */
	public double logprob(List<Pair<String,String>> attrValList) {
		return model.logprob(new SingletonList<Word>(new ListPairWord(attrValList)));
	}
	
    /** Tests loading and scoring. */
    public static void main(String[] args) throws IOException {
        
        String usage = "Usage: java opennlp.ccg.ngrams.ConditionalProbabilityTable <specfile> <string of attr-val pairs>";
        
        if (args.length > 0 && args[0].equals("-h")) {
            System.out.println(usage);
            System.exit(0);
        }
        
        String specfile = args[0];
        String tokens = args[1];
        
        List<Pair<String,String>> pairs = new ArrayList<Pair<String,String>>();
        String[] tokenArray = tokens.split("\\s+");
        for (int i=0; i < tokenArray.length; i+=2) {
        	String attr = tokenArray[i].intern();
        	String val = tokenArray[i+1].intern();
        	pairs.add(new Pair<String,String>(attr, val));
        }
        
        System.out.println("Loading conditional probability table from: " + specfile);
        ConditionalProbabilityTable table = new ConditionalProbabilityTable(specfile);
        FactoredNgramModelFamily lmFamily = table.model;
        System.out.println("primary child var: " + lmFamily.primaryGroup.childName);
        if (lmFamily.furtherGroups != null) {
            for (int i = 0; i < lmFamily.furtherGroups.length; i++) {
                System.out.println("further child var: " + lmFamily.furtherGroups[i].childName);
            }
        }
        System.out.println("openVocab: " + lmFamily.openVocab);
        System.out.println();
        
        System.out.println("scoring: " + tokens);
        System.out.println();
        table.setDebug(true);
        double logprob = table.logprob(pairs);
        double score = NgramScorer.convertToProb(logprob);
        System.out.println("score: " + score);
        System.out.println("logprob: " + logprob);
    }
}


================================================
FILE: src/opennlp/ccg/ngrams/FactoredNgramModel.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2004-5 University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.ngrams;

import opennlp.ccg.lexicon.*;
import opennlp.ccg.util.*;

import java.util.*;
import java.io.*;

/**
 * A scorer for a factored n-gram backoff model. 
 * The file format is the one generated by the SRILM version 1.4.1 fngram-count tool.
 * Only static backoff orders are supported at present, with 
 * the most distant parent variable dropped at each backoff point. 
 * Unknown words/factors are mapped to &lt;unk&gt; if the latter is present in 
 * the model.
 *
 * @author      Michael White
 * @version     $Revision: 1.22 $, $Date: 2011/10/11 03:29:42 $
 */
public class FactoredNgramModel extends NgramScorer
{
	/** Map for caching and reusing individual models by filename. */
	public static Map<String,FactoredNgramModel> modelCache = new HashMap<String,FactoredNgramModel>();
	
    /** The variable to predict. */
    public final ModelVariable child;
    
    /** The parent variables to condition on, backing off from the end. */
    public final ModelVariable[] parents;
    
    /** A variable in a factored n-gram model. */
    public class ModelVariable {
        /** The variable name. */
        public final String name;
        /** The (absolute value of the) position in the history. */
        public final int position;
        /** Makes a model variable from a string such as "W" or "W(-1)". */
        public ModelVariable(String str) {
            int leftparen = str.indexOf("(");
            if (leftparen > 0) {
                name = str.substring(0,leftparen).intern(); 
                int rightparen = str.indexOf(")");
                position = Math.abs(Integer.parseInt(str.substring(leftparen+1,rightparen)));
            }
            else { name = str.intern(); position = 0; }
        }
    }

    
    /** 
     * Loads a factored n-gram model for the given child variable, with the given parent variables, 
     * from the file with the given name, in the SRILM format.
     * The flag for using sem classes is defaulted to true.
     */
    public FactoredNgramModel(String child, String parents[], String filename) throws IOException { 
        this(child, parents, filename, true);
    }
    
    /** 
     * Loads a factored n-gram model for the given child variable, with the given parent variables, 
     * from the file with the given name, in the SRILM format, 
     * and with the given flag for using sem classes.
     */
    public FactoredNgramModel(String child, String parents[], String filename, boolean useSemClasses) throws IOException {
        this.useSemClasses = useSemClasses;
        this.child = new ModelVariable(child);
        this.parents = new ModelVariable[parents.length];
        order = 1;
        for (int i = 0; i < parents.length; i++) {
            this.parents[i] = new ModelVariable(parents[i]);
            order = Math.max(order, this.parents[i].position + 1);
        }
        this.numNgrams = new int[(int)Math.pow(2, parents.length)];
        // check cache
    	FactoredNgramModel cachedModel = modelCache.get(filename);
    	if (cachedModel != null) {
    		// share trie etc.
    		numNgrams = cachedModel.numNgrams;
    		openVocab = cachedModel.openVocab;
    		trieMapRoot = cachedModel.trieMapRoot;
    		cachedLogProbs = cachedModel.cachedLogProbs;
    	}
    	// otherwise load model
    	else {
            Reader in = new BufferedReader(new FileReader(filename));
            readModel(in);
    		modelCache.put(filename, this);
    	}
    }
    
    
    /**
	 * Returns a list of feature keys for the ngram starting at the given index in
	 * wordsToScore and with the given order, using the keys in keysList after
	 * setting them appropriately with setKeysToNgram; returns null if this
	 * operation does not succeed normally.  With factored models, factor keys 
	 * are sequenced as two string keys.
	 */
    protected List<String> ngram(int i, int order) { 
    	boolean ok = setKeysToNgram(i, order);
    	if (!ok) return null;
    	featureKeysList.clear();
    	for (int j=0; j < keysList.size(); j++) {
    		Object key = keysList.get(j);
    		if (key instanceof String) {
    			featureKeysList.add(Tokenizer.WORD_ATTR);
    			featureKeysList.add((String)key);
    		}
    		else if (!(key instanceof FactorKey)) {
    			throw new RuntimeException("Factor keys expected here!  key: " + key);
    		}
    		else {
    			FactorKey fkey = (FactorKey) key;
    			featureKeysList.add(fkey.factor);
    			featureKeysList.add(fkey.val);
    		}
    	}
    	return featureKeysList;
    }

    
    /** Returns the log prob of the ngram starting at the given index 
        in wordsToScore and with the given order, with backoff. 
        If using sem classes, then words with replacement sem classes are 
        mapped to words with the sem class replacing the form and stem.
        Any remaining unknown words/factors are mapped to &lt;unk&gt;, 
        if the latter is present in the model. */
    // extracts factor keys from full words according to parents list, 
    // then determines log prob from the list of factor keys
    protected float logProbFromNgram(int i, int order) {
        // skip initial start tag
        if (i == 0 && order == 1 && ((Word)wordsToScore.get(0)).getForm() == "<s>") return 0;
        // set up factor keys
        keysList.clear();
        int i0 = i + order-1; // index of current word
        // determine last available parent, if full context not available
        int lastParentIndex = parents.length-1;
        if (this.order > order) {
            for (int j = 0; j < parents.length; j++) {
                if (parents[j].position >= order) { lastParentIndex = j-1; break; }
            }
        }
        // go through parents in reverse order, 
        // extracting and adding factor keys
        for (int j = lastParentIndex; j >= 0; j--) {
            int pos_j = i0 - parents[j].position;
            if (pos_j < i) continue; // skip if pos_j past i
            Word w = (Word) wordsToScore.get(pos_j);
            keysList.add(makeFactorKey(w, parents[j].name));
        }
        // add factor key for child
        Word current = (Word) wordsToScore.get(i0);
        keysList.add(makeFactorKey(current, child.name));
        if (debugScore) {
            System.out.print("logp( " + keysList.get(keysList.size()-1) + " | ");
            for (int j = keysList.size()-2; j >= 0; j--) {
                System.out.print(keysList.get(j) + " ");
            }
            System.out.print(") = ");
        }
        // calc log prob from factor keys
        float retval = logProb(0, keysList.size());
        // NB: workaround for apparent bug in SRILM 1.4.1 fngram-count tool, 
        //     whereby prob for </s> does not use higher-order contexts for 
        //     factors other than W:  just use zero
        if (current.getForm() == "</s>" && child.name != "W") retval = 0;
        if (debugScore) System.out.println("" + retval);
        return retval;
    }
    
    // makes a factor key from the given word by extracting 
    // the attribute with the given name, where
    // the delimiter tokens are treated as a special case,  
    // and the attr val is adjusted if using sem classes
    private Object makeFactorKey(Word w, String attr) {
        // special cases for <s> and </s>: just return 
        // a word with this form, regardless of the attr
        String form = w.getForm();
        if (form == "<s>" || form == "</s>") {
            return FactorKey.getKey(attr, form);
        }
        // get val for this attr
        String val = w.getVal(attr);
        // check for sem class replacement for form or stem
        if (attr == Tokenizer.WORD_ATTR || attr == Tokenizer.STEM_ATTR) {
            String scr = semClassReplacement(w);
            if (scr != null) val = scr;
        }
        // make factor key 
        Object retval = FactorKey.getKey(attr, val);
        // check for unknown val
        if (openVocab && trieMapRoot.getChild(retval) == null) {
            val = "<unk>";
            retval = FactorKey.getKey(attr, val);
        }
        // return 
        return retval;
    }

    
    // reads in model
    private void readModel(Reader in) throws IOException {
        // setup
		//Tokenizer wordTokenizer = (Grammar.theGrammar != null)  
		//    ? Grammar.theGrammar.lexicon.tokenizer
		//    : new DefaultTokenizer();
        StreamTokenizer tokenizer = initTokenizer(in); 
        String[] tokens = new String[parents.length+3];
        Object[] factorKeys = new Object[parents.length+1];
        boolean foundData = false;
        int numParents = -1;
        int parentsInt = -1;
        List<Object> currentPrefix = new ArrayList<Object>();
        List<Object> currentKeys = null;
        List<TrieMap<Object,NgramFloats>> currentChildren = null;
        // loop through lines
        while (tokenizer.ttype != StreamTokenizer.TT_EOF) {
            // read line into tokens
            readLine(tokenizer, tokens);
            // check for blank line
            if (tokens[0] == null) continue;
            // check for initial delimiter
            if (tokens[0].equals("\\data\\")) { foundData = true; continue; }
            if (!foundData) continue;
            // read header line
            if (tokens[0].equals("ngram")) {
                int equalPos = tokens[1].indexOf("=");
                int n = Integer.decode(tokens[1].substring(0,equalPos)).intValue(); 
                int total = Integer.parseInt(tokens[1].substring(equalPos+1));
                numNgrams[n] = total;
                // init children, keys lists
                if (currentChildren == null) { 
                    currentChildren = new ArrayList<TrieMap<Object,NgramFloats>>(total);  
                    currentKeys = new ArrayList<Object>(total);  
                }
                // calc totals (not actually used anymore)
                if (n == numNgrams.length-1) {
                    @SuppressWarnings("unused")
					int totalNgrams = 0;
                    for (int i = 0; i < numNgrams.length; i++) { totalNgrams += numNgrams[i]; }
                    // System.out.println("totalNgrams: " + totalNgrams);
                }
                continue;
            }
            // check for final delimiter
            if (tokens[0].equals("\\end\\")) {
                addTrieMapChildren(currentPrefix, currentKeys, currentChildren);
                break;
            }
            // read line starting new parents context
            int gramsPos = -1;
            if (tokens[0].startsWith("\\") && (gramsPos = tokens[0].indexOf("-grams:")) > 0) {
                // add current children
                addTrieMapChildren(currentPrefix, currentKeys, currentChildren);
                // update num parents
                // System.out.println(tokens[0]);
                parentsInt = Integer.decode(tokens[0].substring(1,gramsPos)).intValue();
                numParents = numParents(parentsInt);
                continue;
            }
            if (numParents < 0) continue;
            // current order is num parents plus one for child var
            int currentOrder = numParents + 1;
            // parse a line of the form
            //   <prob> <p1> <p2> ... <pN> <c> [<bow>]
            // i.e. a log prob, followed by N vars, a child var, and an optional back off weight
            // NB:  unlike the ARPA format, here the <bow> here is
            //      associated with the backoff of <p1> <p2> ... <pN>
            //      rather than context consisting of <p1> <p2> ... <pN> <c>
            // read logprob
            float logprob = Float.parseFloat(tokens[0]);
            // unescape, intern factor keys
            for (int i = 1; i < currentOrder+1; i++) {
                String attr = (i == currentOrder) 
                    ? child.name 
                    : parents[(currentOrder-i)-1].name;  
                String val = tokens[i];
                int hyphenPos = val.indexOf('-');
                if (hyphenPos > 0) {
                    String attrCheck = val.substring(0, hyphenPos).intern();
                    if (attr != attrCheck) {
                        System.err.println(
                            "Warning: expected attr " + attr + " rather than " + 
                            attrCheck + " in " + tokens[i]
                        );
                    }
                    val = val.substring(hyphenPos+1);
                }
                val = DefaultTokenizer.unescape(val);
                if (val != null) val = val.intern();
                factorKeys[i-1] = FactorKey.getKey(attr, val);
            }
            // check prefix
            boolean samePrefix = (currentPrefix.size() == currentOrder-1);
            for (int i = 0; samePrefix && i < currentOrder-1; i++) {
                if (factorKeys[i] != currentPrefix.get(i)) samePrefix = false; 
            }
            // if changed, add current children, reset prefix 
            if (!samePrefix) {
                addTrieMapChildren(currentPrefix, currentKeys, currentChildren);
                for (int i = 0; i < currentOrder-1; i++) {
                    currentPrefix.add(factorKeys[i]);
                }
            }
            Object key = factorKeys[currentOrder-1];
            currentKeys.add(key);
            currentChildren.add(new TrieMap<Object,NgramFloats>(new NgramFloats(logprob, 0)));
            // read back-off weight, if present
            if (tokens[currentOrder+1] != null) {
                float bow = Float.parseFloat(tokens[currentOrder+1]);
                // add to prefix node
                TrieMap<Object,NgramFloats> prefixNode = trieMapRoot.findChildFromList(currentPrefix);
                NgramFloats nfloats = prefixNode.data;
                if (nfloats != null) nfloats.bow = bow;
                else prefixNode.data = new NgramFloats(0, bow); 
            }
        }
        // set openVocab according to presence of child <unk>
        Object unkKey = FactorKey.getKey(child.name,"<unk>");
        openVocab = (trieMapRoot.getChild(unkKey) != null);
    }

    
    // returns the number of parents present in the parentsInt spec
    private int numParents(int parentsInt) {
        int retval = 0;
        for (int i = 0; i < parents.length; i++) {
            if ((parentsInt & 1) != 0) retval++;
            parentsInt = parentsInt >> 1;
        }
        return retval;
    }
    
    
    /** Test loading and scoring. */
    // NB: This produces the same scores as the SRILM fngram tool when both 
    //     <s> and </s> tags are used, except that ...
    // NB: There is a workaround for an apparent bug in SRILM 1.4.1 fngram-count tool, 
    //     whereby prob for </s> does not use higher-order contexts for 
    //     factors other than W, and thus a log prob of zero is just used instead.
    public static void main(String[] args) throws IOException {
        
        String usage = "Usage: java opennlp.ccg.ngrams.FactoredNgramModel <child> <parents> <lmfile> <tokens>";
        
        if (args.length > 0 && args[0].equals("-h")) {
            System.out.println(usage);
            System.exit(0);
        }
        
        String child = args[0];
        String[] parents = args[1].split("\\s+");
        String lmfile = args[2];
        String tokens = args[3];
        
        System.out.println("Loading n-gram model from: " + lmfile);
        FactoredNgramModel lm = new FactoredNgramModel(child, parents, lmfile, true);
        System.out.println("child var: " + lm.child.name);
        for (int i = 0; i < lm.parents.length; i++) {
            System.out.println("parent var: (" + lm.parents[i].name + "," + lm.parents[i].position + ")");
        }
        System.out.println("order: " + lm.order);
        System.out.println("openVocab: " + lm.openVocab);
        System.out.println();
        // System.out.println("trie map: ");
        // System.out.println(lm.trieMapRoot.toString());
        // System.out.println();
        
        Tokenizer tokenizer = new DefaultTokenizer();
        List<Word> words = tokenizer.tokenize(tokens, true);
        System.out.println("scoring: ");
        for (int i = 0; i < words.size(); i++) {
            System.out.println(words.get(i).toString());
        }
        System.out.println();
        lm.debugScore = true;
        lm.setWordsToScore(words, true);
        lm.prepareToScoreWords();
        double logprob = lm.logprob();
        double score = convertToProb(logprob);
        System.out.println();
        System.out.println("score: " + score);
        System.out.println("logprob: " + logprob);
        System.out.println("ppl: " + NgramScorer.convertToPPL(logprob / (words.size()-1)));
    }
}


================================================
FILE: src/opennlp/ccg/ngrams/FactoredNgramModelFamily.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2004-5 University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.ngrams;

import opennlp.ccg.lexicon.*;
import opennlp.ccg.perceptron.Alphabet;
import opennlp.ccg.perceptron.FeatureMap;

import java.util.*;
import java.io.*;

/**
 * A scorer consisting of a family of factored n-gram backoff models.
 * The family of models is specified using the factored language model specification 
 * file format given as input to the SRILM version 1.4.1 fngram-count tool.
 * Each individual model is loaded as a FactoredNgramModel instance, and thus 
 * only static backoff orders are supported at present, with 
 * the most distant parent variable dropped at each backoff point.
 * The first model in the specification file should be the primary one.
 * It may be followed by any number of models for the same child variable 
 * but with lower history orders; these models will be used when the 
 * full history is unavailable, if their order matches the available 
 * number of words in the history.  For example, if the primary model is 
 * a trigram model, then a bigram model may also be given (with a potentially 
 * different backoff order) for scoring bigram word sequences.
 * Following these models, there may also be further (sequences of) models for scoring 
 * different child variables.  If present, the scores calculated for these 
 * child variables will be multipled with the score calculated for the primary 
 * model's child variable (typically the word form).  For example, one or more 
 * models may be given to calculate the probability of the word's pitch accent, 
 * independently of the word form (though potentially looking at some of the same history).
 * With each individual model, the parents are assumed to be listed in backoff order.
 * Unknown words are mapped to &lt;unk&gt; if the latter is present in 
 * the first model.
 *
 * @author      Michael White
 * @version     $Revision: 1.15 $, $Date: 2010/02/25 22:26:11 $
 */
public class FactoredNgramModelFamily extends NgramScorer
{
    /** The primary model group. */
    public final ModelGroup primaryGroup;
    
    /** Any additional model groups, for different child variables. */
    public final ModelGroup[] furtherGroups;
    
    /** A factored n-gram model and any secondary ones for the same child variable. */
    public class ModelGroup {
        /** The child variable name. */
        public final String childName;
        /** The primary model. */
        public final FactoredNgramModel primaryModel;
        /** The secondary models. */
        public final FactoredNgramModel[] secondaryModels;
        /** Makes a model group from the given primary model. */
        public ModelGroup(FactoredNgramModel primaryModel, FactoredNgramModel[] secondaryModels) {
            this.childName = primaryModel.child.name;
            this.primaryModel = primaryModel;
            this.secondaryModels = secondaryModels;
        }
        /** Returns the appropriate model for the given order. */
        public FactoredNgramModel getModel(int order) {
            if (secondaryModels == null) return primaryModel;
            for (int i = 0; i < secondaryModels.length; i++) {
                if (secondaryModels[i].order == order) return secondaryModels[i];
            }
            return primaryModel;
        }
        /** Propagates the reverse flag. */
        public void setReverse(boolean reverse) { 
            primaryModel.setReverse(reverse); 
            if (secondaryModels == null) return;
            for (int i = 0; i < secondaryModels.length; i++) {
                secondaryModels[i].setReverse(reverse);
            }
        }
        /** Propagates the debug score flag. */
        public void setDebug(boolean debugScore) { 
            primaryModel.setDebug(debugScore); 
            if (secondaryModels == null) return;
            for (int i = 0; i < secondaryModels.length; i++) {
                secondaryModels[i].setDebug(debugScore);
            }
        }
        /** Propagates wordsToScore to the given list, for sharing purposes. */
        protected void shareWordsToScore(List<Word> wordsToScore) {
            primaryModel.shareWordsToScore(wordsToScore);
            if (secondaryModels == null) return;
            for (int i = 0; i < secondaryModels.length; i++) {
                secondaryModels[i].shareWordsToScore(wordsToScore);
            }
        }
    	/** Sets the alphabet. */
    	public void setAlphabet(Alphabet alphabet) {
    		primaryModel.setAlphabet(alphabet);
            if (secondaryModels == null) return;
            for (int i = 0; i < secondaryModels.length; i++) {
                secondaryModels[i].setAlphabet(alphabet);
            }
    	}
    }
    
    
    /** 
     * Loads a family of factored n-gram models
     * from the file with the given name, in the SRILM format.
     * The flag for using sem classes is defaulted to true.
     */
    public FactoredNgramModelFamily(String filename) throws IOException { 
        this(filename, true);
    }
    
    /** 
     * Loads a family of factored n-gram models
     * from the file with the given name, in the SRILM format, 
     * and with the given flag for using sem classes.
     */
    public FactoredNgramModelFamily(String filename, boolean useSemClasses) throws IOException {
        this.useSemClasses = useSemClasses;
        List<ModelGroup> modelGroups = readModel(filename);
        this.primaryGroup = modelGroups.get(0);
        if (modelGroups.size() == 1) this.furtherGroups = null;
        else {
            this.furtherGroups = new ModelGroup[modelGroups.size()-1];
            for (int i = 1; i < modelGroups.size(); i++) {
                this.furtherGroups[i-1] = modelGroups.get(i);
            }
        }
        order = primaryGroup.primaryModel.order;
        openVocab = primaryGroup.primaryModel.openVocab; 
    }
    
    
    /** Sets reverse flag, and propagates to component models. */
    public void setReverse(boolean reverse) { 
        super.setReverse(reverse);
        primaryGroup.setReverse(reverse);
        if (furtherGroups == null) return;
        for (int i = 0; i < furtherGroups.length; i++) {
            furtherGroups[i].setReverse(reverse);
        }
    }
    
    /** Sets debug score flag, and propagates to component models. */
    public void setDebug(boolean debugScore) { 
        super.setDebug(debugScore);
        primaryGroup.setDebug(debugScore);
        if (furtherGroups == null) return;
        for (int i = 0; i < furtherGroups.length; i++) {
            furtherGroups[i].setDebug(debugScore);
        }
    }
    

    /** Sets wordsToScore to the given list, for sharing purposes. */
    protected void shareWordsToScore(List<Word> wordsToScore) {
        this.wordsToScore = wordsToScore;
        primaryGroup.shareWordsToScore(wordsToScore);
        if (furtherGroups == null) return;
        for (int i = 0; i < furtherGroups.length; i++) {
            furtherGroups[i].shareWordsToScore(wordsToScore);
        }
    }

    
	/** Sets the alphabet. */
	public void setAlphabet(Alphabet alphabet) {
		super.setAlphabet(alphabet);
		primaryGroup.setAlphabet(alphabet);
        if (furtherGroups == null) return;
        for (int i = 0; i < furtherGroups.length; i++) {
        	furtherGroups[i].setAlphabet(alphabet);
        }
	}
	
	/**
	 * Increments ngram counts for the ngrams starting at the given index in
	 * wordsToScore and with the given order.
	 */
	protected void incNgrams(FeatureMap featmap, int i, int order) {
        // do primary group
        List<String> ngram = ngram(primaryGroup, i, order);
        if (ngram != null) {
	        Alphabet.Feature f = alphabet.index(ngram);
			if (f != null) featmap.inc(f);
        }
        // then any further ones
        if (furtherGroups != null) {
            for (int j = 0; j < furtherGroups.length; j++) {
                List<String> ngram2 = ngram(furtherGroups[j], i, order);
                if (ngram2 == null) continue;
                Alphabet.Feature f2 = alphabet.index(ngram2);
        		if (f2 != null) featmap.inc(f2);
            }
        }
	}
	
    // get ngram from a model group
    private List<String> ngram(ModelGroup modelGroup, int i, int order) {
        FactoredNgramModel modelToUse = modelGroup.primaryModel; 
        // with less than full history, get possibly different model to use
        if (order < modelToUse.order) {
            modelToUse = modelGroup.getModel(order); 
        }
        return modelToUse.ngram(i, order);
    }
    
    
    /** Returns the log prob of the ngram starting at the given index 
        in wordsToScore and with the given order, with backoff. */
    protected float logProbFromNgram(int i, int order) {
        float logProbTotal = 0;
        // do primary group
        logProbTotal += logProbFromNgram(primaryGroup, i, order);
        // then any further ones
        if (furtherGroups != null) {
            for (int j = 0; j < furtherGroups.length; j++) 
                logProbTotal += logProbFromNgram(furtherGroups[j], i, order);
        }
        return logProbTotal;
    }
    
    // calculate the log prob from a model group
    private float logProbFromNgram(ModelGroup modelGroup, int i, int order) {
        FactoredNgramModel modelToUse = modelGroup.primaryModel; 
        // with less than full history, get possibly different model to use
        if (order < modelToUse.order) {
            modelToUse = modelGroup.getModel(order); 
            if (debugScore && modelToUse != modelGroup.primaryModel) {
                int modelNum = Arrays.asList(modelGroup.secondaryModels).indexOf(modelToUse);
                System.out.print("[2ndary model " + modelNum + "] ");
            }
        }
        return modelToUse.logProbFromNgram(i, order);
    }
    
    /** The max number of tokens to allow per line in the spec file. */
    public static int MAX_TOKENS_PER_LINE = 64;
    
    // reads in model, returning model groups
    private List<ModelGroup> readModel(String filename) throws IOException {
        // setup
        File infile = new File(filename);
        Reader in = new BufferedReader(new FileReader(infile));
        StreamTokenizer tokenizer = initTokenizer(in); 
        String[] tokens = new String[MAX_TOKENS_PER_LINE];
        // read in models
        FactoredNgramModel[] models = null;
        int numModels = -1;
        int currentModel = 0;
        // loop through lines
        while (tokenizer.ttype != StreamTokenizer.TT_EOF) {
            // read line into tokens
            readLine(tokenizer, tokens);
            // check for blank line
            if (tokens[0] == null) continue;
            // check for comment
            if (tokens[0].charAt(0) == '#') continue;
            // read num models, if not yet found
            if (numModels < 0) {
                numModels = Integer.parseInt(tokens[0]);
                models = new FactoredNgramModel[numModels];
                continue;
            }
            // skip rest if already read in numModels
            if (currentModel >= numModels) break;
            // read model spec if second token is a colon
            // line format is <child> : <numParents> <parent1> ... <parentN> <countfile> <lmfile> <numbognodes>
            if (tokens[1] != null && tokens[1].equals(":")) {
                // read child
                String child = tokens[0];
                // read parents
                int numParents = Integer.parseInt(tokens[2]);
                String[] parents = new String[numParents];
                for (int i = 0; i < numParents; i++) parents[i] = tokens[i+3];
                // read lm filename (skipping count file name)
                String lmfn = tokens[numParents+4];
                // make filename relative to spec file dir
                File lmfile = new File(infile.getParentFile(), lmfn);
                lmfn = lmfile.getPath();
                // load current model
            	models[currentModel] = new FactoredNgramModel(child, parents, lmfn, useSemClasses);
                // share wordsToScore
                models[currentModel].shareWordsToScore(wordsToScore);
                // inc current model
                currentModel++;
            }
        }
        // ensure models found
        if (models == null) {
            throw new IOException("No models found in: " + filename);
        }
        // check num models
        int actualNumModels = 0;
        for (int i = 0; i < numModels; i++) {
            if (models[i] != null) actualNumModels++;
        }
        if (actualNumModels != numModels) {
            System.err.println("Warning: Only found " + actualNumModels + "/" + numModels + " in " + filename);
            numModels = actualNumModels;
        }
        // assign models to groups
        List<ModelGroup> modelGroups = new ArrayList<ModelGroup>();
        int modelIndex = 0;
        while (modelIndex < numModels) {
            // get primary model, remember child name
            FactoredNgramModel primaryModel = models[modelIndex];
            String childName = primaryModel.child.name;
            modelIndex++;
            List<FactoredNgramModel> secondaryModelsList = new ArrayList<FactoredNgramModel>();
            // get secondary models with same child name
            while (modelIndex < numModels && models[modelIndex].child.name == childName) {
                secondaryModelsList.add(models[modelIndex]);
                modelIndex++;
            }
            FactoredNgramModel[] secondaryModels = new FactoredNgramModel[secondaryModelsList.size()];
            secondaryModelsList.toArray(secondaryModels);
            // make, add model group
            modelGroups.add(new ModelGroup(primaryModel, secondaryModels));
        }
        // done
        return modelGroups;
    }

    
    /** Test loading and scoring. */
    public static void main(String[] args) throws IOException {
        
        String usage = "Usage: java opennlp.ccg.ngrams.FactoredNgramModelFamily <specfile> <tokens>";
        
        if (args.length > 0 && args[0].equals("-h")) {
            System.out.println(usage);
            System.exit(0);
        }
        
        String specfile = args[0];
        String tokens = args[1];
        
        System.out.println("Loading n-gram model family from: " + specfile);
        FactoredNgramModelFamily lmFamily = new FactoredNgramModelFamily(specfile); 
        System.out.println("primary child var: " + lmFamily.primaryGroup.childName);
        if (lmFamily.furtherGroups != null) {
            for (int i = 0; i < lmFamily.furtherGroups.length; i++) {
                System.out.println("further child var: " + lmFamily.furtherGroups[i].childName);
            }
        }
        System.out.println("order: " + lmFamily.order);
        System.out.println("openVocab: " + lmFamily.openVocab);
        System.out.println();
        
        Tokenizer tokenizer = new DefaultTokenizer();
        List<Word> words = tokenizer.tokenize(tokens, true);
        System.out.println("scoring: ");
        for (int i = 0; i < words.size(); i++) {
            System.out.println(words.get(i).toString());
        }
        System.out.println();
        lmFamily.setDebug(true);
        lmFamily.setWordsToScore(words, true);
        lmFamily.prepareToScoreWords();
        double logprob = lmFamily.logprob();
        double score = convertToProb(logprob);
        System.out.println("score: " + score);
        System.out.println("logprob: " + logprob);
        System.out.println("ppl: " + NgramScorer.convertToPPL(logprob / (words.size()-1)));
    }
}


================================================
FILE: src/opennlp/ccg/ngrams/KenNgramModel.java
================================================
package opennlp.ccg.ngrams;
import opennlp.ccg.ngrams.kenlm.jni.KenLM;
import opennlp.ccg.ngrams.kenlm.MurmurHash;
import java.io.*;
import java.util.List;
import java.util.ArrayList;
import java.util.Map;
import java.util.HashMap;
import opennlp.ccg.lexicon.DefaultTokenizer;
import opennlp.ccg.lexicon.Tokenizer;
import opennlp.ccg.lexicon.Word;

public class KenNgramModel extends AbstractStandardNgramModel {
    
    // the nuts-n-bolts JNI class.
    private KenLM kenlm = null;

    // Map of hash of word to integer representation (integerized word used by KenLM).
    private Map<Long,Integer> hash2ID = new HashMap<Long,Integer>();
    // Map of String (word to score) to hash of word.
//    private Map<String,Integer> word2Hash = new HashMap<String,Integer>();
    // Map from hashes to tokens (to see whether we have encountered a new token). 
    private Map<Long,String> hash2String = new HashMap<Long,String>();
    // List of vocabulary tokens. New items are added and assigned their index as a representation.
    private List<String> vocabList = new ArrayList<String>();
    // Whether to lowercase text before querying to the language model (e.g., "Pierre Vinken" => "pierre vinken").
    private boolean lowercaseText = false;
    // Whether to split up named entities before querying the language model (e.g., "Pierre_Vinken" => "Pierre Vinken")
    private boolean splitNEs = false;
    // What character delimter to use to split NEs on.
    private char neDelim = '_';
    
    // A reusable container for scoring strings.
//    private List<String> someStringsToScore = null;

    // Whether to print out messages that trace the scoring process.
    public boolean debugScore = false;

    public KenNgramModel(int order, 
			 String lmFile,
			 boolean useSemClasses,
			 boolean lowercaseText,
			 boolean splitNEs,
			 char neDelim,
			 boolean useNgramFeatures) throws IOException {
	super(order, useSemClasses);
	this.lowercaseText = lowercaseText;
	this.splitNEs = splitNEs;
	this.neDelim = neDelim;
	kenlm = new KenLM(order, lmFile);	
//	someStringsToScore = new ArrayList<String>(order);
	this.useNgramFeatures = useNgramFeatures;
    }

    /** Construct with order and filename. (Delegates to superclass for these flags). */
    public KenNgramModel(int order, String lmFile) throws IOException { this(order, lmFile, false); }
    /** Construct with order and filename and an indication of whether to use semantic classes. (Delegates to superclass for these flags). */
    public KenNgramModel(int order, String lmFile, boolean useSemClasses) throws IOException {
	this(order, lmFile, useSemClasses, false, false, '_', false);
    }


    /**
     * Integerize a word and register it with the LM, if needed.
     */
    public int id(String token) {
	synchronized (this) {
	    long hash = 0;
	    try {
		hash = MurmurHash.hash64(token);
	    } catch (UnsupportedEncodingException e) {
		e.printStackTrace();
	    }
	    String hash_word = hash2String.get(hash);
	    if (hash_word != null) {
		return hash2ID.get(hash);
	    } else {
		int id = vocabList.size();
		// let kenlm know about this word's ID.
		kenlm.registerWord(token, id);
		vocabList.add(token);
		hash2String.put(hash, token);
		hash2ID.put(hash, id);
		return id;
	    }
	}
    }

    /**
     * Lowercase each token, if desired, and split each token into a list of tokens
     * (splitting on NE delim token), if desired.
     */
    protected List<Word> splitAndLowercase(List<Word> words) {
	List<Word> tmp = new ArrayList<Word>(words.size());
	if(!(lowercaseText || splitNEs)) {
	    return words;
	} else {
	    for(Word w : words) {
		String wdString = w.getForm();
		String[] parts = wdString.replace(neDelim,' ').split("\\s+");
//		ArrayList<String> subTmp = new ArrayList<String>(parts.length);
		for(String part : parts) {
		    String newWdForm = (lowercaseText) ? part.toLowerCase() : part;
		    // add null attr/val list, since it is not accessible.
		    tmp.add(Word.createWord(newWdForm, w.getPitchAccent(), null, newWdForm, w.getPOS(), w.getSupertag(), w.getSemClass()));
		}
	    }
	    return tmp;
	}
    }

    /**
      * Resets wordsToScore to the given ones, reversing them when the reverse
      * flag is true, and adding sentence delimiters if not already present, when
      * the completeness flag is true. Delegates to the superclass 
      */
    @Override
    protected void setWordsToScore(List<Word> words, boolean complete) {
        wordsToScore.clear();
        tagsAdded = false; 
	List<Word> tmp = splitAndLowercase(words);
	words = tmp;
	super.setWordsToScore(words, complete);
    }


    /**
     * Calculates a log probability of a delineated substring of the strings
     * to score using KenLM. 
     * @param pos The start position (inclusive) within the strings to score.
     * @param len The length, starting from <null>pos</null>, of the string
     * that should be used.  
     */
    @Override
    public float logProb(int pos, int len) {
	try {
	    List<String> range = new ArrayList<String>(keysList.size());
	    for(Object wts : keysList.subList(pos, pos + len)) range.add((String)wts);

	    int rangeSize = range.size();
	    if(rangeSize == 0) {
		throw new IllegalArgumentException("empty range specified for log prob");
	    }

	    // Get hashes of words.
	    int[] wds = new int[range.size()];
	    int cursor = 0;
	    for(String s : range) wds[cursor++] = id(s);
	    
	    // call KenLM
	    float result = kenlm.prob(wds);
	    if(debugScore) {
		String wd = range.get(range.size()-1);
		String context = "";
		for(String contextWord : range.subList(0,range.size()-1)) context += " " + contextWord;
		context = context.trim();
		System.out.println("logp(" + wd + " | " + context + ") = " + result);
	    }
	    return result;
	} catch(IndexOutOfBoundsException e) {
	    return 0.0f;
	}
    }


    /** Test loading and scoring. */
    // NB: This produces the same scores as the SRILM ngram tool when both 
    //     <s> and </s> tags are used.
    public static void main(String[] args) throws IOException {
        
        String usage = "Usage: java opennlp.ccg.ngrams.KenLM <order> <lmfile> <tokens>";
        
        if (args.length > 0 && args[0].equals("-h")) {
            System.out.println(usage);
            System.exit(0);
        }
        
        long start = System.currentTimeMillis();
        String order = args[0]; String lmfile = args[1]; String tokens = args[2];
	boolean lowercase = true, splitNEs = false;

	// we want to prove that there are NEs to split and that there are uppercase chars to preserve.
	for(char c : tokens.toCharArray()) {
	    if (c == '_') {
		splitNEs = true;
		if (!lowercase) break;
	    }
	    
	    if (Character.isUpperCase(c)) {
		lowercase = false;
		if(splitNEs) break;
	    }
	}

        System.out.println("Loading n-gram model with order " + order + " from: " + lmfile);
        KenNgramModel lm = new KenNgramModel(Integer.parseInt(order), lmfile, false, lowercase, splitNEs, '_', false);
	lm.debugScore = true;
        int secs = (int) (System.currentTimeMillis() - start) / 1000;
        System.out.println("secs: " + secs);
        System.out.println();
        Tokenizer tokenizer = new DefaultTokenizer();
        List<Word> words = tokenizer.tokenize(tokens);
        System.out.println("scoring: " + tokens);
        System.out.println();
        lm.setWordsToScore(words, true);
        lm.prepareToScoreWords();
        double logprob = lm.logprob();
        double score = convertToProb(logprob);
        System.out.println();
        System.out.println("score: " + score);
        System.out.println("logprob: " + logprob);
	// Find out how many words there are here.
	int size = lm.splitAndLowercase(words).size();
        System.out.println("ppl: " + NgramScorer.convertToPPL(logprob / (size-1)));
    }
}


================================================
FILE: src/opennlp/ccg/ngrams/LinearNgramScorerCombo.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003-5 University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.ngrams;

import java.util.*;

import opennlp.ccg.perceptron.*;
import opennlp.ccg.synsem.Sign;
import opennlp.ccg.lexicon.Word;

/**
 * Linear combination of n-gram probability models, 
 * interpolated at the word level; can also be used 
 * as a feature extractor in a perceptron model.
 * The models must have the same direction.
 *
 * @author      Michael White
 * @version     $Revision: 1.17 $, $Date: 2009/06/22 04:32:47 $
 */
public class LinearNgramScorerCombo extends NgramScorer implements FeatureExtractor
{
    /** The component models. */
    protected NgramScorer[] models;
    
    /** The weights. */
    protected double weights[];
    
    /**
     * Creates a new linear combo model with the given component models 
     * and with the combination weights determined by the rank order 
     * centroid method.  The models are assumed to be ordered from 
     * most to least important.
     */
    public LinearNgramScorerCombo(NgramScorer[] models) { 
        this(models, rankOrderCentroidWeights(models.length));
    }
    
    /**
     * Creates a new linear combo model with the given component models 
     * and combination weights.  The weights are assumed to sum to 1, 
     * and the number of weights is assumed to match the number of models.
     * The wordsToScore list is shared across the component models.
     */
    public LinearNgramScorerCombo(NgramScorer[] models, double[] weights) {
        this.models = models;
        this.weights = weights;
        for (int i = 0; i < models.length; i++) {
            models[i].shareWordsToScore(wordsToScore);
            order = Math.max(order, models[i].order);
        }
    }
    
    /** Set reverse flag, and propagate to component models. */
    public void setReverse(boolean reverse) { 
        super.setReverse(reverse);
        for (int i = 0; i < models.length; i++) {
            models[i].setReverse(reverse);
        }
    }
    
    /** Sets wordsToScore to the given list, for sharing purposes. */
    protected void shareWordsToScore(List<Word> wordsToScore) {
        this.wordsToScore = wordsToScore;
        for (int i = 0; i < models.length; i++) {
            models[i].shareWordsToScore(wordsToScore);
        }
    }
    
    /** Does further preparation before scoring words for each component model. */
    protected void prepareToScoreWords() {
        for (int i = 0; i < models.length; i++) {
            models[i].prepareToScoreWords();
        }
    }
    
    /** Returns the log prob of the ngram starting at the given index 
        in wordsToScore and with the given order, with backoff.
        In particular, returns the linear combination using the established weights 
        of the probabilities given by the component models,
        converted back to a log prob (base 10). */
    protected float logProbFromNgram(int i, int order) {
        double prob = 0;
        for (int j = 0; j < models.length; j++) {
            prob += convertToProb(models[j].logProbFromNgram(i, order)) * weights[j];
        }
        return (float) convertToLogProb(prob);
    }
    
    
	/**
	 * Increments ngram counts for the ngrams starting at the given index in
	 * wordsToScore and with the given order.  The implementation 
	 * delegates to the component models.
	 */
	protected void incNgrams(FeatureMap featmap, int i, int order) {
        for (int j = 0; j < models.length; j++) {
        	if (models[j].useNgramFeatures) models[j].incNgrams(featmap, i, order);
        }
	}
	
	
	/** Flag for including the interpolated log prob as a feature. */
	protected boolean useInterpLogProb = true;
	
	/** Sets the flag for including interpolated log prob as a feature. */
	public void setInterpLogProb(boolean useInterpLogProb) { 
		this.useInterpLogProb = useInterpLogProb; 
	}
	
    /**
     * Returns a feature vector with the log prob features  
     * for the given sign and completeness flag.
	 * In particular, returns the log prob from each model as 
	 * the value of a feature named '$ngramN'.
	 * The interpolated log prob is also returned as a feature '$ngram' if 
	 * the flag for including the interpolated log prob as a feature is set (the default).
     */
    public FeatureVector extractLogProbs(Sign sign, boolean complete) {
		FeatureList retval = new FeatureList(models.length+1);
		if (useInterpLogProb) {
	        Alphabet.Feature f = alphabet.index("$ngram");
			if (f != null) retval.add(f, (float)logprob(sign, complete));
		}
		for (int i=0; i < models.length; i++) {
	        Alphabet.Feature f = alphabet.index("$ngram"+i);
			if (f != null) retval.add(f, (float)models[i].logprob(sign, complete));
		}
		return retval;
    }
    
	/** Sets the alphabet. */
	public void setAlphabet(Alphabet alphabet) {
		super.setAlphabet(alphabet);
		for (NgramScorer scorer : models) {
			scorer.setAlphabet(alphabet);
		}
	}
}


================================================
FILE: src/opennlp/ccg/ngrams/NgramDiversityPruningStrategy.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2005 University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.ngrams;

import opennlp.ccg.lexicon.Word;
import opennlp.ccg.realize.*;
import opennlp.ccg.synsem.Sign;

import java.util.*;

/**
 * A diversity pruning strategy that defines signs to be 
 * notCompellinglyDifferent if the n-1 initial and final words 
 * are the same, where n is the n-gram order of interest.
 * The single arg constructor defaults the singleBestPerGroup flag 
 * to true, which can increase efficiency with no loss in quality 
 * when only the single best output is of interest (as long as the 
 * reduction in the search space outweighs the extra time necessary 
 * to check for the same initial and final words).
 *
 * @author      Michael White
 * @version     $Revision: 1.3 $, $Date: 2009/12/21 03:27:18 $
 */
public class NgramDiversityPruningStrategy extends DiversityPruningStrategy
{
    /** The n-gram order. */
    protected int order;
    
    /** Constructor that defaults singleBestPerGroup to true. */
    public NgramDiversityPruningStrategy(int order) { this(order, true); }
    
    /** Full constructor. */
    public NgramDiversityPruningStrategy(int order, boolean singleBestPerGroup) { 
        this.order = order; this.singleBestPerGroup = singleBestPerGroup;
    }
    
    /** Returns true iff the given signs are not compellingly different.
        In particular, returns true iff the n-1 initial and final words are the same. */
    public boolean notCompellinglyDifferent(Sign sign1, Sign sign2) {
        List<Word> words1 = sign1.getWords(); List<Word> words2 = sign2.getWords();
        int words1Len = words1.size(); int words2Len = words2.size();  
        for (int i = 0; i < order-1 && i < words1Len && i < words2Len; i++) {
            if (words1.get(i) != words2.get(i)) return false;
        }
        int wordsLenDiff = words1Len-words2Len;
        for (int i = words1Len-1; i > words1Len-order && i >= 0 && i >= wordsLenDiff; i--) {
            int j = i - wordsLenDiff;
            if (words1.get(i) != words2.get(j)) return false;
        }
        return true;
    }
}


================================================
FILE: src/opennlp/ccg/ngrams/NgramFilter.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2004 University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.ngrams;

import opennlp.ccg.lexicon.Word;

import java.util.*;

/**
 * Interface for objects that filter unhappy n-grams.
 *
 * @author      Michael White
 * @version     $Revision: 1.3 $, $Date: 2005/10/20 18:49:42 $
 */
public interface NgramFilter
{
    /** Returns whether to filter out the given list of words. */
    public boolean filterOut(List<Word> words);
}


================================================
FILE: src/opennlp/ccg/ngrams/NgramPrecisionModel.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003-5 University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.ngrams;

import opennlp.ccg.grammar.*;
import opennlp.ccg.lexicon.*;
import opennlp.ccg.perceptron.FeatureVector;
import opennlp.ccg.synsem.Sign;
import opennlp.ccg.util.*;

import gnu.trove.*;
import java.util.*;

/**
 * N-gram precision scoring model, using a linear combination of 
 * n-grams with rank order centroid weights, and optionally replacing word forms with 
 * their semantic classes.
 * Words in the target strings are assumed to contain any desired delimiters.
 * With the exact matches flag set, only exact matches count.
 *
 * @author      Michael White
 * @version     $Revision: 1.18 $, $Date: 2011/05/15 20:35:06 $
 */
public class NgramPrecisionModel extends NgramScorer implements SelfParaphraseBiaser
{
    // n-grams in the target phrases
    @SuppressWarnings("unchecked")
	private Set<List<Word>> targetNgrams = new THashSet();
    
    // weights
    private double[] weights = null;
    
    // exact matches flag
    private boolean exactMatches = false;
    
    /** Reusable list of reduced words. */
    protected List<Word> reducedWords = new ArrayList<Word>();
    
    /** Reusable word list, with identity equals. */
    protected List<Word> wordList = new ArrayListWithIdentityEquals<Word>();

    
    /**
     * Creates a new 4-gram precision model with no initial target strings 
     * and with the combination weights determined by the rank order centroid method.  
     * Word forms are not replaced by their semantic classes.
     */
    public NgramPrecisionModel() { 
        this(new String[]{}, false);
    }
    
    /**
     * Creates a new 4-gram precision model from the given target strings 
     * and with the combination weights determined by the rank order centroid method.  
     * Word forms are not replaced by their semantic classes.
     */
    public NgramPrecisionModel(String[] targets) { 
        this(targets, false);
    }
    
    /**
     * Creates a new n-gram precision model of the given order from the given target strings   
     * and with the combination weights determined by the rank order centroid method.  
     * Word forms are not replaced by their semantic classes.
     */
    public NgramPrecisionModel(String[] targets, int order) { 
        this(targets, order, false);
    }
    
    /**
     * Creates a new 4-gram precision model from the given target strings,  
     * with the given flag controlling whether word forms are replaced by their semantic classes, 
     * and with the combination weights determined by the rank order centroid method.  
     */
    public NgramPrecisionModel(String[] targets, boolean useSemClasses) { 
        this(targets, 4, useSemClasses);
    }
    
    /**
     * Creates a new n-gram precision model of the given order from the given target strings,  
     * with the given flag controlling whether word forms are replaced by their semantic classes, 
     * and with the combination weights determined by the rank order centroid method.  
     */
    public NgramPrecisionModel(String[] targets, int order, boolean useSemClasses) { 
        this(targets, order, useSemClasses, rankOrderCentroidWeights(order));
    }
    
    /**
     * Creates a new n-gram precision model of the given order from the given target strings,  
     * with the given flag controlling whether word forms are replaced by their semantic classes, 
     * and with the given combination weights, beginning with the 
     * highest-order weight and ending with the lowest-order (unigram) weight.
     */
    public NgramPrecisionModel(String[] targets, int order, boolean useSemClasses, double[] weights) {
        this.useSemClasses = useSemClasses;
        this.order = order;
        this.weights = new double[order];
        for (int i = 0; i < order; i++) {
            this.weights[order-(i+1)] = weights[i];
        }
        initTargetNgrams(targets);
    }
    
    
    /** Sets the exact matches flag. */
    public void setExactMatches(boolean exactMatches) { this.exactMatches = exactMatches; }
    
    /** Returns the exact matches flag. */
    public boolean getExactMatches() { return exactMatches; }
    
    
    /** Reduces the words in wordsToScore to reducedWords, before scoring. */
    protected void prepareToScoreWords() {
        reducedWords.clear();
        for (int i = 0; i < wordsToScore.size(); i++) {
            Word w = wordsToScore.get(i);
            reducedWords.add(reduceWord(w));
        }
    }
    
    /** Returns the given word reduced to a surface word, using the sem class, if apropos. */
    protected Word reduceWord(Word w) {
        if (useSemClasses && isReplacementSemClass(w.getSemClass())) 
            return Word.createSurfaceWordUsingSemClass(w);
        else return Word.createSurfaceWord(w);
    }
    
    /** 
     * Returns a score between 0 (worst) and 1 (best) for the given sign 
     * and completeness flag, based on the n-gram score of the sign's words.
     * If the sign is complete, sentence delimiters are added before 
     * scoring the words, if not already present.
     * Returns 0 if any filter flags the n-gram for filtering, or if 
     * the sign has no words.
     * Otherwise, sets <code>signToScore</code>, calls <code>prepareToScoreWords</code>, 
     * and then calculates and returns the n-gram precision score.
     * In particular, returns the linear combination using the established weights 
     * of the various n-gram precision scores (from unigram up to the configured order), 
     * where the n-gram precision is the number of n-grams with a match in the target 
     * strings divided by the number of n-grams in the word sequence.
     * With the exact matches flag set, only exact matches count.
     * With short sequences (less than the order), the score is adjusted 
     * proportionally to the max score.
     */
    public synchronized double score(Sign sign, boolean complete) {
    	// setup
        List<Word> words = sign.getWords(); 
        if (words == null) return 0;
        signToScore = sign;
        setWordsToScore(words, complete);
        if (ngramFilters != null) {
            for (int i = 0; i < ngramFilters.size(); i++) {
                NgramFilter filter = ngramFilters.get(i);
                if (filter.filterOut(wordsToScore)) return 0;
            }
        }
        prepareToScoreWords();
        // calc weighted precision score
        double retval = 0;
        for (int i = 0; i < order; i++) {
            retval += weights[i] * ngramPrecision(i+1);
        }
        signToScore = null;
        // adjust score for short sequences
        int numWords = wordsToScore.size();
        if (numWords < order) {
        	double max = 0.0;
        	for (int i=0; i < numWords; i++) max += weights[i];
        	retval = retval / max;
        }
        // done
        return retval;
    }


	/** 
	 * Returns the features as counts of each ngram for the given sign and completeness flag.
	 * This method returns the feature map as a feature vector.
	 */
	public FeatureVector extractFeatures(Sign sign, boolean complete) {
		return extractFeatureMap(sign, complete);
	}
	
    
    /** Not supported; throws an UnsupportedOperationException. */
    protected float logProbFromNgram(int i, int order) {
        throw new UnsupportedOperationException();
    }
    
    
    // returns the n-gram precision of the given order, or zero if too few words
    private double ngramPrecision(int order) {
        int numWords = reducedWords.size();
        int numNgrams = numWords - (order-1);
        if (numNgrams <= 0) return 0;
        int matches = 0;
        for (int i=0; i < numNgrams; i++) {
            setNgram(reducedWords, i, order);
            if (targetNgrams.contains(wordList))
                matches++;
        }
        if (exactMatches) 
        	return (matches == numNgrams) ? 1.0 : 0.0;
        else 
        	return (matches * 1.0) / numNgrams;
    }

    /** Sets wordList to be the n-gram of the given order using words starting at pos i. */
    protected synchronized void setNgram(List<Word> words, int i, int order) {
        wordList.clear();
        for (int j = 0; j < order; j++) {
            wordList.add(words.get(i+j)); 
        }        
    }

    /**
	 * Sets the keys in keysList to hold the ngram starting at the given index in
	 * wordsToScore and with the given order; returns true if the operation 
	 * succeeds normally. The implementation uses reducedWords.
	 */
	protected boolean setKeysToNgram(int i, int order) {
		keysList.clear();
        for (int j = 0; j < order; j++) {
        	keysList.add(reducedWords.get(i+j).getForm());
        }
		return true;
	}

    
    /** Makes a canonical n-gram of the given order using words starting at pos i. 
        Sublists are shared, a la a trie data structure. */
    @SuppressWarnings("unchecked")
	protected List<Word> makeNgram(List<Word> words, int i, int order) {
        // check for one already interned
        setNgram(words, i, order);
        List<Word> alreadyInterned = (List<Word>) Interner.getGlobalInterned(wordList);
        if (alreadyInterned != null) return alreadyInterned;
        // if order is 1, intern new singleton list
        if (order == 1) {
            return (List<Word>) Interner.globalIntern(new SingletonList<Word>(words.get(i)));
        }
        // otherwise, extend list for the first word with suffix list
        List<Word> firstOneList = makeNgram(words, i, 1);
        List<Word> suffixList = makeNgram(words, i+1, order-1); 
        return (List<Word>) Interner.globalIntern(new StructureSharingList<Word>(firstOneList, suffixList));
    }
    

    // initializes the n-grams from the target phrases
    private void initTargetNgrams(String[] targets) {
        for (int j = 0; j < targets.length; j++) {
        	if (targets[j].length() == 0) continue;
            // parse or tokenize target phrase into words
            List<Word> words;
            if (useSemClasses) // use parsed words to get sem classes
                words = Grammar.theGrammar.getParsedWords(targets[j]);
            else
                words = Grammar.theGrammar.lexicon.tokenizer.tokenize(targets[j]);
            // add sentence delimiters, if not already present
            setWordsToScore(words, true);
            // reduce each word to a surface word, using the sem class if apropos
            int numWords = wordsToScore.size();
            for (int i = 0; i < numWords; i++) {
                Word w = wordsToScore.get(i);
                wordsToScore.set(i, reduceWord(w));
            }
            // make and store target n-grams
            for (int k=0; k < order; k++) {
                for (int i=0; i < numWords - k; i++) {
                    targetNgrams.add(makeNgram(wordsToScore, i, k+1));
                }
            }
        }
    }
    
	/** Sets the target strings for implementing the self-paraphrase bias. */
	@SuppressWarnings("unchecked")
	public void setTargets(String[] targets) {
		targetNgrams = new THashSet();
		initTargetNgrams(targets);
	}
}


================================================
FILE: src/opennlp/ccg/ngrams/NgramScorer.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003-8 University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.ngrams;

import opennlp.ccg.synsem.Sign;
import opennlp.ccg.synsem.SignScorer;
import opennlp.ccg.grammar.Grammar;
import opennlp.ccg.lexicon.*;
import opennlp.ccg.util.*;
import opennlp.ccg.perceptron.*;

import java.util.*;
import java.io.*;

/**
 * Super class for n-gram scoring models.
 *
 * @author      Michael White
 * @version     $Revision: 1.37 $, $Date: 2010/02/25 22:26:11 $
 */
public abstract class NgramScorer implements SignScorer, Reversible, FeatureExtractor
{
	protected NgramScorer() {}
	
	protected NgramScorer(int order) {
		this(order, false);
	}
	
	protected NgramScorer(int order, boolean useSemClasses) {
		this.order = order;
		this.useSemClasses = useSemClasses;
	}
	
    /** The n-gram order of the model. */
    protected int order;
    
    /** Returns the n-gram order of the model. */
    public int getOrder() { return order; }

    /** Flag for whether to reverse words before scoring (defaults to false). */
    protected boolean reverse = false;
    
    /** Get reverse flag. */
    public boolean getReverse() { return reverse; }
    
    /** Set reverse flag, and propagate to any reversible filters. */
    public void setReverse(boolean reverse) { 
        this.reverse = reverse; 
        if (ngramFilters != null) {
            for (int i = 0; i < ngramFilters.size(); i++) {
                NgramFilter filter = ngramFilters.get(i);
                if (filter instanceof Reversible) 
                    ((Reversible)filter).setReverse(reverse);
            }
        }
    }
    
    /** Root of the n-gram trie.  Nodes store NgramFloats instances. */
    protected TrieMap<Object,NgramFloats> trieMapRoot = new TrieMap<Object,NgramFloats>(null);

    /** An ngram data object, for holding the log prob and backoff weight. */
    public static class NgramFloats {
        /** The log prob. */
        public float logprob;
        /** The backoff weight. */
        public float bow;
        /** Constructor. */
        public NgramFloats(float logprob, float bow) {
            this.logprob = logprob; this.bow = bow; 
        }
        
        @Override
        public String toString() { return "logprob: " + logprob + ", bow: " + bow; }
    }

    
    /** The n-gram totals for different histories. */
    protected int[] numNgrams = null;
    
    /** Flag for open vocabulary, ie whether the unknown word &lt;unk&gt; is in the model. */
    protected boolean openVocab = false;
    
    /** Flag for whether to show scoring breakdown. */
    protected boolean debugScore = false;
    
    /** Sets the debug score flag. */
    public void setDebug(boolean debugScore) { this.debugScore = debugScore; } 
    
    /** List of n-gram filters, for identifying unhappy sequences. */
    protected List<NgramFilter> ngramFilters = null;
    
    /** Adds an n-gram filter. */
    public void addFilter(NgramFilter filter) { 
        if (ngramFilters == null) { ngramFilters = new ArrayList<NgramFilter>(); }
        ngramFilters.add(filter);
    }

    
    /** The alphabet, for filtering features to the relevant ones (when present). */
    protected Alphabet alphabet = null;
    
    /** Sets the alphabet, so that features can be filtered to the relevant ones (when present). */
    public void setAlphabet(Alphabet alphabet) { this.alphabet = alphabet; }
    
    
    /** Weak hash map for cached log probs, keyed from a sign's words. */
    protected Map<List<Word>,Float> cachedLogProbs = null;
    
    /** Reference to current sign to score. */
    protected Sign signToScore = null;
    
    /** Reusable list of words to score. */
    protected List<Word> wordsToScore = new ArrayList<Word>();

    /** Flag for whether start/end tags were added with the current words. */
    protected boolean tagsAdded = false;
    
    /** Reusable list of keys for n-gram lookups. */
    protected List<Object> keysList = new ArrayList<Object>();
    
    /** Reusable list of keys for n-gram feature lookups. */
    protected List<String> featureKeysList = new ArrayList<String>();
    
    
    /** Gets a cached log prob for the given list of words (or null if none). */
    protected Float getCachedLogProb(List<Word> words) {
        if (cachedLogProbs == null) return null;
        return cachedLogProbs.get(words);
    }
    
    /** Caches a log prob for the given list of words. */
    protected void putCachedLogProb(List<Word> words, Float logprob) {
        if (cachedLogProbs == null) cachedLogProbs = new WeakHashMap<List<Word>,Float>();
        cachedLogProbs.put(words, logprob);
    }

    
    /** 
     * Returns a score between 0 (worst) and 1 (best) for the given sign 
     * and completeness flag, based on the n-gram score of the sign's words.
     * If the sign is complete, sentence delimiters are added before 
     * scoring the words, if not already present.
     * Returns 0 if any filter flags the n-gram for filtering, or if 
     * the sign has no words.
     * Otherwise, sets <code>signToScore</code>, calls <code>prepareToScoreWords</code>, 
     * and then returns the result of <code>logprob()</code> converted to a probability.
     */
    public synchronized double score(Sign sign, boolean complete) {
    	return convertToProb(logprob(sign, complete));
    }
    
    /** 
     * Returns a log prob for the given sign and completeness flag, 
     * based on the n-gram log prob of the sign's words.
     * If the sign is complete, sentence delimiters are added before 
     * scoring the words, if not already present.
     * Returns the log prob for zero probability if any filter flags the n-gram for filtering, or if 
     * the sign has no words.
     * Otherwise, sets <code>signToScore</code>, calls <code>prepareToScoreWords</code>, 
     * and then returns the result of <code>logProb()</code>.
     */
    public synchronized double logprob(Sign sign, boolean complete) {
        List<Word> words = sign.getWords(); 
        if (words == null) return 0;
        if (!complete) { // check cache
            Float logprob = getCachedLogProb(words);
            if (logprob != null) return logprob;
        }
        signToScore = sign;
        setWordsToScore(words, complete);
        if (ngramFilters != null) {
            for (int i = 0; i < ngramFilters.size(); i++) {
                NgramFilter filter = ngramFilters.get(i);
                if (filter.filterOut(wordsToScore)) return convertToLogProb(0);
            }
        }
        prepareToScoreWords();
        double retval = logprob();
        signToScore = null;
        return retval;
    }
    
    /**
     * Returns an n-gram probability from the given list of words, 
     * by converting the result of the <code>logprob</code> method.
     */
    public synchronized double score(List<Word> words) {
    	return convertToProb(logprob(words));
    }
    
    /** 
     * Returns an n-gram log prob for the given list of words.
     * This method is a simplified version of scoring a sign's words 
     * that does not cache results, filter n-grams or ever add 
     * sentence delimiters.
     */
    public synchronized double logprob(List<Word> words) {
        setWordsToScore(words, false);
        prepareToScoreWords();
        return logprob();
    }
    
    /** Sets wordsToScore to the given list, for sharing purposes. */
    protected void shareWordsToScore(List<Word> wordsToScore) {
        this.wordsToScore = wordsToScore;
    }
    
    /**
	 * Resets wordsToScore to the given ones, reversing them when the reverse
	 * flag is true, and adding sentence delimiters if not already present, when
	 * the completeness flag is true. Also sets the tagsAdded flag.
	 */
    protected void setWordsToScore(List<Word> words, boolean complete) {
        wordsToScore.clear();
        tagsAdded = false; 
        if (complete && (reverse || words.get(0).getForm() != "<s>")) { 
            wordsToScore.add(Word.createWord("<s>"));
            tagsAdded = true;
        }
        if (reverse) {
            for (int j = words.size()-1; j >= 0; j--) {
                Word w = words.get(j);
                if (w.getForm() == "<s>" || w.getForm() == "</s>") continue; // skip <s> or </s>
                wordsToScore.add(w);
            }
        }
        else
            wordsToScore.addAll(words);
        if (complete && (reverse || words.get(words.size()-1).getForm() != "</s>")) {
            wordsToScore.add(Word.createWord("</s>"));
            tagsAdded = true;
        }
    }
    
    /** Optional step to do further preparation before scoring words. */
    protected void prepareToScoreWords() {}
    
    
    /** Returns a feature map with counts of each ngram for the given sign and completness flag. */
    public FeatureMap extractFeatureMap(Sign sign, boolean complete) {
    	FeatureMap featmap = new FeatureMap();
    	// do setup as with scoring
        List<Word> words = sign.getWords(); 
        if (words == null) return featmap;
        signToScore = sign;
        setWordsToScore(words, complete);
        prepareToScoreWords();
        // count ngrams 
        int numWords = wordsToScore.size();
        for (int k=1; k <= order; k++) {
            int numNgrams = numWords - (k-1);
            if (numNgrams <= 0) continue;
            for (int i = 0; i < numNgrams; i++) {
                incNgrams(featmap, i, k);
            }
        }
        // return
        signToScore = null;
    	return featmap;
    }
    
    /**
     * Returns a feature vector with the log prob features  
     * for the given sign and completeness flag.
	 * The default implementation returns the log prob as 
	 * the value of a feature named '$ngram' plus the counts of each ngram.
     */
    public FeatureVector extractLogProbs(Sign sign, boolean complete) {
    	FeatureList retval = new FeatureList(1);
		Alphabet.Feature f = alphabet.index("$ngram");
		if (f != null) retval.add(f, (float)logprob(sign, complete));
		return retval;
    }
    
	/** 
	 * Returns the features for the given sign and completeness flag.
	 * The default implementation returns the log prob as 
	 * the value of a feature named '$ngram' plus the counts of each ngram.
	 */
	public FeatureVector extractFeatures(Sign sign, boolean complete) {
		FeatureVector logprob = extractLogProbs(sign, complete);
		if (useNgramFeatures) {
			FeatureMap map = extractFeatureMap(sign, complete);
			return new ComposedFeatureVector(logprob, map);
		}
		else return logprob;
	}
	
	/**
	 * Increments ngram counts for the ngrams starting at the given index in
	 * wordsToScore and with the given order.  The default implementation 
	 * uses ngram(i, order).
	 */
	protected void incNgrams(FeatureMap featmap, int i, int order) {
        List<String> ngram = ngram(i, order); 
        if (ngram == null) return;
        Alphabet.Feature f = alphabet.index(ngram);
		if (f != null) featmap.inc(f);
	}
	
	
    /**
	 * Returns a list of feature keys for the ngram starting at the given index in
	 * wordsToScore and with the given order, using the keys in keysList after
	 * setting them appropriately with setKeysToNgram; returns null if this
	 * operation does not succeed normally.
	 */
    protected List<String> ngram(int i, int order) { 
    	boolean ok = setKeysToNgram(i, order);
    	if (!ok) return null;
    	featureKeysList.clear();
    	for (int j=0; j < keysList.size(); j++) {
    		Object key = keysList.get(j);
    		if (!(key instanceof String)) {
    			throw new RuntimeException("Feature keys must be strings!");
    		}
    		else featureKeysList.add((String)key);
    	}
    	return featureKeysList;
    }
    
	
    /** 
     * Returns a log prob for the words in wordsToScore.
     * The default method returns the log prob of the word sequence 
     * as determined by this language model's <code>logProbFromNgram</code> method.
     * The probabilities for the first n-1 words are backed off to the  
     * lower order probabilities.
     * If the tagsAdded flag is false, the cache is checked to see whether 
     * the log prob of the words of signToScore's initial sign has already 
     * been calculated, and at the end the log prob of signToScore's words 
     * is stored in the cache.
     */
    protected double logprob() {
        float logProbTotal = 0;
        int numCached = 0;
        if (!tagsAdded && signToScore != null) { // check cache for initial words
            Sign[] inputs = signToScore.getDerivationHistory().getInputs();
            if (inputs != null) {
                Sign initialSign = (!reverse) ? inputs[0] : inputs[inputs.length-1];
                List<Word> initialWords = initialSign.getWords();
                Float logprob = getCachedLogProb(initialWords);
                if (logprob != null) {
                    logProbTotal = logprob.floatValue();
                    numCached = initialWords.size();
                }
            }
        }
        for (int i = numCached; i < wordsToScore.size(); i++) {
            int orderToUse = Math.min(order, i+1);
            int startPos = i - (orderToUse-1);
            logProbTotal += logProbFromNgram(startPos, orderToUse);
        }
        if (!tagsAdded && signToScore != null) { // add log prob to cache
            putCachedLogProb(signToScore.getWords(), new Float(logProbTotal));
        }
        return logProbTotal;
    }
    
    
    /**
	 * Returns the log prob of the ngram starting at the given index in
	 * wordsToScore and with the given order, with backoff.
	 */
    abstract protected float logProbFromNgram(int i, int order);
    
    /**
	 * Sets the keys in keysList to hold the ngram starting at the given index in
	 * wordsToScore and with the given order; returns true if the operation 
	 * succeeds normally. The default implementation invokes
	 * logProbFromNgram, and returns false if the log prob is zero.
	 */
	protected boolean setKeysToNgram(int i, int order) {
		float logprob = logProbFromNgram(i, order);
		return logprob != 0;
	}

    
	/** Flag for using ngrams as features. */
	protected boolean useNgramFeatures = true;
	
    /** Sets the the flag for using ngrams as features. */
	public void setNgramFeatures(boolean useNgramFeatures) { 
		this.useNgramFeatures = useNgramFeatures; 
	}

	
    /**
     * Flag whether to use sem classes in place of words.
     * Defaults to false.
     */
    protected boolean useSemClasses = false;
    
    // tokenizer reference
    private Tokenizer tokenizer = null;

    private Tokenizer getTokenizer() {
        if (tokenizer != null) return tokenizer;
        if (Grammar.theGrammar != null) tokenizer = Grammar.theGrammar.lexicon.tokenizer;
        else tokenizer = new DefaultTokenizer();
        return tokenizer;
    }
    
    /** Returns whether the given semantic class is a replacement one. */
    protected boolean isReplacementSemClass(String semClass) {
        return semClass != null && getTokenizer().isReplacementSemClass(semClass);
    }
    
    /**
	 * Returns the semantic class replacement value (the semantic class
	 * uppercased and interned) for the given word, if apropos, otherwise null.
	 */
    protected String semClassReplacement(Word w) {
        if (useSemClasses) {
            String semClass = w.getSemClass();
            if (isReplacementSemClass(semClass)) 
                return semClass.toUpperCase().intern();
        }
        // otherwise null
        return null;
    }
    
    
    /**
	 * Adds the TrieMap children, with their keys, under the given prefix, then
	 * resets the lists.
	 */
    protected void addTrieMapChildren(List<Object> prefix, List<Object> keys, List<TrieMap<Object,NgramFloats>> children) {
        if (!keys.isEmpty()) {
            TrieMap<Object,NgramFloats> prefixNode = trieMapRoot.findChildFromList(prefix);
            prefixNode.addChildren(keys, children);
        }
        prefix.clear(); keys.clear(); children.clear();
    }
    
    /** Returns the TrieMap node for the given sublist of keysList. */ 
    protected TrieMap<Object,NgramFloats> getNode(int pos, int len) {
        return trieMapRoot.getChildFromList(keysList.subList(pos, pos+len));
    }
    
    
    // from CMU-Cambridge Statistical Language Modeling Toolkit
    //
    // p(wd3|wd1,wd2)= if(trigram exists)           p_3(wd1,wd2,wd3)
                    // else if(bigram w1,w2 exists) bo_wt_2(w1,w2)*p(wd3|wd2)
                    // else                         p(wd3|w2)
    // 
    // p(wd2|wd1)= if(bigram exists) p_2(wd1,wd2)
                // else              bo_wt_1(wd1)*p_1(wd2)
    
    /**
	 * Returns the log prob (base 10) of the given sublist of keysList, with
	 * backoff, or -99 if not found.
	 */
    protected float logProb(int pos, int len) {
        TrieMap<Object,NgramFloats> node = getNode(pos, len);
        if (node != null && node.data != null) return node.data.logprob;
        if (len == 1) return -99;
        float retval = logProb(pos+1, len-1);
        if (debugScore) System.out.print("(" + (len-1) + "-gram: " + retval + ") ");
        if (retval > -99) retval += backoffWeight(pos, len-1);
        return retval;
    }
    
    /**
	 * Returns the back-off weight (log base 10) of the given sublist of
	 * keysList, or 0 if not found.
	 */
    protected float backoffWeight(int pos, int len) {
        TrieMap<Object,NgramFloats> node = getNode(pos, len);
        if (node != null && node.data != null) {
            float retval = node.data.bow;
            // if (debugScore && retval != 0) System.out.print("(bow: " + retval + ") ");
            return retval;
        }
        return 0;
    }


	/**
     * Returns the rank order centroid weights for a ranked list of the given length. 
     * The weights go from highest to lowest, and sum to 1.
     */
    // ex:
    // weight 1 0.5208333333333333
    // weight 2 0.2708333333333333
    // weight 3 0.14583333333333331
    // weight 4 0.0625
    public static double[] rankOrderCentroidWeights(int length) {
        double[] retval = new double[length];
        for (int i = 0; i < length; i++) {
            double weight_i = 0;
            for (int j = i; j < length; j++) {
                weight_i += 1 / (double) (j+1);
            }
            weight_i = weight_i / (double) length;
            retval[i] = weight_i;
        }
        return retval;
    }
    
    
    /** Converts a base 10 log prob to an actual probability, checking for -99 (not found). */
    public static double convertToProb(double logProb) {
        if (logProb <= -99) { return 0; }
        else return Math.pow(10, logProb);
    }
    
    /** Converts a probability to a base 10 log prob, returning -99 if zero. */
    public static double convertToLogProb(double prob) {
        if (prob == 0) return -99;
        else return Math.log(prob) / Math.log(10);
    }
    
    /** Converts a base 10 log prob to the corresponding perplexity. */
    public static double convertToPPL(double logProb) {
        return Math.exp(- logProb * Math.log(10));
    }

    
    /** Sets up tokenizer for reading in language models. */ 
    protected static StreamTokenizer initTokenizer(Reader in) {
        StreamTokenizer tokenizer = new StreamTokenizer(in);
        tokenizer.resetSyntax();
        tokenizer.wordChars(0,255);
        tokenizer.whitespaceChars(' ',' ');
        tokenizer.whitespaceChars('\t','\t');
        tokenizer.whitespaceChars('\n','\n');
        tokenizer.whitespaceChars('\r','\r');
        tokenizer.eolIsSignificant(true);
        return tokenizer;
    }
    
    /**
	 * Reads a line of up to tokens.length tokens using the given tokenizer,
	 * with the remaining array elements set to null.
	 */
    protected static void readLine(StreamTokenizer tokenizer, String[] tokens) throws IOException {
        int index = 0;
        int ttype;
        while ( (ttype = tokenizer.nextToken()) != StreamTokenizer.TT_EOF && ttype != StreamTokenizer.TT_EOL ) {
            if (index < tokens.length && ttype == StreamTokenizer.TT_WORD) { 
                tokens[index] = tokenizer.sval;
                index++;
            }
        }
        for (int i = index; i < tokens.length; i++) {
            tokens[i] = null;
        }
    }
}


================================================
FILE: src/opennlp/ccg/ngrams/RepetitionScorer.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2004 University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.ngrams;

import opennlp.ccg.synsem.Sign;
import opennlp.ccg.synsem.SignScorer;
import opennlp.ccg.lexicon.Word;

import java.util.*;
import gnu.trove.*;

/**
 * Scores a sign according to how repetitive its words are given the 
 * observed context.  Relevant repeated items (eg stems) are counted, 
 * with full counts given to items in the previous words or recent context, 
 * and fractional counts to older items.  The score is then assigned according 
 * to the number of repeated items and the configured penalty, as 
 * 10 to the minus (penalty times repeated items).
 *
 * @author      Michael White
 * @version     $Revision: 1.6 $, $Date: 2011/03/20 20:11:58 $
 */
@SuppressWarnings({"unchecked","rawtypes"})
public class RepetitionScorer implements SignScorer
{
    /** The repetition penalty (defaults to 1.0). */
    public double penalty = 1.0;

    /** The fractional count for the older items (defaults to 0.5). */
    public double olderCount = 0.5;
    
    /** The fractional count for the even older items (defaults to 0.25). */
    public double evenOlderCount = 0.25;
    
    /** The fractional count for the oldest items (defaults to 0.125). */
    public double oldestCount = 0.125;
    
    /** The interned POS values to use for repetition scoring purposes. */
    protected Set posValsToUse = new THashSet(new TObjectIdentityHashingStrategy());
    
    /** The interned stems to ignore for repetition scoring purposes. */
    protected Set stemsToIgnore = new THashSet(new TObjectIdentityHashingStrategy());
    
    /** The interned items (eg stems) seen in the previous words. */
    protected Set previousItems = new THashSet(new TObjectIdentityHashingStrategy());
    
    /** The interned items (eg stems) seen in the recent context. */
    protected Set contextItems = new THashSet(new TObjectIdentityHashingStrategy());
    
    /** The interned items (eg stems) seen in the older context. */
    protected Set olderContextItems = new THashSet(new TObjectIdentityHashingStrategy());
    
    /** The interned items (eg stems) seen in the even older context. */
    protected Set evenOlderContextItems = new THashSet(new TObjectIdentityHashingStrategy());
    
    /** The interned items (eg stems) seen in the oldest context. */
    protected Set oldestContextItems = new THashSet(new TObjectIdentityHashingStrategy());
    
    /**
     * Default constructor.
     * Adds "NNP", "N", "V", "Adj" and "Adv" to posValsToUse, 
     * and "do" and "not" to stemsToIgnore.
     */
    public RepetitionScorer() {
        String[] posVals = { "NNP", "N", "V", "Adj", "Adv" };
        posValsToUse.addAll(Arrays.asList(posVals));
        String[] stems = { "do", "not" };
        stemsToIgnore.addAll(Arrays.asList(stems));
    }
    
    /** Resets all the context items. */
    public void resetContext() { 
        contextItems.clear(); olderContextItems.clear(); 
        evenOlderContextItems.clear(); oldestContextItems.clear();
    }
    
    /** Ages the context items, clearing the recent ones. */
	public void ageContext() { 
        oldestContextItems.clear(); oldestContextItems.addAll(evenOlderContextItems);
        evenOlderContextItems.clear(); evenOlderContextItems.addAll(olderContextItems);
        olderContextItems.clear(); olderContextItems.addAll(contextItems);
        contextItems.clear(); 
    }
    
    /** Adds the items (eg stems) from the given sign's words to the context items. */
    public void updateContext(Sign sign) {
        List words = sign.getWords(); 
        if (words == null) return;
        for (int i = 0; i < words.size(); i++) {
            Word word = (Word) words.get(i);
            updateItems(word, contextItems);
        }
    }
    
    /** 
     * Adds the items (eg stems) from the given word to the given set.
     * By default, adds the relevant stems, per the relevantStem method.
     */
    protected void updateItems(Word word, Set set) {
        String stem = relevantStem(word);
        if (stem != null) set.add(stem);
    }

    /**
     * Returns the stem of the given word if its POS is in posValsToUse, 
     * unless the stem is in stemsToIgnore; otherwise returns null.
     */
    protected String relevantStem(Word word) {
        if (!(posValsToUse.contains(word.getPOS()))) return null;
        String stem = word.getStem();
        if (!(stemsToIgnore.contains(stem))) return stem;
        return null;
    }
    
    /** 
     * Returns a score between 0 (worst) and 1 (best) for the given sign 
     * and completeness flag, according to how repetitive its word are compared to 
     * the observed context.  
     * In particular, returns 10 to the minus (penalty times repeated items), 
     * or zero if there are no words.
     */
    public double score(Sign sign, boolean complete) {
        List words = sign.getWords(); 
        if (words == null) return 0;
        return Math.pow(10, -1 * penalty * repeatedItems(words));
    }
    
    /** 
     * Returns the number of repeated items (eg stems) in the given word list, 
     * using fractional counts for repetitions of older items.
     * The previous items set is cleared, and then the repeated items 
     * are summed for each word, updating the previous items along the way.
     */
    protected double repeatedItems(List words) {
        previousItems.clear();
        double retval = 0;
        for (int i = 0; i < words.size(); i++) {
            Word word = (Word) words.get(i);
            retval += repeatedItems(word);
            updateItems(word, previousItems);
        }
        return retval;
    }
    
    /** 
     * Returns the number of repeated items (eg stems) in the given word, 
     * using fractional counts for repetitions of older items.
     * By default, returns 1 (or a fractional count) if the stem is relevant, 
     * per the relevantStem method. 
     */
    protected double repeatedItems(Word word) {
        String stem = relevantStem(word);
        if (stem == null) return 0;
        if (contextItems.contains(stem) || previousItems.contains(stem)) return 1;
        if (olderContextItems.contains(stem)) return olderCount;
        if (evenOlderContextItems.contains(stem)) return evenOlderCount;
        if (oldestContextItems.contains(stem)) return oldestCount;
        return 0;
    }
}


================================================
FILE: src/opennlp/ccg/ngrams/Reversible.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2005 University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.ngrams;


/**
 * Interface for reversible n-gram classes.
 *
 * @author      Michael White
 * @version     $Revision: 1.1 $, $Date: 2005/05/26 22:18:05 $
 */
public interface Reversible
{
    /** Get reverse flag. */
    public boolean getReverse();
    
    /** Set reverse flag. */
    public void setReverse(boolean reverse);
}


================================================
FILE: src/opennlp/ccg/ngrams/SRILMNgramModel.java
================================================
/*
 * $Id: SRILMNgramModel.java,v 1.5 2008/11/09 03:29:36 mwhite14850 Exp $ 
 */
package opennlp.ccg.ngrams;

import java.io.File;
import java.io.IOException;
import java.util.List;
import java.util.ListIterator;

import opennlp.ccg.lexicon.DefaultTokenizer;
import opennlp.ccg.lexicon.Tokenizer;
import opennlp.ccg.lexicon.Word;


/**
 * A language model that uses the
 * <acronym title="Stanford Research Institute">SRI</acronym> language modeling
 * toolkit.
 * @author <a href="http://www.ling.osu.edu/~scott/">Scott Martin</a>
 * @see <a href="http://www.speech.sri.com/projects/srilm/">SRILM</a>
 * @version $Revision: 1.5 $
 * @since 0.9.2
 */
public class SRILMNgramModel extends AbstractStandardNgramModel {

	/**
	 * Load the binary, platform-dependent library containing the SRILM JNI
	 * bridge code. See ${OPENCCG_HOME}/src/srilmbridge.
	 * @throws UnsatisfiedLinkError If Java can't find the srilmbridge library.
	 */
	static {
		System.loadLibrary("srilmbridge");
	}
	
	/**
	 * Creates a SRILM language model with the specified ngram order and model
	 * type.
	 * @param order The ngram order to use.
	 * @param lmFile The file to read the langauge model from.
	 * @param useSemClasses Whether or not to use semantic classes.
	 * @param modelType The type of language model.
	 * @throws IOException If a problem occurs reading the language model file.
	 * These include non-existent or unreadable files, file format problems,
	 * etc. 
	 */
	public SRILMNgramModel(int order, File lmFile,
		boolean useSemClasses, SRILMNgramModelType modelType)
			throws IOException {
		super(order, useSemClasses);
		loadLMFromFile(order, lmFile, modelType);
	}

	/**
	 * Creates a new SRILM language model.
	 * @see SRILMNgramModel#SRILMNgramModel(int, File, boolean,
	 * SRILMNgramModelType)
	 */
	public SRILMNgramModel(int order, File lmFile,
		SRILMNgramModelType modelType)
			throws IOException {
		this(order, lmFile, false, modelType);
	}
	
	/**
	 * Loads an LM from a file.
	 * @param ngramOrder The ngram order to use.
	 * @param lmFile The file containing the language model.
	 * @param lmType The type of langauge model to expect.
	 * @throws IOException If the language model file is non-existent or
	 * <code>null</code>, or if a problem occurs loading or parsing the file.
	 */
	protected void loadLMFromFile(int ngramOrder, File lmFile, 
				SRILMNgramModelType lmType)
			throws IOException {
		if(lmFile == null) {
			throw new IOException("null file");
		}
		if(!lmFile.exists()) {
			throw new IOException("file does not exist: " + lmFile);
		}
		if(lmFile.isDirectory()) {
			throw new IOException("file is a directory: " + lmFile);
		}
		if(!lmFile.canRead()) {
			throw new IOException("unable to read file: " + lmFile);
		}
		
		loadLM(ngramOrder, lmFile.getAbsolutePath(), lmType.ordinal());
	}

	/**
	 * Calculates a log probability of a delineated substring of the strings
	 * to score using SRILM. This method reverses the context before passing
	 * the string to SRILM, as this is the format SRILM expects.
	 * @param pos The start position (inclusive) within the strings to score.
	 * @param len The length, starting from <null>pos</null>, of the string
	 * that should be used.  
	 */
	@Override
	public float logProb(int pos, int len) {
		try {
			// create new because reversing list affects keysList
			List<Object> range = keysList.subList(pos, pos + len);
			int rangeSize = range.size();
			if(rangeSize == 0) {
				throw new IllegalArgumentException(
						"empty range specified for log prob");
			}
			
			// only allocate context array if we have to
			String[] context = (rangeSize > 1)
				? new String[rangeSize - 1] : null;
			
			if(context != null) { // reverse for SRILM				
				ListIterator<Object> contextIterator
					= range.listIterator(rangeSize - 1);
				int i = 0;
				while(contextIterator.hasPrevious()) {
					context[i++] = contextIterator.previous().toString();
				}
			}
			
			// call SRILM to get word in reversed context
			return doLogProb(range.get(rangeSize - 1).toString(), context);
		}
		catch(IndexOutOfBoundsException e) {
			return 0.0f;
		}
	}

	/**
	 * Invokes SRILM to load a language model.
	 * @param ngramOrder The order of the language model
	 * @param fileAbsolutePath The absolute path of the file containing the
	 * language model.
	 * @param lmType The language model type.
	 * @throws IOException If a problem happens with SRILM while trying to
	 * load the language model.
	 */
	private native void loadLM(int ngramOrder, String fileAbsolutePath,
			int lmType)
		throws IOException;

	/**
	 * Invokes SRILM to calculate the log probability of a string in the
	 * given context. SRILM will make its calculations based on the language
	 * model loaded in {@link #loadLM(int, String, int)}.
	 * @param word The word to calculate a probability for.
	 * @param context The context, in reverse order. For example, to calculate
	 * the probability of the word &quot;rain&quot; in the context of the
	 * string &quot;in the rain&quot;, the context should be the array
	 * <code>{the, in}</code>. If the context is <code>null</code> or
	 * zero-length, SRILM will assume this means no context should be used.
	 * @return The log probability of the given word in the given (reversed)
	 * context, as determined by SRILM.
	 */
	private native float doLogProb(String word, String[] context);

	/**
	 * Invokes SRILM to clean up any initialized objects.
	 */
	@Override
	protected native void finalize() throws Throwable;
	
	public static void main(String[] args) throws Exception {
		String usage = "Usage: java opennlp.ccg.ngrams.SRILMNgramModel"
			+ " <order> <lmfile> <lmtype> <tokens> (-reverse)";
        
        if (args.length > 0 && args[0].equals("-h")) {
            System.out.println(usage);
            return;
        }
        
        long start = System.currentTimeMillis();
        String order = args[0];
        String lmfile = args[1];
        String lmType = args[2];
        String tokens = args[3];
        String reversed = (args.length >= 5 && args[4].equals("-reverse"))
        	? "reversed " : "";
        System.out.println("Loading " + reversed
        		+ "n-gram model with order " + order + " from: " + lmfile);
        SRILMNgramModel lm = new SRILMNgramModel(Integer.parseInt(order),
        		new File(lmfile), SRILMNgramModelType.valueOf(lmType));
        if (reversed.length() > 0) lm.setReverse(true);
        System.out.println("openVocab: " + lm.openVocab);
        int secs = (int) (System.currentTimeMillis() - start) / 1000;
        System.out.println("secs: " + secs);
        System.out.println();
        // System.out.println("trie map: ");
        // System.out.println(lm.trieMapRoot.toString());
        // System.out.println();
        
        Tokenizer tokenizer = new DefaultTokenizer();
        List<Word> words = tokenizer.tokenize(tokens);
        System.out.println("scoring: " + tokens);
        System.out.println();
        lm.debugScore = true;
        lm.setWordsToScore(words, true);
        lm.prepareToScoreWords();
        double logprob = lm.logprob();
        double score = convertToProb(logprob);
        System.out.println();
        System.out.println("score: " + score);
        System.out.println("logprob: " + logprob);
        System.out.println("ppl: " + NgramScorer.convertToPPL(logprob / (words.size()-1)));
	}
}


================================================
FILE: src/opennlp/ccg/ngrams/SRILMNgramModelType.java
================================================
/*
 * $Id: SRILMNgramModelType.java,v 1.2 2007/05/30 22:53:17 coffeeblack Exp $ 
 */
package opennlp.ccg.ngrams;


/**
 * Used by {@link SRILMNgramModel} to specify the type of language model that
 * should be used.
 * @author <a href="http://www.ling.osu.edu/~scott/">Scott Martin</a>
 * @see <a href="http://www.speech.sri.com/projects/srilm/">SRILM</a>
 * @version $LastChangedRevision$
 */
public enum SRILMNgramModelType {
	/*!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!*
	 * It is very important that the order of these does not      *
	 * change, as {@link SRILMNgramModel#loadLM(int, String, int)}*
	 * relies on the ordinal.                                     *
	 *!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!*/
	
	/**
	 * A &quot;standard&quot; ngram model, of the type normally created by
	 * the SRILM binary <code>ngram-count</code>.
	 */
	STANDARD,
	
	/**
	 * For ngram models based on count LMs. The Google LM format is one of
	 * these.
	 * @see <a href="http://www.ldc.upenn.edu/Catalog/CatalogEntry.jsp?catalogId=LDC2006T13">Web 1T 5-gram Version 1</a>
	 */
	COUNT;
}


================================================
FILE: src/opennlp/ccg/ngrams/SRILM_FactoredScorerMaker.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2004 University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.ngrams;

import opennlp.ccg.synsem.SignScorer;

import java.io.*;

/**
 * A custom scorer maker that builds and loads factored n-gram models using the 
 * SRILM toolkit, which must be separately installed.
 * Most parameters are set in the FLM spec file.
 *
 * @author  Michael White
 * @version $Revision: 1.6 $, $Date: 2007/12/21 05:13:37 $
 */
public class SRILM_FactoredScorerMaker extends SRILM_ScorerMaker {
    
    /** The base of the model FLM spec file name.  Defaults to "test.flm". */
    public String flmSpecFileBase = "test.flm";
    
    
    /** Returns the model FLM spec filename, extending flmSpecFileBase with the discount options string and 
        n-gram order, eg "test.flm.n4". */
    protected String flmSpecFilename() {
        return flmSpecFileBase + "." + discountOptionsStr + getOrder();
    }
    
    /** Returns the root of the perplexities filename. */
    protected String pplFileRoot() { return flmSpecFilename(); }
    
    /** Creates fold-specific FLM spec filenames from fold numbers, eg "test.flm.n4.fold1". */
    protected String filename(int foldNum) {
        return flmSpecFilename() + "." + "fold" + foldNum;
    }
    
    
    /** Writes a fold-specific FLM spec file, given the tmp dir and fold num.
        The fold-specific file is created by simply replacing ".count" with ".foldN.count" 
        and ".lm" with ".foldN.lm", where N is the fold num, in the model FLM spec file. */
    protected void writeFoldSpecFile(File tmpDir, int foldNum) throws IOException {
        BufferedReader br = new BufferedReader(new FileReader(flmSpecFilename()));
        File foldSpecFile = new File(tmpDir, filename(foldNum));
        PrintWriter out = new PrintWriter(new FileWriter(foldSpecFile));
        String dotFoldN = ".fold" + foldNum;
        String line = null;
        while ((line = br.readLine()) != null) {
            int countIndex = line.indexOf(".count");
            if (countIndex > 0) {
                String foldLine = line.substring(0, countIndex);
                foldLine += dotFoldN;
                int lmIndex = line.indexOf(".lm", countIndex);
                foldLine += line.substring(countIndex, lmIndex);
                foldLine += dotFoldN;
                foldLine += line.substring(lmIndex);
                out.println(foldLine);
            }
            else {
                out.println(line);
            }
        }
        out.close();
        br.close();
    }
    
    /**
     * Prepares a scoring model from the training data, 
     * by exec-ing the SRILM fngram-count tool with the FLM spec file, 
     * and computes perplexity on the test data.
     * The training/test data are written to foldN-train.txt and foldN-test.txt, 
     * if not already present.
     * The fold-specific FLM spec file's name is determined by filename(N).
     */
    public void prepScorer(File tmpDir, int foldNum, File trainFile, File testFile) throws IOException {
        // write fold spec file
        writeFoldSpecFile(tmpDir, foldNum);
        // do rest much like standard n-gram scorers
        super.prepScorer(tmpDir, foldNum, trainFile, testFile);
    }
    
    /** Writes training/test targets. */
    protected void writeTargets(File tbFile, String textfile) throws IOException {
        if (!useSemClasses) 
            cvr.tester.writeTargetsF(tbFile, textfile); 
        else 
            cvr.tester.writeTargetsFSC(tbFile, textfile); 
    }
    
    /** Returns the command for making an ngram model. */
    protected String countNgrams(int foldNum) {
        String cmd = "fngram-count -nonull -write-counts -lm " +
                     ((unk) ? "-unk " : "") + 
                     "-factor-file " + filename(foldNum) + " " +  
                     "-text " + trainingfile(foldNum) + " " +  
                     "-debug " + debugLevel;
        return cmd;
    }
    
    /** Returns the command for calculating perplexity. 
        NB: At present, only the perplexity from the first model is collected. */
    protected String scoreNgrams(int foldNum) {
        String lmfile = filename(foldNum);
        String cmd2 = "fngram -nonull " + 
                      ((unk) ? "-unk " : "") + 
                      "-factor-file " + lmfile + " " +  
                      "-ppl " + testfile(foldNum);
        return cmd2;
    }
    
    
    /**
     * Loads a scoring model created from the training data. 
     */
    public SignScorer loadScorer(File tmpDir, int foldNum, File trainFile) throws IOException {
        File foldSpecFile = new File(tmpDir, filename(foldNum));
        String foldSpecPath = foldSpecFile.getCanonicalPath();
        return new FactoredNgramModelFamily(foldSpecPath, useSemClasses);
    }
}


================================================
FILE: src/opennlp/ccg/ngrams/SRILM_ScorerMaker.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2004 University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.ngrams;

import opennlp.ccg.synsem.SignScorer;
import opennlp.ccg.test.*;
import java.io.*;
import java.util.*;

/**
 * A custom scorer maker that builds and loads standard n-gram models using the 
 * SRILM toolkit, which must be separately installed.
 * This class may be subclassed to set different parameters in the constructor, 
 * for use in cross-validation tests with the realizer.
 *
 * @author  Michael White
 * @version $Revision: 1.10 $, $Date: 2007/12/21 05:13:37 $
 */
public class SRILM_ScorerMaker implements ScorerMaker {
    
    /** Flag specifying whether to use semantic class replacement. */
    public boolean useSemClasses = true;
    
    /** Flag specifying whether to keep &lt;unk&gt; in the LM. */
    public boolean unk = true;
    
    /** String specifying the min counts to use in building the n-gram model. */
    public String minCountOptions = "-gt1min 1 -gt2min 1 -gt3min 1 -gt4min 1 -gt5min 1 -gt6min 1";
    
    /** String specifying the discounting parameters. */
    public String discountOptions = N_DISCOUNT_PARAMS;
    
    /** String specifying natural discounting parameters. */
    public static final String N_DISCOUNT_PARAMS = "-ndiscount1 -ndiscount2 -ndiscount3 -ndiscount4 -ndiscount5 -ndiscount6";

    /** String specifying Witten-Bell discounting parameters. */
    public static final String WB_DISCOUNT_PARAMS = "-wbdiscount1 -wbdiscount2 -wbdiscount3 -wbdiscount4 -wbdiscount5 -wbdiscount6";
    
    /** String specifying modified Kneser-Ney natural discounting parameters. */
    public static final String KN_DISCOUNT_PARAMS = "-kndiscount1 -kndiscount2 -kndiscount3 -kndiscount4 -kndiscount5 -kndiscount6";
    
    /** String indicating the discounting option in filenames. */
    public String discountOptionsStr = "n"; 
    
    /** Debug level to use. */
    public int debugLevel = 1;
    
    
    /** The context for this scorer maker. */
    public CrossValidateRealizer cvr = null;
    
    /** Sets the context for this scorer maker. */
    public void setCVR(CrossValidateRealizer cvr) { this.cvr = cvr; }
    
    
    /** Stores perplexities for each fold, after calls to prepScorer. */
    protected List<Double> perplexities = new ArrayList<Double>();
    
    /** Gets the n-gram order from the context, defaulting to 3. */
    protected int getOrder() {
        int order = cvr.tester.ngramOrder;
        return (order > 0) ? order : 3;
    }
    
    /** Creates LM filenames from fold numbers. */
    protected String filename(int foldNum) {
        String retval = "fold" + foldNum + "-" + discountOptionsStr;  
        if (useSemClasses) retval += "-sc";
        retval += "." + getOrder() + "bo";
        return retval;
    }
    
    /**
     * Prepares a scoring model from the training data, 
     * by exec-ing the SRILM ngram-count tool with the current options, 
     * and computes perplexity on the test data.
     * The training/test data are written to foldN-train.txt and foldN-test.txt, 
     * if not already present.
     * The LM file's name is determined by filename(N).
     */
    public void prepScorer(File tmpDir, int foldNum, File trainFile, File testFile) throws IOException {
        // write training/test files, if not already present
        writeTrainingAndTestFiles(tmpDir, foldNum, trainFile, testFile);
        // make counting command
        String cmd = countNgrams(foldNum);
        // exec command
        System.out.print("Writing " + getOrder() + "-gram model: " + filename(foldNum) + "\n");
        Process makeLM = Runtime.getRuntime().exec(cmd, null, tmpDir);
        try {
            InputStream istr = makeLM.getErrorStream(); //.getInputStream();
            int b;
            while ((b = istr.read()) != -1) { System.out.print((char)b); }
            int exitval = makeLM.waitFor();
            if (exitval != 0) {
                System.out.println("(f)ngram-count exitval: " + exitval);
            }
        }
        catch (InterruptedException exc) {
            throw (RuntimeException) new RuntimeException().initCause(exc);
        }
        System.out.println();
        // make scoring command, for perplexity
        String cmd2 = scoreNgrams(foldNum);
        // exec command
        System.out.print("Measuring perplexity with: " + filename(foldNum) + "\n");
        Process measurePPL = Runtime.getRuntime().exec(cmd2, null, tmpDir);
        try {
            InputStream istr = measurePPL.getInputStream();
            int b;
            StringBuffer sb = new StringBuffer();
            while ((b = istr.read()) != -1) { 
                System.out.print((char)b); sb.append((char)b); 
            }
            int exitval = measurePPL.waitFor();
            // extract perplexity following "ppl= "
            String pplOut = sb.toString();
            int pplStart = pplOut.indexOf("ppl= ") + "ppl= ".length();
            int pplEnd = pplOut.indexOf(" ", pplStart);
            String pplStr = pplOut.substring(pplStart, pplEnd);
            try {
                perplexities.add(new Double(pplStr));
            }
            catch (NumberFormatException exc) { 
                System.out.println("Warning, unable to extract perplexity from: " + pplStr);
                System.out.println(exc.toString());
            }
            if (exitval != 0) {
                System.out.println("(f)ngram exitval: " + exitval);
            }
        }
        catch (InterruptedException exc) {
            throw (RuntimeException) new RuntimeException().initCause(exc);
        }
        System.out.println();
    }
    
    /** Writes the training and test files, if not already present. */
    protected void writeTrainingAndTestFiles(File tmpDir, int foldNum, File trainFile, File testFile) throws IOException {
        File trainingFoldFile = new File(tmpDir, trainingfile(foldNum)); 
        if (!trainingFoldFile.exists()) {
            String trainingFoldPath = trainingFoldFile.getCanonicalPath();
            writeTargets(trainFile, trainingFoldPath);
        }
        File testFoldFile = new File(tmpDir, testfile(foldNum)); 
        if (!testFoldFile.exists()) {
            String testFoldPath = testFoldFile.getCanonicalPath();
            writeTargets(testFile, testFoldPath); 
        }
    }
    
    /** Returns the name of the training file. */
    protected String trainingfile(int foldNum) { return "fold" + foldNum + "-train.txt"; }
        
    /** Returns the name of the test file. */
    protected String testfile(int foldNum) { return "fold" + foldNum + "-test.txt"; }
        
    /** Writes training/test targets. */
    protected void writeTargets(File tbFile, String textfile) throws IOException {
        if (!useSemClasses) 
            cvr.tester.writeTargets(tbFile, textfile); 
        else 
            cvr.tester.writeTargetsSC(tbFile, textfile); 
    }

    /** Returns the command for making an ngram model. */
    protected String countNgrams(int foldNum) {
        String lmfile = filename(foldNum);
        String cmd = "ngram-count -order " + getOrder() + " " + 
                     ((unk) ? "-unk " : "") + 
                     minCountOptions + " " + 
                     discountOptions + " " + 
                     "-text " + trainingfile(foldNum) + " " +  
                     "-lm " + lmfile + " " + 
                     "-debug " + debugLevel;
        return cmd;
    }
    
    /** Returns the command for calculating perplexity. */
    protected String scoreNgrams(int foldNum) {
        String lmfile = filename(foldNum);
        String cmd2 = "ngram -order " + getOrder() + " " + 
                      ((unk) ? "-unk " : "") + 
                      "-ppl " + testfile(foldNum) + " " +  
                      "-lm " + lmfile;
        return cmd2;
    }
    
    /** Returns the root of the perplexities filename. */
    protected String pplFileRoot() {
        return discountOptionsStr + getOrder();
    }
    
    /**
     * Summarizes perplexities after all calls to prepScorer.
     */
    public void prepScorersSummary(File tmpDir) throws IOException {
        // summarize to sysout
        double sum = 0;
        System.out.print("Perplexities: ");
        for (int i = 0; i < perplexities.size(); i++) {
            double ppl = perplexities.get(i).doubleValue();
            System.out.print(ppl + " ");
            sum += ppl;
        }
        System.out.println();
        double avg = sum / perplexities.size();
        System.out.println("Avg: " + avg);
        // then to xml
        String filename = "ppl";  
        if (useSemClasses) filename += "-sc";
        filename += "." + pplFileRoot() + ".xml";
        System.out.println("Writing perplexities: " + filename);
        PrintWriter pw = new PrintWriter(new FileWriter(new File(tmpDir, filename)));
        pw.println("<perplexities avg=\"" + avg + "\">");
        for (int i = 0; i < perplexities.size(); i++) {
            pw.println("  <fold num=\"" + i + "\" ppl=\"" + perplexities.get(i) + "\"/>");
        }
        pw.println("</perplexities>");
        pw.close();
    }
    
    
    /**
     * Loads a scoring model created from the training data. 
     */
    public SignScorer loadScorer(File tmpDir, int foldNum, File trainFile) throws IOException {
        String lmfile = filename(foldNum);
        String lmPath = new File(tmpDir, lmfile).getCanonicalPath();
        return new StandardNgramModel(getOrder(), lmPath, useSemClasses);
    }
}


================================================
FILE: src/opennlp/ccg/ngrams/SelfParaphraseBiaser.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2011 Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.ngrams;

/**
 * Interface for scoring models that implement a self-paraphrase bias.
 *
 * @author      Michael White
 * @version     $Revision: 1.1 $, $Date: 2011/05/15 20:35:06 $
 */
public interface SelfParaphraseBiaser {
	/** Sets the target strings for implementing the self-paraphrase bias. */
	public void setTargets(String[] targets);
}


================================================
FILE: src/opennlp/ccg/ngrams/SignScorerInterpolation.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2005 University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.ngrams;

import opennlp.ccg.perceptron.*;
import opennlp.ccg.synsem.Sign;
import opennlp.ccg.synsem.SignScorer;

/**
 * Linear interpolation of sign scorers, some of which may be feature extractors.
 *
 * @author      Michael White
 * @version     $Revision: 1.3 $, $Date: 2011/01/15 17:52:59 $
 */
public class SignScorerInterpolation implements SignScorer, FeatureExtractor
{
    /** The component models. */
    protected SignScorer[] models;
    
    /** The weights. */
    protected double weights[];
    
    /** The composed feature extractor. */
    protected ComposedFeatureExtractor composedFeatureExtractor;
    
    /**
     * Constructor with component models, which are given uniform weights.
     */
    public SignScorerInterpolation(SignScorer[] models) { 
        this.models = models;
        this.weights = new double[models.length];
        for (int i = 0; i < models.length; i++) {
            weights[i] = 1.0 / models.length;
        }
    }
    
    /**
     * Constructor with component models and weights.
     * The weights are assumed to sum to 1, 
     * and the number of weights is assumed to match the number of models.
     */
    public SignScorerInterpolation(SignScorer[] models, double[] weights) { 
        this.models = models;
        this.weights = weights;
        this.composedFeatureExtractor = new ComposedFeatureExtractor(models);
    }
    
    /** 
     * Returns a score between 0 (worst) and 1 (best) for the given sign 
     * and completeness flag, as the interpolation of the scores assigned 
     * by the component models.
     * In particular, returns the linear combination using the established weights 
     * of the scores given by the component models. 
     */
    public double score(Sign sign, boolean complete) {
        double retval = 0;
        for (int i = 0; i < models.length; i++) {
            retval += models[i].score(sign, complete) * weights[i];
        }
        return retval;
    }
    
	/** Sets the alphabet for the component feature extractors. */
	public void setAlphabet(Alphabet alphabet) {
		composedFeatureExtractor.setAlphabet(alphabet);
	}
	
	/** Returns the features for the given sign and completeness flag from the component feature extractors. */
	public FeatureVector extractFeatures(Sign sign, boolean complete) {
		return composedFeatureExtractor.extractFeatures(sign, complete);
	}
}


================================================
FILE: src/opennlp/ccg/ngrams/SignScorerProduct.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2004 University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.ngrams;

import opennlp.ccg.perceptron.*;
import opennlp.ccg.synsem.Sign;
import opennlp.ccg.synsem.SignScorer;

// import java.util.*;

/**
 * Product of sign scorers, some of which may be feature extractors..
 *
 * @author      Michael White
 * @version     $Revision: 1.4 $, $Date: 2011/01/15 17:52:59 $
 */
public class SignScorerProduct implements SignScorer, FeatureExtractor
{
    /** The component models. */
    protected SignScorer[] models;
    
    /** The composed feature extractor. */
    protected ComposedFeatureExtractor composedFeatureExtractor;
    
    /**
     * Constructor with component models.
     */
    public SignScorerProduct(SignScorer[] models) { 
        this.models = models;
        this.composedFeatureExtractor = new ComposedFeatureExtractor(models);
    }
    
    /** 
     * Returns a score between 0 (worst) and 1 (best) for the given sign 
     * and completeness flag, as the product of the scores assigned 
     * by the component models.
     */
    public double score(Sign sign, boolean complete) {
        double retval = 1.0;
        for (int i = 0; i < models.length; i++) {
            retval *= models[i].score(sign, complete);
        }
        return retval;
    }
    
	/** Sets the alphabet for the component feature extractors. */
	public void setAlphabet(Alphabet alphabet) {
		composedFeatureExtractor.setAlphabet(alphabet);
	}
	
	/** Returns the features for the given sign and completeness flag from the component feature extractors. */
	public FeatureVector extractFeatures(Sign sign, boolean complete) {
		return composedFeatureExtractor.extractFeatures(sign, complete);
	}
}


================================================
FILE: src/opennlp/ccg/ngrams/StandardNgramModel.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2004-5 University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.ngrams;

import java.io.BufferedReader;
import java.io.FileReader;
import java.io.IOException;
import java.io.Reader;
import java.io.StreamTokenizer;
import java.util.ArrayList;
import java.util.List;

import opennlp.ccg.lexicon.DefaultTokenizer;
import opennlp.ccg.lexicon.Tokenizer;
import opennlp.ccg.lexicon.Word;
import opennlp.ccg.util.TrieMap;

/**
 * A scorer for a standard n-gram backoff model. 
 * Unknown words are mapped to &lt;unk&gt; if the latter is present in 
 * the model.
 *
 * @author      Michael White
 * @version     $Revision: 1.19 $, $Date: 2011/10/11 03:29:42 $
 */
public class StandardNgramModel extends AbstractStandardNgramModel
{
	/** 
     * Loads an n-gram model of the given order in ARPA (Doug Paul) format from
     * the given reader, with the given flag controlling whether words are
     * replaced by their semantic classes.
     */
    public StandardNgramModel(int order, Reader in, boolean useSemClasses)
    		throws IOException {
        super(order, useSemClasses);
        this.numNgrams = new int[order];
        readModel(in);
    }

    /** 
     * Loads an n-gram model of the given order in ARPA (Doug Paul) format from
     * the given reader. Words are not replaced by their semantic classes.
     */
	public StandardNgramModel(int order, Reader in) throws IOException {
		this(order, in, false);
	}

	/** 
     * Loads an n-gram model of the given order in ARPA (Doug Paul) format from
     * the given file, with the given flag controlling whether words are
     * replaced by their semantic classes.
     */
	public StandardNgramModel(int order, String filename, boolean useSemClasses)
			throws IOException {
		this(order, new BufferedReader(new FileReader(filename)),
        		useSemClasses);
	}

	/** 
     * Loads an n-gram model of the given order in ARPA (Doug Paul) format from
     * the given file. Words are not replaced by their semantic classes.
     */
	public StandardNgramModel(int order, String filename) throws IOException {
		this(order, filename, false); 
	}
	
	// reads in model
    private void readModel(Reader in) throws IOException {
        // setup
		//Tokenizer wordTokenizer = (Grammar.theGrammar != null)  
		//    ? Grammar.theGrammar.lexicon.tokenizer
		//    : new DefaultTokenizer();
        StreamTokenizer tokenizer = initTokenizer(in); 
        String[] tokens = new String[order+2];
        boolean foundData = false;
        int currentOrder = 0;
        List<Object> currentPrefix = new ArrayList<Object>();
        List<Object> currentKeys = null;
        List<TrieMap<Object,NgramFloats>> currentChildren = null;
        // loop through lines
        while (tokenizer.ttype != StreamTokenizer.TT_EOF) {
            // read line into tokens
            readLine(tokenizer, tokens);
            // check for blank line
            if (tokens[0] == null) continue;
            // check for initial delimiter
            if (tokens[0].equals("\\data\\")) { foundData = true; continue; }
            if (!foundData) continue;
            // read header line
            if (tokens[0].equals("ngram")) {
                int n = Integer.parseInt(tokens[1].substring(0,1)); 
                int total = Integer.parseInt(tokens[1].substring(2));
                if (n > order) continue;
                numNgrams[n-1] = total;
                // init children, keys lists
                if (currentChildren == null) { 
                    currentChildren = new ArrayList<TrieMap<Object,NgramFloats>>(total);  
                    currentKeys = new ArrayList<Object>(total);  
                }
                // calc totals (not actually used anymore)
                if (n == order) {
                    @SuppressWarnings("unused")
					int totalNgrams = 0;
                    for (int i = 0; i < order; i++) { totalNgrams += numNgrams[i]; }
                    // System.out.println("totalNgrams: " + totalNgrams);
                }
                continue;
            }
            // check for final delimiter
            if (tokens[0].equals("\\end\\")) {
                // add current children
                addTrieMapChildren(currentPrefix, currentKeys, currentChildren);
                break;
            }
            // read line starting new order
            if (tokens[0].equals("\\" + (currentOrder+1) + "-grams:")) { 
                // add current children
                addTrieMapChildren(currentPrefix, currentKeys, currentChildren);
                // System.out.println(tokens[0]);
                currentOrder++; continue; 
            } 
            if (currentOrder == 0) continue;
            if (currentOrder > order) break;
            // read logprob
            float logprob = Float.parseFloat(tokens[0]);
            // read back-off weight (except with last order)
            float bow = 0;
            if (currentOrder < order && tokens[currentOrder+1] != null) {
                bow = Float.parseFloat(tokens[currentOrder+1]);
            }
            // intern string tokens
            for (int i = 1; i < currentOrder+1; i++) {
                tokens[i] = tokens[i].intern();
            }
            // check prefix
            boolean samePrefix = (currentPrefix.size() == currentOrder-1);
            for (int i = 1; samePrefix && i < currentOrder; i++) {
                if (tokens[i] != currentPrefix.get(i-1)) samePrefix = false; 
            }
            // if changed, add current children, reset prefix 
            if (!samePrefix) {
                addTrieMapChildren(currentPrefix, currentKeys, currentChildren);
                for (int i = 1; i < currentOrder; i++) {
                    currentPrefix.add(tokens[i]);
                }
            }
            String key = tokens[currentOrder];
            currentKeys.add(key);
            currentChildren.add(new TrieMap<Object,NgramFloats>(new NgramFloats(logprob, bow)));
        }
        // set openVocab according to presence of <unk>
        openVocab = (trieMapRoot.getChild("<unk>") != null);
    }
    
    /** Test loading and scoring. */
    // NB: This produces the same scores as the SRILM ngram tool when both 
    //     <s> and </s> tags are used.
    public static void main(String[] args) throws IOException {
        
        String usage = "Usage: java opennlp.ccg.ngrams.StandardNgramModel <order> <lmfile> <tokens> (-reverse)";
        
        if (args.length > 0 && args[0].equals("-h")) {
            System.out.println(usage);
            System.exit(0);
        }
        
        long start = System.currentTimeMillis();
        String order = args[0]; String lmfile = args[1]; String tokens = args[2];
        String reversed = (args.length >= 4 && args[3].equals("-reverse")) ? "reversed " : "";
        System.out.println("Loading " + reversed + "n-gram model with order " + order + " from: " + lmfile);
        StandardNgramModel lm = new StandardNgramModel(Integer.parseInt(order), lmfile);
        if (reversed.length() > 0) lm.setReverse(true);
        System.out.println("openVocab: " + lm.openVocab);
        int secs = (int) (System.currentTimeMillis() - start) / 1000;
        System.out.println("secs: " + secs);
        System.out.println();
        // System.out.println("trie map: ");
        // System.out.println(lm.trieMapRoot.toString());
        // System.out.println();
        
        Tokenizer tokenizer = new DefaultTokenizer();
        List<Word> words = tokenizer.tokenize(tokens);
        System.out.println("scoring: " + tokens);
        System.out.println();
        lm.debugScore = true;
        lm.setWordsToScore(words, true);
        lm.prepareToScoreWords();
        double logprob = lm.logprob();
        double score = convertToProb(logprob);
        System.out.println();
        System.out.println("score: " + score);
        System.out.println("logprob: " + logprob);
        System.out.println("ppl: " + NgramScorer.convertToPPL(logprob / (words.size()-1)));
    }
}


================================================
FILE: src/opennlp/ccg/ngrams/kenlm/MurmurHash.java
================================================
package opennlp.ccg.ngrams.kenlm;

import java.io.UnsupportedEncodingException;

/**
 * MurmurHash 2.0.
 * 
 * The murmur hash is a relative fast hash function from http://murmurhash.googlepages.com/ for
 * platforms with efficient multiplication.
 * 
 * This is a re-implementation of the original C code plus some additional features.
 * 
 * Public domain.
 * 
 * @author Viliam Holub
 * @version 1.0.2
 * 
 */
public final class MurmurHash {

  private final static String ENCODING = "UTF-16";

  /**
   * Generates 32 bit hash from byte array of the given length and seed.
   * 
   * @param data byte array to hash
   * @param length length of the array to hash
   * @param seed initial seed value
   * @return 32 bit hash of the given array
   */
  public static int hash32(final byte[] data, int length, int seed) {
    // 'm' and 'r' are mixing constants generated offline.
    // They're not really 'magic', they just happen to work well.
    final int m = 0x5bd1e995;
    final int r = 24;
    // Initialize the hash to a random value
    int h = seed ^ length;
    int length4 = length / 4;

    for (int i = 0; i < length4; i++) {
      final int i4 = i * 4;
      int k =
          (data[i4 + 0] & 0xff) + ((data[i4 + 1] & 0xff) << 8) + ((data[i4 + 2] & 0xff) << 16)
              + ((data[i4 + 3] & 0xff) << 24);
      k *= m;
      k ^= k >>> r;
      k *= m;
      h *= m;
      h ^= k;
    }

    // Handle the last few bytes of the input array
    switch (length % 4) {
      case 3:
        h ^= (data[(length & ~3) + 2] & 0xff) << 16;
      case 2:
        h ^= (data[(length & ~3) + 1] & 0xff) << 8;
      case 1:
        h ^= (data[length & ~3] & 0xff);
        h *= m;
    }

    h ^= h >>> 13;
    h *= m;
    h ^= h >>> 15;

    return h;
  }


  /**
   * Generates 32 bit hash from byte array with default seed value.
   * 
   * @param data byte array to hash
   * @param length length of the array to hash
   * @return 32 bit hash of the given array
   */
  public static int hash32(final byte[] data, int length) {
    return hash32(data, length, 0x9747b28c);
  }


  /**
   * Generates 32 bit hash from a string.
   * 
   * @param text string to hash
   * @return 32 bit hash of the given string
   * @throws UnsupportedEncodingException
   */
  public static int hash32(final String text) throws UnsupportedEncodingException {
    final byte[] bytes = text.getBytes(ENCODING);
    return hash32(bytes, bytes.length);
  }


  /**
   * Generates 32 bit hash from a substring.
   * 
   * @param text string to hash
   * @param from starting index
   * @param length length of the substring to hash
   * @return 32 bit hash of the given string
   * @throws UnsupportedEncodingException
   */
  public static int hash32(final String text, int from, int length)
      throws UnsupportedEncodingException {
    return hash32(text.substring(from, from + length));
  }


  /**
   * Generates 64 bit hash from byte array of the given length and seed.
   * 
   * @param data byte array to hash
   * @param length length of the array to hash
   * @param seed initial seed value
   * @return 64 bit hash of the given array
   */
  public static long hash64(final byte[] data, int length, int seed) {
    final long m = 0xc6a4a7935bd1e995L;
    final int r = 47;

    long h = (seed & 0xffffffffl) ^ (length * m);

    int length8 = length / 8;

    for (int i = 0; i < length8; i++) {
      final int i8 = i * 8;
      long k =
          ((long) data[i8 + 0] & 0xff) + (((long) data[i8 + 1] & 0xff) << 8)
              + (((long) data[i8 + 2] & 0xff) << 16) + (((long) data[i8 + 3] & 0xff) << 24)
              + (((long) data[i8 + 4] & 0xff) << 32) + (((long) data[i8 + 5] & 0xff) << 40)
              + (((long) data[i8 + 6] & 0xff) << 48) + (((long) data[i8 + 7] & 0xff) << 56);

      k *= m;
      k ^= k >>> r;
      k *= m;

      h ^= k;
      h *= m;
    }

    switch (length % 8) {
      case 7:
        h ^= (long) (data[(length & ~7) + 6] & 0xff) << 48;
      case 6:
        h ^= (long) (data[(length & ~7) + 5] & 0xff) << 40;
      case 5:
        h ^= (long) (data[(length & ~7) + 4] & 0xff) << 32;
      case 4:
        h ^= (long) (data[(length & ~7) + 3] & 0xff) << 24;
      case 3:
        h ^= (long) (data[(length & ~7) + 2] & 0xff) << 16;
      case 2:
        h ^= (long) (data[(length & ~7) + 1] & 0xff) << 8;
      case 1:
        h ^= (long) (data[length & ~7] & 0xff);
        h *= m;
    };

    h ^= h >>> r;
    h *= m;
    h ^= h >>> r;

    return h;
  }


  /**
   * Generates 64 bit hash from byte array with default seed value.
   * 
   * @param data byte array to hash
   * @param length length of the array to hash
   * @return 64 bit hash of the given string
   */
  public static long hash64(final byte[] data, int length) {
    return hash64(data, length, 0xe17a1465);
  }


  /**
   * Generates 64 bit hash from a string.
   * 
   * @param text string to hash
   * @return 64 bit hash of the given string
   * @throws UnsupportedEncodingException
   */
  public static long hash64(final String text) throws UnsupportedEncodingException {
    byte[] bytes;
    bytes = text.getBytes(ENCODING);
    return hash64(bytes, bytes.length);
  }


  /**
   * Generates 64 bit hash from a substring.
   * 
   * @param text string to hash
   * @param from starting index
   * @param length length of the substring to hash
   * @return 64 bit hash of the given array
   * @throws UnsupportedEncodingException
   */
  public static long hash64(final String text, int from, int length)
      throws UnsupportedEncodingException {
    return hash64(text.substring(from, from + length));
  }
}


================================================
FILE: src/opennlp/ccg/ngrams/kenlm/jni/KenLM.java
================================================
package opennlp.ccg.ngrams.kenlm.jni;

// TODO(Joshua devs): include my state object with your LM state then
// update this API to pass state instead of int[].

public class KenLM {
  /**
   * Load the binary, platform-dependent library containing the KenLM JNI
   * bridge code. 
   * @throws UnsatisfiedLinkError If Java can't find the 'ken' library.
   */
  static {
      System.loadLibrary("ken");
  }

  private final long pointer;
  // this is read from the config file, used to set maximum order
  private final int ngramOrder;
  // inferred from model file (may be larger than ngramOrder)
  private final int N;


  private final static native long construct(String file_name, float fake_oov);

  private final static native void destroy(long ptr);

  private final static native int order(long ptr);

  private final static native boolean registerWord(long ptr, String word, int id);

  private final static native float prob(long ptr, int words[]);

  private final static native float probString(long ptr, int words[], int start);

  public KenLM(int order, String file_name) {
    float lm_ceiling_cost = 99.0f;
    ngramOrder = order;
    pointer = construct(file_name, -lm_ceiling_cost);
    N = order(pointer);
  }

  public void destroy() {
    destroy(pointer);
  }

  public int getOrder() {
    return N;
  }

  public boolean registerWord(String word, int id) {
    return registerWord(pointer, word, id);
  }

  public float prob(int words[]) {
    return prob(pointer, words);
  }

}


================================================
FILE: src/opennlp/ccg/parse/Chart.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003-10 Jason Baldridge, Gann Bierner and Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.parse;

import opennlp.ccg.grammar.*;
import opennlp.ccg.synsem.*;
import gnu.trove.*;

import java.io.*;
import java.util.*;

/**
 * An implementation of the table (or chart) used for chart parsers like CKY.
 * Special functions are provided for combining cells of the chart into another
 * cell.  Time or edge or cell limits can be placed on initial chart construction. 
 * A pruning value applies to unpacking, which also limits the number of equivalent 
 * edges kept during chart construction.
 * 
 * @author Jason Baldridge
 * @author Gann Bierner
 * @author Michael White
 * @version $Revision: 1.41 $, $Date: 2011/11/16 03:25:27 $
 */
public class Chart {

    // maps edges to representative edges, according to their headwords and cats, sans LFs
	// NB: using unfilled dependencies in equiv relation appears to unacceptably slow down parsing, 
	//     with a significant drop in complete parses
    @SuppressWarnings("unchecked")
    private static Map<Edge,Edge> createEdgeMap() {
    	return new THashMap(11, representativeEdgeStrategy);
    }
    
    private static TObjectHashingStrategy representativeEdgeStrategy = new TObjectHashingStrategy() {
		private static final long serialVersionUID = 1L;
		public int computeHashCode(Object o) {
            Sign sign = ((Edge)o).sign;
            int headpos = Edge.getEdge(sign.getLexHead()).wordPos; 
            return 31*headpos + sign.getCategory().hashCodeNoLF(); 
            //return 31*headpos + sign.getCategory().hashCodeNoLF() + 17*sign.getUnfilledDeps().hashCode(); 
        }
        public boolean equals(Object o1, Object o2) {
        	if (!(o1 instanceof Edge) || !(o2 instanceof Edge)) return false;
            Sign sign1 = ((Edge)o1).sign; Sign sign2 = ((Edge)o2).sign;
            return Edge.getEdge(sign1.getLexHead()).wordPos == Edge.getEdge(sign2.getLexHead()).wordPos && 
            	sign1.getCategory().equalsNoLF(sign2.getCategory()); 
            	//&& sign1.getUnfilledDeps().equals(sign2.getUnfilledDeps());
        }
    };
    
    // a cell pairs a sorted list with an edge map
    private class Cell implements Serializable {
		private static final long serialVersionUID = 1L;
		final List<Edge> list = new ArrayList<Edge>();
    	final Map<Edge,Edge> map = createEdgeMap();
    	int size() { return list.size(); }
    	Edge get(Edge edge) { return map.get(edge); }
    	// add edge, preserving cell limit; return true iff given edge added
    	boolean add(Edge edge) {
    		if (map.containsKey(edge)) return false;
    		return addEdgeSorted(edge, list, map, _cellLimit);
    	}
    	List<Sign> getSignsSorted() {
        	List<Sign> retval = new ArrayList<Sign>(list.size());
        	for (Edge e : list) retval.add(e.sign);
        	return retval;
    	}
    	SignHash getSigns() {
    		SignHash retval = new SignHash();
    		for (Edge e : list) retval.insert(e.sign);
        	return retval;
    	}
    };	
    
    // adds edge to sorted list and optional map, preserving limit; returns true iff edge added
    // nb: all lexical edges kept
    private boolean addEdgeSorted(Edge edge, List<Edge> list, Map<Edge,Edge> map, int limit) {
		int index = Collections.binarySearch(list, edge, edgeComparator);
		// convert index to insertion point
        index = Math.abs(index) - 1;
        // if somehow negative, use last position
        if (index < 0) index = list.size();
        // check if last and at limit
        boolean limitActive = limit > 0 && !edge.sign.isLexical();
        if (limitActive && index >= limit) return false;
        // otherwise add edge
        list.add(index, edge);
		if (map != null) map.put(edge, edge);
		// remove last if over limit
		if (limitActive && list.size() > limit) {
			Edge last = list.remove(list.size()-1);
			if (map != null) map.remove(last);
		}
		return true;    	
    }
    
    /** Compares edges based on their relative score, in descending order, then their signs. */
	public static final Comparator<Edge> edgeComparator = new Comparator<Edge>() {
		public int compare(Edge edge1, Edge edge2) {
			if (edge1.score != edge2.score)
				return -1 * Double.compare(edge1.score, edge2.score);
			else 
				return SignHash.compareTo(edge1.sign, edge2.sign);
		}
	};

    /** The chart. */
	protected Cell[][] _table;

	/** Its size. */
	protected int _size;

	/** The count of edges created before unpacking. */
	protected int _numEdges = 0;
	
	/** The count of edges created while unpacking. */
	protected int _numUnpackingEdges = 0;
	
	/** The max cell size before unpacking. */
	protected int _maxCellSize = 0;
	
	/** The rules. */
	protected RuleGroup _rules;

	/** The sign scorer (defaults to the null scorer). */
	protected SignScorer _signScorer = SignScorer.nullScorer;
	
	/** The "n" for n-best pruning (or 0 if none). */
	protected int _pruneVal = 0;
	
	/** The time limit (0 if none). */
	protected int _timeLimit = 0;
	
	/** The start time. */
	protected long _startTime = 0;
	
	/** The edge limit (0 if none). */
	protected int _edgeLimit = 0;
	
	/** The cell limit on non-lexical edges (0 if none). */
	protected int _cellLimit = 0;
	
	/** Constructor. */
	public Chart(int s, RuleGroup _R) {
		_rules = _R; _size = s;
		_table = new Cell[_size][_size];
	}

	/** Sets the sign scorer. */
	public void setSignScorer(SignScorer signScorer) { _signScorer = signScorer; }
	
	/** Sets the n-best pruning val. */
	public void setPruneVal(int n) { _pruneVal = n; }
	
	/** Sets the time limit. */
	public void setTimeLimit(int timeLimit) { _timeLimit = timeLimit; }
	
	/** Sets the start time. */
	public void setStartTime(long startTime) { _startTime = startTime; }
	
	/** Sets the edge limit. */
	public void setEdgeLimit(int edgeLimit) { _edgeLimit = edgeLimit; }
	
	/** Sets the cell limit on non-lexical edges. */
	public void setCellLimit(int cellLimit) { _cellLimit = cellLimit; }
	
	/** Returns the edge count prior to unpacking. */
	public int edgeCount() { return _numEdges; }
	
	/** Returns the edge count while unpacking. */
	public int unpackingEdgeCount() { return _numUnpackingEdges; }
	
	/** Returns the max cell size prior to unpacking. */
	public int maxCellSize() { return _maxCellSize; }
	
	
	//-----------------------------------------------------------
	// Chart construction
	
	/** 
	 * Inserts a sign at the given cell (modulo pruning).  
	 * Returns true if an edge for the sign is added as a new equiv class. 
	 */
	public boolean insert(int x, int y, Sign w) {
		Cell cell = get(x, y);
		boolean retval = false;
		// make edge
		Edge edge = new Edge(w);
		if (w.isLexical()) edge.setWordPos(x);
		// get representative edge
		Edge rep = cell.get(edge);
		// if none, add as representative
		if (rep == null) {
			edge.initAltEdges();
			retval = cell.add(edge);
		}
		// otherwise add as an alternative
		else {
			addEdgeSorted(edge, rep.altEdges, null, _pruneVal);
		}
		// update edge count, max cell size
		_numEdges++;
		if (cell.size() > _maxCellSize) _maxCellSize = cell.size();
		// done
		return retval;
	}

	/** Returns the given cell (ensuring non-null). */
	protected Cell get(int x, int y) {
		if (_table[x][y] == null) _table[x][y] = new Cell();
		return _table[x][y];
	}

	/** Returns the signs for a given cell (ensuring non-null). */
	protected SignHash getSigns(int x, int y) {
		Cell cell = get(x, y);
		return cell.getSigns();
	}

	/** Inserts edges into (x,y) that result from applying unary rules to those already in (x,y). 
	 * @throws ParseException */ 
	protected void insertCell(int x, int y) throws ParseException {
		if (_table[x][y] == null) return;
		List<Sign> inputs = _table[x][y].getSignsSorted();
		List<Sign> nextInputs = new ArrayList<Sign>(inputs.size());
		// repeat until no more inputs
		while (inputs.size() > 0) {
			// apply rules
			for (Sign sign : inputs) {
				checkLimits();
				List<Sign> results = _rules.applyUnaryRules(sign);
				for (Sign result : results) {
					// check for unary rule cycle; skip result if found
					if (!result.getDerivationHistory().containsCycle()) {
						// insert result
						boolean newEdgeClass = insert(x, y, result);
						// add to next inputs if it yielded a new equiv class
						if (newEdgeClass) nextInputs.add(result);
					}
				}
			}
			// move all results to inputs
			inputs.clear();
			inputs.addAll(nextInputs);
			nextInputs.clear();
		}
	}

	/** Inserts edges into (x3,y3) resulting from combining those in (x1,y1) and (x2,y2). 
	 * @throws ParseException */
	protected void insertCell(int x1, int y1, int x2, int y2, int x3, int y3) throws ParseException {
		if (_table[x1][y1] == null) return;
		if (_table[x2][y2] == null) return;
		List<Sign> inputs1 = _table[x1][y1].getSignsSorted();
		List<Sign> inputs2 = _table[x2][y2].getSignsSorted();
		for (Sign sign1 : inputs1) {
			for (Sign sign2 : inputs2) {
				checkLimits();
				List<Sign> results = _rules.applyBinaryRules(sign1, sign2);
				for (Sign result : results)
					insert(x3, y3, result);
			}
		}
	}

	/** 
	 * Inserts fragmentary edges into (x3,y3), if non-empty, resulting from combining 
	 * those in (x1,y1) and (x2,y2) using the glue rule. 
	 * @throws ParseException 
	 */
	protected void insertCellFrag(int x1, int y1, int x2, int y2, int x3, int y3) throws ParseException {
		if (_table[x1][y1] == null) return;
		if (_table[x2][y2] == null) return;
		if (!cellIsEmpty(x3, y3)) return;
		List<Sign> inputs1 = _table[x1][y1].getSignsSorted();
		List<Sign> inputs2 = _table[x2][y2].getSignsSorted();
		for (Sign sign1 : inputs1) {
			for (Sign sign2 : inputs2) {
				checkLimits();
				List<Sign> results = _rules.applyGlueRule(sign1, sign2);
				for (Sign result : results)
					insert(x3, y3, result);
			}
		}
	}

    // check edge and time limit
    private void checkLimits() throws ParseException {
    	if (_edgeLimit > 0 && _numEdges > _edgeLimit) {
    		throw new ParseException(ParseException.EDGE_LIMIT_EXCEEDED);
    	}
        if (_timeLimit > 0) {
        	int timeSoFar = (int) (System.currentTimeMillis() - _startTime);
        	if (timeSoFar > _timeLimit) {
        		throw new ParseException(ParseException.TIME_LIMIT_EXCEEDED);
        	}
        }
    }
    
	/** Returns whether the given cell is empty. */
    public boolean cellIsEmpty(int x, int y) {
		Cell cell = get(x, y);
    	return cell.list.isEmpty();
    }
    
    
	//-----------------------------------------------------------
	// Unpacking 
	
	/** Unpacks the edges in the given cell as an n-best list. */
	public List<Edge> unpack(int x, int y) {
		Cell cell = get(x, y);
		// recursively unpack each edge
	    @SuppressWarnings("unchecked")
        Set<Edge> unpacked = new THashSet(new TObjectIdentityHashingStrategy());
	    @SuppressWarnings("unchecked")
        Set<Edge> startedUnpacking = new THashSet(new TObjectIdentityHashingStrategy());
		for (Edge edge : cell.list) unpack(edge, unpacked, startedUnpacking); 
		// collect and sort results
        EdgeHash merged = new EdgeHash();
		for (Edge edge : cell.list) {
			merged.addAll(edge.altEdges);
		}
		List<Edge> retval = new ArrayList<Edge>(merged.asEdgeSet());
		Collections.sort(retval, edgeComparator);
        // prune
        if (_pruneVal > 0) {
        	while (retval.size() > _pruneVal) retval.remove(retval.size()-1);
        }
        // restore alts
        for (Edge edge : cell.list) edge.restoreAltEdges();
		// return
		return retval;
	}

	// recursively unpack edge, unless already visited
	private void unpack(Edge edge, Set<Edge> unpacked, Set<Edge> startedUnpacking) {
		// check visited
        if (unpacked.contains(edge)) return;
        if (startedUnpacking.contains(edge)) {
        	System.err.println("Warning, revisiting edge before unpacking complete: " + edge);
        	System.err.println(edge.sign.getDerivationHistory().toString());
        	return;
        }
        startedUnpacking.add(edge);
        // OR: recursively unpack alts, merging resulting alts
        EdgeHash merged = new EdgeHash();
        for (Edge alt : edge.altEdges) {
            // AND: unpack inputs, make alts, add to merged
            unpackAlt(alt, unpacked, startedUnpacking, merged);
        }
        // score
        boolean complete = (edge.sign.getWords().size() == _size);
        for (Edge m : merged.asEdgeSet()) { m.setScore(_signScorer.score(m.sign, complete)); }
        // sort
        List<Edge> mergedList = new ArrayList<Edge>(merged.asEdgeSet());
        Collections.sort(mergedList, edgeComparator);
        // prune
        if (_pruneVal > 0) {
        	while (mergedList.size() > _pruneVal) mergedList.remove(mergedList.size()-1);
        }
        // replace edge's alts
        edge.replaceAltEdges(mergedList);
        // add to unpacked set
        unpacked.add(edge);
    }
    
    // recursively unpack inputs, make alt combos and add to merged
    private void unpackAlt(Edge alt, Set<Edge> unpacked, Set<Edge> startedUnpacking, EdgeHash merged) {
        // unpack via input signs
        DerivationHistory history = alt.sign.getDerivationHistory(); 
        Sign[] inputSigns = history.getInputs();
        // base case: no inputs
        if (inputSigns == null) {
            merged.insert(alt); return;
        }
        // otherwise recursively unpack
        Edge[] inputEdges = new Edge[inputSigns.length];
        for (int i = 0; i < inputSigns.length; i++) {
            inputEdges[i] = Edge.getEdge(inputSigns[i]); 
            unpack(inputEdges[i], unpacked, startedUnpacking);
        }
        // then make edges for new combos, using same rule, and add to merged (if unseen)
        Rule rule = history.getRule();
        List<Sign[]> altCombos = inputCombos(inputEdges, 0);
        List<Sign> results = new ArrayList<Sign>(1);
        for (Sign[] combo : altCombos) {
        	// use this alt for same combo
        	if (sameSigns(inputSigns, combo)) {
        		merged.insert(alt); continue;
        	}
        	results.clear();
        	((AbstractRule)rule).applyRule(combo, results); // TODO: bypass rule app for efficiency? (requires doing something about var subst)
        	if (results.isEmpty()) continue; // (rare?)
            Sign sign = results.get(0); // assuming single result
            merged.insert(new Edge(sign)); // make edge for new alt
            _numUnpackingEdges++;
        }
	}
	
    // returns a list of sign arrays, with each array of length inputEdges.length - i, 
    // representing all combinations of alt signs from i onwards
    private List<Sign[]> inputCombos(Edge[] inputEdges, int index) {
        Edge edge = inputEdges[index];
        // base case, inputEdges[last]
        if (index == inputEdges.length-1) {
            List<Edge> altEdges = edge.altEdges; 
            List<Sign[]> retval = new ArrayList<Sign[]>(altEdges.size());
            for (Edge alt : altEdges) {
                retval.add(new Sign[] { alt.sign });
            }
            return retval;
        }
        // otherwise recurse on index+1
        List<Sign[]> nextCombos = inputCombos(inputEdges, index+1);
        // and make new combos
        List<Edge> altEdges = edge.altEdges; 
        List<Sign[]> retval = new ArrayList<Sign[]>(altEdges.size() * nextCombos.size());
        for (Edge alt : altEdges) {
            for (int i = 0; i < nextCombos.size(); i++) {
                Sign[] nextSigns = nextCombos.get(i);
                Sign[] newCombo = new Sign[nextSigns.length+1];
                newCombo[0] = alt.sign;
                System.arraycopy(nextSigns, 0, newCombo, 1, nextSigns.length);
                retval.add(newCombo);
            }
        }
        return retval;
    }

    // checks for same signs
    private boolean sameSigns(Sign[] a, Sign[] b) {
    	if (a.length != b.length) return false;
    	for (int i=0; i < a.length; i++)
    		if (a[i] != b[i]) return false;
    	return true;
    }
    
	
	//-----------------------------------------------------------
	// Lazy Unpacking 
	
	/** 
	 * Lazily unpacks the edges in the given cell as an n-best list 
	 * using a variant of "cube pruning".  The algorithm essentially 
	 * follows Algorithm 2 of Huang and Chiang (2005), with checking 
	 * for spurious ambiguity.
	 */ 
	@SuppressWarnings("unchecked")
	public List<Edge> lazyUnpack(int x, int y) {
		// if no pruning value set, use basic unpacking algorithm
		if (_pruneVal <= 0) return unpack(x, y);
		// recursively sort edge alts
		Cell cell = get(x, y);
		// make top-level candidate list and derivs map
		List<Candidate> topcands = new ArrayList<Candidate>(_pruneVal);
		Map<Edge, List<Edge>> derivsmap = new THashMap(new TObjectIdentityHashingStrategy());
		for (Edge edge : cell.list) {
			List<Candidate> cands = getCandidates(edge, derivsmap);
			topcands.addAll(cands);
		}
		sortAndPrune(topcands);
		// NB: no single edge for top cell, so must treat it as a special case of findKBest
		List<Edge> retval = new ArrayList<Edge>(_pruneVal);
    	EdgeHash merged = new EdgeHash();
    	while (merged.size() < _pruneVal && !topcands.isEmpty()) {
    		appendNext(topcands, merged, derivsmap);
    	}
    	retval.addAll(merged.asEdgeSet());
    	// rescore edges if apropos
    	if (_signScorer instanceof ReRankingScorer) {
    		ReRankingScorer rescorer = (ReRankingScorer) _signScorer;
    		rescorer.setFullModel(true);
    		for (Edge e : retval) {
    			e.score = rescorer.score(e.sign, true);
    		}
    		rescorer.setFullModel(false);
    	}
    	Collections.sort(retval, edgeComparator);
		// done
		return retval;
	}
	
    // lazily find k-best derivations, if edge not already visited
    private void findKBest(Edge edge, Map<Edge, List<Edge>> derivsmap) {
    	if (derivsmap.containsKey(edge)) return;
    	List<Candidate> cands = getCandidates(edge, derivsmap);
    	EdgeHash merged = new EdgeHash();
    	while (merged.size() < _pruneVal && !cands.isEmpty()) {
    		appendNext(cands, merged, derivsmap);
    	}
    	List<Edge> derivs = new ArrayList<Edge>(_pruneVal);
    	derivs.addAll(merged.asEdgeSet());
    	Collections.sort(derivs, edgeComparator);
    	derivsmap.put(edge, derivs);
    }
    
    // appends next candidate, expands frontier
    private void appendNext(List<Candidate> cands, EdgeHash merged, Map<Edge, List<Edge>> derivsmap) {
    	// append next
    	Candidate cand = cands.remove(0);
    	merged.add(cand.edge);
		// check for lex cand
		if (cand.indices == null) return;
		// enumerate frontier
		for (int i=0; i < cand.indices.length; i++) {
			// inc nextIndices at i
			int[] nextIndices = new int[cand.indices.length];
			for (int m=0; m < nextIndices.length; m++) nextIndices[m] = cand.indices[m];
			nextIndices[i]++;
			Edge next = getEdgeForIndices(cand.edge, cand.inputReps, nextIndices, derivsmap); 
			// add next candidate, if any, if not already there
			if (next != null) {
				Candidate nextCand = new Candidate(next, cand.inputReps, nextIndices);
				if (!cands.contains(nextCand)) {
					int index = Collections.binarySearch(cands, nextCand);
		            index = Math.abs(index) - 1; // convert index to insertion point
		            if (index >= 0) 
		            	cands.add(index, nextCand);
		            else cands.add(nextCand);
				}
			}
		}
    }
    
	// candidate is an edge plus an array of indices for keeping track of 
	// where to pull candidates from next (or null if lexical),  
    // using the input representatives
	private static class Candidate implements Comparable<Candidate> {
		Edge edge; Edge[] inputReps; int[] indices;
		Candidate(Edge edge, Edge[] inputReps, int[] indices) { 
			this.edge = edge; this.inputReps = inputReps; this.indices = indices; 
		}
		public int compareTo(Candidate c) { 
			int retval = edgeComparator.compare(edge, c.edge);
			if (retval != 0) return retval;
			if (indices == null && c.indices == null) return 0;
			if (indices == null && c.indices != null) return -1;
			if (indices != null && c.indices == null) return 1;
			if (indices.length < c.indices.length) return -1;
			if (indices.length > c.indices.length) return 1;
			for (int i=0; i < indices.length; i++) {
				if (indices[i] < c.indices[i]) return -1;
				if (indices[i] > c.indices[i]) return 1;
			}
			return 0;
		}
		public boolean equals(Object o) {
			if (!(o instanceof Candidate)) return false;
			Candidate c = (Candidate)o;
			if (indices != null && c.indices == null) return false;
			if (indices == null && c.indices != null) return false;
			if (indices != null && c.indices != null) {
				if (indices.length != c.indices.length) return false;
				for (int i=0; i < indices.length; i++) {
					if (indices[i] != c.indices[i]) return false;
				}
			}
			return edge.equals(c.edge);
		}
	}
	
	// get candidates for unpacking an edge
	private List<Candidate> getCandidates(Edge edge, Map<Edge, List<Edge>> derivsmap) {
		List<Candidate> retval = new ArrayList<Candidate>(_pruneVal);
		// make initial candidate for each alt
		// nb: should only get initial candidates for representative edges, 
		//     but may as well ensure that at least this edge is included
		List<Edge> alts = new ArrayList<Edge>(edge.getAltEdges());
		if (alts.isEmpty()) alts.add(edge);
		for (Edge alt : alts) {
			Sign[] inputs = alt.sign.getDerivationHistory().getInputs();
			// lex case: no indices
			if (inputs == null) {
				retval.add(new Candidate(alt, null, null));
				continue;
			}
			// otherwise get edge for best inputs
			Edge[] inputReps = new Edge[inputs.length];
			int[] indices = new int[inputs.length];
			for (int i=0; i < inputs.length; i++) {
				inputReps[i] = Edge.getEdge(inputs[i]);
				indices[i] = 0;
			}
			Edge e = getEdgeForIndices(alt, inputReps, indices, derivsmap);
			if (e != null) {
				retval.add(new Candidate(e, inputReps, indices));
			}
		}
		// sort and prune
		sortAndPrune(retval);
		// done
		return retval;
	}
    
	// returns the edge for the given input indices, or null if none
	private Edge getEdgeForIndices(Edge edge, Edge[] inputReps, int[] indices, Map<Edge, List<Edge>> derivsmap) {
		DerivationHistory history = edge.sign.getDerivationHistory();
        Sign[] combo = new Sign[inputReps.length];
        for (int i = 0; i < inputReps.length; i++) {
            Edge inputEdge = inputReps[i];
            // recurse
            findKBest(inputEdge, derivsmap);
            // get derivs
            List<Edge> inputDerivs = derivsmap.get(inputEdge);
            // check index, return null if out of bounds
            if (indices[i] < inputDerivs.size()) 
            	combo[i] = inputDerivs.get(indices[i]).sign;
            else return null;
        }
        // return edge if combo is same as input signs
		Sign[] inputSigns = history.getInputs();
        if (sameSigns(inputSigns, combo)) return edge;
        // otherwise return new edge for combo
        Rule rule = history.getRule();
        List<Sign> results = new ArrayList<Sign>(1);
    	((AbstractRule)rule).applyRule(combo, results); // TODO: bypass rule app for efficiency? (requires doing something about var subst)
    	if (results.isEmpty()) return null; // (rare?)
        Sign sign = results.get(0); // assuming single result
        Edge retval = new Edge(sign); // make edge for new combo
        _numUnpackingEdges++;
        // score it
        boolean complete = (sign.getWords().size() == _size);
        retval.setScore(_signScorer.score(sign, complete));
        // done 
		return retval;
	}
	
	// sort and prune candidate list
	private void sortAndPrune(List<Candidate> cands) {
		Collections.sort(cands);
		while (cands.size() > _pruneVal) cands.remove(cands.size()-1);
	}
	
    
	//-----------------------------------------------------------

	/** Saves the chart entries to the given file. */
	public void saveChartEntries(File file) throws IOException {
		ObjectOutputStream out = new ObjectOutputStream(new BufferedOutputStream(new FileOutputStream(file)));
		out.writeObject(_table);
		out.flush(); out.close();
	}
	
	/** Loads the chart entries from the given file. */
	public void loadChartEntries(File file) throws IOException {
		ObjectInputStream in = new ObjectInputStream(new BufferedInputStream(new FileInputStream(file)));
		try {
			// read entries
			_table = (Cell[][]) in.readObject();
			// restore size, unpacking edge count
			_size = _table.length;
			_numUnpackingEdges = 0;
		} catch (ClassNotFoundException e) {
			in.close();
            throw (RuntimeException) new RuntimeException().initCause(e);
		}
		in.close();
	}
	
	
	//-----------------------------------------------------------
    
	/** Returns the number of entries in each cell in the chart. */
	public String toString() {
		StringBuffer sb = new StringBuffer();
		for (int i = 0; i < _size; i++) {
			for (int j = 0; j < _size; j++) {
				sb.append(get(i, j).size()).append('\t');
			}
			sb.append('\n');
		}
		return sb.toString();
	}

	/** Prints the signs in the chart to System.out. */
	public void printChart() {
		int[] sizes = new int[_size];
		int rows = 0;
		for (int i = 0; i < _size; i++) {
			for (int j = i; j < _size; j++)
				if (get(i, j).size() > sizes[i])
					sizes[i] = get(i, j).size();
			rows += sizes[i];
		}

		String[][] toprint = new String[rows][_size];
		String[] words = new String[_size];
		int maxwidth = 0;

		for (int i = 0, row = 0; i < _size; row += sizes[i++]) {
			for (int j = 0; j < _size; j++)
				for (int s = 0; s < sizes[i]; s++) {
					SignHash cell = getSigns(i, j);
					if (i == j) words[i] = cell.asSignSet().iterator().next().getOrthography();
					if (cell.size() >= s + 1) {
						toprint[row + s][j] = ((Sign) cell.toArray()[s])
								.getCategory().toString();
						if (toprint[row + s][j].length() > maxwidth)
							maxwidth = toprint[row + s][j].length();
					}
				}
		}

		int fullwidth = _size * (maxwidth + 3) - 1;
		System.out.print(" ");
		for (String w : words) {
			System.out.print(w);
			int pad = (maxwidth + 3) - w.length();
			for (int p = 0; p < pad; p++)
				System.out.print(" ");
		}
		System.out.print("|");
		System.out.println();
		for (int p = 0; p < fullwidth; p++)
			System.out.print("-");
		System.out.print("| ");
		System.out.println();

		for (int i = 0, entry = sizes[0], e = 0; i < rows; i++) {
			if (i == entry) {
				System.out.print("|");
				for (int p = 0; p < fullwidth; p++)
					System.out.print("-");
				System.out.print("|");
				System.out.println();
				entry += sizes[++e];
			}
			System.out.print("| ");

			for (int j = 0; j < _size; j++) {
				int pad = 1 + maxwidth;
				if (toprint[i][j] != null) {
					System.out.print(toprint[i][j]);
					pad -= toprint[i][j].length();
				}
				for (int p = 0; p < pad; p++)
					System.out.print(" ");
				System.out.print("| ");
			}
			System.out.println();
		}
		System.out.print("|");
		for (int p = 0; p < fullwidth; p++)
			System.out.print("-");
		System.out.print("| ");
		System.out.println();
	}
}


================================================
FILE: src/opennlp/ccg/parse/DerivationHistory.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003-5 Jason Baldridge, Gann Bierner and 
//                      University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.parse;

import opennlp.ccg.synsem.*;
import opennlp.ccg.grammar.*;

import java.io.Serializable;
import java.util.*;

/**
 * Record the steps taken in a derivation.
 *
 * @author      Jason Baldridge
 * @author      Michael White
 * @version     $Revision: 1.12 $, $Date: 2009/12/16 22:39:32 $
 */
public class DerivationHistory implements Serializable, Comparable<DerivationHistory> {

	private static final long serialVersionUID = 2867339743258182859L;
	
	private Sign[] _inputs;
    private Sign _output;
    private Rule _rule;
    private boolean _noHistory = false;
    private transient int _complexity = -1;
    
    /** Constructor for a sign with no prior history. */
    public DerivationHistory(Sign output) {
        _noHistory = true;
        _output = output;
    }
    
    /** Constructor for a sign created by rule. */
    public DerivationHistory(Sign[] inputs, Sign output, Rule rule) {
        _inputs = new Sign[inputs.length];
        for (int i=0; i < inputs.length; i++) {
            _inputs[i] = inputs[i];
        }
        _output = output;
        _rule = rule;
    }


    /** Returns true iff the history is empty. */
    public boolean isEmpty() { return _noHistory; }
    
    /** Returns the inputs (or null if none). */
    public Sign[] getInputs() { return _inputs; }
    
    /** Returns the output. */
    public Sign getOutput() { return _output; }
    
    /** Returns the rule. */
    public Rule getRule() { return _rule; }
    
    
    /** Returns the derivation history in vertical list form. */
    public String toString() {
        return toString(maxRuleLen());
    }
    
    // returns the derivation history given the max rule len, for alignment
    private String toString(int maxRuleLen) {
        StringBuffer sb = new StringBuffer();
        // lex item
        if (_noHistory) {
            sb.append("(lex) ");
            for (int i = 5; i < maxRuleLen; i++) { sb.append(' '); }
            sb.append(_output.toString()).append('\n');
            return sb.toString();
        }
        // inputs
        for (int i=0; i < _inputs.length; i++) {
            sb.append(_inputs[i].getDerivationHistory().toString(maxRuleLen));
        }
        // type-changing rule (possibly)
        String ruleName = _rule.name();
        TypeChangingRule tcr = Grammar.theGrammar.rules.getTypeChangingRule(ruleName);
        if (tcr != null) {
            sb.append("(gram) ");
            for (int i = 6; i < maxRuleLen; i++) { sb.append(' '); }
            sb.append(tcr.toString()).append('\n');
        }
        // this rule and result
        sb.append('(').append(ruleName).append(") ");
        for (int i = (ruleName.length() + 2); i < maxRuleLen; i++) { sb.append(' '); }
        sb.append(_output.toString()).append('\n');
        // done
        return sb.toString();
    }
    
    // returns the max length of rule names (including parens)
    private int maxRuleLen() {
        if (_noHistory) { return 6; }
        int max = 0;
        for (int i=0; i < _inputs.length; i++) {
            max = Math.max(max, _inputs[i].getDerivationHistory().maxRuleLen());
        }
        max = Math.max(max, _rule.name().length() + 2);
        return max;
    }
    
    /** Returns the complexity of the derivation, as the sum of 
        the number of steps, plus the number of composition or 
        substitution steps, plus the number of crossing steps. */
    public int complexity() {
    	if (_complexity > 0) return _complexity;
        if (_noHistory) return 0;
        int retval = 1;
        String ruleName = _rule.name();
        if (ruleName.length() > 1 && (ruleName.charAt(0) == '>' || ruleName.charAt(0) == '<')) {
            if (ruleName.charAt(1) == 'B' || ruleName.charAt(1) == 'S') {
                retval++;
                if (ruleName.length() == 3 && ruleName.charAt(2) == 'x') retval++;
            }
        }
        for (int i=0; i < _inputs.length; i++) {
            retval += _inputs[i].getDerivationHistory().complexity();
        }
        _complexity = retval;
        return retval;
    }
    
    /** Returns whether the derivation contains a unary rule cycle. */
    public boolean containsCycle() {
    	if (_noHistory || _inputs.length != 1) return false;
    	List<Rule> rulesSeen = new ArrayList<Rule>(4);
    	rulesSeen.add(_rule);
    	return _inputs[0].getDerivationHistory().containsCycle(rulesSeen);
    }
    
    // recursive cycle check
    private boolean containsCycle(List<Rule> rulesSeen) {
    	if (_noHistory || _inputs.length != 1) return false;
    	if (rulesSeen.contains(_rule)) return true;
    	rulesSeen.add(_rule);
    	return _inputs[0].getDerivationHistory().containsCycle(rulesSeen);
    }

    /** Recursively compares derivation histories by their complexity. */
	public int compareTo(DerivationHistory dh) {
		int c1 = complexity(); int c2 = dh.complexity();
		if (c1 < c2) return -1;
		if (c1 > c2) return 1;
		if (_noHistory) return 0;
		if (_inputs.length < dh._inputs.length) return -1;
		if (_inputs.length > dh._inputs.length) return 1;
		for (int i=0; i < _inputs.length; i++) {
			int cmp = _inputs[i].getDerivationHistory().compareTo(dh._inputs[i].getDerivationHistory());
			if (cmp != 0) return cmp;
		}
		return 0;
	}
}


================================================
FILE: src/opennlp/ccg/parse/Edge.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2007 Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.parse;

import opennlp.ccg.synsem.*;
import java.util.*;
import java.io.Serializable;
import java.text.*;

/**
 * <p>
 * An edge is a wrapper for a sign, ie a sign together 
 * with a score, and optionally a list of alternative edges. 
 * A representative edge is an edge that represents (stands in for) 
 * other edges with the same category (but different LFs) during the 
 * chart construction process, stored in the list of alternative edges; 
 * it is considered disjunctive when there is more than one alternative.
 * Note that initially a representative edge will be in its list 
 * of alternatives, but it can be removed during pruning.
 * </p>
 *
 * @author      Michael White
 * @version     $Revision: 1.4 $, $Date: 2009/12/22 22:19:00 $
 */
public class Edge implements Serializable {

	private static final long serialVersionUID = 1L;

	
	/** Class for storing back-refs from signs. */
	public static class EdgeRef implements Serializable {
		private static final long serialVersionUID = 1L;
		/** The edge. */
		public final Edge edge;
		/** Constructor. */
		public EdgeRef(Edge edge) { this.edge = edge; }
	}
	
	/** Returns the edge associated with this sign, or null if none. */
	public static Edge getEdge(Sign sign) {
		EdgeRef eref = (EdgeRef) sign.getData(EdgeRef.class);
		return (eref != null) ? eref.edge : null;
	}
	
	
	/** The sign. */
    protected Sign sign;
    
    /** The edge score. */
    protected double score;
    
    /** Word position, for lexical edges (otherwise -1). */
    protected int wordPos = -1;
    
    /** The alternative edges (none initially). */
    protected List<Edge> altEdges = null;
    
    /** Saved list of alternative edges, for restoring chart after unpacking. */
    protected transient List<Edge> savedAltEdges = null;
    
    
    /** Constructor (score defaults to 0.0). */
    public Edge(Sign sign) { this(sign, 0.0); }

    /** Constructor with score. */
    public Edge(Sign sign, double score) {
        this.sign = sign; this.score = score; 
        sign.addData(new EdgeRef(this));
    }

    
    /** Returns the sign. */
    public Sign getSign() { return sign; }
    
    /** Returns the score. */
    public double getScore() { return score; }
    
    /** Sets the score. */
    public void setScore(double score) { this.score = score; }

    /** Returns the word position of a lexical edge (otherwise -1). */
    public int getWordPos() { return wordPos; }
    
    /** Sets the word position of a lexical edge. */
    public void setWordPos(int pos) { wordPos = pos; }
    
    /** Returns whether this edge is a representative. */
    public boolean isRepresentative() { return altEdges != null; }
    
    /** Returns whether this edge is disjunctive. */
    public boolean isDisjunctive() { return altEdges != null && altEdges.size() > 1; }
    
    /** Returns the list of alt edges, or the empty list if none. */
    public List<Edge> getAltEdges() {
        if (altEdges == null) return Collections.emptyList(); 
        else return altEdges;
    }
    
    /** Initializes the alt edges list with a default capacity, adding this edge. */
    public void initAltEdges() { initAltEdges(3); }
    
    /** Initializes the alt edges list with the given capacity, adding this edge. */
    public void initAltEdges(int capacity) {
        // check uninitialized
        if (altEdges != null) throw new RuntimeException("Alt edges already initialized!");
        altEdges = new ArrayList<Edge>(capacity);
        altEdges.add(this);
    }
    
    /** Replaces the alt edges, saving the current ones for later restoration. */
    public void replaceAltEdges(List<Edge> newAlts) {
    	savedAltEdges = altEdges; 
    	altEdges = newAlts;
    }
    
    /** Recursively restores saved alt edges, if any. */
    public void restoreAltEdges() { 
    	if (savedAltEdges != null) {
    		// restore
        	altEdges = savedAltEdges;
        	savedAltEdges = null;
        	// recurse
        	for (Edge alt : altEdges) {
        		Sign[] inputs = alt.sign.getDerivationHistory().getInputs();
        		if (inputs != null) {
        			for (Sign s : inputs) 
        				getEdge(s).restoreAltEdges();
        		}
        	}
    	}
    }
    
    
    /** Returns a hash code for this edge, based on its sign. (Alternatives and the score are not considered.) */
    public int hashCode() {
        return sign.hashCode() * 23;
    }
    
    /** Returns a hash code for this edge based on the sign's surface words. (Alternatives and the score are not considered.) */
    public int surfaceWordHashCode() {
    	return sign.surfaceWordHashCode() * 23;
    }
    
    /** Returns whether this edge equals the given object. (Alternatives and the score are not considered.) */
    public boolean equals(Object obj) {
        if (obj == this) return true;
        if (!(obj instanceof Edge)) return false;
        Edge edge = (Edge) obj;
        return sign.equals(edge.sign);
    }
    
    /** Returns whether this edge equals the given object based on the sign's surface words. (Alternatives and the score are not considered.) */
    public boolean surfaceWordEquals(Object obj) {
        if (obj == this) return true;
        if (!(obj instanceof Edge)) return false;
        Edge edge = (Edge) obj;
        return sign.surfaceWordEquals(edge.sign);
    }
    
    
    /**
     * Returns a string for the edge in the format
     * [score] orthography :- category. 
     */
    public String toString() {
        StringBuffer sbuf = new StringBuffer();
        if (score >= 0.001 || score == 0.0) sbuf.append("[" + nf3.format(score) + "] ");
        else sbuf.append("[" + nfE.format(score) + "] ");
        sbuf.append(sign.toString());
        return sbuf.toString();
    }
    
    // formats to three decimal places
    private static final NumberFormat nf3 = initNF3();
    private static NumberFormat initNF3() { 
        NumberFormat f = NumberFormat.getInstance();
        f.setMinimumIntegerDigits(1);
        f.setMinimumFractionDigits(3);
        f.setMaximumFractionDigits(3);
        return f;
    }
    
    // formats to "0.##E0"
    private static final NumberFormat nfE = new DecimalFormat("0.##E0");
}


================================================
FILE: src/opennlp/ccg/parse/EdgeHash.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2005-7 Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.parse;

import gnu.trove.*;
import java.util.*;

/**
 * A set of edges, unique up to surface words.
 * Edges whose signs have lower derivational complexity are kept during insertion.
 * NB: This is just like EdgeHash in the realize package, except that 
 *     it deals with parse edges.
 *
 * @author      Michael White
 * @version     $Revision: 1.1 $, $Date: 2007/12/20 05:51:10 $
 */
public class EdgeHash extends THashSet {

	private static final long serialVersionUID = 1L;
	
	/** Hashing strategy that uses Edge's surfaceWordHashCode and surfaceWordEquals methods. */
    protected static TObjectHashingStrategy surfaceWordHashingStrategy = new TObjectHashingStrategy() {
		private static final long serialVersionUID = 1L;
		public int computeHashCode(java.lang.Object o) {
            return ((Edge)o).surfaceWordHashCode();
        }
        public boolean equals(java.lang.Object o1, java.lang.Object o2) {
            return ((Edge)o1).surfaceWordEquals((Edge)o2);
        }
    };

    /** Default constructor. */
    public EdgeHash() { super(surfaceWordHashingStrategy); }

    /**
     * Returns this as a set of edges.
     */
    @SuppressWarnings("unchecked")
	public Set<Edge> asEdgeSet() { return (Set<Edge>) this; }

    /**
     * Adds an edge, keeping the one whose sign has lower derivational complexity 
     * if there is an equivalent one there already; returns the old
     * edge if it was displaced, the new edge if there was no equivalent 
     * old edge, or null if the edge was not actually added.
     * iff the edge is actually inserted.
     */
    public Edge insert(Edge edge) {
        int pos = index(edge);
        if (pos >= 0) {
            Edge oldEdge = (Edge) _set[pos];
            if (oldEdge == edge) return null; 
            int complexity = edge.sign.getDerivationHistory().complexity();
            int oldComplexity = oldEdge.sign.getDerivationHistory().complexity();
            if (complexity < oldComplexity) {
            	_set[pos] = edge; return oldEdge;
            }
            else return null;
        }
        else {
        	add(edge); return edge;
        }
    }
}


================================================
FILE: src/opennlp/ccg/parse/ParseException.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2002-9 Jason Baldridge, Gann Bierner and Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.parse;

/**
 * Any exception having to do with reading the lexicon or rules, etc.
 * 
 * @author Gann Bierner
 * @version $Revision: 1.3 $, $Date: 2009/12/20 18:54:41 $
 */
public class ParseException extends Exception {
	
	private static final long serialVersionUID = 1L;

	/** Time limit exceeded message. */
	public static final String TIME_LIMIT_EXCEEDED = "Time limit exceeded";
	
	/** Edge limit exceeded message. */
	public static final String EDGE_LIMIT_EXCEEDED = "Edge limit exceeded";

	/**
	 * Class constructor
	 * 
	 * @param s
	 *            the error message
	 */
	public ParseException(String s) {
		super(s); 
	}

	public String toString() { return getMessage(); }
}


================================================
FILE: src/opennlp/ccg/parse/Parser.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003-9 Jason Baldridge, Gann Bierner and Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.parse;

import opennlp.ccg.TextCCG;
import opennlp.ccg.lexicon.*;
import opennlp.ccg.synsem.*;
import opennlp.ccg.grammar.*;
import opennlp.ccg.hylo.EPsScorer;
import opennlp.ccg.hylo.HyloHelper;
import opennlp.ccg.hylo.Nominal;
import opennlp.ccg.unify.*;
import opennlp.ccg.util.Pair;

import java.util.*;
import java.util.prefs.Preferences;

/**
 * The parser is a CKY chart parser for CCG, optionally  
 * with iterative beta-best supertagging and n-best output.
 *
 * @author      Jason Baldridge
 * @author      Gann Bierner
 * @author      Michael White
 * @version     $Revision: 1.38 $, $Date: 2011/08/27 19:27:00 $
 */
public class Parser 
{
    /** Preference key for time limit on parsing. */
    public static final String PARSE_TIME_LIMIT = "Parse Time Limit";
    
    /** A constant indicating no time limit on parsing. */
    public static final int NO_TIME_LIMIT = 0;

    /** Preference key for edge limit on parsing. */
    public static final String PARSE_EDGE_LIMIT = "Parse Edge Limit";
    
    /** A constant indicating no edge limit on parsing. */
    public static final int NO_EDGE_LIMIT = 0;

    /** Preference key for pruning the number of signs kept per equivalence class. */
    public static final String PARSE_PRUNING_VALUE = "Parse Pruning Value";

    /** Preference key for pruning the number of edges kept per cell. */
    public static final String PARSE_CELL_PRUNING_VALUE = "Parse Cell Pruning Value";

    /** A constant indicating no pruning of signs per equivalence class. */
    public static final int NO_PRUNING = 0;

    /** Preference key for whether to use lazy unpacking. */
    public static final String PARSE_LAZY_UNPACKING = "Parse Lazy Unpacking";
    
	/** The grammar. */
	public final Grammar grammar;
	
    /** The lexicon used to create edges. */    
    public final Lexicon lexicon;
    
    /** The rules used to create edges. */
    public final RuleGroup rules;
    
    /** Flag for whether to show the chart for failed parses. */
    public boolean debugParse = false;
    
	/** The sign scorer (or null if none). */
	protected SignScorer signScorer = null;
	
	/** The "n" for n-best pruning. (Default is none.) */
	protected int pruneVal = -1;
	
	/** The cell pruning value. (Default is none.) */
	protected int cellPruneVal = -1;
	
	/** The lazy unpacking flag. (Default is none.) */
	protected Boolean lazyUnpacking = null;
	
    /** Supertagger to use. (Default is none.) */
    protected Supertagger supertagger = null;
    
    /** Flag for whether to use the supertagger in the most-to-least restrictive direction. */
    protected boolean stMostToLeastDir = true;
    
    /** Time limit in milliseconds. (Default is none.) */
    protected int timeLimit = -1; 
    
    /** Edge limit. (Default is none.) */
    protected int edgeLimit = -1; 
    
    // start time for chart construction
    private long startTime = 0;
    
    // lex lookup time
    private int lexTime = 0;
    
    // parse time
    private int parseTime = 0;
    
    // chart construction time
    private int chartTime = 0;
    
    // unpacking time
    private int unpackingTime = 0;
    
    // time limit to use
    private int timeLimitToUse = NO_TIME_LIMIT;
    
    // edge limit to use
    private int edgeLimitToUse = NO_EDGE_LIMIT;
    
    // pruning value to use
    private int pruneValToUse = NO_PRUNING;
    
    // pruning value to use
    private int cellPruneValToUse = NO_PRUNING;
    
    // lazy unpacking flag to use
    private boolean lazyUnpackingToUse = true;
    
    // current chart
    private Chart chart = null;
    
    // parse results
    private ArrayList<Sign> result;

    // parse scores
    private ArrayList<Double> scores;

    // flag for whether to glue fragments currently
    private boolean gluingFragments = false;
    
    /** Constructor. */
    public Parser(Grammar grammar) {
    	this.grammar = grammar;
        this.lexicon = grammar.lexicon;
        this.rules = grammar.rules;
    }
    
	/** Sets the sign scorer. */
	public void setSignScorer(SignScorer signScorer) { this.signScorer = signScorer; }
	
	/** Sets the time limit. */
	public void setTimeLimit(int timeLimit) { this.timeLimit = timeLimit; }
	
	/** Sets the edge limit. */
	public void setEdgeLimit(int edgeLimit) { this.edgeLimit = edgeLimit; }
	
	/** Sets the n-best pruning val. */
	public void setPruneVal(int n) { pruneVal = n; }
	
	/** Sets the cell pruning val. */
	public void setCellPruneVal(int n) { cellPruneVal = n; }
	
	/** Sets the lazy unpacking flag. */
	public void setLazyUnpacking(Boolean b) { this.lazyUnpacking = b; }
	
	/** Sets the supertagger. */
	public void setSupertagger(Supertagger supertagger) { this.supertagger = supertagger; }

	/** Sets the supertagger most-to-least restrictive direction flag. */
	public void setSupertaggerMostToLeastRestrictiveDirection(boolean bool) {
		stMostToLeastDir = bool;
	}
	
    /**
     * Parses a string.
     *
     * @param s the string
     * @exception ParseException thrown if a parse can't be found for the
     *            entire string
     */
    public void parse(String s) throws ParseException {
        // tokenize
        List<Word> words = lexicon.tokenizer.tokenize(s);
        // parse words
        parse(words);
    }
    
    /**
     * Parses a list of words.
     */
    public void parse(List<Word> words) throws ParseException {
    	// set up timing: use limit from prefs unless explicitly set
		Preferences prefs = Preferences.userNodeForPackage(TextCCG.class);
    	if (timeLimit >= 0) timeLimitToUse = timeLimit;
    	else timeLimitToUse = prefs.getInt(PARSE_TIME_LIMIT, NO_TIME_LIMIT);
    	if (edgeLimit >= 0) edgeLimitToUse = edgeLimit;
    	else edgeLimitToUse = prefs.getInt(PARSE_EDGE_LIMIT, NO_EDGE_LIMIT);
    	if (pruneVal >= 0) pruneValToUse = pruneVal; 
    	else pruneValToUse = prefs.getInt(PARSE_PRUNING_VALUE, NO_PRUNING);
    	if (cellPruneVal >= 0) cellPruneValToUse = cellPruneVal; 
    	else cellPruneValToUse = prefs.getInt(PARSE_CELL_PRUNING_VALUE, NO_PRUNING);
    	if (lazyUnpacking != null) lazyUnpackingToUse = lazyUnpacking;
    	else lazyUnpackingToUse = prefs.getBoolean(PARSE_LAZY_UNPACKING, true);
    	// supertagger case: iterative beta-best
    	if (supertagger != null) {
    		parseWithSupertagger(words);
    		return;
    	}
    	// otherwise just once
        try {
        	// init
        	long lexStartTime = System.currentTimeMillis();
            UnifyControl.startUnifySequence();
            // get entries for each word
            List<SignHash> entries = new ArrayList<SignHash>(words.size());
            for (Word w : words) {
            	entries.add(lexicon.getSignsFromWord(w));
            }
            lexTime = (int) (System.currentTimeMillis() - lexStartTime);
            // do parsing
            parseEntries(entries);
        } catch (LexException e) {
        	setGiveUpTime();
        	String msg = "Unable to retrieve lexical entries:\n\t" + e.toString();
        	if (debugParse) System.out.println(msg);
        	throw new ParseException(msg);
        }
		catch (ParseException e) {
        	setGiveUpTime();
			// show chart for failed parse if apropos
			if (debugParse) {
				System.out.println(e);
				System.out.println("Chart for failed parse:");
				chart.printChart();
			}
        	// rethrow
			throw e;
		}
    }

    // iterative beta-best parsing
    private void parseWithSupertagger(List<Word> words) throws ParseException {
    	// set supertagger in lexicon
    	grammar.lexicon.setSupertagger(supertagger);
    	// ensure gluing off
    	gluingFragments = false;
    	// reset beta
    	if (stMostToLeastDir) supertagger.resetBeta();
    	else supertagger.resetBetaToMax();
    	// loop
    	boolean done = false;
    	while (!done) {
    		try {
    	    	// init
            	long lexStartTime = System.currentTimeMillis();
    	        UnifyControl.startUnifySequence();
                // get filtered entries for each word
                List<SignHash> entries = new ArrayList<SignHash>(words.size());
                supertagger.mapWords(words);
                for (int i=0; i < words.size(); i++) {
                	supertagger.setWord(i);
                    Word word = words.get(i);
            		entries.add(lexicon.getSignsFromWord(word));
                }
                lexTime = (int) (System.currentTimeMillis() - lexStartTime);
                // do parsing
                parseEntries(entries);
                // done
                done = true;
            	// reset supertagger in lexicon, turn gluing off
            	grammar.lexicon.setSupertagger(null);
            	gluingFragments = false;
    		}
    		catch (LexException e) {
    			// continue if more betas
    			if (stMostToLeastDir && supertagger.hasMoreBetas()) {
    				supertagger.nextBeta();
    			}
    			// otherwise give up
    			else {
    	        	setGiveUpTime();
    	        	// reset supertagger in lexicon, turn gluing off
    	        	grammar.lexicon.setSupertagger(null);
                	gluingFragments = false;
    	        	// throw parse exception
    	        	String msg = "Unable to retrieve lexical entries:\n\t" + e.toString();
    	        	if (debugParse) System.out.println(msg);
    	            throw new ParseException(msg);
    			}
    		}
    		catch (ParseException e) {
    			// check if limits exceeded
    			boolean outwith = e.getMessage() == ParseException.EDGE_LIMIT_EXCEEDED || 
					e.getMessage() == ParseException.TIME_LIMIT_EXCEEDED;
    			// continue if more betas and limits not exceeded
    			if (stMostToLeastDir && supertagger.hasMoreBetas() && !outwith) 
    				supertagger.nextBeta();
    			// or if limits exceeded and moving in the opposite direction
    			else if (!stMostToLeastDir && supertagger.hasLessBetas() && outwith)
    				supertagger.previousBeta();
    			// otherwise try glue rule, unless already on
    			else if (!gluingFragments) {
    				supertagger.resetBeta(); // may as well use most restrictive supertagger setting with glue rule
    				gluingFragments = true;
    			}
    			// otherwise give up
    			else {
    	        	setGiveUpTime();
    				// show chart for failed parse if apropos
    				if (debugParse) {
    					System.out.println(e);
	    				System.out.println("Chart for failed parse:");
	    				chart.printChart();
    				}
    	        	// reset supertagger in lexicon, turn gluing off
    	        	grammar.lexicon.setSupertagger(null);
                	gluingFragments = false;
    	        	// rethrow
    				throw e;
    			}
    		}
    	}
    }
    
    /**
     * Returns the results of the parse.
     */
    public List<Sign> getResult() { return result; }

    /**
     * Returns the corresponding scores for the results of the parse.
     */
    public List<Double> getScores() { return scores; }

	/** Returns the edge count prior to unpacking. */
	public int edgeCount() { return (chart != null) ? chart.edgeCount() : 0; }
	
	/** Returns the edge count while unpacking. */
	public int unpackingEdgeCount() { return (chart != null) ? chart.unpackingEdgeCount() : 0; }

	/** Returns the max cell size prior to unpacking. */
	public int maxCellSize() { return (chart != null) ? chart.maxCellSize() : 0; }
	
	/** Returns the lexical lookup time for the latest parse. */
	public int getLexTime() { return lexTime; }
	
	/** Returns the overall parse time (but excluding lex lookup) for the latest parse. */
	public int getParseTime() { return parseTime; }
	
	/** Returns the time spent constructing the chart. */
	public int getChartTime() { return chartTime; }
	
	/** Returns the time spent unpacking. */
	public int getUnpackingTime() { return unpackingTime; }
	
	/** Returns the supertagger's final beta value (or 0 if none). */
	public double getSupertaggerBeta() {
		return (supertagger != null) ? supertagger.getCurrentBetaValue() : 0;
	}
	
	
    // parses from lex entries
    private void parseEntries(List<SignHash> entries) throws ParseException {
    	startTime = System.currentTimeMillis();
        // set up chart
        initializeChart(entries);
        if (signScorer != null) chart.setSignScorer(signScorer);
        chart.setPruneVal(pruneValToUse);
        chart.setTimeLimit(timeLimitToUse);
        chart.setStartTime(startTime);
        chart.setEdgeLimit(edgeLimitToUse);
        chart.setCellLimit(cellPruneValToUse);
        // do parsing
        parse(entries.size());
    }
    
    // initialize the chart
    private void initializeChart(List<SignHash> entries) {
        chart = new Chart(entries.size(), rules);
        for (int i=0; i < entries.size(); i++) {
            SignHash wh = entries.get(i);
            for (Sign sign : wh.getSignsSorted()) {
                Category cat = sign.getCategory();
                UnifyControl.reindex(cat);
                chart.insert(i, i, sign);
            }
        }
    }
    
    // actual CKY parsing
    private void parse(int size) throws ParseException {
    	// fill in chart
        for (int i=0; i<size; i++) {
        	chart.insertCell(i,i);
        }
        for (int j=1; j<size; j++) {
            for (int i=j-1; i>=0; i--) {
                for (int k=i; k<j; k++) {
                	chart.insertCell(i,k, k+1,j, i,j);
                }
                chart.insertCell(i,j);
            }
        }
        // glue fragments if apropos
        if (gluingFragments && chart.cellIsEmpty(0, size-1)) {
            for (int j=1; j<size; j++) {
                for (int i=j-1; i>=0; i--) {
                    for (int k=i; k<j; k++) {
                    	chart.insertCellFrag(i,k, k+1,j, i,j);
                    }
                }
            }
        }
        chartTime = (int) (System.currentTimeMillis() - startTime);
        // extract results
        createResult(size);
        parseTime = (int) (System.currentTimeMillis() - startTime);
        unpackingTime = parseTime - chartTime;
    }
	
    // create answer ArrayList
    private void createResult(int size) throws ParseException {
        result = new ArrayList<Sign>();
        scores = new ArrayList<Double>();
        // unpack top
        List<Edge> unpacked = (lazyUnpackingToUse) 
        	? chart.lazyUnpack(0,size - 1) 
			: chart.unpack(0, size - 1);
        // add signs for unpacked edges
        for (Edge edge : unpacked) {
        	result.add(edge.sign);
        	scores.add(edge.score);
        }
        // check non-empty
        if (result.size() == 0) {
            throw new ParseException("Unable to parse");
        }
    }
    
    // set parse time when giving up
    private void setGiveUpTime() {
        chartTime = (int) (System.currentTimeMillis() - startTime);
        parseTime = chartTime; 
    	unpackingTime = 0;
    }
    
    /**
     * Adds the supertagger log probs to the lexical signs of the gold standard parse.
     */
    public void addSupertaggerLogProbs(Sign gold) {
    	List<Word> words = gold.getWords();
        supertagger.mapWords(words);
        addSupertaggerLogProbs(gold, gold);
        for (int i=0; i < words.size(); i++) {
        	supertagger.setWord(i);
        }
    }

    // recurses through derivation, adding lex log probs to lexical signs
    private void addSupertaggerLogProbs(Sign gold, Sign current) {
    	// lookup and add log prob for lex sign
    	if (current.isLexical()) {
    		supertagger.setWord(gold.wordIndex(current));
    		Map<String,Double> stags = supertagger.getSupertags();
    		Double lexprob = stags.get(current.getSupertag());
    		if (lexprob != null) {
    			current.addData(new SupertaggerAdapter.LexLogProb((float) Math.log10(lexprob)));
    		}
    	}
    	// otherwise recurse
    	else {
    		Sign[] inputs = current.getDerivationHistory().getInputs();
    		for (Sign s : inputs) addSupertaggerLogProbs(gold, s);
    	}
    }
    
    /**
     * Returns the oracle best sign among those in the n-best list for the given LF, 
     * using the f-score on all EPs, together with a flag indicating whether the gold LF 
     * was found (as indicated by an f-score of 1.0).
     * NB: It would be better to return the forest oracle, but the nominal conversion would 
     * be tricky to do correctly. 
     */
    public Pair<Sign,Boolean> oracleBest(LF goldLF) {
    	Sign retval = null; double bestF = 0.0;
    	for (Sign sign : result) {
            Category cat = sign.getCategory().copy();
            Nominal index = cat.getIndexNominal();
            LF parsedLF = cat.getLF();
            if (parsedLF != null) {
	            index = HyloHelper.convertNominals(parsedLF, sign, index);
	    		EPsScorer.Results score = EPsScorer.score(parsedLF, goldLF);
	    		if (score.fscore > bestF) {
	    			retval = sign;
	    			bestF = score.fscore;
	    		}
            }
    	}
    	return new Pair<Sign,Boolean>(retval, (bestF == 1.0));
    }
}


================================================
FILE: src/opennlp/ccg/parse/Supertagger.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2009 Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.parse;

import opennlp.ccg.lexicon.*;
import java.util.*;

/**
 * A parsing supertagger must extend the SupertaggerAdapter interface for plugging a 
 * supertagger into the lexicon.  It must additionally support methods for 
 * calculating and caching contextual supertagging assignments, so that 
 * supertags can be retrieved just based on the current word index.
 * 
 * @author      Michael White
 * @version     $Revision: 1.3 $, $Date: 2010/12/08 15:24:26 $
 */
public interface Supertagger extends SupertaggerAdapter {
	
	/**
	 * Maps the given words to their predicted categories, 
	 * so that the beta-best categories can be returned by calls to setWord
	 * and getSupertags.
	 */
	public void mapWords(List<Word> words);
	
	/**
	 * Sets the current word to the one with the given index, 
	 * so that the beta-best categories for it can be returned by a call to 
	 * getSupertags.
	 */
	public void setWord(int index);
}


================================================
FILE: src/opennlp/ccg/parse/postagger/BasicPOSTagger.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (c) 2010 Dennis N. Mehay
//
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed inp the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.parse.postagger;
import opennlp.ccg.parse.postagger.ml.POSPriorModel;
import java.io.BufferedReader;
import java.io.BufferedWriter;
import java.io.File;
import java.io.FileNotFoundException;
import java.io.FileReader;
import java.io.FileWriter;
import java.io.IOException;
import java.io.InputStreamReader;
import java.io.OutputStreamWriter;
import java.util.ArrayList;
import java.util.Collection;
import java.util.Collections;
import java.util.Comparator;
import java.util.HashMap;
import java.util.List;
import java.util.Map;
import java.util.logging.Level;
import java.util.logging.Logger;
import opennlp.ccg.lexicon.Word;
import opennlp.ccg.parse.tagger.TaggedWord;
import opennlp.ccg.parse.tagger.ml.MaxentModel;
import opennlp.ccg.parse.supertagger.ml.FeatureExtractor;
import opennlp.ccg.util.Pair;
import opennlp.ccg.parse.tagger.io.SRILMFactoredBundleCorpusIterator;
import opennlp.ccg.parse.tagger.util.ResultSink;
import opennlp.ccg.parse.tagger.sequencescoring.SequenceScorer;
import opennlp.ccg.parse.tagger.Constants;

/**
 * A non-dummy POS tagger.
 * 
 * @author Dennis N. Mehay
 */
public class BasicPOSTagger extends POSTagger {    
    
    private FeatureExtractor posFex = null;
    private MaxentModel tagMod = null;    
    
    private static final Comparator<Pair<Double,Integer>> comp = new Comparator<Pair<Double,Integer>>() {
        public int compare(Pair<Double, Integer> pr0, Pair<Double, Integer> pr1) { 
            // sorts descending by prob (the double member of the pair).
            if(pr0.a == pr1.a) { return 0; } else if (pr0.a < pr1.a) { return 1; } else { return -1; }  
        }
    };
    
    public BasicPOSTagger(MaxentModel tagMod, FeatureExtractor posFex, String tagSequenceModel)  {
        this.posFex = posFex;
        this.tagMod = tagMod;
        int ord = SequenceScorer.findOrder(tagSequenceModel);
        try {
            posSeqMod = new SequenceScorer(ord, tagSequenceModel);
            // set the search algorithm.
            posSeqMod.setAlgorithm(Constants.TaggingAlgorithm.FORWARDBACKWARD);
            // set the search beam width
            posSeqMod.setSearchBeam(5);
            
        } catch (IOException ex) {
            Logger.getLogger(BasicPOSTagger.class.getName()).log(Level.SEVERE, null, ex);
        }
    }
        
    public List<TaggedWord> tagSentence(List<Word> sentence) { 
        List<TaggedWord> result = new ArrayList<TaggedWord>(sentence.size());
        
        // the prob-string taggings (to be filtered, etc. before adding them to the taggings of the TaggedWord list).        
        List<List<Pair<Double,String>>> taggings = new ArrayList<List<Pair<Double,String>>>(sentence.size());
        
        Map<Integer, TaggedWord> sentMap = new HashMap<Integer, TaggedWord>(sentence.size());
        int ind = 0; 
        for(Word w : sentence) {        
            sentMap.put(ind++, new TaggedWord(w)); 
        }
        List<Collection<Pair<String,Double>>> ftss = posFex.getSentenceFeatures(sentMap);
        
        double[] distro = null;        
        
        int wordIndex = 0;
        for(Collection<Pair<String,Double>> fts : ftss) {
            
            distro = tagMod.eval(fts);
            List<Pair<Double,Integer>> distroList = new ArrayList<Pair<Double,Integer>>(distro.length);
            ind = 0; for(double prob : distro) { distroList.add(new Pair<Double,Integer>(prob, ind++)); }            
            Collections.sort(distroList, comp);                        
            // widen beta a little bit (we're going to do some fwd-bwd rescoring inp a minute, but we don't
            // want to do the fwd-bwd alg over ALL possible tags -- too inefficient).
            List<Pair<Double,String>> tagging = new ArrayList<Pair<Double,String>>(distro.length);
            double best = distroList.get(0).a;
            double widenedBeta = beta/8;            
            
            String goldPOS = sentence.get(wordIndex).getPOS();
            
            for(Pair<Double,Integer> outcome : distroList) { 
                if( (outcome.a >= (widenedBeta * best)) || (includeGold && tagMod.getOutcome(outcome.b).equals(goldPOS)) ) {
                   tagging.add(new Pair<Double,String>(outcome.a, tagMod.getOutcome(outcome.b))); 
                } else {
                    if(!includeGold) {  // if not still potentially fishing for a gold POS tag, then break (they're in sorted order).
                        break;
                    } 
                }
            }
            taggings.add(tagging);
            wordIndex++;
        }
        // rescore using forward-backward.
        taggings = posSeqMod.rescoreSequence(taggings);        
        // add these rescored taggings to the list of TaggedWord's.
        int wInd = 0;
        for(List<Pair<Double,String>> tagging : taggings) {
            TaggedWord tmpWd = new TaggedWord(sentence.get(wInd++));
            tmpWd.setPOSTagging(tagging);            
            result.add(tmpWd);
        }
        // now filter down to the beta-best.
        return betaBestFilter(result); 
    }
    
    
    public static void main(String[] args) throws IOException {
        String usage = "\nBasicPOSTagger -c <configFile> (-i <input> [defaults to <stdin>]) (-o <output> [defaults to <stdout>])\n"+
                       "                 (-e [test tagger; assumes input is gold-standard corpus])\n";
        if (args.length > 0 && args[0].equals("-h")) {
            System.out.println(usage);
            System.exit(0);
        }

        SRILMFactoredBundleCorpusIterator inp = null;
        BufferedWriter out = null;
        
        try {
            String inputCorp = "<stdin>", output = "<stdout>", 
                   configFile = null;
            
            boolean test = false;

            for (int i = 0; i < args.length; i++) {
                if (args[i].equals("-i")) { inputCorp = args[++i]; continue; }
                if (args[i].equals("-o")) { output = args[++i];    continue; }
                if (args[i].equals("-e")) { test = true; continue; }
                if (args[i].equals("-c")) { configFile = args[++i]; continue; }
                System.out.println("Unrecognized option: " + args[i]);
            }

            ResultSink rs = new ResultSink(ResultSink.ResultSinkType.POSTAG);
            
            try {                        
                inp = new SRILMFactoredBundleCorpusIterator(
                        (inputCorp.equals("<stdin>")) ? 
                            new BufferedReader(new InputStreamReader(System.in)) : 
                            new BufferedReader(new FileReader(new File(inputCorp))));                
            } catch (FileNotFoundException ex) {
                System.err.print("Input corpus " + inputCorp + " not found.  Exiting...");
                Logger.getLogger(POSPriorModel.class.getName()).log(Level.SEVERE, null, ex);
                System.exit(-1);
            }  

            try {
                out = (output.equals("<stdout>")) ? new BufferedWriter(new OutputStreamWriter(System.out)) : new BufferedWriter(new FileWriter(new File(output)));
            } catch (IOException ex) {
                System.err.print("Output file " + output + " not found.  Exiting...");
                Logger.getLogger(POSPriorModel.class.getName()).log(Level.SEVERE, null, ex);
                System.exit(-1);
            }

            POSTagger post = POSTagger.posTaggerFactory(configFile);
            
            for (List<Word> inLine : inp) {
                List<TaggedWord> taggedSent = post.tagSentence(inLine);
                List<List<Pair<Double,String>>> sentTagging = new ArrayList<List<Pair<Double,String>>>(taggedSent.size());
                for(TaggedWord tw : taggedSent) { sentTagging.add(tw.getPOSTagging()); }
                if(test) { rs.addSent(sentTagging, inLine); }
                out.write("<s>" + System.getProperty("line.separator"));
                for(TaggedWord tw : taggedSent) {
                    out.write(tw.getForm());
                    for(Pair<Double,String> tg : tw.getPOSTagging()) {
                        out.write("\t" + tg.b + "\t" + tg.a);
                    }
                    out.write(System.getProperty("line.separator"));
                }
                out.write("</s>" + System.getProperty("line.separator"));
            }
            out.flush();

            if(test) { System.err.println(rs.report()); }
        } catch(Throwable t) {
            t.printStackTrace();
        } finally {
            try {                
                inp.close();
                out.close();
            } catch (IOException ex) {
                Logger.getLogger(POSPriorModel.class.getName()).log(Level.SEVERE, null, ex);
            }
        }
    }
}

================================================
FILE: src/opennlp/ccg/parse/postagger/DummyPOSTagger.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2010 Dennis N. Mehay
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.parse.postagger;
import java.util.ArrayList;
import java.util.List;
import opennlp.ccg.lexicon.Word;
import opennlp.ccg.parse.tagger.TaggedWord;
import opennlp.ccg.util.Pair;
        
/**
 * A "DummyPOSTagger" simply grabs the single POS tag in the Words themselves
 * and puts them into a TaggedWord with a singleton list of probability 1.0 POS
 * tags.
 * 
 * @author Dennis N. Mehay
 */
public class DummyPOSTagger extends POSTagger {    

    public List<TaggedWord> tagSentence(List<Word> sentence) { 
        List<TaggedWord> result = new ArrayList<TaggedWord>(sentence.size());
        for(Word w : sentence) {            
            List<Pair<Double,String>> tmpTagging = new ArrayList<Pair<Double,String>>(1);
            tmpTagging.add(new Pair<Double,String>(1.0,w.getPOS()));            
            TaggedWord tmp = new TaggedWord(w);
            tmp.setPOSTagging(tmpTagging);
            result.add(tmp);            
        }
        return result; 
    }
}

================================================
FILE: src/opennlp/ccg/parse/postagger/POSTagSequenceGetter.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (c) 2010 Dennis N. Mehay
//
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed inp the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.parse.postagger;

import java.io.BufferedReader;
import java.io.BufferedWriter;
import java.io.File;
import java.io.FileNotFoundException;
import java.io.FileReader;
import java.io.FileWriter;
import java.io.IOException;
import java.util.List;
import opennlp.ccg.lexicon.Word;
import opennlp.ccg.parse.tagger.io.SRILMFactoredBundleCorpusIterator;

/**
 * @author Dennis N. Mehay
 */
public class POSTagSequenceGetter {
    public static void main(String[] args) throws FileNotFoundException, IOException {
        String usage = "\nPOSTagSequenceGetter -i <inputCorpus> -o <outputLocation>\n";
        String input = null, output = null;
        if(args == null || args.length == 0 || args[0].equals("-h")) {
            System.err.println(usage);
            System.exit(0);
        }
        for(int i = 0; i < args.length; i++) {
            if(args[i].equals("-i")) { input = args[++i]; continue; }
            if(args[i].equals("-o")) { output = args[++i]; continue; }
            System.err.println("unknown command-line option: " + args[i]);
        }
        
        BufferedReader in = new BufferedReader(new FileReader(new File(input)));
        SRILMFactoredBundleCorpusIterator corp = new SRILMFactoredBundleCorpusIterator(in);
        BufferedWriter out = new BufferedWriter(new FileWriter(new File(output)));
        
        
        for(List<Word> sent : corp) {
            out.write("<s> ");
            for(Word w : sent) {
                out.write(w.getPOS()+" ");
            }
            out.write("</s>"+System.getProperty("line.separator"));
        }
        out.close();
    }
    
}


================================================
FILE: src/opennlp/ccg/parse/postagger/POSTagger.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2010 Dennis N. Mehay
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.parse.postagger;

import opennlp.ccg.parse.tagger.Constants.TaggingAlgorithm;
import java.io.File;
import java.io.FileNotFoundException;
import java.io.IOException;
import java.util.ArrayList;
import java.util.List;
import java.util.Map;
import java.util.logging.Level;
import java.util.logging.Logger;
import opennlp.ccg.parse.tagger.TaggedWord;
import opennlp.ccg.lexicon.Word;
import opennlp.ccg.parse.postagger.ml.POSPriorModel;
import opennlp.ccg.parse.postagger.ml.POSTagFex;
import opennlp.ccg.parse.tagger.ml.MaxentModel;
import opennlp.ccg.parse.tagger.ml.ZLMEM;
import opennlp.ccg.parse.tagger.sequencescoring.SequenceScorer;
import opennlp.ccg.util.Pair;
import opennlp.ccg.parse.tagger.util.ConfigFileProcessor;

/**
 * Interface for POS taggers.
 * 
 * @author Dennis N. Mehay
 */
public abstract class POSTagger {

    protected SequenceScorer posSeqMod = null;
    public TaggingAlgorithm alg = TaggingAlgorithm.FORWARDBACKWARD;
    public double beta = 1.0;
    protected boolean includeGold = false;

    /** In goes a list of {@code Word}s; out comes a list of {@code TaggedWord}s*/
    public abstract List<TaggedWord> tagSentence(List<Word> sentence);

    /** Set the tagging algorithm. */    
    public void setTaggingAlgorithm(TaggingAlgorithm newAlg) { 
        alg = newAlg; 
        posSeqMod.setAlgorithm(alg);
    }
    
    /** Set the beam width (by default, it's 1.0 -- i.e., single-best). */
    public void setBeta(double beta) {
        this.beta = beta;
    }

    /** Say whether or not we will include gold tags (e.g., for training). */
    public void setIncludeGold(boolean includeGoldOrNot) { includeGold = includeGoldOrNot; }
    
    /** 
     * Filter the POS tags by the beta filter and return the (potentially) trimmed-down results. 
     * It is assumed that the tags of the tagged word are sorted in descending order of
     * probability.
     */
    public List<TaggedWord> betaBestFilter(List<TaggedWord> sentence) {
        List<TaggedWord> res = new ArrayList<TaggedWord>(sentence.size());
        for (TaggedWord tw : sentence) {
            Word w = tw.getWord();
            double best = tw.getPOSTagging().get(0).a;
            int endIndex = 0;
            for (Pair<Double, String> tagging : tw.getPOSTagging()) {
                if (tagging.a >= (beta * best)) {
                    endIndex++;
                } else {
                    break;
                }
            }
            List<Pair<Double, String>> tmpTagging = new ArrayList<Pair<Double, String>>(tw.getPOSTagging().size());
            for (Pair<Double, String> tg : tw.getPOSTagging()) {
                tmpTagging.add(tg);
            }
            tmpTagging.subList(endIndex, tmpTagging.size()).clear();
            TaggedWord twTmp = new TaggedWord(w);
            twTmp.setPOSTagging(tmpTagging);
            res.add(twTmp);
        }
        return res;
    }
    
    /** 
     * Build a POS tagger from a config file. 
     * A non-dummy config file might contain:
     * ...
     * # this is a comment
     * taggerType=basic
     * priorModel=/home/.../posprior/prior.flm
     * # note that CaSE dOES Not matter for the key (but does for the value, e.g. a file name).
     * PRIORmodelvocab=/home/.../posprior/vocab.voc
     * # you can also repeat opions. the last one will take effect.
     * priormodelvocab=/home/.../posprior/vocab2.voc
     * 
     * # did you see that empty line get ignored?
     * # notice that spaces around the '=' get ignored, as well.
     * maxentModel = /home/.../maxentmodels/myposmod.mod
     * # this last must be an ARPA-formatted n-gram model over POS tags (7-grams work well).
     * sequenceModel=/home/.../pos.lm
     * # lastly, the tagging beam width (1.0 means "single-best" -- i.e., a unitagger).
     * beta=0.1
     */
    public static POSTagger posTaggerFactory(String configFile) {
        POSTagger res = null;
        try {

            String[] pathKeys = { "maxentmodel", "priormodel", "priormodelvocab", "sequencemodel"};
            Map<String, String> opts = ConfigFileProcessor.readInConfig(configFile, pathKeys);
            if (opts.get("taggertype").equalsIgnoreCase("dummy")) {
                return new DummyPOSTagger();
            }
            MaxentModel mem = new ZLMEM(new File(opts.get("maxentmodel")));
            POSPriorModel posPrior = null;
	    if (opts.get("priormodel") != null) {
		posPrior = new POSPriorModel(opts.get("priormodel"), opts.get("priormodelvocab"));
	    }
            POSTagFex fexer = new POSTagFex(posPrior);

            res = new BasicPOSTagger(mem, fexer, opts.get("sequencemodel"));
            res.setBeta(Double.parseDouble(opts.get("beta")));
            TaggingAlgorithm alg = (opts.get("taggingalgorithm") == null || opts.get("taggingalgorithm").equals("forward-backward")) ? 
                TaggingAlgorithm.FORWARDBACKWARD : TaggingAlgorithm.FORWARD;
            res.setTaggingAlgorithm(alg);

            res.setIncludeGold((opts.get("includegold") == null || opts.get("includegold").equals("false")) ? false : true);
            
        } catch (FileNotFoundException ex) {
            Logger.getLogger(POSTagger.class.getName()).log(Level.SEVERE, null, ex);
        } catch (IOException ex) {
            Logger.getLogger(POSTagger.class.getName()).log(Level.SEVERE, null, ex);
        }

        return res;
    }
}


================================================
FILE: src/opennlp/ccg/parse/postagger/ml/POSPriorModel.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2010 Dennis N. Mehay
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.parse.postagger.ml;

import opennlp.ccg.parse.supertagger.util.ProbPairComparator;

import java.io.BufferedReader;
import java.io.BufferedWriter;
import java.io.File;
import java.io.FileNotFoundException;
import java.io.FileReader;
import java.io.FileWriter;
import java.io.IOException;
import java.io.InputStreamReader;
import java.io.OutputStreamWriter;
import java.util.ArrayList;
import java.util.Collection;
import java.util.Collections;
import java.util.HashMap;
import java.util.HashSet;
import java.util.List;
import java.util.Map;
import java.util.logging.Level;
import java.util.logging.Logger;
import opennlp.ccg.lexicon.DefaultTokenizer;
import opennlp.ccg.lexicon.Word;
import opennlp.ccg.ngrams.ConditionalProbabilityTable;
import opennlp.ccg.parse.tagger.io.SRILMFactoredBundleCorpusIterator;
import opennlp.ccg.util.Interner;
import opennlp.ccg.util.Pair;

/**
 * (c) (2009) Dennis N. Mehay
 * @author Dennis N. Mehay
 * 
 * Model for predicting p(POS | word).  Uses an ARPA-formatted
 * SRILM-trained "unigram" factored LM for this, where each "unigram" is
 * a bundle of word:pos.
 */
public class POSPriorModel extends ConditionalProbabilityTable {

    public static final String WORD = DefaultTokenizer.WORD_ATTR;
    public static final String POS_TAG = DefaultTokenizer.POS_ATTR;
    private Interner<Pair<String, String>> pairs = new Interner<Pair<String, String>>();
    /** 
     * Re-usable list for attr-val pairs of word-pos-supertag inputs to the prior model
     * (i.e., for predicting p(STag | word, POS). 
     */
    public List<Pair<String, String>> attrVals = new ArrayList<Pair<String, String>>(5);
    /** 
     * A comparator for sorting Pair<Double,String>'s where the Double is a probability
     * (effectively sorts by descending order of probability).
     */
    private ProbPairComparator ppcomp = new ProbPairComparator();
    /** All the priors. Reference them when getting beta-best, beta-worst, etc. */
    List<Pair<Double, String>> priors = new ArrayList<Pair<Double, String>>(1000);

    /** String[] of all possible POS outcomes. */
    private String[] posVocab = null;

    /** Construct a prior model with the FLM config file and corresponding vocab file. */
    public POSPriorModel(String flmFile, String vocabFile) throws IOException {
        super(flmFile);
        String post = null;
        BufferedReader br = new BufferedReader(new FileReader(new File(vocabFile)));
        post = br.readLine().trim();

        // get next POS tag from the vocab.
        while ((post != null) && !post.trim().startsWith(POS_TAG + "-")) {
            post = br.readLine();
        }
        if (post != null) {
            post = post.trim().split("-")[1];
        }

        Collection<String> allSupertags = new HashSet<String>();

        // find out how many outcomes we have.
        int cnt = 0;
        while (post != null) {
            cnt++;
            allSupertags.add(post);
            while ((post != null) && !post.trim().startsWith(POS_TAG + "-")) {
                post = br.readLine();
            }
            if (post != null) {
                post = post.trim().split("-")[1];
            }
        }

        // initialize the arrays to this size.
        posVocab = new String[cnt];
        

        cnt = 0;
        // fill the vocab array with all possible POS tags.
        for (String posTag : allSupertags) {
            posVocab[cnt++] = posTag.intern();
        }
        br.close();
    }

    /** Get the prior probability of this POS/word combo. */
    public double getPriorOf(String pos, String word) {
        attrVals.clear();
        Pair<String, String> surfaceForm = pairs.intern(new Pair<String, String>(WORD, word.intern()));
        attrVals.add(surfaceForm);
        Pair<String, String> partOfSpeech = pairs.intern(new Pair<String, String>(POS_TAG, pos.intern()));
        attrVals.add(partOfSpeech);
        return score(attrVals);
    }

    /** Get the POS-dict restricted prior distribution (sorted descending by prob.) */
    public List<Pair<Double, String>> getPriors(Word w) {
        List<Pair<Double, String>> sortedTags = new ArrayList<Pair<Double, String>>(posVocab.length);
        for (String postag : posVocab) {
            sortedTags.add(new Pair<Double, String>(getPriorOf(postag, w.getForm()), postag));
        }
        Collections.sort(sortedTags, ppcomp);
        return sortedTags;
    }
    /* added by DCE, to facilitate use in hypertagging
     * Identical to above method, but accepts a String (name of EP) rather than
     * a Word object.
     */
    public List<Pair<Double, String>> getPriors(String s) {
    	s.intern();
    	List<Pair<Double, String>> sortedTags = new ArrayList<Pair<Double, String>>(posVocab.length);
      for (String postag : posVocab) {
          sortedTags.add(new Pair<Double, String>(getPriorOf(postag, s), postag));
      }
      Collections.sort(sortedTags, ppcomp);
      return sortedTags;
    }
    
    public static void main(String[] args) throws IOException {
        String usage = "\nPOSPriorModel -vocab <vocabfile> (-c <corpus> [default = <stdin>]) (-o <output> [default = <stdout>])\n";
        if (args.length > 0 && args[0].equals("-h")) {
            System.out.println(usage);
            System.exit(0);
        }

        SRILMFactoredBundleCorpusIterator in = null;
        BufferedWriter out = null;
        BufferedWriter voc = null;

        try {
            String inputCorp = "<stdin>", output = "<stdout>", vocabFile = "vocab.voc";

            for (int i = 0; i < args.length; i++) {
                if (args[i].equals("-c")) { inputCorp = args[++i]; continue; }
                if (args[i].equals("-o")) { output = args[++i];    continue; }
                if (args[i].equals("-vocab")) { vocabFile = args[++i];  continue; }
                System.out.println("Unrecognized option: " + args[i]);
            }

            try {
                in = new SRILMFactoredBundleCorpusIterator(
                        (inputCorp.equals("<stdin>")) ? new BufferedReader(new InputStreamReader(System.in)) : new BufferedReader(new FileReader(new File(inputCorp))));
            } catch (FileNotFoundException ex) {
                System.err.print("Input corpus " + inputCorp + " not found.  Exiting...");
                Logger.getLogger(POSPriorModel.class.getName()).log(Level.SEVERE, null, ex);
                System.exit(
                        -1);
            }

            try {
                out = (output.equals("<stdout>")) ? new BufferedWriter(new OutputStreamWriter(System.out)) : new BufferedWriter(new FileWriter(new File(output)));
            } catch (IOException ex) {
                System.err.print("Output file " + output + " not found.  Exiting...");
                Logger.getLogger(POSPriorModel.class.getName()).log(Level.SEVERE, null, ex);
                System.exit(
                        -1);
            }

            try {
                voc = new BufferedWriter(new FileWriter(new File(vocabFile)));
            } catch (IOException ex) {
                Logger.getLogger(POSPriorModel.class.getName()).log(Level.SEVERE, null, ex);
            }

            Map<String, Integer> vocab = new HashMap<String, Integer>();
            for (List<Word> inLine : in) {
                for (Word w : inLine) {
                    String pos = POS_TAG + "-" + DefaultTokenizer.escape(w.getPOS()),
                        wform = WORD + "-" + DefaultTokenizer.escape(w.getForm());

                    vocab.put(pos, (vocab.get(pos) == null) ? 1 : vocab.get(pos) + 1);
                    vocab.put(wform, (vocab.get(wform) == null) ? 1 : vocab.get(wform) + 1);
                    out.write(wform + ":" + pos + " ");
                }
                out.write(System.getProperty("line.separator"));
            }
            out.flush();

            for (String str : vocab.keySet()) {
                    voc.write(str + System.getProperty("line.separator"));
            }
            voc.flush();
        } finally {
            try {
                out.close();
                in.close();
                voc.close();
            } catch (IOException ex) {
                Logger.getLogger(POSPriorModel.class.getName()).log(Level.SEVERE, null, ex);
            }
        }
    }
}


================================================
FILE: src/opennlp/ccg/parse/postagger/ml/POSTagFex.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (c) 2010 Dennis N. Mehay
//
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed inp the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.parse.postagger.ml;

import java.io.BufferedReader;
import java.io.BufferedWriter;
import java.io.File;
import java.io.FileReader;
import java.io.FileWriter;
import java.io.IOException;
import java.io.InputStreamReader;
import java.io.OutputStreamWriter;
import java.util.ArrayList;
import java.util.Collection;
import java.util.Collections;
import java.util.HashMap;
import java.util.List;
import java.util.Map;
import opennlp.ccg.parse.tagger.Constants;
import opennlp.ccg.parse.supertagger.ml.FeatureExtractor;
import opennlp.ccg.parse.tagger.TaggedWord;
import opennlp.ccg.util.Pair;
import opennlp.ccg.parse.tagger.io.SRILMFactoredBundleCorpusIterator;
import opennlp.ccg.lexicon.Word;

/**
 * Feature extractor for POS taggers.
 * 
 * The inputs are "TaggedWord"s simply for consistency of interface.
 * There should be no tags assigned to the words (short, perhaps, TOBI 
 * tags or the like).
 * 
 * @author Dennis N. Mehay
 */
public class POSTagFex implements FeatureExtractor {
    private POSPriorModel posPrior = null;
    
    /** Constructor with a prior model (replaces tagging dictionary). */
    public POSTagFex(POSPriorModel posPrior) {
        this.posPrior = posPrior;
    }
    
    /** Constructor without prior model. Prior features will not be used. */    
    public POSTagFex() { this(null); }
    
    public static final String curL = "X";
    public static final String prevL = "X-1";
    public static final String prevPrevL = "X-2";
    public static final String nextL = "X+1";
    public static final String nextNextL = "X+2";
    private static final String[] lxfLabs = {prevPrevL, prevL, curL, nextL, nextNextL};
    private static final String prefix = "prefix", suffix = "suffix";
    private static final String hyphen = "containsHyphen";
    private static final String caps = "containsUC";
    private static final String num = "containsNum";
    private static final String neConn = "containsNEConnector";
    private static final String priorF = "PPOS";
    /** The string that connects elements of a fused named entity. */
    private String neConnecter = "_";
    /** Get a word's features for applying the tagger (i.e., not training mode). */
    public Collection<Pair<String, Double>> getFeatures(Map<Integer, TaggedWord> sentence, Integer wordIndex) {
        return getFeatures(sentence, wordIndex, false);
    }

    /** Get a sentence of words' features for applying the tagger (i.e., not training mode). */
    public List<Collection<Pair<String, Double>>> getSentenceFeatures(Map<Integer, TaggedWord> sentence) {
        return getSentenceFeatures(sentence, false);
    }

    /** 
     * Get the features for a word in context.  training == true iff the output class is to be collected as well. 
     * 
     * TODO: This and supertagger feature extractor (fex) should be merged into a more general, parameterizable 
     * sentence-level contextual feature extractor. (VERY todo-ish, though.)
     */
    public Collection<Pair<String, Double>> getFeatures(Map<Integer, TaggedWord> sentence, Integer wordIndex, boolean training) {
        Collection<Pair<String, Double>> result = new ArrayList<Pair<String, Double>>(30);

        TaggedWord current, prev, prevPrev, next, nextNext;
        current = sentence.get(wordIndex);
        // -------- The left periphery ------------
        int wind = wordIndex.intValue();
        if (wind > 1) {
            prev = sentence.get(wind - 1);
            prevPrev = sentence.get(wind - 2);
        } else if (wind > 0) {
            prev = sentence.get(wind - 1);
            prevPrev = Constants.OOB;
        } else {
            prev = prevPrev = Constants.OOB;
        }

        // -------- The right periphery -----------
        int tempSize = sentence.size();
        if ((tempSize - (wind + 1)) >= 2) {
            next = sentence.get(wind + 1);
            nextNext = sentence.get(wind + 2);
        } else if (tempSize - (wind + 1) >= 1) {
            next = sentence.get(wind + 1);
            nextNext = Constants.OOB;
        } else {
            next = nextNext = Constants.OOB;
        }

        Double activation = Constants.one;
        
        if (training) {
            result.add(new Pair<String, Double>(current.getPOS(), activation));
        }

        // we do not use tag-sequence features in this model.
        // these are in a separate sequence model (n-gram model over POS sequences).
        
        // standard contextual features (word to the left, current word, word to the right, etc.).
        // these features are from Ratnaparkhi (1996).
        result.add(new Pair<String, Double>(curL + "=" + current.getForm(), activation));
        result.add(new Pair<String, Double>(prevL + "=" + prev.getForm(), activation));
        result.add(new Pair<String, Double>(prevPrevL + "=" + prevPrev.getForm(), activation));
        result.add(new Pair<String, Double>(nextL + "=" + next.getForm(), activation));
        result.add(new Pair<String, Double>(nextNextL + "=" + nextNext.getForm(), activation));
        
        // features that replace the tagging dictionary. 
        // add real-valued (activation = prior log-prob) features for each of the beta-best prior
        // tags, given this word.
        if(posPrior != null) {
            List<Pair<Double,String>> priors = posPrior.getPriors(current.getWord());
            double beta = 0.1;
            double best = priors.get(0).a;
            String wform = current.getForm();
            for(Pair<Double,String> prior : priors) {
                if(prior.a > (beta * best)) {
                    // add the features PPOS=<POSTAG>:<log-prob> and PPOS_word=<POSTAG>_<wordForm>:<log-prob>.
                    result.add(new Pair<String,Double>(priorF + "=" + prior.b, prior.a));
                    result.add(new Pair<String,Double>(priorF + "_word" + "=" + prior.b + "_" + wform, prior.a));
                } else {
                    break;
                }
            }
        }
        
        // these are in addition to Ratnaparkhi's (1996) contextual features.
        // now for conjunctions of features: w-2w-1=..., w-1w+1=..., w+1w+2=... (same for posp).
        // (i.e., bigram features over words and parts of speech and bigrams of words and POSs that straddle the current token).
        // N.B. only use single-best POSs (maybe change later).
        TaggedWord[] wds = {prevPrev, prev, current, next, nextNext};

        for (int j = 1; j < wds.length; j++) {
            result.add(new Pair<String, Double>(lxfLabs[j - 1] + "|" + lxfLabs[j] + "=" + wds[j - 1].getForm() + "|" + wds[j].getForm(), activation));
            // also, if at the current word slot, add bigrams that straddle the current word.
            if (j == 2) {
                result.add(new Pair<String, Double>(lxfLabs[j - 1] + "|" + lxfLabs[j + 1] + "=" + wds[j - 1].getForm() + "|" + wds[j + 1].getForm(), activation));
            }
        }
        
        // affix features from Ratnaparkhi (1996).
        // if the word's length is > 4, then extract the 1-, 2-, 3- and 4-character affixes.        
        if(current.getForm().length() > 4) {
            StringBuffer prefixes = new StringBuffer(4), suffixes = new StringBuffer(4);
            char[] wdForm = current.getForm().toCharArray();
            // prefixes.
            int cursor = 0;
            for(cursor = 0; cursor < 4; cursor++) {
                prefixes.append(wdForm[cursor]);
                result.add(new Pair<String,Double>(prefix+"="+prefixes.toString(), Constants.one));
            }
            // suffixes.
            for(cursor = wdForm.length-1; cursor >= wdForm.length-5; cursor--) {
                suffixes.insert(0, wdForm[cursor]);
                result.add(new Pair<String,Double>(suffix+"="+suffixes.toString(), Constants.one));
            }
        }
        
        // now do "contains hyphen", "contains number", "contains uppercase letter" and contains fused NE connecter (_) features.
        // also from Ratnaparkhi (1996).        
        if(current.getForm().contains("-")) { result.add(new Pair<String,Double>(hyphen, Constants.one)); }
        if(current.getForm().matches(".*[0-9]+.*")) { result.add(new Pair<String,Double>(num, Constants.one)); }
        if(!current.getForm().toLowerCase().equals(current.getForm())) { result.add(new Pair<String,Double>(caps, Constants.one)); }
	// if we see a NE connector, this is likely a NNP (in English, e.g.).
        if(current.getForm().contains(neConnecter)) { result.add(new Pair<String,Double>(neConn, Constants.one)); }
        return result;
    }

    /** 
     * Get the features for a sentence of words in context.  
     * training == true iff the output classes are to be collected as well. 
     */
    public List<Collection<Pair<String, Double>>> getSentenceFeatures(Map<Integer, TaggedWord> sentence, boolean training) {
        List<Collection<Pair<String, Double>>> result = new ArrayList<Collection<Pair<String, Double>>>(30);
        List<Integer> keys = new ArrayList<Integer>(sentence.keySet().size());
        for(Integer wordIndex : sentence.keySet()) { keys.add(wordIndex); }
        Collections.sort(keys);
        for(Integer wordIndex : keys) {
            result.add(getFeatures(sentence, wordIndex, training));
        }
        return result;
    }
    
    public static void main(String[] args) throws IOException {        
        String usage = 
                "POSTagFex (-h [gets this message]) (-i <input> [defaults to <stdin>]) (-o <output> [defaults to <stdout>])\n"+
                "          (-p <posPriorModel> [.flm] -v <priorModVocab>)\n";
        if(args.length > 0 && args[0].equals("-h")) { System.out.println(usage); System.exit(0); }
        
        String input = "<stdin>", output = "<stdout>", priorModF = null, priorVocab = null;
        for(int j = 0; j < args.length; j++) {
            if(args[j].equals("-i")) { input = args[++j]; continue; }
            if(args[j].equals("-o")) { output = args[++j]; continue; }
            if(args[j].equals("-p")) { priorModF = args[++j]; continue; }
            if(args[j].equals("-v")) { priorVocab = args[++j]; continue; }
            System.err.println("Unrecognized option: " + args[j]); 
        }
        SRILMFactoredBundleCorpusIterator corp = new SRILMFactoredBundleCorpusIterator(
                input.equals("<stdin>") ?
                    new BufferedReader(new InputStreamReader(System.in)) :
                    new BufferedReader(new FileReader(new File(input))));
        BufferedWriter out = new BufferedWriter(
                output.equals("<stdout>") ?
                    new BufferedWriter(new OutputStreamWriter(System.out)) :
                    new BufferedWriter(new FileWriter(new File(output))));
        
        POSPriorModel posPriorMod = null;
        if(priorModF != null) {
            posPriorMod = new POSPriorModel(priorModF, priorVocab);
        }
        POSTagFex fexer = new POSTagFex(posPriorMod);        
        for(List<Word> sentence : corp) {
            Map<Integer, TaggedWord> sent = new HashMap<Integer, TaggedWord>(sentence.size());
            int index = 0;
            for(Word w : sentence) { sent.put(index++, new TaggedWord(w)); }
            
            List<Collection<Pair<String,Double>>> ftss = fexer.getSentenceFeatures(sent, true);
            
            for(Collection<Pair<String,Double>> fts : ftss) {
                index = 0;
                for(Pair<String,Double> ft : fts) {
                    // if we're at the first item, print out the label.
                    if (index == 0) {
                        out.write(ft.a);
                    } else {
                        out.write(" " + ft.a + ":" + ft.b);
                    }
                    index++;   
                }
                out.write(System.getProperty("line.separator"));
            }
        }
	out.flush();
    }
}


================================================
FILE: src/opennlp/ccg/parse/supertagger/JavaSupertaggingApp.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2009 Dennis N. Mehay
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.parse.supertagger;

import opennlp.ccg.parse.tagger.util.ResultSink;
import opennlp.ccg.parse.supertagger.ml.STFex;
import opennlp.ccg.parse.supertagger.ml.FeatureExtractor;
import opennlp.ccg.parse.tagger.ml.ZLMEM;
import opennlp.ccg.parse.tagger.io.SRILMFactoredBundleCorpusIterator;
import opennlp.ccg.parse.tagger.io.PipeDelimitedFactoredBundleCorpusIterator;
import opennlp.ccg.parse.tagger.Constants;
import java.io.*;
import java.util.*;
import static java.util.Arrays.*;
import joptsimple.*;
import opennlp.ccg.lexicon.Word;
import opennlp.ccg.parse.supertagger.io.*;
import opennlp.ccg.parse.supertagger.ml.*;
import opennlp.ccg.parse.supertagger.util.*;
import opennlp.ccg.util.Pair;

/**
 * @author Dennis N. Mehay
 * @version $Revision: 1.6 $, $Date: 2010/09/21 04:12:41 $
 */
public class JavaSupertaggingApp {

    public static void main(String[] args) throws Exception {
        try {
            // instantiate command-line option parser, setting up type-safe expectations about
            // what should be passed for the options.
            OptionParser parser = new OptionParser();
            parser.acceptsAll(asList("train", "R"), "extract training features.");
            parser.acceptsAll(asList("tag", "T"), "supertag a POS-tagged file.");
            parser.acceptsAll(asList("test","E"), "test tagger against gold standard.");            
            parser.acceptsAll(asList("tagdictextract", "D"), "extract tagging dictionaries.");
            parser.acceptsAll(asList("h", "?"), "show help.");
            OptionSpec<String> tokenisation = parser.acceptsAll(asList("delimiter", "d")).withRequiredArg().ofType(String.class).describedAs("SRILM factor bundles or C&C-style" +
                    "(pipe-delimited) factor bundles [choose one of: \"SRILM\", \"candc\"]");
            OptionSpec<File> goldstandspec = parser.acceptsAll(asList("g","gold")).withRequiredArg().ofType(File.class).
                    describedAs("the gold standard tagged file [file must have same bundle format as input corpus, \"SRILM\" or \"candc\"]");
            OptionSpec<File> inputspec = parser.acceptsAll(asList("i", "input")).withRequiredArg().ofType(File.class).describedAs("training or tagging/testing file");
            OptionSpec<File> outputspec = parser.acceptsAll(asList("o", "output")).withRequiredArg().ofType(File.class).describedAs("output location (for training feats or tags)");
            OptionSpec<File> modspec = parser.acceptsAll(asList("m", "model")).withRequiredArg().ofType(File.class).describedAs("textual model file (ZhangLe maxent-style) [for tagging/testing only]");
            OptionSpec<String> priormodspec = parser.acceptsAll(asList("priorModelF")).withRequiredArg().ofType(String.class).describedAs("config file for ARPA-formatted FLM [for tagging/testing and feature extraction"+
                    "MUST also give vocab file]");
            OptionSpec<String> vocabspec = parser.acceptsAll(asList("vocabF")).withRequiredArg().ofType(String.class).describedAs("vocab file for ARPA-formatted FLM [for tagging/testing and feature extraction]");
            OptionSpec<Integer> kspec = parser.accepts("K").withRequiredArg().ofType(Integer.class).describedAs("K parameter of Clark and Curran [for tagging/testing only]");
            OptionSpec<Double> betaspec = parser.accepts("beta").withRequiredArg().ofType(Double.class).describedAs("beam width for supertagger [for tagging only]");
            OptionSpec<File> wdictspec = parser.acceptsAll(asList("w", "worddict")).withRequiredArg().ofType(File.class).describedAs("path to the word-based tagging dictionary file");
            OptionSpec<File> pdictspec = parser.acceptsAll(asList("p", "posdict")).withRequiredArg().ofType(File.class).describedAs("path to the POS-based tagging dictionary file");
            OptionSpec<String> seqModel = parser.acceptsAll(asList("s","seqModel")).withOptionalArg().ofType(String.class).describedAs("the tag sequence model (for forward-backward tagging)");
            OptionSpec<Integer> fbBeam = parser.acceptsAll(asList("fbBeamWidth")).withOptionalArg().ofType(Integer.class).describedAs("maximum width of the forward-backward beam [default = 5]");
            OptionSpec<String> tagAlgorithm = parser.acceptsAll(asList("taggingAlgorithm")).withOptionalArg().ofType(String.class).describedAs("tagging algorithm. choose from {forward-backward, forward} [default = forward-backward]");
            OptionSet options = parser.parse(args);
            if (options.has("?") || args.length == 0) {
                parser.printHelpOn(System.out);
                System.exit(0);
            }
            assert (options.valueOf(tokenisation).equalsIgnoreCase("candc") || options.valueOf(tokenisation).equalsIgnoreCase("srilm"));
            // Must say whether we are tagging (or testing) or training (extracting features, actually).
            assert (options.has("tag") || options.has("train") || options.has("test") || options.has("D"));
            
            // Can't both train and tag/test, or train and extract tagging dict, or tag/test and do the last.
            assert !(options.has("train") && (options.has("tag") || options.has("test")));
            assert !(options.has("train") && options.has("D"));
            assert !((options.has("tag") || options.has("test")) && options.has("D"));
            
            // either we're doing forward-backward tagging, or we're not.
            assert (options.has("seqModel") || !(options.has("seqInterp") || options.has("fbBeamWidth")));
                        
            // Can't have a model file input when we are training....
            assert !(options.has("train") && options.has("m"));
            // ... or when extracting a tag dict.
            assert !(options.has("D") && options.has("m"));
            
            // Must have tagging dict files when tagging or extracting tag dicts, 
            // and additionally beta and K when tagging .
            assert (!(options.has("tag") || options.has("test") || options.has("D")) || (options.has("p") && options.has("w")));
            assert (!(options.has("tag") || options.has("test")) || (options.has("K") && options.has("beta")));
            
            // can't use prior model if no vocab file is given (so that the prior model knows which 
            // classes to make probabilistic predictions over) or no POS dictionary is given (so
            // that we can restrict our priors to those supertags that have occurred with a particular
            // POS).
            assert (!(options.has("priorModelF") && (!options.has("vocabF") || !options.has("p"))));
            STPriorModel stPrior = null;
            if (options.has("priorModelF")) {
                stPrior = new STPriorModel(options.valueOf(priormodspec), 
                        options.valueOf(vocabspec), 
                        new XMLPOSDictionaryReader(options.valueOf(pdictspec)).read());
            }
            
            if (options.has("tag") || options.has("test")) {
              long start = System.currentTimeMillis();
              // tag (and potentially measure performance against the gold-standard).              
              //File mod = options.valueOf(modspec);
              //Integer k = options.valueOf(kspec);
              Double beta = options.valueOf(betaspec);
              
              
              ZLMEM maxentModel;
              String seqMod = options.has("seqModel") ? options.valueOf(seqModel) : null;
              Integer fbWidth = options.has("fbBeamWidth") ? options.valueOf(fbBeam) : 5;
              
              String algStr = options.has("taggingAlgorithm") ? options.valueOf(tagAlgorithm) : "forward-backward";
              Constants.TaggingAlgorithm alg = algStr.equalsIgnoreCase("forward") ? 
                  Constants.TaggingAlgorithm.FORWARD : 
                  Constants.TaggingAlgorithm.FORWARDBACKWARD;
              
              STTaggerWordDictionary wd = null;
              STTaggerPOSDictionary pd = null;
              
              if(options.has("w")) wd = new XMLWordDictionaryReader(options.valueOf(wdictspec)).read();
              if(options.has("p")) pd = new XMLPOSDictionaryReader(options.valueOf(pdictspec)).read();
              
              WordAndPOSDictionaryLabellingStrategy tagger = new WordAndPOSDictionaryLabellingStrategy(
                      wd,
                      pd, 
                      (options.has("K") ? options.valueOf(kspec).intValue() : 20), 
                      maxentModel = new ZLMEM(options.valueOf(modspec)),
                      new STFex(stPrior),
                      seqMod,
                      alg);
              
              tagger.setMaxSearchBeam(fbWidth);
              maxentModel.verbose = true;
              
              Iterator<List<Word>> corpus = null;
              Iterator<List<Word>> goldCorpus = null;
              
              if(options.valueOf(tokenisation).equalsIgnoreCase("srilm")) {
                  corpus = new SRILMFactoredBundleCorpusIterator(new BufferedReader(new FileReader(options.valueOf(inputspec))));
              } else if(options.valueOf(tokenisation).equalsIgnoreCase("candc")) {
                  corpus = new PipeDelimitedFactoredBundleCorpusIterator(new BufferedReader(new FileReader(options.valueOf(inputspec))));
              }
              if(options.has("test") && options.valueOf(tokenisation).equalsIgnoreCase("srilm")) {
                  goldCorpus = new SRILMFactoredBundleCorpusIterator(new BufferedReader(new FileReader(options.valueOf(goldstandspec))));
              } else if(options.has("test") && options.valueOf(tokenisation).equalsIgnoreCase("candc")) {
                  goldCorpus = new PipeDelimitedFactoredBundleCorpusIterator(new BufferedReader(new FileReader(options.valueOf(goldstandspec))));
              }
              
              BufferedWriter outf = new BufferedWriter(new FileWriter(options.valueOf(outputspec)));
              
              boolean test = options.has("test");
              
              ResultSink results = new ResultSink();
              int sentCnt = 0;
              
              tagger.setBetas(new double[] {beta});
              
              while(corpus.hasNext()) {
                  sentCnt++;
                  List<Word> sent = corpus.next();
                  
                  List<List<Pair<Double,String>>> taggings = tagger.multitag(sent, beta); 
                  
                  if(test) {
                      List<Word> goldsent = goldCorpus.next();
                      results.addSent(taggings, goldsent);
                  }                  
                  
                  Iterator<Word> sentiter = sent.iterator(); 
                  // output file format = word goldtag tag1 ... tagK                  
                  outf.write("<s>"+System.getProperty("line.separator"));
                  for(List<Pair<Double,String>> tagging : taggings) {                      
                      Word nextw = sentiter.next();
                      outf.write(nextw.getForm() + "\t1\t" + nextw.getPOS() + "\t1.0\t" + tagging.size() + "\t");// + nextw.getSupertag() + " ");
                      //outf.write(nextw.getForm() + "|||"+ nextw.getStem() + "|||" + nextw.getPOS() + "|||");
                      String tags = "";
                      for(Pair<Double,String> tg : tagging) {
                          //tags+="^"+tg.b+":"+tg.a;
                          tags+= "\t" + tg.b + "\t"+tg.a;
                      }
                      // write out the multitagging, minus the initial space (tab).
                      outf.write(tags.substring(1) + System.getProperty("line.separator"));
                      
                      //// write out the multitagging, minus the initial ^.
                      //outf.write(tags.substring(1) + " ");
                  }                  
                                
                  outf.write("</s>"+System.getProperty("line.separator"));
                  if(sentCnt % 10 == 0) {
                      outf.flush();
                  }
              }
              outf.flush();
              outf.close();
              if(test) {
                  System.err.println(results.report());
              }
              long end = System.currentTimeMillis();
              System.err.println("Time to tag: " + ((end - start + 0.0)/1000) + " seconds.");
              
            } else if (options.has("tagdictextract")) {
              // extract tagging dictionaries.
              File wd = options.valueOf(wdictspec);
              File pd = options.valueOf(pdictspec);
              File inf = options.valueOf(inputspec);
              TaggingDictionaryExtractor tde = new TaggingDictionaryExtractor(inf,wd,pd,options.valueOf(tokenisation));
              System.err.println("Extracting dictionaries from: "+inf.toString()+" into files: "+wd.toString()+" and: "+pd.toString()+"\n(wdict and posdict, resp.).");
              tde.extract();
            } else {
                // train (extract features).        
                File inf = options.valueOf(inputspec);
                File outf = options.valueOf(outputspec);
                FeatureExtractor fexer = (stPrior == null) ? new STFex() : new STFex(stPrior);
                ZhangLeTrainingExtractor fexApp = new ZhangLeTrainingExtractor(inf, outf, options.valueOf(tokenisation), fexer);
                System.err.println("Extracting features from file: " + inf.toString() + ", and placing extracted features in: " + outf.toString() + ".");
                fexApp.writeFeats();
            }

        } catch (OptionException e) {
            throw e;
        } catch (Exception e) {
            throw e;
            //System.err.println("Something went wrong.  Double-check your inputs.");
        }
    }
}


================================================
FILE: src/opennlp/ccg/parse/supertagger/LabellingStrategy.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2009 Dennis N. Mehay
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.parse.supertagger;

import java.util.Collection;
import java.util.List;
import opennlp.ccg.lexicon.Word;
import opennlp.ccg.util.Pair;
//import ml.MaxentModel;

/**
 * @author Dennis N. Mehay
 * @version $Revision: 1.2 $, $Date: 2010/09/21 04:12:41 $
 */
public interface LabellingStrategy {
	
    /**
     * A method to reset the K parameter (for word dictionaries).
     * @param newK An int to replace the int value of K.
     * @returns null.
     */
    public void setK(int newK);
    
    /** Multitag a TaggedWord and throw away the probabilities. */
    public List<String> multitag(Word thisword, Collection<Pair<String,Double>> context, double beta);
    
    /** Multitag a TaggedWord and retain the probabilities. */
    public List<Pair<Double,String>> multitagWithScores(Word thisword, Collection<Pair<String,Double>>contex, double beta);
    
}


================================================
FILE: src/opennlp/ccg/parse/supertagger/WordAndPOSDictionaryLabellingStrategy.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2009 Dennis N. Mehay
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.parse.supertagger;

import java.io.BufferedReader;
import java.io.BufferedWriter;
import java.io.File;
import java.io.FileNotFoundException;
import java.io.FileReader;
import java.io.FileWriter;
import opennlp.ccg.parse.supertagger.io.XMLWordDictionaryReader;
import opennlp.ccg.parse.supertagger.io.XMLPOSDictionaryReader;
import opennlp.ccg.parse.supertagger.ml.STFex;
import opennlp.ccg.parse.supertagger.ml.FeatureExtractor;
import opennlp.ccg.parse.tagger.ProbIndexPair;
import opennlp.ccg.parse.tagger.TaggedWord;
import opennlp.ccg.parse.tagger.Constants;
import opennlp.ccg.parse.tagger.io.SRILMFactoredBundleCorpusIterator;
import java.io.IOException;
import java.io.InputStreamReader;
import java.io.OutputStreamWriter;
import java.util.*;
import java.util.logging.Level;
import java.util.logging.Logger;
import opennlp.ccg.lexicon.*;
import opennlp.ccg.parse.Supertagger;
import opennlp.ccg.parse.postagger.DummyPOSTagger;
import opennlp.ccg.parse.postagger.POSTagger;
import opennlp.ccg.parse.supertagger.ml.STPriorModel;
import opennlp.ccg.parse.tagger.ml.MaxentModel;
import opennlp.ccg.parse.supertagger.util.*;
import opennlp.ccg.parse.tagger.Constants.TaggingAlgorithm;
import opennlp.ccg.parse.tagger.ml.ZLMEM;
import opennlp.ccg.util.Pair;
import opennlp.ccg.parse.tagger.sequencescoring.SequenceScorer;
import opennlp.ccg.parse.tagger.util.ConfigFileProcessor;
import opennlp.ccg.parse.tagger.util.ResultSink;

/**
 * A `labelling strategy' for a CCG supertagger that
 * restricts the output of the model based on word and POS `tagging
 * dictionaries' in the following way:
 *
 * if a word w occurs at least K times in training, the model's output
 * is constrained to the outcomes seen with w during training.  If w
 * did not occur at least K times during training, the model's output is
 * constrained to the outcomes seen with w's POS tag during training.
 * In the off chance that the POS tag was not seen in training, the model's
 * best prediction is used.
 *
 * @author Dennis N. Mehay
 * @version $Revision: 1.22 $, $Date: 2011/03/22 03:20:25 $
 */
public class WordAndPOSDictionaryLabellingStrategy implements LabellingStrategy, Supertagger {

    // print warnings?
    private boolean verbose = false;
    // use tagging dictionaries?
    private boolean useWordDict = false;
    private boolean usePOSDict = false;
    private SequenceScorer seqScorer = null;
    private STTaggerWordDictionary wd;
    private STTaggerPOSDictionary pd;
    private int K, usualK, finalK;    
    private MaxentModel mo;
    // extracts features from the context of a word.
    private FeatureExtractor fexer = new STFex();
    
    // postagger for non-gold-POS supertagging.
    private POSTagger posTagger;

    // the current tagging.
    private List<TaggedWord> tagging;
    
    // POS-specific multipliers to "tighten" or "loosen" up the tagging beam width
    // ("beta") as needed. E.g., the beta for period/full stop might not need to be
    // very permissive, while those for lexical verbs or some fancy punctuation marks
    // might need to be.
    public Map<String,Double> betaMultipliers = new HashMap<String,Double>();
    public double minMultiplier = 1.0;
            
    /** Constructor without n-gram model (for scoring tag sequences). */
    public WordAndPOSDictionaryLabellingStrategy(STTaggerWordDictionary wd, STTaggerPOSDictionary pd, int K, MaxentModel mo,
            FeatureExtractor fexer) {
        this(wd, pd, K, mo, fexer, null, null);
    }

    
    /** Constructor WITH n-gram model (for scoring tag sequences). */
    public WordAndPOSDictionaryLabellingStrategy(
            STTaggerWordDictionary wd,
            STTaggerPOSDictionary pd,
            int K,
            MaxentModel mo,
            FeatureExtractor fexer,
            String tagSequenceModel,
            Constants.TaggingAlgorithm alg) {
        this(wd, pd, K, mo, fexer, tagSequenceModel, alg, new DummyPOSTagger());
    }
    /** Constructor with n-gram model and POS tagger */
    public WordAndPOSDictionaryLabellingStrategy(
            STTaggerWordDictionary wd,
            STTaggerPOSDictionary pd,
            int K,
            MaxentModel mo,
            FeatureExtractor fexer,
            String tagSequenceModel,
            Constants.TaggingAlgorithm alg,
            POSTagger posTagger) {
        this.wd = wd;
        this.pd = pd;
        this.mo = mo;
        this.posTagger = posTagger;
        if (K > 0) {
            this.K = K;
        } else {
            this.K = 0;
        }
        usualK = K; finalK = K;
        
        this.fexer = fexer;     
        
        try {

            if (tagSequenceModel != null) {
                // find the n-gram order of the model.
                int ord = SequenceScorer.findOrder(tagSequenceModel);
                // load it into the SequenceScorer.
                seqScorer = new SequenceScorer(ord, tagSequenceModel);
                seqScorer.setSearchBeam(5);
                seqScorer.setAlgorithm(alg);
            }
        } catch (IOException ex) {
            Logger.getLogger(WordAndPOSDictionaryLabellingStrategy.class.getName()).log(Level.SEVERE, null, ex);
        }        
    }

    public void useWordDict(boolean useIt) { useWordDict = useIt; }
    public void usePOSDict(boolean useIt) { usePOSDict = useIt; }
    public WordAndPOSDictionaryLabellingStrategy(STTaggerWordDictionary wd, STTaggerPOSDictionary pd, int K, MaxentModel mo) {
        this(wd, pd, K, mo, new STFex());
    }

    /**
     * Set the maximum width of the beam in the forward-backward tagger.
     */
    public void setMaxSearchBeam(int maxSearchBeam) { if (seqScorer != null) seqScorer.setSearchBeam(maxSearchBeam); }
    
    /**
     * Reset the K parameter.
     */
    public void setK(int newK) {
        this.K = newK;
    }

     /**
     * Set the usual K parameter.
     */
    public void setUsualK(int newK) {
        this.usualK = newK;
    }

    /**
     * Set the final K parameter.
     */
    public void setFinalK(int newK) {
        this.finalK = newK;
    }

    /**
     * A method that returns all labels given by the model that both (1) are assigned probability `p' s.t.:
     * p>=(`beta'*<bestProb>), where `beta' is a factor passed in by the client of this method and
     * where <bestProb> is the probability of the most probably outcome of the model and (2) (if the word
     * (obtained from the <code>String[]</code> `context') has occured at least K times in training)
     * are in the <code>STTaggerWordDictionary</code> under the entry for said word.  If the word did
     * not occur at least K times in training, the output set is constrained by a <code>STTaggerPOSDictionary</code>.
     * In the off chance that a POS did not occur in the training data, the models predictions themselves are
     * submitted to the `beta constraint'.
     *
     * @param context A <code>String[]</code> of contextual predicates (in the maximum entropy modelling sense)
     * @param mo A <code>MaxentModel</code>.
     * @param beta A <code>double</code> specifying how close in probability all returned outcomes must be.
     * @return An <code>ArrayList<String></code> of labels that meet the above constraints.
     */
    public List<String> multitag(Word w, Collection<Pair<String, Double>> context, double beta) {
        List<Pair<Double, String>> temp = this.multitagWithScores(w, context, beta);
        ArrayList<String> res = new ArrayList<String>(temp.size());
        for (Pair<Double, String> t : temp) {
            res.add(t.b);
        }
        return res;
    }

    /**
     * A method to return the set of labels that are greater than or equal to 
     * the best label multiplied by a factor `beta', given a model and a <code>String[]</code>
     * of contextual predicates.
     * @param thisWord a <code>opennlp.ccg.lexicon.Word</code> representing the current word being tagged.
     * @param context A <code>Collection<Pair<String,Double>></code> of contextual predicates 
     * (in the maximum entropy modelling sense) with their corresponding activations (real-valued, hence the
     * <code>Double</code>).
     * @param model A model for generating the base predictions.
     * @param beta A positive <code>double</code> specifying how close to the best label
     *             each label returned must be.
     * @return An <code>ArrayList<Pair<Double,String>></code> of the outcomes
     *         {o: score(o)>=[beta * score(bestLabel)]}.
     */
    public List<Pair<Double, String>> multitagWithScores(Word thisWord, Collection<Pair<String, Double>> context, double beta) {
        // All the scores of the outcomes (the index of each double score
        // is the key which allows us to retrieve the outcome from the model).
        double[] ocs = mo.eval(context);
        // Sort in descending order of probability.
        ProbIndexPair[] sortedOutcomes = new ProbIndexPair[ocs.length];
        for (int i = 0; i < ocs.length; i++) {
            sortedOutcomes[i] = new ProbIndexPair(new Double(ocs[i]), new Integer(i));
        }
        Arrays.sort(sortedOutcomes);
        String tempOutcome = "";
        String word = thisWord.getForm();
        String pos = thisWord.getPOS();
        ArrayList<Pair<Double, String>> retVal = new ArrayList<Pair<Double, String>>(30);

        // Find the best outcomes seen with the word in training that
        // meet the `beta' constraint.
        // *******************************************************************************************
        double bestOutcomeProb, currentOutcomeProb;
        bestOutcomeProb = 0;
        // mww: changed to not always include front of list, as it may not meet dict constraints
        ProbIndexPair temp;
        // Now loop to see how many make the cut.
        // (But make sure to be sensitive to the dictionary, if necessary.)
        // See whether the word has a freq of this.K in the training corpus.
        Collection<String> wordPermittedOutcomes = (wd != null) ? this.wd.getEntry(word, this.K) : null;
        if (wordPermittedOutcomes != null && useWordDict) {
            // The word (lemma) was seen at least K times in training.
            // Get all beta-OK outcomes that are in the dictionary entry.
            for (int ocInd = 0; ocInd < sortedOutcomes.length; ocInd++) {
                temp = sortedOutcomes[ocInd];
                tempOutcome = mo.getOutcome(temp.b.intValue());
                currentOutcomeProb = temp.a.doubleValue();
                if (wordPermittedOutcomes.contains(tempOutcome)) {
                    if (bestOutcomeProb == 0) {
                        bestOutcomeProb = currentOutcomeProb;
                    }
                    if (currentOutcomeProb >= (bestOutcomeProb * beta)) { // Beta constraint.
                        // The cut-off was met, add the outcome.

                        retVal.add(new Pair<Double, String>(temp.a, tempOutcome));
                        // update max, for first selected outcome
                        if (currentOutcomeProb > bestOutcomeProb) {
                            bestOutcomeProb = currentOutcomeProb;
                        }
                    } else {
                        // Else, since our ProbIndexPair[] is sorted by probablity, there will be no more
                        // outcomes that make the (beta) cut.
                        break;
                    }
                } // If the word is not in the dictionary specified outcomes, move along.                

            }
        } else {
            // Revert to the POS dictionary.
            Collection<String> posPermittedOutcomes = null;
            if (pos != null) {
                posPermittedOutcomes = (pd != null) ? this.pd.getEntry(pos) : null;
            } else {
                if(verbose) { System.err.println("warning: null POS for: " + word);}  // mww: check for null pos

            }
            if (posPermittedOutcomes != null && usePOSDict) {
                // Get all beta-OK outcomes that are in the POS dictionary entry.
                for (int ocInd2 = 0; ocInd2 < sortedOutcomes.length; ocInd2++) {
                    temp = sortedOutcomes[ocInd2];
                    tempOutcome = mo.getOutcome(temp.b.intValue());
                    currentOutcomeProb = temp.a.doubleValue();

                    if (posPermittedOutcomes.contains(tempOutcome.trim())) {
                        if (bestOutcomeProb == 0) {
                            bestOutcomeProb = currentOutcomeProb;
                        }
                        if (currentOutcomeProb >= (bestOutcomeProb * beta)) { // Beta constraint.
                            // Made the cut-off, add the outcome.

                            retVal.add(new Pair<Double, String>(temp.a, tempOutcome));
                            // update max, for first selected outcome
                            if (currentOutcomeProb > bestOutcomeProb) {
                                bestOutcomeProb = currentOutcomeProb;
                            }
                        } else {
                            // Else, since our ProbIndexPair[] is sorted by probablity, there will be no more
                            // outcomes that make the (beta) cut.
                            break;
                        }
                    } // If the word is not in the dictionary specified outcomes, move along.                    

                }
            } else {
                // Otherwise, just get all model predictions that meet the beta constraint,
                // ignoring the word and POS dictionaries.
                for (int ocInd3 = 0; ocInd3 < sortedOutcomes.length; ocInd3++) {
                    temp = sortedOutcomes[ocInd3];
                    currentOutcomeProb = temp.a.doubleValue();

                    if (bestOutcomeProb == 0) {
                        bestOutcomeProb = currentOutcomeProb;
                    }
                    if (currentOutcomeProb >= (bestOutcomeProb * beta)) {
                        // Made the cut-off, add the outcome.
                        retVal.add(new Pair<Double, String>(temp.a, mo.getOutcome(temp.b.intValue())));
                        // update max, for first selected outcome
                        if (currentOutcomeProb > bestOutcomeProb) {
                            bestOutcomeProb = currentOutcomeProb;
                        }
                    } else {
                        // Else, since our ProbIndexPair[] is sorted by probability, there will be no more
                        // outcomes that make the cut.
                        break;
                    }
                }
            }
        }       

        // include the gold standard tag, if not in there.
        if(includeGold) {
            // assume input word has the gold tag in it.
            String gold = thisWord.getSupertag();
            // check whether gold is in the output.
            boolean containsGold = false;
            for(Pair<Double,String> tg : retVal) {
                if(tg.b.equals(gold)) {
                    containsGold = true;
                    break;
                }
            }
            if(!containsGold) {
                // insert it
                containsGold = false;
                for(ProbIndexPair oc : sortedOutcomes) {
                    if(mo.getOutcome(oc.b).equals(gold)) {
                        retVal.add(new Pair<Double,String>(oc.a, mo.getOutcome(oc.b)));
                        containsGold = true;
                        break;
                    }
                }          
            }
            if(!containsGold) {
                // if the gold-standard still isn't in there, it must not be part of the tag set, add it with epsilon probability.
                // we're assuming that gold tags are needed for a training routine that doesn't care about supertag probabilities
                // (as in Clark and Curran (2007)).
                // check to see whether we are in the log domain (by checking for negative scores -- kind of a hack).
                retVal.add(new Pair<Double,String>((sortedOutcomes[0].a < 0) ? -99 : 1.0112214926104486e-43, thisWord.getSupertag()));
            }
        }
        // *******************************************************************************************
        return retVal;
    }


    // get the current tagging (now only used to grab the POS tagging).    
    public List<TaggedWord> getCurrentTagging() { return tagging; }
    // set the current tagging (now only used to set the current POS tagging).
    public void setCurrentTagging(List<TaggedWord> tgging) { tagging = tgging; }
    
    public List<List<Pair<Double, String>>> multitag(List<Word> sentence, double beta) {
        List<List<Pair<Double, String>>> results = new ArrayList<List<Pair<Double, String>>>(sentence.size());
        Map<Integer, TaggedWord> sent = new TreeMap<Integer, TaggedWord>();
        int cnt = 0;
        
        List<TaggedWord> taggedSent = posTagger.tagSentence(sentence);
        setCurrentTagging(taggedSent);
        
        for (TaggedWord werd : taggedSent) {
            sent.put(new Integer(cnt++), werd);
        }

        List<Collection<Pair<String, Double>>> contexts = fexer.getSentenceFeatures(sent);

        // Iterate simultaneously through both the words and the contextual features.
        Iterator<Word> wds = sentence.iterator();
        Word w = null;
        Iterator<Collection<Pair<String, Double>>> ctxts = contexts.iterator();
        Collection<Pair<String, Double>> context = null;

        int cursor = 0;
        while (wds.hasNext() && ctxts.hasNext()) {
            // get the next word.
            w = wds.next();
            if(w.getPOS() == null) {
                w = Word.createFullWord(w, w.getForm(), tagging.get(cursor).getPOSTagging().get(0).b, w.getSupertag(), w.getSemClass()); 
            }
            context = ctxts.next();
            if (seqScorer != null) {
                // increase the tag ambiguity (for re-scoring using forward-backward).
                double newBeta = Math.min(beta * minMultiplier, beta / 8);
                if(beta < 0.00001) { newBeta = Math.min(beta * minMultiplier, beta / 2);  }
                    results.add(multitagWithScores(w, context, newBeta));
            } else { results.add(multitagWithScores(w, context, beta)); }
            cursor++;
        }
        
        List<List<Pair<Double,String>>> finalResults = null;
        if (seqScorer != null) {
            // rescore and filter. pass in input sentence (in case, e.g., we have set the includeGold flag).
            finalResults = betaBestFilter(seqScorer.rescoreSequence(results), beta, sentence);
        } else {
            finalResults = results;
        }       
        return finalResults;
    }

    /** 
     * Return a beta-best filtered subset of the tags in each multitagging list (each multitagging list is assumed to be non-empty). 
     */
    private List<List<Pair<Double, String>>> betaBestFilter(List<List<Pair<Double, String>>> multitaggings, double beta, List<Word> inputSentence) {
        List<List<Pair<Double, String>>> res = new ArrayList<List<Pair<Double, String>>>(multitaggings.size());

        int wordIndex = 0;
        for (List<Pair<Double, String>> mtagging : multitaggings) {
            List<Pair<Double, String>> tempTagging = new ArrayList<Pair<Double, String>>(mtagging.size());            
            Word thisWord = inputSentence.get(wordIndex);
            // set to a (possibly different, possibly less restrictive?) beta if this POS has a beta multiplier set.
            Double bmult = betaMultipliers.get(thisWord.getPOS());
            double possiblyNewBeta = Math.min(1.0, (bmult != null) ? (bmult * beta) : beta);
            
            double best = mtagging.get(0).a;
            for (Pair<Double, String> tg : mtagging) {
                if (tg.a >= (possiblyNewBeta * best) || (includeGold && tg.b.equals(thisWord.getSupertag()))) {
                    tempTagging.add(tg);
                } else {
                    if(!includeGold) {  // if we're not still fishing for gold...
                        // ...stop, since they're in sorted order.
                        break;
                    }
                }
            }            
            res.add(tempTagging);
            wordIndex++;
        }
        return res;
    }
    
    
    //-------------------------------------------------------------------------
    // Supertagger interface methods (added by Michael White)
    
    /**
     * The sequence of beta values to use in tagging.
     */
    protected double[] betas = null;
    
    /**
     * The current betaIndex.
     */
    protected int betaIndex = 0;
    
    /**
     * The current tagging.
     */
    protected List<List<Pair<Double, String>>> currentTagging = null;
    
    /**
     * The current word.
     */
    protected int currentWord = 0;
    
    /**
     * Flag for whether to include gold tags.
     */
    protected boolean includeGold = false;

    /** Sets the beta values. */
    public void setBetas(double[] betas) {
        this.betas = betas;
    }

    /** Returns all the beta values. */
    public double[] getBetas() {
        return betas;
    }

    /** Returns the current beta value. */
    public double getCurrentBetaValue() {
        return betas[betaIndex];
    }

    /**
     * Advances beta to the next most restrictive setting.
     */
    public void nextBeta() {
        betaIndex++;
    }

    /**
     * Advances beta to the next less restrictive setting.
     */
    public void previousBeta() {
        betaIndex--;
    }

    /**
     * Returns whether there are any less restrictive beta settings
     * remaining in the sequence.
     */
    public boolean hasMoreBetas() {
        return betaIndex < betas.length - 1;
    }

    /**
     * Returns whether there are any more restrictive beta settings
     * remaining in the sequence.
     */
    public boolean hasLessBetas() {
        return betaIndex > 0;
    }

    /**
     * Resets beta to the most restrictive value.
     */
    public void resetBeta() {
        betaIndex = 0;
    }

    /**
     * Resets beta to the least restrictive value.
     */
    public void resetBetaToMax() {
        betaIndex = betas.length - 1;
    }

    /**
     * Sets the flag for whether to include gold tags.
     */
    public void setIncludeGold(boolean includeGold) { this.includeGold = includeGold; }

    /**
     * Maps the given words to their predicted categories, 
     * so that the beta-best categories can be returned by calls to setWord
     * and getSupertags.
     */
    public void mapWords(List<Word> words) {
        if(hasMoreBetas()) {
            K = usualK;
        } else {
            K = finalK;            
        }        
        currentTagging = multitag(words, getCurrentBetaValue());
    }

    /**
     * Sets the current word to the one with the given index, 
     * so that the beta-best categories for it can be returned by a call to 
     * getSupertags.
     */
    public void setWord(int index) {
        currentWord = index;
    }

    /**
     * Returns the supertags of the desired categories for the current lexical lookup
     * as a map from supertags to contextual probabilities (or null to accept all). 
     */
    public Map<String, Double> getSupertags() {
        Map<String, Double> retval = new HashMap<String, Double>();
        List<Pair<Double, String>> tags = currentTagging.get(currentWord);
        for (Pair<Double, String> tag : tags) {
            retval.put(tag.b, tag.a);
        }
        return retval;
    }
    
    /** 
     * A factory method to make a supertagger from a config file (see the sample config file:
     *  
     * $OPENCCG_HOME/ccgbank/models/supertagger/st.config
     * 
     * for more information).
     */
    @SuppressWarnings("unused")
		public static WordAndPOSDictionaryLabellingStrategy supertaggerFactory(String configFile) {        
        WordAndPOSDictionaryLabellingStrategy res = null;
        String[] pathKeys = { "priormodel", "priormodelvocab", "sequencemodel", "wdict", "posdict", "maxentmodel", "posconfig" };
        Map<String,String> opts = ConfigFileProcessor.readInConfig(configFile, pathKeys);
        boolean verbose = (opts.get("verbose").equals("true")) ? true : false;
        // 'S' is for string repr.
        String priorModS = opts.get("priormodel"), 
               priorVocabS = opts.get("priormodelvocab"),
               seqModS = opts.get("sequencemodel"),
               wDictS = opts.get("wdict"),
               pDictS = opts.get("posdict"),
               firstKS = opts.get("firstk"),
               lastKS = opts.get("lastk"),
               maxentModS = opts.get("maxentmodel"),
               posConfigS = opts.get("posconfig"),
               betasS = opts.get("betas"),
               betaMults = opts.get("betamultipliers"), // POS-specific multipliers to "tighten" or "loosen" up the tagging beam width.
               includeGold = opts.get("includegold");
        
        assert (maxentModS != null) : "Empty maxent model.";
        
        // either use prior model (and have prior vocab specified) or not.
        assert (priorModS != null && priorVocabS != null) || (priorModS == null && priorVocabS == null) : "using prior model with no vocab file.";
        
        // ensure that there are word- and pos-keyed tagging dicts if there
        // is no st prior model.
        assert (wDictS == null || pDictS == null) && priorModS == null : "need tagging dicts if no supertagging prior model and prior vocab are specified.";
        
        // need the POS-keyed tagging dict, no matter what.
        assert (priorModS != null && pDictS == null) : "need POS-keyed tagging dict for prior model.";
        
        // need 'K' values if not using tagging dicts.
        assert (priorModS == null || (firstKS != null & lastKS != null)) : "need to specify first and last 'K' value when not using prior model.";
        
        // seqMod probably shouldn't be null. warn if in verbose mode.
        if(seqModS == null && verbose) { System.err.println("Warning: empty sequence model. Performance will suffer."); }
        
        STPriorModel priorM = null;
        if(priorModS != null && priorVocabS != null) {
            try { priorM = new STPriorModel(priorModS, priorVocabS); } 
            catch (IOException ex) {
                Logger.getLogger(WordAndPOSDictionaryLabellingStrategy.class.getName()).log(Level.SEVERE, null, ex);
            }
        }
        STFex fex = new STFex(priorM);
        STTaggerWordDictionary wD = (wDictS != null) ? new XMLWordDictionaryReader(new File(wDictS)).read() : null;        
        STTaggerPOSDictionary pD = (pDictS != null) ? new XMLPOSDictionaryReader(new File(pDictS)).read() : null;
        int kay = (opts.get("firstk") == null) ? 20 : Integer.parseInt(opts.get("firstk")), firstK, lastK;
        firstK = (opts.get("firstk") == null) ? 20 : Integer.parseInt(opts.get("firstk"));
        lastK = (opts.get("lastk") == null) ? 100 : Integer.parseInt(opts.get("lastk"));
        double[] betaz = new double[betasS.split("\\s+").length];
        int cursor = 0;
        for(String beta : betasS.split("\\s+")) {
            betaz[cursor++] = Double.parseDouble(beta);
        }
        
        // should we use the tagging dictionaries (yes if there is no prior model).
        boolean useWordDictionary = (wDictS != null);
        boolean usePOSDictionary = (pDictS != null);
        POSTagger pTagger = (posConfigS == null) ? null : POSTagger.posTaggerFactory(posConfigS);
        TaggingAlgorithm alg = (opts.get("taggingalgorithm") == null || opts.get("taggingalgorithm").equals("forward-backward")) ?
            TaggingAlgorithm.FORWARDBACKWARD : TaggingAlgorithm.FORWARD;
        MaxentModel mem = new ZLMEM(new File(maxentModS));
        //STTaggerWordDictionary wd,STTaggerPOSDictionary pd,  int K, MaxentModel mo, FeatureExtractor fexer,
        //String tagSequenceModel, Constants.TaggingAlgorithm alg, POSTagger posTagger
        res = (pTagger != null) ? 
            new WordAndPOSDictionaryLabellingStrategy(wD, pD, kay, mem, fex, seqModS, alg, pTagger) :
            new WordAndPOSDictionaryLabellingStrategy(wD, pD, kay, mem, fex, seqModS, alg);
        res.setK(kay);
        res.setUsualK(firstK);
        res.setFinalK(lastK);
        res.setBetas(betaz);
        res.useWordDict(useWordDictionary);
        res.usePOSDict(usePOSDictionary);
        res.setIncludeGold((opts.get("includegold") == null || opts.get("includegold").equals("false")) ? false : true); 
        
        // get POS-specific beta multipliers (as a string of <POS,double> pairs -- all space delimited).
        if(betaMults != null) {
            String[] bmts = betaMults.split("\\s+");
            for(int a=0, b=1; b < bmts.length; a = a + 2, b = b + 2) {
                double mul = Double.parseDouble(bmts[b]);
                res.betaMultipliers.put(bmts[a], mul);
                if(mul < res.minMultiplier) {
                    res.minMultiplier = mul;
                }
            }
        }
        return res;
    }
    
    public static void main(String[] args) {
        String usage = "\nWordAndPOSDictLabellingStrategy (-h [gets this message]) -e <areWeTesting> [defaults to not testing] -c <configFile> > -beta [0.0,1.0]\n"+
                       "                                  (-i <input> [default=<stdin>]) (-o <output> [default=<stdout>])\n";
        
        if (args.length > 0 && args[0].equals("-h")) {
            System.out.println(usage);
            System.exit(0);
        }

        SRILMFactoredBundleCorpusIterator in = null;
        BufferedWriter out = null;
        try {
            
            String inputCorp = "<stdin>", output = "<stdout>", 
                   configFile = null;
            
            double beta = 1.0;
            boolean test = false;

            for (int i = 0; i < args.length; i++) {
                if (args[i].equals("-i")) { inputCorp = args[++i]; continue; }
                if (args[i].equals("-o")) { output = args[++i];    continue; }
                if (args[i].equals("-e")) { test = true; continue; }
                if (args[i].equals("-c")) { configFile = args[++i]; continue; }
                if (args[i].equals("-beta")) { beta = Double.parseDouble(args[++i]); continue; }
                System.out.println("Unrecognized option: " + args[i]);
            }

            ResultSink rs = new ResultSink(ResultSink.ResultSinkType.SUPERTAG);
            try {                
                in = new SRILMFactoredBundleCorpusIterator(
                        (inputCorp.equals("<stdin>")) ? 
                            new BufferedReader(new InputStreamReader(System.in)) : 
                            new BufferedReader(new FileReader(new File(inputCorp))));                
            } catch (FileNotFoundException ex) {
                System.err.print("Input corpus " + inputCorp + " not found.  Exiting...");
                Logger.getLogger(WordAndPOSDictionaryLabellingStrategy.class.getName()).log(Level.SEVERE, null, ex);
                System.exit(-1);
            }

            try {
                out = (output.equals("<stdout>")) ? new BufferedWriter(new OutputStreamWriter(System.out)) : new BufferedWriter(new FileWriter(new File(output)));
            } catch (IOException ex) {
                System.err.print("Output file " + output + " not found.  Exiting...");
                Logger.getLogger(WordAndPOSDictionaryLabellingStrategy.class.getName()).log(Level.SEVERE, null, ex);
                System.exit(-1);
            }

            WordAndPOSDictionaryLabellingStrategy stgger = WordAndPOSDictionaryLabellingStrategy.supertaggerFactory(configFile);
            
            // for each sentence, print out:
            // <s>
            // w1   <numPOSTags>    <posTag1>   ... <posTagK>   <numSupertags>  <supertag1> ... <supertagL>
            // ...
            // wN   <numPOSTags>    <posTag1>   ... <posTagM>   <numSupertags>  <supertag1> ... <supertagU>
            // </s>
            for (List<Word> inLine : in) {
                
                List<List<Pair<Double,String>>> taggedSent = stgger.multitag(inLine, beta);
                if(test) { rs.addSent(taggedSent, inLine); }
                // beginning of sentence...
                out.write("<s>" + System.getProperty("line.separator"));                
                List<TaggedWord> posTagging = stgger.getCurrentTagging();
                int cursor = -1;
                while(++cursor < taggedSent.size()) {
                    Word wdIn = inLine.get(cursor);
                    // word form...
                    out.write(wdIn.getForm());
                    TaggedWord posT = posTagging.get(cursor);
                    // print out number of POS tags, followed by tab-separated probabilized POS tagging.
                    out.write("\t" + posT.getPOSTagging().size());
                    for(Pair<Double,String> pt : posT.getPOSTagging()) {
                        out.write("\t" + pt.b + "\t" + pt.a);
                    }
                    // now print out number of and list of tab-separated, probabilized supertags.
                    out.write("\t" + taggedSent.get(cursor).size());
                    for(Pair<Double,String> stg : taggedSent.get(cursor)) {
                        out.write("\t" + stg.b + "\t" + stg.a);
                    }
                    out.write(System.getProperty("line.separator"));
                }
                out.write("</s>" + System.getProperty("line.separator"));
            }
            out.flush();

            if(test) { System.err.println(rs.report()); }
        } catch (IOException ex) {
            Logger.getLogger(WordAndPOSDictionaryLabellingStrategy.class.getName()).log(Level.SEVERE, null, ex);
        } finally {
            try {
                out.close();
                in.close();
            } catch (IOException ex) {
                Logger.getLogger(WordAndPOSDictionaryLabellingStrategy.class.getName()).log(Level.SEVERE, null, ex);
            }
        }
    }
} // End class WordPOSDictLabellingStrategy


================================================
FILE: src/opennlp/ccg/parse/supertagger/io/XMLPOSDictionaryReader.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2009 Dennis N. Mehay
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.parse.supertagger.io;

import java.io.File;
import java.util.HashSet;
import java.util.Collection;
import java.util.Iterator;
import java.util.Map;
import java.util.TreeMap;
import javax.xml.parsers.*;

import opennlp.ccg.parse.supertagger.util.STTaggerPOSDictionary;
import opennlp.ccg.util.Pair;
import org.xml.sax.Attributes;
import org.xml.sax.SAXException;
import org.xml.sax.XMLReader;
import org.xml.sax.helpers.DefaultHandler;

/**
 * @author Dennis N. Mehay
 * @version $Revision: 1.2 $, $Date: 2009/12/21 02:10:57 $
 */
public class XMLPOSDictionaryReader {
    
    private File dictFile;
    private XMLReader reader;
    private Map<String, Collection<String>> dict; 
    
    /** Creates a new instance of XMLDictionaryReader
     * @param dictFile A <code>String</code> pointing to the location of
     * the XML file specifying the word dictionary.
     */
    public XMLPOSDictionaryReader(File df) {
        if(!df.exists()) {
            throw new RuntimeException("File "+df.getAbsolutePath().toString()+" does not exist.");
        }
        this.dictFile = df;       
    }
    
    /**
     * Read in the dictionary file and create a new STTaggerPOSDictionary.
     * @return A new <tt>STTaggerPOSDictionary</tt>.
     */
    public STTaggerPOSDictionary read() {
        SAXParserFactory factory = SAXParserFactory.newInstance();
        try {
            SAXParser parser = factory.newSAXParser();
            reader = parser.getXMLReader();
            reader.setContentHandler(new wdContentHandler());
            reader.parse(this.dictFile.toURI().toString());
        } catch(Exception e) {
            e.printStackTrace();
        }
        return new STTaggerPOSDictionary(this.dict);
    }
    
    public static void main(String[] args) {
        // This is just to verify that the XML doc read in is the one 
        // spit out.
        String fname = args[0];
        XMLPOSDictionaryReader rdr = new XMLPOSDictionaryReader(new File(fname));
        STTaggerPOSDictionary dct = rdr.read();
        Iterator<Pair<String, Collection<String>>> it = dct.getMappings();
        Pair<String, Collection<String>> tempP = null;
        System.out.println("<posdict>");
        while(it.hasNext()) {
            tempP = it.next();
            System.out.println("     <entry pos=\""+tempP.a+"\">");            
            for(Iterator<String> stgs = tempP.b.iterator(); stgs.hasNext(); ) {
                System.out.println("          <supertag> "+stgs.next().trim()+" </supertag>");
            }
            System.out.println("     </entry>");
        }
        System.out.print("</posdict>");
    }
    
    /*
     * A ContentHandler to properly interpret the "semantics" of the XML (semantics
     * in the CS sense of formal semantics of a structured document).
     */
    class wdContentHandler extends DefaultHandler {
        private boolean inEntry = false, inSupertag = false;
        private String curPOS = null, currSTFrag = null;
        
        @Override
        public void startDocument() {
            dict = new TreeMap<String, Collection<String>>();
        }
        
        @Override
        public void startElement(String namespaceURI, String lname, String qname, Attributes attrs)
                throws SAXException {
            if(qname.equalsIgnoreCase("entry")) {  
                if(this.inEntry) {
                    throw new SAXException("Something is wrong.\nThis is not a well-formed dictionary.");
                } else {
                    this.inEntry = true;
                    String pos = attrs.getValue(0).trim();                    
                    dict.
                         put(pos,
                             new HashSet<String>());
                    this.curPOS = pos;
                }
                
            } else if(qname.equalsIgnoreCase("supertag")) {
                if(!this.inEntry) {
                    throw new SAXException("Something is wrong.\nThis is not a well-formed dictionary.");
                } else {
                    this.inSupertag = true;
                    this.currSTFrag = "";
                }
            }
        }
        
        @Override
        public void endElement(String uri, String name, String qName) {
            if(qName.equalsIgnoreCase("entry")) {
                this.inEntry = false; this.curPOS = null;
            } else if(qName.equalsIgnoreCase("supertag")) {
                this.inSupertag = false; 
                Collection<String> tempL = dict.get(this.curPOS);
                tempL.add(this.currSTFrag.trim());
                dict.put(this.curPOS, tempL);
                this.currSTFrag = null;
            }
        }
        
        @Override
        public void characters(char[] ch, int start, int length) {
            if(this.inSupertag && this.curPOS!=null) {
                // Get this supertag and add it to the list mapped to by this POS (i.e., the list
                // of supertags seen with this POS in training).
                String temp = new String(ch);      
                temp = temp.substring(start, start+length);
                this.currSTFrag += temp;
            } else if(this.inSupertag) {
                System.err.println("Something is wrong.\nThis is not a well-formed dictionary.");
            }
        }
    }
}


================================================
FILE: src/opennlp/ccg/parse/supertagger/io/XMLWordDictionaryReader.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2009 Dennis N. Mehay
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.parse.supertagger.io;

import java.io.File;
import java.util.HashSet;
import java.util.Iterator;
import java.util.Map;
import java.util.Collection;
import java.util.TreeMap;
import javax.xml.parsers.*;

import opennlp.ccg.parse.supertagger.util.STTaggerWordDictionary;
import opennlp.ccg.util.Pair;
import org.xml.sax.Attributes;
import org.xml.sax.SAXException;
import org.xml.sax.XMLReader;
import org.xml.sax.helpers.DefaultHandler;

/**
 * @author Dennis N. Mehay
 * @version $Revision: 1.3 $, $Date: 2010/09/21 04:12:41 $
 */
public class XMLWordDictionaryReader {
    
    private File dictFile;
    private XMLReader reader;
    private Map<String, Pair<Integer,Collection<String>>> dict; 
    
    /** Creates a new instance of XMLDictionaryReader
     * @param dictFile A <code>String</code> pointing to the location of
     * the XML file specifying the word dictionary.
     */
    public XMLWordDictionaryReader(File df) {
        if(!df.exists()) {
            throw new RuntimeException("File "+df.getAbsolutePath().toString()+" does not exist.");
        }
        this.dictFile = df;       
    }
    
    /**
     * Read in the dictionary file and create a new STTaggerWordDictionary.
     * @return A new <tt>STTaggerWordDictionary</tt>.
     */
    public STTaggerWordDictionary read() {
        SAXParserFactory factory = SAXParserFactory.newInstance();
        try {
            SAXParser parser = factory.newSAXParser();
            reader = parser.getXMLReader();
            reader.setContentHandler(new wdContentHandler());
            reader.parse(this.dictFile.toURI().toString());
        } catch(Exception e) {
            e.printStackTrace();
        }        
        return new STTaggerWordDictionary(this.dict);
    }
    
    public static void main(String[] args) {
        // This is just to verify that the XML doc read in is the one 
        // spit out.
        String fname = args[0];
        XMLWordDictionaryReader rdr = new XMLWordDictionaryReader(new File(fname));
        STTaggerWordDictionary dct = rdr.read();
        Iterator<Pair<String, Pair<Integer, Collection<String>>>> it = dct.getMappings();  
        Pair<String, Pair<Integer, Collection<String>>> tempP = null;
        System.out.println("<wdict>");        
        while(it.hasNext()) {
        	
            tempP = it.next();
            System.out.println("     <entry word=\""+tempP.a+"\" freq=\""+tempP.b.a+"\">");            
            for(Iterator<String> stgs = tempP.b.b.iterator(); stgs.hasNext(); ) {
                System.out.println("          <supertag> "+stgs.next().trim()+" </supertag>");
            }
            System.out.println("     </entry>");
        }
        System.out.print("</wdict>");
    }
    
    /*
     * A ContentHandler to properly interpret the "semantics" of the XML (semantics
     * in the CS sense of formal semantics of a structured document).
     */
    class wdContentHandler extends DefaultHandler {
        private boolean inEntry = false, inSupertag = false;
        private String curWord = null, currSTFrag = null;
        
        @Override
        public void startDocument() {
            dict = new TreeMap<String, Pair<Integer,Collection<String>>>();
        }
        
        @Override
        public void startElement(String namespaceURI, String lname, String qname, Attributes attrs)
                throws SAXException {
            if(qname.equalsIgnoreCase("entry")) {  
                if(this.inEntry) {
                    throw new SAXException("Something is wrong.\nThis is not a well-formed dictionary.");
                } else {
                    this.inEntry = true;
                    String word = attrs.getValue(0).trim(),
                            freq = attrs.getValue(1).trim();
                    word = word.replace("&amp;","&");
                    word = word.replace("&gt;",">");
                    word = word.replace("&lt;","<");
                    word = word.replace("&apos;","\'");
                    word = word.replace("&quot;","\"");
                    
                    dict.
                         put(word,
                             new Pair<Integer,Collection<String>>(
                                 new Integer(Integer.parseInt(freq)),
                                 new HashSet<String>()));
                    this.curWord = word;
                }
                
            } else if(qname.equalsIgnoreCase("supertag")) {
                if(!this.inEntry) {
                    throw new SAXException("Something is wrong.\nThis is not a well-formed dictionary.");
                } else {
                    this.inSupertag = true;
                    this.currSTFrag = "";
                }
            }
        }
        
        @Override
        public void endElement(String uri, String lName, String qName) {
            if(qName.equalsIgnoreCase("entry")) {
                this.inEntry = false; this.curWord = null;
            } else if(qName.equalsIgnoreCase("supertag")) {
                this.inSupertag = false;
                Pair<Integer, Collection<String>> tempL = dict.get(this.curWord);
                tempL.b.add(this.currSTFrag.trim());
            	dict.put(this.curWord, tempL);
                this.currSTFrag = null;
            }
        }
        
        @Override
        public void characters(char[] ch, int start, int length) {
            if(this.inSupertag && this.curWord!=null) {
                // Get this supertag and add it to the list mapped to by this word (i.e., the list
                // of supertags seen with this word in training).
            	String temp = new String(ch);                
            	temp = temp.substring(start, start+length);
            	this.currSTFrag += temp;            	
            } else if(this.inSupertag) {
                System.err.println("Something is wrong.\nThis is not a well-formed dictionary.");
            }
        }
    }
}


================================================
FILE: src/opennlp/ccg/parse/supertagger/ml/FeatureExtractor.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2009 Dennis N. Mehay
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.parse.supertagger.ml;

import opennlp.ccg.parse.tagger.TaggedWord;
import java.util.Collection;
import java.util.List;
import java.util.Map;
import opennlp.ccg.util.Pair;

/**
 * @author Dennis N. Mehay
 * @version $Revision: 1.1 $, $Date: 2010/09/21 04:12:41 $
 */
public interface FeatureExtractor {
	
    /** 
     * @param sentence A {@code Map<Integer,Word>} giving the (string-indexed) sentence of
     *  {@code Word}s to be tagged.
     * @param wordIndex An {@code Integer}, giving the string index of the current word.
     * @return A {@code Collection<Pair<String,Double>><String>} representing the 
     * real-valued activations of features (predicates) in the context of a word to be labelled.
     */
    public Collection<Pair<String,Double>> getFeatures(Map<Integer,TaggedWord> sentence, Integer wordIndex);
    
     /** 
     * Same as getFeatures, but for the whole sentence, returning a List of contextual features, in order, one
      * per <code>Word</code> in <tt>sentence</tt>
     */
    public List<Collection<Pair<String,Double>>> getSentenceFeatures(Map<Integer,TaggedWord> sentence);
    
    /** 
     * @param sentence A <code>Map<Integer,Word></code> giving the (string-indexed) sentence of
     *  <tt>Word</tt>s to be tagged.
     * @param wordIndex An <code>Integer</code>, giving the string index of the current word.
     * @param training A boolean indicating whether we are extracting features for training (in which case
     * we need the label too).
     * @return A <code>Collection<Pair<String,Double>><String></code> representing the 
     * real-valued activations of features (predicates) in the context of a word to be labelled.
     */
    public Collection<Pair<String,Double>> getFeatures(Map<Integer,TaggedWord> sentence, Integer wordIndex, boolean training);
    
     /** 
     * Same as getFeatures, but for the whole sentence, returning a List of contextual features, in order, one
      * per <code>Word</code> in <tt>sentence</tt>
     */
    public List<Collection<Pair<String,Double>>> getSentenceFeatures(Map<Integer,TaggedWord> sentence, boolean training);
}


================================================
FILE: src/opennlp/ccg/parse/supertagger/ml/STFex.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2009 Dennis N. Mehay
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.parse.supertagger.ml;

import java.io.BufferedReader;
import java.io.IOException;
import java.io.InputStreamReader;
import java.util.logging.Level;
import java.util.logging.Logger;
import opennlp.ccg.lexicon.Word;
import opennlp.ccg.parse.tagger.TaggedWord;
import opennlp.ccg.parse.tagger.Constants;
import java.util.ArrayList;
import java.util.Collection;
import java.util.Collections;
import java.util.HashMap;
import java.util.List;
import java.util.Map;
import opennlp.ccg.parse.postagger.POSTagger;
import opennlp.ccg.parse.tagger.io.SRILMFactoredBundleCorpusIterator;
import opennlp.ccg.util.Pair;

/**
 * @author Dennis N. Mehay
 * @version $Revision: 1.7 $, $Date: 2010/12/15 07:16:03 $
 */
public class STFex implements FeatureExtractor {
	
    private boolean useMultiPOS = false;
    public static final String LEX = "X";
    public static final String POS = "P";
    public static final String prevP = POS + "-1=";
    public static final String prevPrevP = POS + "-2=";
    public static final String nextP = POS + "+1=";
    public static final String nextNextP = POS + "+2=";
    public static final String curP = POS + "=";
    public static final String prevL = LEX + "-1=";
    public static final String prevPrevL = LEX + "-2=";
    public static final String nextL = LEX + "+1=";
    public static final String nextNextL = LEX + "+2=";
    public static final String curL = LEX + "=";
    public static final String priorST = "PST" + "=";
    public static final String wordPOSPriorST = "WPosPST" + "=";
    public static final String wordPriorST = "WPST" + "=";
    public static final String POSPriorST = "PosPST" + "=";
    public static final String antiPriorST = "APST" + "=";    
    public static final String wordPOSAntiPriorST = "WPosAPST" + "=";
    public static final String wordAntiPriorST = "WAPST" + "=";
    public static final String POSAntiPriorST = "PosAPST" + "=";
    public static final TaggedWord outOfBounds = Constants.OOB;
    
    private static final String[] lxfLabs = {LEX + "-2", LEX + "-1", LEX,     LEX + "+1", LEX + "+2"};
    private static final String[] posfLabs = {POS + "-2", POS + "-1", POS,     POS + "+1", POS + "+2"};   
    
    /** 
     * An object containing a ConditionalProbabilityTable that can give a prior distribution over all
     * known supertags given a POS-tagged word.
     * 
     * Trained as a factored LM (presumably using SRILM).
     */
    protected STPriorModel priorMod;

    /** Constructor with no prior model. */
    public STFex( ) { this.priorMod = null; }
    
    /** Constructor with a prior model over supertags (to be used as a feature). */
    public STFex(STPriorModel priorMod) { this.priorMod = priorMod; }

    /** Pass in true to use multi-POS features, pass in false not to. */
    public void useMultiPOS(boolean trueOrFalse) { useMultiPOS = trueOrFalse; }
    
    /**
     * Extracts an <code>ArrayList<String></code> representing the contextual
     * predicates (features) of a line of (tokenised) text (each <code>String</code>
     * represents the predicates that fire for a word in the line).
     * Each resulting <code>String</code> will have the form:
     * cp1 cp2 ... cpK
     * @param sentence A <code>List<Word></code> of feature bundles.
     * @param wordIndex An <code>int</code> giving the location of the word to be tagged.
     * @return A <code>Collection<Pair<String,Double>></code> of real-valued feature activations
     * for the word at index <tt>wordIndex</tt>
     */
    public Collection<Pair<String, Double>> getFeatures(Map<Integer, TaggedWord> sentence, Integer wordIndex, boolean training) {
        Collection<Pair<String, Double>> result = new ArrayList<Pair<String, Double>>(30);

        TaggedWord current, prev, prevPrev, next, nextNext;
        current = sentence.get(wordIndex);
        // -------- The left periphery ------------
        int wind = wordIndex.intValue();
        if (wind > 1) {
            prev = sentence.get(wind - 1);
            prevPrev = sentence.get(wind - 2);
        } else if (wind > 0) {
            prev = sentence.get(wind - 1);
            prevPrev = outOfBounds;
        } else {
            prev = prevPrev = outOfBounds;
        }

        // -------- The right periphery -----------
        int tempSize = sentence.size();
        if ((tempSize - (wind + 1)) >= 2) {
            next = sentence.get(wind + 1);
            nextNext = sentence.get(wind + 2);
        } else if (tempSize - (wind + 1) >= 1) {
            next = sentence.get(wind + 1);
            nextNext = outOfBounds;
        } else {
            next = nextNext = outOfBounds;
        }
        Double activation = new Double(1.0);
        if (training)
            result.add(new Pair<String, Double>(current.getSupertag(), activation));      
        
        result.add(new Pair<String, Double>(curL + current.getForm(), activation));        
        if(useMultiPOS) { for(Pair<Double,String> tg : current.getPOSTagging()) result.add(new Pair<String,Double>(curP + tg.b, tg.a)); }
        else { result.add(new Pair<String, Double>(curP + current.getPOS(), activation)); }
        
        result.add(new Pair<String, Double>(prevL + prev.getForm(), activation));        
        if(useMultiPOS && prev != Constants.OOB) { for(Pair<Double,String> tg : prev.getPOSTagging()) result.add(new Pair<String,Double>(prevP + tg.b, tg.a)); }
        else { result.add(new Pair<String, Double>(prevP + prev.getPOS(), activation)); }        
        
        result.add(new Pair<String, Double>(prevPrevL + prevPrev.getForm(), activation));        
        if(useMultiPOS && prevPrev != Constants.OOB) { for(Pair<Double,String> tg : prevPrev.getPOSTagging()) result.add(new Pair<String,Double>(prevPrevP + tg.b, tg.a)); }
        else { result.add(new Pair<String, Double>(prevPrevP + prevPrev.getPOS(), activation)); }
        
        result.add(new Pair<String, Double>(nextL + next.getForm(), activation));        
        if(useMultiPOS && next != Constants.OOB) { for(Pair<Double,String> tg : next.getPOSTagging()) result.add(new Pair<String,Double>(nextP + tg.b, tg.a)); }
        else { result.add(new Pair<String, Double>(nextP + next.getPOS(), activation)); }
        
        result.add(new Pair<String, Double>(nextNextL + nextNext.getForm(), activation));
        if(useMultiPOS && nextNext != Constants.OOB) { for(Pair<Double,String> tg : nextNext.getPOSTagging()) result.add(new Pair<String,Double>(nextNextP + tg.b, tg.a)); }
        else { result.add(new Pair<String, Double>(nextNextP + nextNext.getPOS(), activation)); }
        
        // now for conjunctions of features: w-2w-1=..., w-1w+1=..., w+1w+2=... (same for posp).
        // (i.e., bigram features over words and parts of speech and bigrams of words and POSs that straddle the current token).
        // N.B. only use single-best POSs (maybe change later).       
        TaggedWord[] wds = {prevPrev,   prev,       current, next,       nextNext};
        
        for (int j = 1; j < wds.length; j++) {
            // add bigram features (only for single-best POS).           
            result.add(new Pair<String,Double>(lxfLabs[j - 1] + "|" + lxfLabs[j] + "=" + wds[j - 1].getForm() + "|" + wds[j].getForm(), activation));
            result.add(new Pair<String,Double>(posfLabs[j - 1] + "|" + posfLabs[j] + "=" + wds[j - 1].getPOS() + "|" + wds[j].getPOS(), activation));
            // also, if at the current word slot, add bigrams that straddle the current word.
            if (j == 2) {
                result.add(new Pair<String,Double>(lxfLabs[j - 1] + "|" + lxfLabs[j + 1] + "=" + wds[j - 1].getForm() + "|" + wds[j + 1].getForm(), activation));
                result.add(new Pair<String,Double>(posfLabs[j - 1] + "|" + posfLabs[j + 1] + "=" + wds[j - 1].getPOS() + "|" + wds[j + 1].getPOS(), activation));
            }
        }
        
        // If the prior model is not null, extract a feature for the beta-best (beta = 0.1) classes
        // predicted by the prior model (for all output classes -- supertags -- seen with this word's
        // POS).
        // Extract prior features from these. 
        if(priorMod != null) {
            priorMod.computePriors(current.getWord());
            for(Pair<String,Double> priorClassActivationPair : priorMod.getRestrictedBetaBestPriors(current.getWord(), 0.1)) { // TODO: make beta parameterizable.
                double act = Math.log(priorClassActivationPair.b);              
                String wd = current.getForm().intern(), pos = current.getPOS().intern();
                result.add(new Pair<String,Double>(priorST + priorClassActivationPair.a.intern(), act)); // log(prob)
                result.add(new Pair<String,Double>(wordPriorST + priorClassActivationPair.a.intern()+"_"+wd, act)); // log(prob)
                result.add(new Pair<String,Double>(wordPOSPriorST + priorClassActivationPair.a.intern()+"_"+wd+"_"+pos, act)); // log(prob)
                result.add(new Pair<String,Double>(POSPriorST + priorClassActivationPair.a.intern()+"_"+pos, act)); // log(prob)
                result.add(new Pair<String,Double>(antiPriorST + priorClassActivationPair.a.intern(), Math.log(1-Math.exp(act)))); // log(1-prob)
                // TODO: come up with sensible "anti-prior" features that simulate the filtering effect of the tagging dict.
            }
        }        
        return result;
    }

    public List<Collection<Pair<String, Double>>> getSentenceFeatures(Map<Integer, TaggedWord> sentence, boolean training) {
        List<Collection<Pair<String,Double>>> res = new ArrayList<Collection<Pair<String,Double>>>(sentence.size());
        List<Integer> keys = new ArrayList<Integer>(sentence.keySet().size());
        for(Integer i : sentence.keySet()) { keys.add(i); }
        Collections.sort(keys);
        for(Integer wordIndex : keys) {
            res.add(getFeatures(sentence, wordIndex, training));
        }
        return res;
    }

    public Collection<Pair<String, Double>> getFeatures(Map<Integer, TaggedWord> sentence, Integer wordIndex) {
        return getFeatures(sentence, wordIndex, false);
    }

    public List<Collection<Pair<String, Double>>> getSentenceFeatures(Map<Integer, TaggedWord> sentence) {
        return getSentenceFeatures(sentence, false);
    }
    
    // main method for extracting features from a file (for training).
    // pass in a supertag prior model and prior model vocab file, if desired.
    // (these replace tagging dictionaries).
    // pass in a POS tagger config file,  if we aren't only using gold POS tags only.
    // input corpus is from stdin, output goes to stdout.
    public static void main(String[] args) {
        // we assume that the training data is being streamed in from stdin (no parse IDs, just SRILM factor bundle lines),
        // and that output will stream to stdout.
        String usage = 
                "\n<stdin> | STFex (-h [gets this message]) (-r <priorSTModelF> -v <priorSTModelVocabF>) (-p <postaggerConfigFile>) | <stdout>";
        if(args.length > 0 && args[0].equals("-h")) { System.out.println(usage); System.exit(0); }
        
        String priorModF = null, priorVocab = null, posConfig = null;
        for(int j = 0; j < args.length; j++) {
            if(args[j].equals("-r")) { priorModF  = args[++j]; continue; }
            if(args[j].equals("-v")) { priorVocab = args[++j]; continue; }
            if(args[j].equals("-p")) { posConfig  = args[++j]; continue; }
            System.err.println("Unrecognized option: " + args[j]); 
        }
        SRILMFactoredBundleCorpusIterator corp = new SRILMFactoredBundleCorpusIterator(new BufferedReader(new InputStreamReader(System.in)));   
        STPriorModel stPriorMod = null;
        if(priorModF != null) {
            try {
                stPriorMod = new STPriorModel(priorModF, priorVocab);
            } catch (IOException ex) {
                Logger.getLogger(STFex.class.getName()).log(Level.SEVERE, null, ex);
            }
        }
        STFex fexer = new STFex(stPriorMod);        
        POSTagger posT = (posConfig == null) ? null : POSTagger.posTaggerFactory(posConfig);
        
        if(posT != null) { fexer.useMultiPOS(true); } else { fexer.useMultiPOS(false); }
        
        for(List<Word> sentence : corp) {
            Map<Integer, TaggedWord> sent = new HashMap<Integer, TaggedWord>(sentence.size());
            int index = 0;                
            if(posT == null) {                
                for(Word w : sentence) { sent.put(index++, new TaggedWord(w)); }            
            } else {
                List<TaggedWord> posTagging = posT.tagSentence(sentence);
                for(TaggedWord tw : posTagging) { sent.put(index++, tw); }
            }
            List<Collection<Pair<String,Double>>> ftss = fexer.getSentenceFeatures(sent, true);            
            for(Collection<Pair<String,Double>> fts : ftss) {
                index = 0;
                for(Pair<String,Double> ft : fts) {
                    // if we're at the first item, print out the label.
                    if (index == 0) {
                        System.out.print(ft.a);
                    } else {
                        System.out.print(" " + ft.a + ":" + ft.b);
                    }
                    index++;   
                }
                System.out.println();
            }
        }
    }
}


================================================
FILE: src/opennlp/ccg/parse/supertagger/ml/STPriorModel.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2010 Dennis N. Mehay
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.parse.supertagger.ml;

import opennlp.ccg.parse.supertagger.util.ProbPairComparator;

import java.io.BufferedReader;
import java.io.BufferedWriter;
import java.io.File;
import java.io.FileNotFoundException;
import java.io.FileReader;
import java.io.FileWriter;
import java.io.IOException;
import java.io.InputStreamReader;
import java.io.OutputStreamWriter;
import java.util.ArrayList;
import java.util.Arrays;
import java.util.Collection;
import java.util.Collections;
import java.util.HashMap;
import java.util.HashSet;
import java.util.List;
import java.util.Map;
import java.util.logging.Level;
import java.util.logging.Logger;
import opennlp.ccg.lexicon.DefaultTokenizer;
import opennlp.ccg.lexicon.Word;
import opennlp.ccg.ngrams.ConditionalProbabilityTable;
import opennlp.ccg.parse.tagger.io.SRILMFactoredBundleCorpusIterator;
import opennlp.ccg.parse.tagger.ProbIndexPair;
import opennlp.ccg.parse.supertagger.util.STTaggerPOSDictionary;
import opennlp.ccg.util.Interner;
import opennlp.ccg.util.Pair;

/**
 * (c) (2009) Dennis N. Mehay
 * @author Dennis N. Mehay
 * 
 * Model for predicting p(supertag | word, pos).  Uses an ARPA-formatted
 * SRILM-trained "unigram" factored LM for this, where each "unigram" is
 * a bundle of word:pos:supertag.
 */
public class STPriorModel extends ConditionalProbabilityTable {

    public static final String WORD = DefaultTokenizer.WORD_ATTR;
    public static final String POS_TAG = DefaultTokenizer.POS_ATTR;
    public static final String SUPERTAG = DefaultTokenizer.SUPERTAG_ATTR;
    private Interner<Pair<String, String>> pairs = new Interner<Pair<String, String>>();
    /** 
     * Re-usable list for attr-val pairs of word-pos-supertag inputs to the prior model
     * (i.e., for predicting p(STag | word, POS). 
     */
    public List<Pair<String, String>> attrVals = new ArrayList<Pair<String, String>>(5);
    /** 
     * A comparator for sorting Pair<Double,String>'s where the Double is a probability
     * (effectively sorts by descending order of probability).
     */
    private ProbPairComparator ppcomp = new ProbPairComparator();
    /** All the priors. Reference them when getting beta-best, beta-worst, etc. */
    List<Pair<Double, String>> priors = new ArrayList<Pair<Double, String>>(1000);
    /** String[] of all possible supertag outcomes. */
    private String[] stagVocab = null;
    /** double[] containing the probability distro over all supertags. */
    private double[] stagDistro = null;
    /** 
     * POS-keyed tagging dictionary (to provide restrictions on what the prior model may consider.
     * No restrictions if null.
     */
    private STTaggerPOSDictionary posDict = null;
    /** 
     * Re-usable way of containing the probabilities and a pointer back into where they came from
     * in the probability distro over all supertags. 
     */
    private ProbIndexPair[] stagPointers = null;

    /** Construct a prior model with the FLM config file and corresponding vocab file. */
    public STPriorModel(String flmFile, String vocabFile) throws IOException {
        // create with a null POS dictionary (i.e., no restrictions on taggings).
        this(flmFile, vocabFile, null);
    }

    /** Construct a prior model with the FLM config file and corresponding vocab file. */
    public STPriorModel(String flmFile, String vocabFile, STTaggerPOSDictionary posDict) throws IOException {
        super(flmFile);
        this.posDict = posDict;

        String st = null;
        BufferedReader br = new BufferedReader(new FileReader(new File(vocabFile)));
        st = br.readLine().trim();

        // get next supertag from the vocab.
        while ((st != null) && !st.trim().startsWith(SUPERTAG + "-")) {
            st = br.readLine();
        }
        if (st != null) {
            st = st.trim().split("-")[1];
        }

        Collection<String> allSupertags = new HashSet<String>();

        // find out how many outcomes we have.
        int cnt = 0;
        while (st != null) {
            cnt++;
            allSupertags.add(st);
            while ((st != null) && !st.trim().startsWith(SUPERTAG + "-")) {
                st = br.readLine();
            }
            if (st != null) {
                st = st.trim().split("-")[1];
            }
        }
        br.close();

        // initialize the arrays to this size.
        stagVocab = new String[cnt];
        stagPointers = new ProbIndexPair[cnt];
        stagDistro = new double[cnt];

        cnt = 0;
        // fill the vocab array with all possible supertags.
        for (String stag : allSupertags) {
            stagVocab[cnt++] = stag.intern();
        }
    }

    /** Set the POS-keyed tagging dictionary. */
    public void setPOSDict(STTaggerPOSDictionary posDict) {
        this.posDict = posDict;
    }

    /** Get the prior probability of this supertag/POS/word combo. */
    public double getPriorOf(String supertag, String word, String pos) {
        attrVals.clear();
        Pair<String, String> surfaceForm = pairs.intern(new Pair<String, String>(WORD, DefaultTokenizer.escape(word).intern()));
        attrVals.add(surfaceForm);
        Pair<String, String> partOfSpeech = pairs.intern(new Pair<String, String>(POS_TAG, DefaultTokenizer.escape(pos).intern()));
        attrVals.add(partOfSpeech);
        attrVals.add(pairs.intern(new Pair<String, String>(SUPERTAG, DefaultTokenizer.escape(supertag).intern())));
        return score(attrVals);
    }

    /** Get the beta-best tags for this word, under the prior model. */
    public List<Pair<String, Double>> getBetaBestPriors(Word w, double beta) {
        List<Pair<String, Double>> allPriors = getAllPriors(w);
        List<Pair<String, Double>> betaBestPriors = new ArrayList<Pair<String, Double>>(100);
        double best = allPriors.get(0).b;
        for (Pair<String, Double> prior : allPriors) {
            if (best * beta <= prior.b) {
                betaBestPriors.add(prior);
            } else {
                break;
            }
        }
        return betaBestPriors;
    }

    /** Compute all priors, subject to the POS dict constraints. */
    public void computePriors(Word w) {
        if (posDict != null) {
            priors = getPOSRestrictedPriors(w);
        }
    }

    /** Get the POS-dict restricted prior distribution (sorted descending by prob.) */
    protected List<Pair<Double, String>> getPOSRestrictedPriors(Word w) {
        Collection<String> tagsAllowed = posDict.getEntry(w.getPOS());
        if (tagsAllowed == null || tagsAllowed.size() == 0) {
            return priors;
        } else {
            List<Pair<Double, String>> sortedTags = new ArrayList<Pair<Double, String>>(tagsAllowed.size());
            for (String tag : tagsAllowed) {
                sortedTags.add(new Pair<Double, String>(getPriorOf(tag, w.getForm(), w.getPOS()), tag));
            }
            Collections.sort(sortedTags, ppcomp);
            return sortedTags;
        }
    }

    /** 
     * Get the beta-best tags (using the prior model) only from among the POS-dictionary-allowed possibilities. 
     * beta-best (def'n): {t | p(t) >= beta * p(best-tag) }
     */
    public List<Pair<String, Double>> getRestrictedBetaBestPriors(Word w, double beta) {
        if (posDict == null) {
            return getBetaBestPriors(w, beta);
        } else {
            List<Pair<String,Double>> rez = new ArrayList<Pair<String,Double>>(50);
            double best = priors.get(0).a;
            for(Pair<Double,String> tg : priors) {
                if(tg.a >= (beta * best)) {
                    rez.add(new Pair<String,Double>(tg.b,tg.a));
                } else {
                    break;
                }
            }
            return rez;
        }
    }
    
    /** 
     *  Get the beta-WORST tags (using the prior model) only from among the POS-dictionary-allowed possibilities. 
     *  beta-best (def'n): {t | p(t) >= beta * p(best-tag) }
     *  beta-worst (def'n): {t | p(t) * beta <= p(worst-tag)}
     */
    public List<Pair<String, Double>> getRestrictedBetaWorstPriors(Word w, double beta) {
        if (posDict == null) {
            throw new UnsupportedOperationException("Cannot get beta-worst without a pos-keyed tagging dict.\nNot yet implemented.");
        } else {
            List<Pair<String,Double>> rez = new ArrayList<Pair<String,Double>>(50);
            List<Pair<Double,String>> cpy = new ArrayList<Pair<Double,String>>(priors);
            Collections.reverse(cpy);            
            double worst = cpy.get(0).a;
            for(Pair<Double,String> tg : cpy) {
                if((tg.a * beta) <= worst) {
                    rez.add(new Pair<String,Double>(tg.b,tg.a));
                } else {
                    break;
                }
            }
            return rez;
        }
    }

    public List<Pair<String, Double>> getAllPriors(Word w) {
        return getNBestPriors(w, stagVocab.length);
    }

    /** Get the n-best supertags on the prior model, given this word (with POS). */
    public List<Pair<String, Double>> getNBestPriors(Word w, int n) {
        attrVals.clear();
        Pair<String, String> surfaceForm = pairs.intern(new Pair<String, String>(WORD, DefaultTokenizer.escape(w.getForm()).intern()));
        attrVals.add(surfaceForm);
        Pair<String, String> pos = pairs.intern(new Pair<String, String>(POS_TAG, DefaultTokenizer.escape(w.getPOS()).intern()));
        attrVals.add(pos);

        int cnt = 0;
        for (String st : stagVocab) {
            // remove the last stag factor, if there.
            if (attrVals.size() == 3) {
                attrVals.remove(attrVals.size() - 1);
            }

            attrVals.add(pairs.intern(new Pair<String, String>(SUPERTAG, st)));
            // add the probability of this tag under the prior model to the distro array.
            double sc = score(attrVals);
            stagDistro[cnt] = sc;
            // add this probability with a pointer back to where it came from in the vocab.
            // (so that we can sort by probability, but then retrieve the supertag string).
            stagPointers[cnt] = new ProbIndexPair(sc, cnt);
            cnt++;

        }
        // sort descending by probability (achieved by the comparator implementation of ProbIndexPair).

        Arrays.sort(stagPointers);

        List<Pair<String, Double>> result = new ArrayList<Pair<String, Double>>(n);
        for (int i = 0; i <
                n; i++) {
            result.add(new Pair<String, Double>(stagVocab[stagPointers[i].b], stagPointers[i].a));
        }

        return result;
    }

    public static void main(String[] args) throws IOException {
        String usage = "\nSTPriorModel -vocab <vocabfile> (-c <corpus>) (-o <output>) (-u <catFreqCutoff> ) (-v [ or '-verbose'])\n";
        if (args.length > 0 && args[0].equals("-h")) {
            System.out.println(usage);
            System.exit(0);
        }

        SRILMFactoredBundleCorpusIterator in = null;
        BufferedWriter out = null;
        BufferedWriter voc = null;

        try {
            String inputCorp = "<stdin>", output = "<stdout>", vocabFile = "vocab.voc";
            int catCutoff = 10;

            for (int i = 0; i <
                    args.length; i++) {
                if (args[i].equals("-c")) { inputCorp = args[++i]; continue; }
                if (args[i].equals("-o")) { output = args[++i];    continue; }
                if (args[i].equals("-vocab")) {vocabFile = args[++i]; continue; }
                if (args[i].equals("-u")) { catCutoff = Integer.parseInt(args[++i]); continue; }
                System.out.println("Unrecognized option: " + args[i]);
            }
            
            try {
                in = new SRILMFactoredBundleCorpusIterator(
                        (inputCorp.equals("<stdin>")) ? new BufferedReader(new InputStreamReader(System.in)) : new BufferedReader(new FileReader(new File(inputCorp))));
            } catch (FileNotFoundException ex) {
                System.err.print("Input corpus " + inputCorp + " not found.  Exiting...");
                Logger.getLogger(STPriorModel.class.getName()).log(Level.SEVERE, null, ex);
                System.exit(
                        -1);
            }

            try {
                out = (output.equals("<stdout>")) ? new BufferedWriter(new OutputStreamWriter(System.out)) : new BufferedWriter(new FileWriter(new File(output)));
            } catch (IOException ex) {
                System.err.print("Output file " + output + " not found.  Exiting...");
                Logger.getLogger(STPriorModel.class.getName()).log(Level.SEVERE, null, ex);
                System.exit(
                        -1);
            }

            try {
                voc = new BufferedWriter(new FileWriter(new File(vocabFile)));
            } catch (IOException ex) {
                Logger.getLogger(STPriorModel.class.getName()).log(Level.SEVERE, null, ex);
            }

            Map<String, Integer> vocab = new HashMap<String, Integer>();
            for (List<Word> inLine : in) {
                for (Word w : inLine) {
                    String st = SUPERTAG + "-" + DefaultTokenizer.escape(w.getSupertag()),
                            pos = POS_TAG + "-" + DefaultTokenizer.escape(w.getPOS()),
                            wform = WORD + "-" + DefaultTokenizer.escape(w.getForm());

                    vocab.put(st, (vocab.get(st) == null) ? 1 : vocab.get(st) + 1);
                    vocab.put(pos, (vocab.get(pos) == null) ? 1 : vocab.get(pos) + 1);
                    vocab.put(wform, (vocab.get(wform) == null) ? 1 : vocab.get(wform) + 1);
                }

            }

            // reopen file
            try {
                in = new SRILMFactoredBundleCorpusIterator(
                        (inputCorp.equals("<stdin>")) ? new BufferedReader(new InputStreamReader(System.in)) : new BufferedReader(new FileReader(new File(inputCorp))));
            } catch (FileNotFoundException ex) {
                System.err.print("Input corpus " + inputCorp + " not found.  Exiting...");
                Logger.getLogger(STPriorModel.class.getName()).log(Level.SEVERE, null, ex);
                System.exit(
                        -1);
            }
            for (List<Word> inLine : in) {
                for (Word w : inLine) {
                    String st = SUPERTAG + "-" + DefaultTokenizer.escape(w.getSupertag()),
                            pos = POS_TAG + "-" + DefaultTokenizer.escape(w.getPOS()),
                            wform = WORD + "-" + DefaultTokenizer.escape(w.getForm());
                    if (vocab.get(st) > catCutoff) {
                        out.write(wform + ":" + pos + ":" + st + " ");
                    }
                }

                out.write(System.getProperty("line.separator"));
            }

            out.flush();

            for (String str : vocab.keySet()) {
                if (vocab.get(str) > catCutoff) {
                    voc.write(str + System.getProperty("line.separator"));
                }
            }

            voc.flush();
        } finally {
            try {
                out.close();
                in.close();
                voc.close();
            } catch (IOException ex) {
                Logger.getLogger(STPriorModel.class.getName()).log(Level.SEVERE, null, ex);
            }
        }
    }
}


================================================
FILE: src/opennlp/ccg/parse/supertagger/ml/ZhangLeTrainingExtractor.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2009 Dennis N. Mehay
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.parse.supertagger.ml;

import java.io.BufferedReader;
import java.io.BufferedWriter;
import java.io.File;
import java.io.FileNotFoundException;
import java.io.FileReader;
import java.io.FileWriter;
import java.io.IOException;
import java.util.Collection;
import java.util.Iterator;
import java.util.List;
import java.util.Map;
import java.util.TreeMap;
import java.util.logging.Level;
import java.util.logging.Logger;
import opennlp.ccg.lexicon.Word;
import opennlp.ccg.parse.tagger.io.PipeDelimitedFactoredBundleCorpusIterator;
import opennlp.ccg.parse.tagger.io.SRILMFactoredBundleCorpusIterator;
import opennlp.ccg.parse.supertagger.ml.FeatureExtractor;
import opennlp.ccg.parse.supertagger.ml.STFex;
import opennlp.ccg.parse.tagger.TaggedWord;
import opennlp.ccg.util.Pair;

/**
 * @author Dennis N. Mehay
 * @version $Revision: 1.3 $, $Date: 2010/09/21 04:12:41 $
 */
public class ZhangLeTrainingExtractor {

    private File outputF;
    private Iterator<List<Word>> incorp;
    private FeatureExtractor fexer = new STFex();

    /**
     * Create a training feature extractor that will extract features (with results)
     * for every instance in the input (training) corpus corpusName.
     * 
     * @param corpusName A <code>String</code> giving the complete
     * path to the input file of SRILM-compliant factored bundles.
     * @param outputFileName A <code>String</code> giving the complete
     * path to the output file where the features will be written.
     */
    public ZhangLeTrainingExtractor(File corpus, File outputF, String tokenisation) {
        this(corpus, outputF, tokenisation, new STFex());
    }
    
    public ZhangLeTrainingExtractor(File corpus, File outputF, String tokenisation, FeatureExtractor fexer) {
        this.fexer = fexer;
        this.outputF = outputF;
        try {
            if (tokenisation.equalsIgnoreCase("srilm")) {
                incorp = new SRILMFactoredBundleCorpusIterator(new BufferedReader(new FileReader(corpus)));
            } else {
                incorp = new PipeDelimitedFactoredBundleCorpusIterator(new BufferedReader(new FileReader(corpus)));
            }
        } catch (FileNotFoundException ex) {
            Logger.getLogger(ZhangLeTrainingExtractor.class.getName()).log(Level.SEVERE, null, ex);
        }
    }

    /**
     * Writes training feats to file.
     */
    public void writeFeats() {
        BufferedWriter bw = null;
        try {
            try {
                bw = new BufferedWriter(new FileWriter(this.outputF));
            } catch (IOException ex) {
                Logger.getLogger(ZhangLeTrainingExtractor.class.getName()).log(Level.SEVERE, null, ex);
            }
            if (bw != null || this.incorp != null) {
                List<Word> sent = null;
                Map<Integer, TaggedWord> snt = null;

                Iterator<List<Word>> sents = this.incorp;
                while (sents.hasNext()) {
                    //for (Iterator<List<Word>> sents = this.incorp; sents.hasNext();) {
                    sent = sents.next();

                    // turn the sent into a map from integer string indices to Words.
                    int index = 0;
                    snt = new TreeMap<Integer, TaggedWord>();
                    for (Word w : sent) {
                        snt.put(index++, new TaggedWord(w));
                    }

                    // 'true' says "we're getting training feats"
                    for (Collection<Pair<String, Double>> sentFeatsWithActivation : fexer.getSentenceFeatures(snt, true)) {
                        try {
                            boolean isLabel = true;
                            for (Pair<String, Double> ftWAct : sentFeatsWithActivation) {
                                if (isLabel) {
                                    bw.write(ftWAct.a + " ");
                                    isLabel = false;
                                } else {
                                    bw.write(ftWAct.a + ":" + ftWAct.b.doubleValue() + " ");
                                }
                            }
                            bw.newLine();
                        } catch (IOException ex) {
                            Logger.getLogger(ZhangLeTrainingExtractor.class.getName()).log(Level.SEVERE, null, ex);
                        }

                    }
                }
            }
        } finally {
            try {
                bw.flush();
                bw.close();
            } catch (IOException ex) {
                Logger.getLogger(ZhangLeTrainingExtractor.class.getName()).log(Level.SEVERE, null, ex);
            } catch (Exception e) {
                System.out.println(e);
            }
        }
    }
}

================================================
FILE: src/opennlp/ccg/parse/supertagger/util/PipedTokenizer.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2009 Dennis N. Mehay
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.parse.supertagger.util;

import java.util.List;
import opennlp.ccg.lexicon.DefaultTokenizer;
import opennlp.ccg.lexicon.Word;
import opennlp.ccg.util.Pair;

/**
 * @author Dennis N. Mehay
 * @version $Revision: 1.1 $, $Date: 2009/08/21 17:20:20 $
 */
public class PipedTokenizer extends DefaultTokenizer {

    public PipedTokenizer() {
        super();
    }

    @Override
    public Word parseToken(String token, boolean strictFactors) {
        // init
        String form = token;
        String stem = null;
        String POS = null;
        String pitchAccent = null;
        String supertag = null;
        String semClass = null;
        List<Pair<String,String>> attrValPairs = null;
        
        // handle pipe-separated attr-val pairs
        int pipePos = token.indexOf('|');
        String suffix = null;
        if (pipePos > 0) {
            // get word form
            form = token.substring(0, pipePos);
            // shave off word form
            suffix = token.substring(pipePos + 1);
            // get next | position
            pipePos = suffix.indexOf('|');            
            // get stem [or lemma]. could be null.
            stem = suffix.substring(0,pipePos);
            if (stem.equals("")) { stem = null;}
            // shave off stem/lemma
            suffix = suffix.substring(pipePos + 1);
            // get next | position
            pipePos = suffix.indexOf('|');
            // get POS
            POS = suffix.substring(0,pipePos);
            // shave off POS
            suffix = suffix.substring(pipePos + 1);
            // see whether there is a supertag
            if (suffix != null && !suffix.equals("")) {
                // get supertag
                supertag = suffix.trim();
            }
        } else {
            throw new RuntimeException("This file is not in the right format: \n"+
                    "form|lemma|POS|(Supertag) ... form|lemma|POS(Supertag).");
        }
        // done
        return Word.createWord(form, pitchAccent, attrValPairs, stem, POS, supertag, semClass);
    }
}


================================================
FILE: src/opennlp/ccg/parse/supertagger/util/ProbPairComparator.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (c) 2010 Dennis N. Mehay
//
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed inp the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.parse.supertagger.util;

import java.util.Comparator;
import opennlp.ccg.util.Pair;

/**
 * @author Dennis N. Mehay
 * 
 * A little Comparator instance for comparing Pair<Double,String>
 * instances of pair by descending order of the Double value (assuming
 * that they are probabilities of string tags).
 */
public class ProbPairComparator implements Comparator<Pair<Double,String>> {

    /**
     * Implements the Comparator interface's work-horse method.
     * 
     * Compares two Pair<Double,String> objects.  Crucially, it does NOT
     * ensure that both objects are Pair<Double,String> before casting them.
     * The caller is responsible for ensuring this, and failure to do so may
     * result in a RuntimeException.
     */
    public int compare(Pair<Double,String> pr1, Pair<Double,String> pr2) {
        if (pr1 == pr2) { return 0; }
        return -1 * Double.compare(pr1.a, pr2.a);

    }
}


================================================
FILE: src/opennlp/ccg/parse/supertagger/util/STTaggerDictionary.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2009 Dennis N. Mehay
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.parse.supertagger.util;

//import java.util.ArrayList;
import java.util.Collection;

/**
 * An interface for supertagger "dictionaries" as described
 * in, e.g., Clark (2002) _Supertagging for CCG_.
 * 
 * @author Dennis N. Mehay
 * @version $Revision: 1.1 $, $Date: 2009/08/21 17:20:20 $
 */
public interface STTaggerDictionary {

    /**
     * A method for getting the dictionary entry for a particular
     * <code>String</code> key.  
     * The key will usually be a word, lemma or a part 
     * of speech, but you may have other interesting grammatical things 
     * to associate with supertags.
     * 
     * @param key A <code>String</code> representing a particular
     *            grammatical type.
     * @return A <code>Collection<String></code> containing supertags (CCG lexical 
     *         categories) seen with the particular grammatical type `key'.
     *         Returns <code>null</code> if that word was not seen in the
     *         corpus or (if the implementing class has a frequency cut-off)
     *         if that type's token frequency was not high enough.
     */
    public Collection<String> getEntry(String key);
    
    /**
     * A method to test whether this <code>STTaggerDictionary</code> contains 
     * an entry for a particular <code>String</code> key.  
     * The key will usually be a word, lemma or a part of speech, but 
     * you may have other interesting grammatical things to associate with 
     * supertags.
     * 
     * @param key A <code>String</code> representing a particular
     *            grammatical type.
     * @return A <code>boolean</code> value of <code>true</code> or 
     *           <code>false</code> answering the question of whether this
     *           dictionary contains an entry for the specified key.
     */
    public boolean containsEntry(String key);
}


================================================
FILE: src/opennlp/ccg/parse/supertagger/util/STTaggerPOSDictionary.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2009 Dennis N. Mehay
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.parse.supertagger.util;

//import util.Pair;
import java.io.*;
import java.util.ArrayList;
import java.util.Collection;
import java.util.Iterator;
import java.util.Map;
import opennlp.ccg.util.Pair;

/**
 * @author Dennis N. Mehay
 * @version $Revision: 1.2 $, $Date: 2010/09/21 04:12:41 $
 */
public class STTaggerPOSDictionary implements STTaggerDictionary, Serializable {

	private static final long serialVersionUID = -4814356608876054823L;
	
	/**
     * This object represents our dictionary.  The String is the
     * POS we want to look up, and the Collection<String> holds all of 
     * of the CCG lex. cat's seen with that POS.
    */
    private Map<String, Collection<String>> dict = null;

   
    /**
     * This constructor does not create the dictionary; that must
     * be done using a <code>DictionaryMaker</code>.    
     */
    public STTaggerPOSDictionary(Map<String, Collection<String>> dict) { 
    	this.dict = dict;
    } 

    /** 
     * This method implements the <code>interface</code> STTaggerDictionary
     * by delegating to <code>getEntry(String, int)</code> (see below).
    */
    public Collection<String> getEntry(String POS) {
	return this.dict.get(POS);
    }

    /**
     * A method that returns the contents of the mapping embodied in this dictionary.
     * @return An <code>Iterator</code> of <code>supertagger.util.Pair</code>s
     * that represent the pos ->  { ... supertags ...} mappings in the dictionary.
     */
    public Iterator<Pair<String, Collection<String>>> getMappings() {
        Iterator<String> keyset = this.dict.keySet().iterator();
        ArrayList<Pair<String, Collection<String>>> preRes = 
                new ArrayList<Pair<String, Collection<String>>>();
        String tempS = null;
        while(keyset.hasNext()) {
            tempS = keyset.next();
            preRes.add(new Pair<String, Collection<String>>(tempS, this.dict.get(tempS)));
        }
        return preRes.iterator();
    }
    
    /**
     * A method to test whether this <code>STTaggerDictionary</code> contains 
     * an entry for a particular <code>String</code> representing a POS tag.  
     *
     * @param key A <code>String</code> representing a particular
     *            POS tag.
     * @return A <code>boolean</code> value of <code>true</code> or 
     *           <code>false</code> answering the question of whether this
     *           dictionary contains an entry for the specified POS tag.
     */
    public boolean containsEntry(String POS) { return this.dict.containsKey(POS); }
    
} // End class STTaggerPOSDictionary


================================================
FILE: src/opennlp/ccg/parse/supertagger/util/STTaggerWordDictionary.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2009 Dennis N. Mehay
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.parse.supertagger.util;

import java.io.*;
import java.util.ArrayList;
import java.util.Collection;
import java.util.Iterator;
import java.util.Map;
import opennlp.ccg.util.Pair;

/**
 * @author Dennis N. Mehay
 * @version $Revision: 1.2 $, $Date: 2009/11/15 04:52:26 $
 */
public class STTaggerWordDictionary implements STTaggerDictionary, Serializable {
	
	private static final long serialVersionUID = -2474606825228545547L;
	
	/* This object represents our dictionary.  The String is the
	 * word we want to look up, and the Pair holds
	 * the word frequency count (= `a') and the Collection<String> of the CCG lex. cat's
	 * seen with that word (= `b').
	 */
	private Map<String, Pair<Integer, Collection<String>>> dict = null;


	/* This constructor does not create the dictionary; that must
	 * be done using a <code>DictionaryMaker</code>.    
	 */
	public STTaggerWordDictionary(Map<String, Pair<Integer, Collection<String>>> dict) { 
		this.dict = dict;
	} 

	/** 
	 * This method implements the interface STTaggerDictionary
	 * by delegating to <code>getEntry(String, int)</code> (see below).
	 */
	public Collection<String> getEntry(String word) {
		return getEntry(word, 1);
	}

	/**
	 * A method for getting the dictionary entry for a particular
	 * <code>String</code> word, only if that word appears at least
	 * `freq' times in the corpus.  
	 * 
	 * @param key A <code>String</code> representing a particular
	 *            word.
	 * @param freq An <code>int</code> specifying the number of times a 
	 *             word should have occured before it is returned.
	 * @return A <code>String[]</code> containing all supertags (CCG lexical 
	 *         categories) seen with the specified word.
	 *         Returns <code>null</code> if the word does not appear at least
	 *         `freq' times in the corpus from which the dictionary was 
	 *         created or if the word does not appear at all.
	 *         (N.B. Passing in an <code>int</code> `freq' value of zero will elicit the
	 *          same behavior as passing in a `freq' value of 1.)
	 */
	@SuppressWarnings("unchecked")
	public Collection<String> getEntry(String word, int freq) {
		if (word == null) return null; // mww: extra null check
		Object o = this.dict.get(word);
		if(o==null) { return null; }

		Pair<Integer,Collection<String>> p = (Pair<Integer,Collection<String>>)o;
		int wfreq = p.a.intValue();
		if(wfreq>=freq) {
			return p.b;
		}
		else {
			return null;
		}
	} // End method getEntry(String, int)

	/**
	 * A method to test whether this <code>STTaggerDictionary</code> contains 
	 * an entry for a particular <code>String</code> representing a word.  
	 *
	 * @param key A <code>String</code> representing a particular
	 *            word.
	 * @return A <code>boolean</code> value of <code>true</code> or 
	 *           <code>false</code> answering the question of whether this
	 *           dictionary contains an entry for the specified word.
	 */
	public boolean containsEntry(String word) { return this.dict.containsKey(word); }

	/**
	 * A method that returns the contents of the mapping embodied in this dictionary.
	 * @return An <code>Iterator</code> of <code>supertagger.util.Pair</code>s
	 * that represent the word -> (freq, { ... supertags ...}) mappings in the dictionary.
	 */
	public Iterator<Pair<String, Pair<Integer,Collection<String>>>> getMappings() {
		Iterator<String> keyset = this.dict.keySet().iterator();
		ArrayList<Pair<String, Pair<Integer,Collection<String>>>> preRes = 
			new ArrayList<Pair<String, Pair<Integer,Collection<String>>>>();
		String tempS = null;
		while(keyset.hasNext()) {
			tempS = keyset.next();
			preRes.add(
					new Pair<String, Pair<Integer, Collection<String>>>(tempS, this.dict.get(tempS)));
		}
		return preRes.iterator();
	}

	/** 
	 * A method for getting the number of times a word was seen 
	 * in the training data with which this dictionary was created.
	 * 
	 * @param word A <code>String</code> representing the word in question.
	 * @return An <code>int</code> count of this word's frequency in the 
	 *         corpus with which this dictionary was created.
	 */
	@SuppressWarnings("unchecked")
	public int getCount(String word) { 
		Object o = dict.get(word);
		if(o==null) { return 0; }
		else {
			Pair<Integer,Collection<String>> p = (Pair<Integer,Collection<String>>)o;
			return p.a.intValue();
		}
	} // End method getCount(word)
} // End class STTaggerWordDictionary


================================================
FILE: src/opennlp/ccg/parse/supertagger/util/SupertagSequenceGetter.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (c) 2010 Dennis N. Mehay
//
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed inp the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.parse.supertagger.util;

import java.io.BufferedReader;
import java.io.BufferedWriter;
import java.io.File;
import java.io.FileNotFoundException;
import java.io.FileReader;
import java.io.FileWriter;
import java.io.IOException;
import java.util.List;
import opennlp.ccg.lexicon.Word;
import opennlp.ccg.parse.tagger.io.SRILMFactoredBundleCorpusIterator;

/**
 * @author Dennis N. Mehay
 */
public class SupertagSequenceGetter {
    public static void main(String[] args) throws FileNotFoundException, IOException {
        String usage = "\nSupertagSequenceGetter -i <inputCorpus> -o <outputLocation>\n";
        String input = null, output = null;
        if(args == null || args.length == 0 || args[0].equals("-h")) {
            System.err.println(usage);
            System.exit(0);
        }
        for(int i = 0; i < args.length; i++) {
            if(args[i].equals("-i")) { input = args[++i]; continue; }
            if(args[i].equals("-o")) { output = args[++i]; continue; }
            System.err.println("unknown command-line option: " + args[i]);
        }
        
        BufferedReader in = new BufferedReader(new FileReader(new File(input)));
        SRILMFactoredBundleCorpusIterator corp = new SRILMFactoredBundleCorpusIterator(in);
        BufferedWriter out = new BufferedWriter(new FileWriter(new File(output)));
        
        
        for(List<Word> sent : corp) {
            out.write("<s> ");
            for(Word w : sent) {
                out.write(w.getSupertag()+" ");
            }
            out.write("</s>"+System.getProperty("line.separator"));
        }
        out.close();
    }
    
}


================================================
FILE: src/opennlp/ccg/parse/supertagger/util/TaggingDictionaryExtractor.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2009 Dennis N. Mehay
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.parse.supertagger.util;

import java.io.BufferedReader;
import java.io.BufferedWriter;
import java.io.File;
import java.io.FileNotFoundException;
import java.io.FileReader;
import java.io.FileWriter;
import java.io.IOException;
import java.text.CharacterIterator;
import java.text.StringCharacterIterator;
import java.util.HashMap;
import java.util.HashSet;
import java.util.Iterator;
import java.util.List;
import java.util.Map;
import java.util.Set;
import java.util.logging.Level;
import java.util.logging.Logger;
import opennlp.ccg.lexicon.Word;
import opennlp.ccg.parse.tagger.io.PipeDelimitedFactoredBundleCorpusIterator;
import opennlp.ccg.parse.tagger.io.SRILMFactoredBundleCorpusIterator;
import opennlp.ccg.util.Pair;

/**
 * Extracts and writes out XML files containing tagging
 * dictionary stats.
 * 
 * @author Dennis N. Mehay
 * @version $Revision: 1.5 $, $Date: 2010/09/21 04:12:41 $
 */
public class TaggingDictionaryExtractor {

    /**
     * Create a new dictionary extractor, specifying the word and POS
     * dictionary files, as well as the tokenisation type (SRILM Factored bundle or
     * C&C/Moses-style pipe-delimited factored bundles.
     * @param corpus A <code>File</code> of plain-text, one sentence per line and no additional mark-up beyond
     * the <s> ... </s> for SRILM factored bundle style.
     * @param wd A <code>File</code> where the word-based tagging dictionary will be written.
     * @param posd A <code>File</code> where the POS-based tagging dictionary will be written.
     * @param tokenisationType A <code>String</code> telling us how to tokenise factors in the 
     * corpus file.
     */
    // mapping from words to a pairing of their frequencies and the lexical categories they were seen with.
    private Map<String, Pair<Integer, Set<String>>> wdmap = new HashMap<String, Pair<Integer, Set<String>>>();
    // mapping from POS tags to the lexical categories they were seen with.
    private Map<String, Set<String>> posmap = new HashMap<String, Set<String>>();
    private Iterator<List<Word>> incorp = null;
    // writers for dict files.
    private BufferedWriter wbr = null,  pbr = null;

    // how frequently a cat must occur to make it into the dictionaries.
    private int minCatFreq = 1;
    
    /**
     * Escape characters for text appearing as XML data, between tags.
     * 
     * <P>The following characters are replaced with corresponding character entities :
     * <table border='1' cellpadding='3' cellspacing='0'>
     * <tr><th> Character </th><th> Encoding </th></tr>
     * <tr><td> < </td><td> &lt; </td></tr>
     * <tr><td> > </td><td> &gt; </td></tr>
     * <tr><td> & </td><td> &amp; </td></tr>
     * <tr><td> " </td><td> &quot;</td></tr>
     * <tr><td> ' </td><td> &#039;</td></tr>
     * </table>
     * 
     * <P>Note that JSTL's {@code <c:out>} escapes the exact same set of 
     * characters as this method. <span class='highlight'>That is, {@code <c:out>}
     *  is good for escaping to produce valid XML, but not for producing safe 
     *  HTML.</span>
     */
    public static String forXML(String aText) {
    	if (aText == null) return null;
        final StringBuilder result = new StringBuilder();
        final StringCharacterIterator iterator = new StringCharacterIterator(aText);
        char character = iterator.current();
        while (character != CharacterIterator.DONE) {
            if (character == '<') {
                result.append("&lt;");
            } else if (character == '>') {
                result.append("&gt;");
            } else if (character == '\"') {
                result.append("&quot;");
            } else if (character == '\'') {
                result.append("&#039;");
            } else if (character == '&') {
                result.append("&amp;");
            } else {
                //the char is not a special one
                //add it to the result as is
                result.append(character);
            }
            character = iterator.next();
        }
        return result.toString();
    }

    public TaggingDictionaryExtractor(File corpus, File wd, File posd, String tokenisationType) {
        this(corpus, wd, posd, tokenisationType, 10);
    }
    
    public TaggingDictionaryExtractor(File corpus, File wd, File posd, String tokenisationType, int catFreq) {
        try {
            wbr = new BufferedWriter(new FileWriter(wd));
            pbr = new BufferedWriter(new FileWriter(posd));
            minCatFreq = catFreq;
            if (tokenisationType.equalsIgnoreCase("srilm")) {
                incorp = new SRILMFactoredBundleCorpusIterator(new BufferedReader(new FileReader(corpus)));
            } else {
                incorp = new PipeDelimitedFactoredBundleCorpusIterator(new BufferedReader(new FileReader(corpus)));
            }
        } catch (IOException ex) {
            Logger.getLogger(TaggingDictionaryExtractor.class.getName()).log(Level.SEVERE, null, ex);
        }
    }

    /**
     * Extract the dictionaries.
     */
    @SuppressWarnings("unchecked")
	public void extract() {
        try {
            List<Word> currsent = null;
            String currForm = null, currPOS = null;
            //Set<String> currFormSTs = null, curPOSSTs = null;
            //Integer currWdCnt = null;
            Pair<Integer, Set<String>> currFormFetch = null;
            Set<String> currFormSet = null, currPOSSet = null;

            Map<String, Integer> catCount = new HashMap<String, Integer>();
            
            while (incorp.hasNext()) {
                // for every word in every sentence, update the counts, and add to the word- and POS-based
                // allowable tags.
                currsent = incorp.next();
                for (Word w : currsent) {
                    currForm = w.getForm();
                    currPOS = w.getPOS();
                    Object wfetch = wdmap.get(currForm);
                    String stag = w.getSupertag();
                    catCount.put(stag, catCount.get(stag)==null ? 1 : catCount.get(stag) + 1);
                    
                    if (wfetch == null) {
                        currFormSet = new HashSet<String>();
                        currFormSet.add(w.getSupertag());
                        wdmap.put(currForm, new Pair<Integer, Set<String>>(new Integer(1), currFormSet));
                    } else {
                        currFormFetch = ((Pair<Integer, Set<String>>) wfetch);
                        currFormSet = currFormFetch.b;
                        currFormSet.add(w.getSupertag());
                        wdmap.put(currForm,
                                new Pair<Integer, Set<String>>(new Integer(currFormFetch.a.intValue() + 1), currFormSet));
                    }

                    Object pfetch = posmap.get(currPOS);
                    if (pfetch == null) {
                        currPOSSet = new HashSet<String>();
                        currPOSSet.add(w.getSupertag());
                    } else {
                        currPOSSet = (Set<String>) pfetch;
                        currPOSSet.add(w.getSupertag());
                    }
                    
                    posmap.put(currPOS, currPOSSet);
                }
            }

            // now write out the dictionaries.
            String wrd = null;
            Pair<Integer, Set<String>> lkup = null;
            wbr.write("<?xml version=\"1.0\"?>\n");
            wbr.write("<wdict>\n");
            for (Object wdobj : wdmap.keySet()) {
                wrd = (String) wdobj;
                lkup = (Pair<Integer, Set<String>>) (wdmap.get(wdobj));
                wbr.write("\t<entry word=\"" + forXML(wrd) + "\" freq=\"" + lkup.a.intValue() + "\">\n");                
                for (String st : lkup.b) {
                    if(catCount.get(st) >= minCatFreq) {
                        wbr.write("\t\t<supertag> " + forXML(st) + " </supertag>\n");
                    }
                }
                wbr.write("\t</entry>\n");
            }
            wbr.write("</wdict>");

            String pos = null;
            Set<String> plkup = null;
            pbr.write("<?xml version=\"1.0\"?>\n");
            pbr.write("<posdict>\n");
            for (Object pobj : posmap.keySet()) {
                pos = (String) pobj;
                plkup = (Set<String>) posmap.get(pobj);
                pbr.write("\t<entry pos=\"" + forXML(pos) + "\">\n");
                for (String st : plkup) {
                    if(catCount.get(st) >= minCatFreq) {
                        pbr.write("\t\t<supertag> " + forXML(st) + " </supertag>\n");
                    }
                }
                pbr.write("\t</entry>\n");
            }
            pbr.write("</posdict>");

            // clean up.
            wbr.flush();
            wbr.close();
            pbr.flush();
            pbr.close();
        // done
        } catch (FileNotFoundException ex) {
            Logger.getLogger(TaggingDictionaryExtractor.class.getName()).log(Level.SEVERE, null, ex);
        } catch (IOException e) {
            Logger.getLogger(TaggingDictionaryExtractor.class.getName()).log(Level.SEVERE, null, e);
        }
    }
    
    public static void main(String[] args) throws Exception {
        String usage ="\nTaggingDictionaryExtractor -i <inputCorpus> -f <catFreqCutoff> -p <POSOutputXMLFile> -w <wordOutputXMLFile>\n\n";
        if(args.length > 0 && args[0].equals("-h")) {
            System.out.print(usage);
            System.exit(0);
        }
        
        String inputCorp = null, wOutput = null, pOutput = null;
        // how frequently must a supertag category have been seen to be included in the dictionary?
        int catFreq = 10;
        for(int i = 0; i < args.length; i++) {
            if(args[i].equals("-i")) {inputCorp = args[++i]; continue;}
            if(args[i].equals("-w")) {wOutput = args[++i]; continue;}
            if(args[i].equals("-p")) {pOutput = args[++i]; continue;}
            if(args[i].equals("-f")) {catFreq = Integer.parseInt(args[++i]); continue; }
            System.err.println("Unknown command-line option: "+args[i]);
        }
        
        File in = new File(inputCorp); 
        File wout = new File(wOutput);
        File pout = new File(pOutput);
        TaggingDictionaryExtractor tde = new TaggingDictionaryExtractor(in, wout, pout, "SRILM", catFreq);
        tde.extract();
    }
}


================================================
FILE: src/opennlp/ccg/parse/tagger/Constants.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (c) 2010 Dennis N. Mehay
//
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed inp the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.parse.tagger;
import opennlp.ccg.lexicon.Word;

/**
 * @author Dennis N. Mehay
 */
public final class Constants {
    public static final Double one = new Double(1.0);
    public static final Double zero = new Double(0.0);
    public static final TaggedWord OOB = new TaggedWord(Word.createWord("OOS", null, null, "OOS", "OOS", "OOS", null));
    public static enum Domain {PROB, LOGPROB};
    public static enum TaggingAlgorithm {FORWARDBACKWARD, FORWARD};
}


================================================
FILE: src/opennlp/ccg/parse/tagger/ProbIndexPair.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2009 Dennis N. Mehay
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.parse.tagger;

/**
 * @author Dennis N. Mehay
 * @version $Revision: 1.1 $, $Date: 2010/09/21 04:12:41 $
 */
public class ProbIndexPair implements Comparable<ProbIndexPair> {
	
    public Double a;
    public Integer b;
    
    public ProbIndexPair(Double a, Integer b) { this.a=a; this.b=b; }
    
    public int compareTo(ProbIndexPair p) { return (-1 * (this.a).compareTo(p.a)); }
    
    public static void main(String[] args) {
        ProbIndexPair p1 = new ProbIndexPair(new Double(4.0), new Integer(5));
        ProbIndexPair p2 = new ProbIndexPair(new Double(3.0), new Integer(5));
        ProbIndexPair p3 = new ProbIndexPair(new Double(2.0), new Integer(5));
        ProbIndexPair p4 = new ProbIndexPair(new Double(4.0), new Integer(5));
        System.out.println("p1 < p2? "+(p1.compareTo(p2)<0));
        System.out.println("p2 < p3? "+(p2.compareTo(p3)<0));
        System.out.println("p1 < p3? "+(p1.compareTo(p3)<0));
        System.out.println("p1 == p4? "+(p1.compareTo(p4)==0));
        System.out.println("p2 > p1? "+(p2.compareTo(p1)>0));
        System.out.println("p3 > p2? "+(p3.compareTo(p2)>0));
        System.out.println("p3 > p1? "+(p3.compareTo(p1)>0));
    }
}


================================================
FILE: src/opennlp/ccg/parse/tagger/TaggedWord.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (c) 2010 Dennis N. Mehay
//
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed inp the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

/**
 * A wrapper around {@code Word}s that can hold multitaggings (for POSs and for
 * supertags).
 */

package opennlp.ccg.parse.tagger;

import java.util.List;
import opennlp.ccg.lexicon.Word;
import opennlp.ccg.util.Pair;

/**
 * @author Dennis N. Mehay
 */
public class TaggedWord {
    // multitaggings for POSs and supertags (resp).
    private List<Pair<Double,String>> postagging;    
    private List<Pair<Double,String>> stagging;    
    
    // old-timey Word that holds the word form (and potentially gold POS and supertag).
    private Word oldWord;
    
    /** Decorators for the core functionality of the underlying word. */
    public String getSupertag() { return oldWord.getSupertag(); }
    public String getForm() { return oldWord.getForm(); }
    public String getPOS() { return oldWord.getPOS(); }
    
    /** Accessor for the underlying vanilla Word. */
    public Word getWord() { return oldWord; }
    
    /** Constructor with a Word. */
    public TaggedWord(Word wd) { 
        oldWord = Word.createFullWord(wd, wd.getForm(), wd.getPOS(), wd.getSupertag(), wd.getSemClass()); 
    }
        
    /** This does the obvious thing. */
    public void setSupertagging(List<Pair<Double,String>> stagging) { this.stagging = stagging; }
    
    /** 
     * Set the multi-POS tagging.  
     * Also replace the underlying single-best tagging with the
     * first tag of the multitag list.
     */
    public void setPOSTagging(List<Pair<Double,String>> postagging) { 
        this.postagging = postagging; 
        oldWord = Word.createFullWord(oldWord, oldWord.getForm(), this.postagging.get(0).b, oldWord.getSupertag(), oldWord.getSemClass());            
    }
    
    
    /** This does the obvious thing. */
    public List<Pair<Double,String>> getSupertagging() { return stagging; }
    
    /** This does the obvious thing. */
    public List<Pair<Double,String>> getPOSTagging() { return postagging; }
    
    /** Gets the gold-standard supertag. */
    public String getGoldSuper() { return oldWord.getSupertag(); }
    
    /** Gets the gold-standard POS tag. */
    public String getGoldPOS() { return oldWord.getPOS(); }
    
}


================================================
FILE: src/opennlp/ccg/parse/tagger/io/CorpusIterator.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2009 Dennis N. Mehay
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.parse.tagger.io;

import java.io.IOException;
import java.util.Iterator;
import java.util.List;
import opennlp.ccg.lexicon.Word;

/**
 * An interface that all file iterators must (should?) implement.
 * 
 * @author Dennis N. Mehay
 * @version $Revision: 1.1 $, $Date: 2010/09/21 04:12:41 $
 */
public interface CorpusIterator {
    
    public List<Word> next() throws IOException;
    
    public boolean hasNext();
    
    public void close();
    
    public Iterator<List<Word>> iterator();
    
}


================================================
FILE: src/opennlp/ccg/parse/tagger/io/PipeDelimitedFactoredBundleCorpusIterator.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2009 Dennis N. Mehay
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.parse.tagger.io;

import java.io.BufferedReader;
import java.io.IOException;
import java.util.Iterator;
import java.util.List;
import opennlp.ccg.lexicon.Tokenizer;
import opennlp.ccg.lexicon.Word;
import opennlp.ccg.parse.supertagger.util.PipedTokenizer;

/**
 * Assuming an input file of n different sentences of the form:
 * <s> wordbundle1 wordbundle2 ... wordbundleM </s>
 * ... [n-2 lines]
 * <s> wordbundle1 ... wordbundleQ </s>
 * 
 * where the 'wordbundle's are SRILM factored LM-compliant
 * bundles of factors (wordform, lemma, POS, supertag, semantic class, etc.).
 * 
 * We assume one sentence per line, so the <s> ... </s> bracketing is just
 * a formality (what SRILM expects).
 * 
 * @author Dennis N. Mehay
 * @version $Revision: 1.2 $, $Date: 2010/09/26 05:50:15 $
 */
public class PipeDelimitedFactoredBundleCorpusIterator implements CorpusIterator, Iterator<List<Word>>, Iterable<List<Word>> {

    private BufferedReader reader;
    private String nextLine,  nextID;
    public static final String SENT_START = "<s>",  SENT_END = "</s>";
    private Tokenizer toker = new PipedTokenizer();

    /** Creates a new instance of SRILMFactoredBundleCorpusIterator */
    public PipeDelimitedFactoredBundleCorpusIterator(BufferedReader file) {
        try {
            this.reader = file;
            String line = this.reader.readLine();
            //while (line.length() == 0 && line != null) {
            //    line = this.reader.readLine();
            //}
            if (line != null && line.length() > 0) {
                line = line.trim();
                this.nextLine = line;
            } else {
                this.nextLine = this.nextID = null;
            }
        } catch (Exception e) {
            e.printStackTrace();
        }
    }

    /**
     * The client of this method is responsible for checking that there
     * is in fact a next line (by calling <code>hasNext</code> before 
     * calling this method.
     * 
     * @return A <code>String</code> representing the next line in the 
     *         file.
     * @throws <code>java.io.IOException</code>. 
     */
    public List<Word> next() {
        List<Word> currentSent = null;
        try {
            if (this.hasNext()) {
                String line = this.reader.readLine();
                //while(line != null && (line.length()==0 || line.trim().equals(""))) {
                //    line = this.reader.readLine();
                //}
                if (line != null) {
                    line = line.trim();
                }
                if (this.nextLine.endsWith(SENT_END)) {
                    currentSent = toker.tokenize(this.nextLine.substring(this.nextLine.indexOf(">") + 1, this.nextLine.lastIndexOf("<")).trim());
                } else {
                    currentSent = toker.tokenize(this.nextLine.substring(this.nextLine.indexOf(">") + 1).trim());
                }

                if (line != null && !(line.trim().equals(""))) {
                    this.nextLine = line;
                } else {
                    this.nextLine = this.nextID = null;
                }
            } else {
                throw new IOException("There is no next line.");
            }
        } catch (IOException ex) {
            java.util.logging.Logger.getLogger("global").log(java.util.logging.Level.SEVERE,
                    ex.getMessage(), ex);
        }
        return currentSent;
    }

    /**
     * @return A <code>String</code> representing the current parse ID
     *         (a la CCGbank).
     */
    public String getCurrentID() {
        return this.nextID;
    }

    /**
     * @return A <code>boolean</code> as to whether there is a next line
     *         in the file. 
     */
    public boolean hasNext() {
        return this.nextLine != null;
    }

    /**
     * Closes the underlying <code>BufferedReader</code>.
     * 
     */
    public void close() {
        try {
            this.reader.close();
        } catch (IOException ex) {
            java.util.logging.Logger.getLogger("global").log(java.util.logging.Level.SEVERE,
                    ex.getMessage(), ex);
        }
    }

    public void remove() {
        throw new UnsupportedOperationException("Not supported yet.");
    }
    
    public Iterator<List<Word>> iterator() { return this; }
}


================================================
FILE: src/opennlp/ccg/parse/tagger/io/SRILMFactoredBundleCorpusIterator.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2009 Dennis N. Mehay
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.parse.tagger.io;

import java.io.BufferedReader;
import java.io.IOException;
import java.util.Iterator;
import java.util.List;
import opennlp.ccg.lexicon.DefaultTokenizer;
import opennlp.ccg.lexicon.Tokenizer;
import opennlp.ccg.lexicon.Word;

/**
 * Assuming an input file of n different sentences of the form:
 * <s> wordbundle1 wordbundle2 ... wordbundleM </s>
 * ... [n-2 lines]
 * <s> wordbundle1 ... wordbundleQ </s>
 * 
 * where the 'wordbundle's are SRILM factored LM-compliant
 * bundles of factors (wordform, lemma, POS, supertag, semantic class, etc.).
 * 
 * We assume one sentence per line, so the <s> ... </s> bracketing is just
 * a formality (what SRILM expects).
 * 
 * @author Dennis N. Mehay
 * @version $Revision: 1.2 $, $Date: 2010/09/26 05:50:15 $
 */
public class SRILMFactoredBundleCorpusIterator implements CorpusIterator, Iterator<List<Word>>, Iterable<List<Word>> {

    private BufferedReader reader;
    private String nextLine,  nextID;
    public static final String SENT_START = "<s>",  SENT_END = "</s>";
    private Tokenizer toker = new DefaultTokenizer();

    /** Creates a new instance of SRILMFactoredBundleCorpusIterator */
    public SRILMFactoredBundleCorpusIterator(BufferedReader file) {
        try {
            this.reader = file;
            String line = this.reader.readLine();
            if (line != null && line.length() > 0) {
                line = line.trim();
                this.nextLine = line;
            } else {
                this.nextLine = this.nextID = null;
            }
        } catch (Exception e) {
            e.printStackTrace();
        }
    }

    /**
     * The client of this method is responsible for checking that there
     * is in fact a next line (by calling <code>hasNext</code> before 
     * calling this method.
     * 
     * @return A <code>String</code> representing the next line in the 
     *         file.
     * @throws <code>java.io.IOException</code>. 
     */
    public List<Word> next() {
        List<Word> currentSent = null;
        try {
            if (this.hasNext()) {
                String line = this.reader.readLine();
                //while(line != null && (line.length()==0 || line.trim().equals(""))) {
                //    line = this.reader.readLine();
                //}
                if (line != null) {
                    line = line.trim();
                }
                if (this.nextLine.endsWith(SENT_END)) {
                    currentSent = toker.tokenize(this.nextLine.substring(this.nextLine.indexOf(">") + 1, this.nextLine.lastIndexOf("<")).trim());
                } else {
                    currentSent = toker.tokenize(this.nextLine.substring(this.nextLine.indexOf(">") + 1).trim());
                }

                if (line != null && !(line.trim().equals(""))) {
                    this.nextLine = line;
                } else {
                    this.nextLine = this.nextID = null;
                }
            } else {
                throw new IOException("There is no next line.");
            }
        } catch (IOException ex) {
            java.util.logging.Logger.getLogger("global").log(java.util.logging.Level.SEVERE,
                    ex.getMessage(), ex);
        }
        return currentSent;
    }

    /**
     * @return A <code>String</code> representing the current parse ID
     *         (a la CCGbank).
     */
    public String getCurrentID() {
        return this.nextID;
    }

    /**
     * @return A <code>boolean</code> as to whether there is a next line
     *         in the file. 
     */
    public boolean hasNext() {
        return this.nextLine != null;
    }

    /**
     * Closes the underlying <code>BufferedReader</code>.
     * 
     */
    public void close() {
        try {
            this.reader.close();
        } catch (IOException ex) {
            java.util.logging.Logger.getLogger("global").log(java.util.logging.Level.SEVERE,
                    ex.getMessage(), ex);
        }
    }

    public void remove() {
        throw new UnsupportedOperationException("Not supported yet.");
    }

    public Iterator<List<Word>> iterator() {
        return this;
    }
}


================================================
FILE: src/opennlp/ccg/parse/tagger/ml/MaxentModel.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2009 Dennis N. Mehay
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.parse.tagger.ml;

import java.util.Collection;
import opennlp.ccg.util.Pair;

/**
 * @author Dennis N. Mehay
 * @version $Revision: 1.1 $, $Date: 2010/09/21 04:12:41 $
 */
public interface MaxentModel {
    public double[] eval(Collection<Pair<String,Double>> context);
    public String getOutcome(int indexOfOutcome);
}


================================================
FILE: src/opennlp/ccg/parse/tagger/ml/TaggerFeature.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (c) 2010 Dennis N. Mehay
//
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed inp the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.parse.tagger.ml;

/**
 * @author Dennis N. Mehay
 */
public class TaggerFeature {
    public String name;
    public Double activation;
    
    public TaggerFeature(String name, Double activation) {
        this.name = name.intern();
        this.activation = activation;
    }
}


================================================
FILE: src/opennlp/ccg/parse/tagger/ml/ZLMEM.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2009 Dennis N. Mehay
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.parse.tagger.ml;
import java.io.File;
import java.util.Collection;
import opennlp.ccg.util.Pair;
import opennlp.ccg.parse.tagger.Constants;

/**
 * Decorates ZLMaxentModel, making it a MaxentModel.
 * 
 * @author Dennis N. Mehay
 * @version $Revision: 1.2 $, $Date: 2010/09/26 05:50:15 $
 */
public class ZLMEM extends ZLMaxentModel implements MaxentModel {
	
    public ZLMEM(File model) {
        super(model);
    }
    
    /**
     * @param context: A collection of String,Double pairs, representing the contextual input
     * features and their activations.
     * @return a double[] which represents a probability distribution over output classes, each
     * retrievable by its index with getOutcome(index);
     */
    public double[] eval(Collection<Pair<String, Double>> context) {
        // Have to turn a collection of pairs into a String[] of feature:activation Strings.
        // Sloppy and inefficient.  
        // TODO: A better solution would be to refactor ZLMaxentModel (DNM)
        String[] inpt = new String[context.size()];
        int index = -1;
        for(Pair<String,Double> inp : context) {
            inpt[++index] = inp.a + ":" + inp.b;
        }
        
        return super.eval(context, true, Constants.Domain.PROB);
    }
}


================================================
FILE: src/opennlp/ccg/parse/tagger/ml/ZLMaxentModel.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (c) 2010 Dennis N. Mehay
//
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed inp the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.parse.tagger.ml;

/* A nearly literal translation of Zhang Le's pymaxent.py file
 * into Java (D.N. Mehay).
 */

import opennlp.ccg.parse.tagger.Constants.Domain;
import opennlp.ccg.parse.tagger.Constants;
import java.io.BufferedReader;
import java.io.File;
import java.io.FileNotFoundException;
import java.io.FileReader;
import java.io.IOException;
import java.util.ArrayList;
import java.util.Collection;
import java.util.HashMap;
import java.util.Map;
import opennlp.ccg.util.Pair;

public class ZLMaxentModel {
    public boolean verbose = false;
    private ItemMap predMap = null;
    private ItemMap outComeMap = null;
    ArrayList<ArrayList<Pair<Integer, Integer>>> paramsMap;
    private boolean loaded = false;
    private double[] probs;
    private int n_outcome;
    // the parameters.
    private double[] theta;
    private Double one = Constants.one;

    public ZLMaxentModel() {
    }

    public ZLMaxentModel(File model) {
        load(model);
    }

    public void load(File modelFile) {
        if (!loaded) {
            loaded = true;
            BufferedReader br = null;
            try {
                br = new BufferedReader(new FileReader(modelFile));
                String line = br.readLine();

                if (line.contains("#")) {
                    line = br.readLine();
                }

                if (verbose) System.err.println("\nReading predicates...");
                // Read in contextual predicates.
                int numPreds = Integer.parseInt(line);
                predMap = new ItemMap();
                // read in predicates...
                for (int i = 0; i < numPreds; i++) {
                    line = br.readLine();
                    predMap.add(line);
                }

                if (verbose) System.err.println("Reading outcomes...");
                outComeMap = new ItemMap();
                // Read in outcomes (labels).
                line = br.readLine();
                int numOutcomes = Integer.parseInt(line);
                for (int j = 0; j < numOutcomes; j++) {
                    line = br.readLine();
                    outComeMap.add(line);
                }

                if (verbose) System.err.println("Reading parameters...");
                // Read parameters.                
                int numParameters = predMap.size();
                paramsMap = new ArrayList<ArrayList<Pair<Integer, Integer>>>(numParameters);
                ArrayList<Pair<Integer, Integer>> prms;
                int fid = 0;
                String ln = "";
                for (int q = 0; q < numParameters; q++) {
                    ln = br.readLine();
                    String[] lineParts = ln.split(" ");
                    prms = new ArrayList<Pair<Integer, Integer>>(Integer.parseInt(lineParts[0]));
                    Integer oid;
                    for (int p = 1; p < lineParts.length; p++) {
                        oid = Integer.valueOf(lineParts[p]); 
                        prms.add(new Pair<Integer, Integer>(oid, Integer.valueOf(fid))); 
                        fid++;
                    }
                    paramsMap.add(prms);
                }
                
                // Load theta.
                int nTheta = Integer.valueOf(br.readLine());
                if (verbose) System.err.println("Number of parameters: " + nTheta);
                theta = new double[nTheta];
                for (int z = 0; z < theta.length; z++) {
                    theta[z] = Double.parseDouble(br.readLine());
                }

                n_outcome = outComeMap.size();
                // Initialise the array for computing distribution over all labels.
                probs = new double[n_outcome];
                if (verbose) System.err.println("Number of outcomes: " + n_outcome);

            } catch (FileNotFoundException e) {
                e.printStackTrace();
            } catch (IOException e) {
                e.printStackTrace();
            } finally {
                try {
                    br.close();
                } catch (IOException ioe) {
                    ioe.printStackTrace();
                }
            }
        }
    }

    public String getBestOutcome(double[] probs) {
        double maxprob = 0.0;
        int maxidx = -1;
        for (int i = 0; i < probs.length; i++) {
            if (probs[i] > maxprob) {
                maxidx = i;
                maxprob = probs[i];
            }
        }
        return getOutcome(maxidx);
    }

    public double[] eval(Collection<Pair<String, Double>> context, boolean realValued) {
        return eval(context, realValued, Domain.PROB);
    }

    public double[] eval(Collection<Pair<String, Double>> context, boolean realValued, Domain domain) {
        // Zero out prob distribution over labels.
        for (int i = 0; i < probs.length; i++) {
            probs[i] = 0.0;
        // build up exponentiated scores.  
        }
        for (Pair<String, Double> pv : context) {
            Integer predID = predMap.id(pv.a);
            if (predID != null) {
                ArrayList<Pair<Integer, Integer>> featClassAssocs = paramsMap.get(predID.intValue());
                for (Pair<Integer, Integer> classAndAssoc : featClassAssocs) {
                    if (pv.b == one) {
                        // ln(exp(lambda * 1)) = ln(exp(lambda)^1) = ln(exp(lambda)) = lambda
                        probs[classAndAssoc.a.intValue()] += theta[classAndAssoc.b.intValue()];
                    } else {
                        // ln(exp(lambda * <act>)) = ln(exp(lambda)^<act>)
                        probs[classAndAssoc.a.intValue()] += Math.log(Math.exp(theta[classAndAssoc.b.intValue()] * pv.b.doubleValue()));
                    }
                }
            }
        }

        double sum = 0.0;
        // exponentiate the numerators for the denomenator sum.
        for (int p = 0; p < probs.length; p++) {
            sum += Math.exp(probs[p]);
        }
        sum = Math.log(sum);
        for (int q = 0; q < probs.length; q++) {
            probs[q] -= sum;
        }
        if (domain == Domain.PROB) {
            // translate back from the log domain.
            for (int q = 0; q < probs.length; q++) {
                probs[q] = Math.exp(probs[q]);
            }
        }
        return probs;
    }

    public String getOutcome(int index) {
        return outComeMap.getItem(index);
    }
}

class ItemMap {

    private Integer index;
    private Map<String, Integer> dict = new HashMap<String, Integer>();
    private Map<Integer, String> reverseDict = new HashMap<Integer, String>();

    public ItemMap() {
        index = Integer.valueOf(0);
    }

    public int add(String item) {
        if (dict.containsKey(item)) {
            return dict.get(item);
        } else {
            dict.put(item, index);
            reverseDict.put(index, item);
            index = Integer.valueOf(index.intValue() + 1);
            return index.intValue() - 1;

        }

    }

    public Integer id(String item) {
        if (dict.containsKey(item)) {
            return dict.get(item);
        } else {
            return null;
        }
    }

    public int size() {
        return dict.size();
    }

    public String getItem(int i) {
        return reverseDict.get(Integer.valueOf(i));
    }
}

class IntegerPool {

    private Integer[] _table;

    public IntegerPool(int size) {
        _table = new Integer[size];
        for (int i = 0; i < size; i++) {
            _table[i] = new Integer(i);
        }
    }

    public Integer getInt(int i) {
        if (i < _table.length && i >= 0) {
            return _table[i];
        } else {
            return new Integer(i);
        }
    }
}


================================================
FILE: src/opennlp/ccg/parse/tagger/sequencescoring/Backpointer.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (c) 2010 Dennis N. Mehay
//
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed inp the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////


package opennlp.ccg.parse.tagger.sequencescoring;

import java.util.List;

/**
 * An abstraction for lists of backpointers in trellises, lattices, etc.
 * Each backpointer is a List of Integer's that give backpointers to the j-th highest
 * scoring paths (where 1 <= j <= N==len(Backpointer) are the indices of the 
 * internal list of the backpointer).
 * 
 * @author Dennis N. Mehay
 */
public class Backpointer {
    private List<Integer> bkpts;
    public Backpointer(List<Integer> bkpts) {
        this.bkpts = bkpts;
    }
    public List<Integer> getBkpts() { return bkpts; }
    public Integer get(int i) { return bkpts.get(i); }
    public int size() { return bkpts.size(); }
}


================================================
FILE: src/opennlp/ccg/parse/tagger/sequencescoring/FBNode.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (c) 2010 Dennis N. Mehay
//
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed inp the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////


package opennlp.ccg.parse.tagger.sequencescoring;

import java.util.List;

/**
 * A node in a forward-backward lattice.
 * 
 * Holds the current label, the forward score, backward score, a list of Doubles representing
 * this node's contribution to the scores of the following nodes in the next
 * step of the lattice, a list of Strings representing the Markov history of the
 * optimal sequence leading up to this node, and, finally, holds a ranked array of
 * backpointers to the n-best optimal predecessor nodes.
 * 
 * @author Dennis N. Mehay
 */
public class FBNode {    
    /** How far back of a Markov history window do we have? */
    public int markovHistSize;    
    /** The label at this node. */
    public String label;
    /** The (normalised) sum of the log-probabilites of all paths leading to this node. */
    public double forwardScore = 0.0;
    /** The (normalised) sum of the log-probabilites of all paths starting at this node. */
    public double backwardScore = 0.0;
    /** 
     * How does this node contribute to each of the nodes in the next time step in
     * the lattice?
     */    
    public List<Double> forwardContributions;    
    /** The list of the optimal Markov history. */
    public List<String> markovHist;
    /** 
     * A list of backpointers to the nodes in the previous time step (ranked in order
     * of how likely the sequence including them leading to this node is).
    */
    public List<Integer> backpointers;   
    
    /** 
     * Empty constructor.  Default Markov history of length 2.  
     * All other values are set directly in the fields as they are calculated. 
     */
    public FBNode() { this(2); }
    
    /** Constructor that only specifies Markov history size. */
    public FBNode(int markovHistSize) {
        this.markovHistSize = markovHistSize;
    }
}


================================================
FILE: src/opennlp/ccg/parse/tagger/sequencescoring/SequenceScorer.java
================================================
///////////////////////////////////////////////////////////////////////////////
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.parse.tagger.sequencescoring;

import java.io.BufferedReader;
import java.io.File;
import java.io.FileNotFoundException;
import java.io.FileReader;
import java.io.IOException;
import java.util.ArrayList;
import java.util.Arrays;
import java.util.List;
import java.util.logging.Level;
import java.util.logging.Logger;
import opennlp.ccg.lexicon.Word;
import opennlp.ccg.ngrams.StandardNgramModel;
import opennlp.ccg.util.Interner;
import opennlp.ccg.util.Pair;
import opennlp.ccg.parse.tagger.ProbIndexPair;
import opennlp.ccg.parse.tagger.Constants;

/**
 * Initialise with a language model over the output sequences and,
 * given a List of List<Pair<Double,String>>'s initially tagged with "observation"
 * probabilities (output probabilities only based on local features),
 * return the forward-pass re-estimated probabilites of the output
 * classes.
 * 
 * @author Dennis N. Mehay
 */
public class SequenceScorer extends StandardNgramModel {

    /**
     * A Trellis to hold sequence labels (wrapped in Word classes)
     * functionality. 
     */
    private Trellis<Word> seqLabs;
    /** Trellis for initial observation model scores. */
    private Trellis<Double> initScores;
    /** Trellis for forward-backward re-estimated scores. */
    private Trellis<Double> fbScores;
    /** Trellis of back-pointers (for retrieving n-best sequences). */
    private Trellis<Backpointer> backPointers;
    /** How many of the previous (following) best predictions make it into the forward (or backward) search? */
    private int searchBeam = 200;
    /** Re-usable private data structures. */
    private List<List<Double>> tmpInitScores = new ArrayList<List<Double>>(500);
    private List<List<Double>> tmpFwdScores = new ArrayList<List<Double>>(500);
    private List<List<Word>> tmpSeqLabs = new ArrayList<List<Word>>(500);
    private List<List<Backpointer>> tmpBkpointers = new ArrayList<List<Backpointer>>(500);
    /** For interning Word's */
    private Interner<Word> words = new Interner<Word>();
    private Constants.TaggingAlgorithm alg = Constants.TaggingAlgorithm.FORWARDBACKWARD;

    /** Create a ForwardScorer with a sequence model (over supertags, POSs tags, words, etc.) */
    public SequenceScorer(int order, String lmFile) throws IOException {
        super(order, lmFile);
    }

    /** 
     * A utility method for finding the order of n-gram models (by reading in the ARPA-formatted file.
     * (A bit messy, I know.)
     */
    public static int findOrder(String tagSequenceModel) {
        // find n-gram order of sequence model.
        BufferedReader reader = null;
        String ln = null;
        int ord = 0;
        try {
            reader = new BufferedReader(new FileReader(new File(tagSequenceModel)));
            ln = reader.readLine();
            reader = new BufferedReader(new FileReader(new File(tagSequenceModel)));
            while (ln != null && !ln.startsWith("\\data\\")) {
                ln = reader.readLine();
            }
            ln = reader.readLine();
            while (ln != null & ln.startsWith("ngram ")) {
                ord = Integer.parseInt(ln.split(" ")[1].split("=")[0]);
                ln = reader.readLine();
            }
            reader.close();
        } catch (FileNotFoundException fnfe) {
            Logger.getLogger(SequenceScorer.class.getName()).log(Level.SEVERE, null, fnfe);
        } catch (IOException ioe) {
            Logger.getLogger(SequenceScorer.class.getName()).log(Level.SEVERE, null, ioe);
        }
        return ord;
    }

    /** Set the tagging algorithm (with one of {forward-backward, forward}). */
    public void setAlgorithm(Constants.TaggingAlgorithm newAlg) {
        alg = newAlg;
    }

    /**
     * Set the maximum width of the number of previous hypothesized tags to consider
     * in the forward probabilities.
     */
    public void setSearchBeam(int newBeam) {
        searchBeam = newBeam;
    }

    /** Rescore an observation sequence of (initially) supertagged Word's using the sequence model. */
    public List<List<Pair<Double, String>>> rescoreSequence(List<List<Pair<Double, String>>> observationSequence) {
        // build up initial trellises.
        tmpInitScores.clear();
        tmpFwdScores.clear();
        tmpSeqLabs.clear();
        tmpBkpointers.clear();

        for (List<Pair<Double, String>> tw : observationSequence) {
            ArrayList<Double> scrs = new ArrayList<Double>(tw.size());
            ArrayList<Double> fscs = new ArrayList<Double>(tw.size());
            ArrayList<Word> sLabs = new ArrayList<Word>(tw.size());
            ArrayList<Backpointer> bpts = new ArrayList<Backpointer>(tw.size());
            for (Pair<Double, String> tagging : tw) {
                // add observation score, and convert to log-prob domain, if needed.
                scrs.add((tagging.a > 0) ? Math.log(tagging.a) : tagging.a);
                fscs.add(null);
                sLabs.add(words.intern(Word.createWord(tagging.b, null, null, null, null, null, null)));
                bpts.add(null);
            }
            tmpInitScores.add(scrs);
            tmpSeqLabs.add(sLabs);
            tmpFwdScores.add(fscs);
            tmpBkpointers.add(bpts);
        }
        initScores = new Trellis<Double>(tmpInitScores);
        // these are initially null.
        fbScores = new Trellis<Double>(tmpFwdScores);
        // these are too.
        backPointers = new Trellis<Backpointer>(tmpBkpointers);
        seqLabs = new Trellis<Word>(tmpSeqLabs);

        // forward loop.
        // for each word...
        for (int u = 0; u < observationSequence.size(); u++) {
            List<Pair<Double, String>> tw = observationSequence.get(u);
            double normTot = 0.0;
            // for each of its tags within the search beam.
            for (int v = 0; v < tw.size(); v++) {
                Word currTag = seqLabs.getCoord(u, v);
                List<Word> bestHist = null;
                Double seqScore = null;

                Double obsScore = initScores.getCoord(u, v);
                if (u == 0) {
                    // beginning of sequence.                    
                    bestHist = getBestHist(u, v, order);
                    bestHist.add(currTag);
                    seqScore = lmScore(bestHist);

                    double fs = seqScore + obsScore; 

                    normTot += Math.exp(fs);
                    fbScores.setCoord(u, v, fs);
                } else {
                    // use dynamic programming-computed scores to progress.
                    List<Pair<Double, String>> prevTaggedWord = observationSequence.get(u - 1);
                    ProbIndexPair[] bestPrevScores = new ProbIndexPair[Math.min(prevTaggedWord.size(), searchBeam)];

                    for (int z = 0; z < Math.min(prevTaggedWord.size(), searchBeam); z++) {
                        bestHist = getBestHist(u - 1, z, order - 1);
                        bestHist.add(currTag);
                        seqScore = lmScore(bestHist);
                        double fs = fbScores.getCoord(u - 1, z) + seqScore;
                        fs += obsScore;                         
                        bestPrevScores[z] = new ProbIndexPair(
                                Double.valueOf(fs),
                                Integer.valueOf(z));

                    }

                    // sort descending based on score.
                    Arrays.sort(bestPrevScores);

                    // add up the prob's of all sequences leading to this node.
                    double fsum = 0.0;
                    for (int q = 0; q < bestPrevScores.length; q++) {
                        fsum += Math.exp(bestPrevScores[q].a);
                    }
                    normTot += fsum;
                    //fbScores.setCoord(u, v, bestPrevScores[0].a.doubleValue());
                    fbScores.setCoord(u, v, Math.log(fsum));

                    // add n-best backpointers.
                    List<Integer> bks = new ArrayList<Integer>(bestPrevScores.length);
                    for (int q = 0; q < bestPrevScores.length; q++) {
                        bks.add(bestPrevScores[q].b);
                    }
                    backPointers.setCoord(u, v, new Backpointer(bks));
                }
            }

            // normalise.            
            for (int v = 0; v < tw.size(); v++) {
                fbScores.setCoord(u, v, Math.log(Math.exp(fbScores.getCoord(u, v)) / normTot));
            }
        }

        // backward loop.
        int size = observationSequence.size();
        if (alg == Constants.TaggingAlgorithm.FORWARDBACKWARD) {
            // for each word...
            for (int u = size - 1; u >= 0; u--) {
                List<Pair<Double, String>> tw = observationSequence.get(u);
                double normTot = 0.0;
                // for each of its tags...
                for (int v = 0; v < tw.size(); v++) {
                    List<Word> bestHist = null;
                    
                    Double obsScore = initScores.getCoord(u, v);
                    
                    if (u == (size - 1)) { // right-hand end of sequence.

                        bestHist = getBestHist(u, v, order - 1);
                        bestHist.add(words.intern(Word.createWord("</s>", null, null, null, null, null, null)));
                        double bsc = fbScores.getCoord(u, v) + obsScore;
                        normTot += Math.exp(bsc);
                        fbScores.setCoord(u, v, bsc);
                    } else {
                        // use dynamic programming-computed scores to progress backwards.
                        bestHist = getBestHist(u, v, order - 1);
                        List<Pair<Double, String>> followingTaggedWd = observationSequence.get(u + 1);
                        double backwardSum = 0.0;
                        for (int z = 0; z < followingTaggedWd.size(); z++) {
                            Word followingTag = words.intern(Word.createWord(followingTaggedWd.get(z).b.intern(), null, null, null, null, null, null));
                            if (z > 0) {
                                bestHist.remove(bestHist.size() - 1);
                            }
                            bestHist.add(followingTag);
                            backwardSum += Math.exp(lmScore(bestHist) + fbScores.getCoord(u + 1, z));
                        }
                        double newSc = Math.log(backwardSum) + obsScore;
                        normTot += Math.exp(newSc);
                        fbScores.setCoord(u, v, newSc);
                    }
                }
                // normalise.
                for (int v = 0; v < tw.size(); v++) {
                    fbScores.setCoord(u, v, Math.log(Math.exp(fbScores.getCoord(u, v)) / normTot));
                }
            }
        }

        // re-sort based on re-estimated scores.        
        for (int i = 0; i < observationSequence.size(); i++) {
            ProbIndexPair[] fwdScrs = new ProbIndexPair[observationSequence.get(i).size()];
            List<Pair<Double, String>> tagging = observationSequence.get(i);

            for (int j = 0; j < tagging.size(); j++) {
                double probP = Math.exp(fbScores.getCoord(i, j).doubleValue());
                fwdScrs[j] = new ProbIndexPair(probP, new Integer(j));
            }
            Arrays.sort(fwdScrs);

            List<Pair<Double, String>> newTagging = new ArrayList<Pair<Double, String>>(fwdScrs.length);
            for (int z = 0; z < fwdScrs.length; z++) {
                Double renorm = new Double(fwdScrs[z].a.doubleValue());
                if (renorm.equals(Constants.one)) {
                    renorm = Constants.one;
                }
                newTagging.add(new Pair<Double, String>(renorm, tagging.get(fwdScrs[z].b.intValue()).b));
            }
            observationSequence.set(i, newTagging);
        }
        return observationSequence;
    }

    /** 
     * Use the LM to score a sequence of words.
     */
    private double lmScore(List<Word> seq) {
        setWordsToScore(seq, false);
        prepareToScoreWords();
        return logprob();
    }

    /** Follow the back-pointers to get the best sequence of up to length 'order' leading up to cell (i,j). */
    private List<Word> getBestHist(int i, int j, int order) {
        int size = Math.max(order, 0);
        List<Word> retVal = null;
        Backpointer bp = backPointers.getCoord(i, j);
        if (i == -1) {
            // base case (off of the end of the sequence).            
            retVal = new ArrayList<Word>(size);
            retVal.add(words.intern(Word.createWord("<s>", null, null, null, null, null, null)));
            return retVal;
        } else if (i == 0) {
            // base case (at beginning of sequence)
            retVal = getBestHist(i - 1, 0, order - 1);
            retVal.add(seqLabs.getCoord(i, j));
            return retVal;
        } else if (order == 0) {
            // base case (reached back as far as the n-gram model will need to see).
            retVal = new ArrayList<Word>(size);
            return retVal;
        } else {
            // recursive case.            
            retVal = getBestHist(i - 1, bp.get(0).intValue(), order - 1);
            retVal.add(seqLabs.getCoord(i, j));
            return retVal;
        }
    }
}


================================================
FILE: src/opennlp/ccg/parse/tagger/sequencescoring/Trellis.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (c) 2010 Dennis N. Mehay
//
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed inp the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////


package opennlp.ccg.parse.tagger.sequencescoring;

import java.util.ArrayList;
import java.util.List;

/**
 * A Trellis for sequence coding (of supertags, e.g.).
 * 
 * @author Dennis N. Mehay
 */
public class Trellis<A> {
    /** The dimensions of the Trellis. */
    private int cols, rows;
    
    /** The actual nuts and bolts of the Trellis. */
    private ArrayList<ArrayList<A>> trellis;

    /** Constructor with passed-in list of lists. */
    public Trellis(List<List<A>> inpt) {
        this.reshape(inpt.size(), inpt.get(0).size(), inpt);
    }
    
    /** Constructor with dimensions. */
    public Trellis(int cols, int rows, A dummy) {
        List<List<A>> tr = new ArrayList<List<A>>(cols);
        for(int i = 0; i < cols; i++) {
            ArrayList<A> tmp = new ArrayList<A>(rows);
            for(int j = 0; j < rows; j++) {
                tmp.add(dummy);
            }
            tr.add(tmp);
        }
        reshape(cols, rows, tr);
    }
    
    /** 
     * Reshape the dimensions (e.g., to accomodate a new sequence with a 
     * particular max beam width 
     */
    public void reshape(int cols, int rows, List<List<A>> inpt) {
        this.cols = cols;
        this.rows = rows;
        
        this.trellis = new ArrayList<ArrayList<A>>(cols);        
        for(List<A> la : inpt) {
            ArrayList<A> row = new ArrayList<A>(rows);
            for(A a : la) {
                row.add(a);
            }
            this.trellis.add(row);            
        }
    }
    
    /** What is the max beam width? */
    public int getWidth() { return rows; }
    /** What is the length of the sequence? */
    public int getLength() { return cols; }
    /** Clear out values in the trellis. */
    public void clear() { 
        for(int i = 0; i < cols; i++) {
            this.trellis.add(new ArrayList<A>(rows));
        }
    }
    /** Get the sequence options at index i. */
    public ArrayList<A> getOptions(int i) { return this.trellis.get(i); }
    
    /** Get a node in the Trellis (referenced by 2D coordinate). */
    public A getCoord(int i, int j) { 
        try {return this.trellis.get(i).get(j); 
        } catch(IndexOutOfBoundsException iobe) {
            return null;
        }
    }
    
    /** Set the value at a node in the Trellis (referenced by 2D coordinate) */
    public void setCoord(int i, int j, A val) { this.trellis.get(i).set(j, val); }
}


================================================
FILE: src/opennlp/ccg/parse/tagger/util/CCGBankToSRILMFLM.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (c) 2010 Dennis N. Mehay
//
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed inp the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////


/*
 * Read in the CCGbank (auto format), line by line, and transform each lexical
 * item (<L cat1 pos1 pos2 word cat2>) into an SRILM factored LM bundle format:
 * W-word:S-word:P-pos1:T:cat1, where every thing has been escaped (e.g., colons),
 * "W" stands for word form, "S" for stem, "P" for POS and "T" for super_t_ag.
 */

package opennlp.ccg.parse.tagger.util;

import java.io.BufferedReader;
import java.io.BufferedWriter;
import java.io.File;
import java.io.FileNotFoundException;
import java.io.FileReader;
import java.io.FileWriter;
import java.io.IOException;
import java.util.regex.Matcher;
import java.util.regex.Pattern;
import opennlp.ccg.lexicon.DefaultTokenizer;

/**
 * @author Dennis N. Mehay
 */
public class CCGBankToSRILMFLM {
    public static void main(String[] args) throws FileNotFoundException, IOException {
        String usage = "\nCCGBankToSRILMFLM -input <inputCorpus> -o <outputCorpus> \n";
        if (args.length > 0 && args[0].equals("-h") || args.length == 0) {
            System.out.println(usage);
            System.exit(0);
        }

        BufferedReader reader = null;
        BufferedWriter writer = null;
        String inputCorp = "train.auto", output = "train.srilm";
        for (int i = 0; i < args.length; i++) {
            if (args[i].equals("-i")) {inputCorp = args[++i]; continue;}
            if (args[i].equals("-o")) {output = args[++i]; continue;}
            System.out.println("Unrecognized option: " + args[i]);
        }
        reader = new BufferedReader(new FileReader(new File(inputCorp)));
        writer = new BufferedWriter(new FileWriter(new File(output)));
        String parseIDHeader = "ID=";
        Pattern p = Pattern.compile("(<L\\s+.*?>)+?");
        
        String line = reader.readLine();
        while(line != null) {
            if(line.startsWith(parseIDHeader)) {line = reader.readLine(); continue;}
            line = line.trim();
            Matcher m = p.matcher(line);
            String word = null, pos = null, cat = null;
            int cnt = 0;
            while(m.find()) {
                String toks = m.group();
                // {<L, cat1, pos1, pos2, word, cat2>}
                String[] parts = toks.split(" ");
                word = parts[4];
                pos = parts[2];
                cat = parts[1];
                if(cnt++ > 0) {
                    writer.write(" ");
                }
                writer.write("W-"+DefaultTokenizer.escape(word)+":"
                        +"S-"+DefaultTokenizer.escape(word)+":"
                        +"P-"+DefaultTokenizer.escape(pos)+":"
                        +"T-"+DefaultTokenizer.escape(cat));
            }
            writer.write(System.getProperty("line.separator"));
            line = reader.readLine();
        }
        writer.close();
        reader.close();
    }
}


================================================
FILE: src/opennlp/ccg/parse/tagger/util/ConfigFileProcessor.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (c) 2010 Dennis N. Mehay
//
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed inp the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.parse.tagger.util;

import java.io.BufferedReader;
import java.io.File;
import java.io.FileNotFoundException;
import java.io.FileReader;
import java.io.IOException;
import java.util.*;
//import java.util.Map;
import java.util.logging.Level;
import java.util.logging.Logger;

/**
 * @author Dennis N. Mehay
 */
public class ConfigFileProcessor {
    
    
    /** Read in config file as a {@code Map<String,String>}. */
    public static Map<String, String> readInConfig(String configFile) {
    	return readInConfig(configFile, null);
    }

    /**
     * Read in config file as a {@code Map<String,String>}, resolving the given path keys
     * relative to the config file if not absolute.
     */
    public static Map<String, String> readInConfig(String configFile, String pathKeys[]) {
    	Set<String> paths = Collections.emptySet();
    	if (pathKeys != null) paths = new HashSet<String>(Arrays.asList(pathKeys));
        BufferedReader cf = null;
        Map<String, String> opts = new HashMap<String, String>();
        try {
        	File infile = new File(configFile);
        	File parentDir = infile.getParentFile();
            cf = new BufferedReader(new FileReader(infile));
            
            String ln = cf.readLine();
            // map options to values.
            while (ln != null) {
                if (ln.trim().equals("") || ln.trim().startsWith("#")) {
                    ln = cf.readLine();
                    continue;
                }
                String[] parts = ln.trim().split("=");
                String key = parts[0].trim().toLowerCase();
                String val = parts[1].trim();
                // resolve path keys
                if (paths.contains(key)) {
                	File f = new File(parentDir, val);
                	if (!f.exists()) {
                		f = new File(val);
                		if (!f.exists()) throw new FileNotFoundException("Can't resolve filename: " + val);
                	}
                	val = f.getPath();
                }
                opts.put(key, val);
                ln = cf.readLine();
            }
        } catch (FileNotFoundException ex) {
            Logger.getLogger(ConfigFileProcessor.class.getName()).log(Level.SEVERE, null, ex);
        } catch (IOException ex) {
            Logger.getLogger(ConfigFileProcessor.class.getName()).log(Level.SEVERE, null, ex);        
        } finally {
            try {
                cf.close();
            } catch (IOException ex) {
                Logger.getLogger(ConfigFileProcessor.class.getName()).log(Level.SEVERE, null, ex);
            }
        }
        return opts;
    }

}


================================================
FILE: src/opennlp/ccg/parse/tagger/util/ResultSink.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2009 Dennis N. Mehay
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.parse.tagger.util;

import java.util.HashMap;
import java.util.Iterator;
import java.util.List;
import java.util.Map;
import opennlp.ccg.lexicon.Word;
import opennlp.ccg.util.Pair;

/**
 * Inspired (loosely, based on my recollection) by Jason Baldridge's 
 * similar class for tracking classifier performance.
 * Here we simply track the <code>Word</code>-by-<code>Word</code>
 * tagging performance of a CCG supertagger by passing in a multitagging
 * and a gold-standard answer and tabulating the results.  The results
 * are reported by a custom <code>report</code> method, which returns
 * a <code>String</code> representation of the results.
 * 
 * @author Dennis N. Mehay
 * @version $Revision: 1.1 $, $Date: 2010/09/21 04:12:42 $
 */
public class ResultSink {

    public static enum ResultSinkType { SUPERTAG, POSTAG };
    
    private int totalTags = 0,  totalWords = 0,  totalRight = 0;
    // for keeping pos-specific stats.
    private Map<String, Integer> posToRight = new HashMap<String, Integer>(),  posTot = new HashMap<String, Integer>();
    // for tracking the total number of sentences, number totally tagged
    // correctly, etc.
    private int sentNum = 0,  sentsCorrect = 0;
    private boolean allCorrect = true;
    // what type of tag are we tracking the results over?
    private ResultSinkType whatType;
    // for general pos-specific stats (e.g., N... -> <stats>, not NNP -> <stats> and NNPS -> <stats>, etc.)
    private Map<String, Integer> genPOSToRight = new HashMap<String, Integer>(),  genPOSTot = new HashMap<String, Integer>();

    /** 
     * Nullary constructor.  Defaults to supertag result sink.
     * (TODO: add log file logging for more detailed error reporting.)
     */
    public ResultSink() {
        this(ResultSinkType.SUPERTAG);
    }

    public ResultSink(ResultSinkType whatType) {
        this.whatType = whatType;
    }

    /** 
     * Add and store a sentence of tagged words (<code>List<List<Pair<Double,String>>></code>)
     * wrt a gold-standard tagged word. 
     */
    public void addSent(List<List<Pair<Double, String>>> sent, List<Word> goldTagging) {
        sentNum++;
        allCorrect = true;
        Iterator<Word> gold = goldTagging.iterator();
        for (List<Pair<Double, String>> tgging : sent) {
            addResult(tgging, gold.next());
        }
        if (allCorrect) {
            sentsCorrect++;
        }
    }

    /**
     * Add a single-word tagging result alongside its gold-standard tagging.
     * Compare and log whether the gold-standard tag is in the beta-best (also
     * log pos-specific error stats).
     */
    public void addResult(List<Pair<Double, String>> tagging, Word goldTagging) {
        String goldTag = (whatType == ResultSinkType.SUPERTAG) ? goldTagging.getSupertag() : goldTagging.getPOS();
        totalTags += tagging.size();
        totalWords++;
        // mww: check for missing gold POS (grrr)
        if (goldTagging.getPOS() == null) {
            System.err.println("Warning: found null gold POS, skipping word: " + goldTagging);
            this.allCorrect = false;
            return;
        }

        String thisPOS = goldTagging.getPOS(), thisGenPOS = goldTagging.getPOS().substring(0, 1);
        Integer posT = this.posTot.get(thisPOS), gPOST = this.genPOSTot.get(thisGenPOS);
        if (posT == null) {
            this.posTot.put(thisPOS, new Integer(1));
        } else {
            this.posTot.put(thisPOS, new Integer(posT.intValue() + 1));
        }
        if (gPOST == null) {
            this.genPOSTot.put(thisGenPOS, new Integer(1));
        } else {
            this.genPOSTot.put(thisGenPOS, new Integer(gPOST.intValue() + 1));
        }
        // assume this tagging is incorrect, until proven otherwise.
        boolean gotIt = false;
        for (Pair<Double, String> tag : tagging) {
            if (tag.b.equals(goldTag)) {
                gotIt = true;
                totalRight++;
                // add one both to the pos right and total for that pos type.
                Integer posLkup = this.posToRight.get(thisPOS),
                        genPOSLkup = this.genPOSToRight.get(thisGenPOS);
                if (posLkup == null) {
                    this.posToRight.put(thisPOS, new Integer(1));
                } else {
                    this.posToRight.put(thisPOS, new Integer(posLkup.intValue() + 1));
                }
                if (genPOSLkup == null) {
                    this.genPOSToRight.put(thisGenPOS, new Integer(1));
                } else {
                    this.genPOSToRight.put(thisGenPOS, new Integer(genPOSLkup.intValue() + 1));
                }
                break;
            }
        }
        // mistagged this one word, so tagging the whole sentence correctly -- 
        // allCorrect==true -- is not possible. 
        if (!gotIt) {
            this.allCorrect = false;
        }

    }

    public String report() {
        // make sure 0 counts are inserted for POS types that were never got right.
        for (String post : this.posTot.keySet()) {
            if (this.posToRight.get(post) == null) {
                this.posToRight.put(post, new Integer(0));
            }
        }
        for (String post : this.genPOSTot.keySet()) {
            if (this.genPOSToRight.get(post) == null) {
                this.genPOSToRight.put(post, new Integer(0));
            }
        }

        String rep = "";
        rep += "\n\nAccuracy by POS type:\n\n";
        for (String post : this.posTot.keySet()) {
            rep += post + ": " + ((this.posToRight.get(post).intValue() + 0.0) / (this.posTot.get(post))) +
                    " <==> " + this.posToRight.get(post).intValue() + "/" + (this.posTot.get(post)) + " = " +
                    (100 * ((this.posTot.get(post) - this.posToRight.get(post) + 0.0) / (totalWords - totalRight))) + " (% of total errors) \n";
        }
        rep += "\nAccuracy by general (truncated) POS type:\n\n";
        for (String post : this.genPOSTot.keySet()) {
            rep += post + ": " + (this.genPOSToRight.get(post).intValue() + 0.0) / (this.genPOSTot.get(post)) +
                    " <==> " + this.genPOSToRight.get(post).intValue() + "/" + (this.genPOSTot.get(post)) + " = " +
                    (100 * ((this.genPOSTot.get(post) - this.genPOSToRight.get(post) + 0.0) / (totalWords - totalRight))) + " (% of total errors) \n";
        }
        rep += "\nTotal words: " + totalWords +
                "\nTotal sents: " + this.sentNum +
                "\nAggregate total tags: " + totalTags +
                "\nAve. tags/word: " + ((totalTags + 0.0) / (totalWords + 0.0)) +
                "\nWord accuracy: " + ((totalRight + 0.0) / totalWords) + "\n" +
                "\nSent accuracy: " + ((this.sentsCorrect + 0.0) / (this.sentNum)) + "\n\n";
        return rep;
    }
}

================================================
FILE: src/opennlp/ccg/perceptron/Alphabet.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2008 Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.perceptron;

import java.util.*;
import java.io.*;

import opennlp.ccg.util.*;
import opennlp.ccg.lexicon.DefaultTokenizer;

/**
 * A bidirectional mapping between feature names and indices.
 * 
 * An alphabet can be read from either an alphabet file or a model file.
 * An alphabet file starts with the number of features on one line, 
 * followed by one line per feature pairing the feature name with its 
 * frequency (which is ignored).
 * 
 * An alphabet can be open or closed.  An closed alphabet does not 
 * accept new features, and thus can be used to filter out features 
 * not already in the alphabet.
 * 
 * The main routine filters the input event file to an output alphabet file,
 * optionally with a table size and pruning threshold.
 * 
 * @author Michael White
 * @version     $Revision: 1.7 $, $Date: 2009/11/02 03:44:15 $
 */
public class Alphabet {
	
	/** Feature as a node in a trie, with each node storing the feature index. */
	public static class Feature extends TrieMap<String,Integer> {
		
		/** Constructor with index. */
		public Feature(Integer index) { super(index); }
		
		/** Factory method, for adding empty child nodes. */
		protected Feature createNode() { return new Feature(null); }
		
		/** Returns a string name by concatenating escaped keys using colons. */
		public String name() {
			StringBuffer namebuf = new StringBuffer();
			List<String> keys = traceKeys();
			for (int i=0; i < keys.size(); i++) {
				namebuf.append(DefaultTokenizer.escape(keys.get(i)));
				if (i+1 < keys.size()) namebuf.append(':');
			}
			return namebuf.toString();
		}
		
		/** Returns the index. */
		public Integer getIndex() { return data; }
	}
	
	
	// mappings
	private Feature dict;
	private List<Feature> dictInv;
	
	// size
	private int size = 0;
	
	// closed flag
	private boolean closed = false;
	
	
	/** Constructor with initial size. The alphabet is left open. */
	public Alphabet(int size) {
		init(size);
	}

	/** Constructor to load an alphabet from a file. The alphabet is set to closed. */
	public Alphabet(String filename) throws IOException {
		Reader reader = EventFile.openReader(new File(filename));
		StreamTokenizer tokenizer = EventFile.initTokenizer(reader);
		tokenizer.nextToken();
		int size = Integer.parseInt(tokenizer.sval);
		init(size);
		for (int i=0; i < size; i++) {
			tokenizer.nextToken();
			add(tokenizer.sval);
			tokenizer.nextToken(); // skip freq or weight
		}
		reader.close();
		closed = true;
	}
	
	// initializes dict, dictInv
	private void init(int size) {
		dict = new Feature(null);
		dictInv = new ArrayList<Feature>(size);
	}
	
	
	/** Size. */
	public int size() { return size; }
	
	/** Closed. */
	public boolean closed() { return closed; }
	
	/** Set closed. */
	public void setClosed(boolean closed) { this.closed = closed; }
	
	
	/** Add feature with given name, if not already present, returning added feature. */
	public Feature add(String feat) {
		return add(parseKeys(feat));
	}
	
	/** Add equivalent feature, if not already present, returning added feature. */
	public Feature add(Feature f) {
		return add(f.traceKeys());
	}
	
	/** Add feature with given keys, if not already present, returning added feature. */
	public Feature add(List<String> keys) {
		if (closed) throw new RuntimeException("Can't add to a closed alphabet!");
		Feature node = (Feature) dict.findChildFromList(keys);
		return addNode(node);
	}
	
	/** Add feature with given keys, if not already present, returning added feature. */
	public Feature addLazy(List<TrieMap.KeyExtractor<String>> keyExtractors) {
		if (closed) throw new RuntimeException("Can't add to a closed alphabet!");
		Feature node = (Feature) dict.findChildFromLazyList(keyExtractors);
		return addNode(node);
	}
	
	// adds a feature node
	private Feature addNode(Feature node) {
		if (node.data != null) return node;
		node.data = size++;
		dictInv.add(node);
		return node;
	}
	
	/** 
	 * Parses a feature name into a list of unescaped interned string keys, 
	 * breaking on colons. 
	 */
	public static List<String> parseKeys(String feat) {
		List<String> retval = new ArrayList<String>();
		int current = 0; 
		while (current < feat.length()) {
			int breakpos = feat.indexOf(":", current);
			String key;
			if (breakpos >= 0) {
				key = feat.substring(current, breakpos);
				current = breakpos + 1;
			}
			else {
				key = feat.substring(current);
				current = feat.length();
			}
			retval.add(DefaultTokenizer.unescape(key).intern());
		}
		return retval;
	}
	
	
	/** Get or add index of feature with given name (null if none when closed). */
	public Feature index(String feat) { 
		return index(parseKeys(feat));
	}
	
	/** Get or add index of equivalent feature (null if none when closed). */
	public Feature index(Feature f) {
		return index(f.traceKeys());
	}
	
	/** Get or add index of feature with given keys (null if none when closed). */
	public Feature index(List<String> keys) {
		if (!closed) return add(keys);
		Feature node = (Feature) dict.getChildFromList(keys);
		return node;
	}
	
	/** Get or add index of feature with given key extractors (null if none when closed). */
	public Feature indexLazy(List<TrieMap.KeyExtractor<String>> keyExtractors) {
		if (!closed) return addLazy(keyExtractors);
		Feature node = (Feature) dict.getChildFromLazyList(keyExtractors);
		return node;
	}
	
	/** Get indexed feature. */
	public Feature feature(int index) { return dictInv.get(index); }
	
	
	/** 
	 * Creates an alphabet file from an event file, 
	 * saving it to a file with features sorted by frequency, 
	 * using the given table size and pruning threshold. 
	 **/
	public static void createAlphabet(String eventfile, String alphabetfile, int tablesize, int pruningthreshold) throws IOException {
		// open files
		EventFile eventFile = new EventFile(eventfile);
		PrintWriter out = EventFile.openWriter(new File(alphabetfile));
		// init freq tally
		Map<Feature,Integer> freqTally = new HashMap<Feature,Integer>(tablesize*2);
		// read event file, incrementing tallies
		EventFile.Block block;
		FeatureMap goldMap = new FeatureMap();
		Set<Alphabet.Feature> seenFeats = new HashSet<Alphabet.Feature>();
		while ( (block = eventFile.nextBlock()) != null ) {
			// set gold map (nb: assumes single gold event)
			goldMap.clear();
			seenFeats.clear();
			for (EventFile.Event event : block.events) {
				if (event.count > 0) goldMap.add(event.features);
			}
			// tally distinct feats not in gold map
			for (EventFile.Event event : block.events) {
				if (event.count > 0) continue;
				for (FeatureVector.Iterator it = event.features.iterator(); it.hasNext(); ) {
					Feature feat = it.nextFeature();
					float val = it.nextValue();
					seenFeats.add(feat);
					float goldVal = goldMap.get(feat);
					if (val != goldVal) {
						Integer tally = freqTally.get(feat);
						if (tally != null) freqTally.put(feat, ++tally);
						else freqTally.put(feat, 1);
					}
				}
			}
			// tally unseen feats from gold event
			for (EventFile.Event event : block.events) {
				if (event.count == 0) continue;
				for (FeatureVector.Iterator it = event.features.iterator(); it.hasNext(); ) {
					Feature feat = it.nextFeature();
					if (!seenFeats.contains(feat)) {
						Integer tally = freqTally.get(feat);
						if (tally != null) freqTally.put(feat, ++tally);
						else freqTally.put(feat, 1);
					}
				}
			}
		}
		// get tallies passing frequency threshold
		List<Map.Entry<Feature,Integer>> tallies = new ArrayList<Map.Entry<Feature,Integer>>(freqTally.size());
		if (pruningthreshold > 0) {
			for (Map.Entry<Feature,Integer> entry : freqTally.entrySet()) {
				if (entry.getValue() >= pruningthreshold) tallies.add(entry);
			}
		}
		else tallies.addAll(freqTally.entrySet());
		// sort tallies by descending frequency 
		// (further sorting alphabetically seems to take too long)
		Collections.sort(
			tallies, 
			new Comparator<Map.Entry<Feature,Integer>>() {
				public int compare(Map.Entry<Feature,Integer> entry1, Map.Entry<Feature,Integer> entry2) {
					int val1 = entry1.getValue(); int val2 = entry2.getValue(); 
					if (val1 > val2) return -1;
					if (val1 < val2) return 1;
					return 0;
					//return entry1.getKey().name().compareTo(entry2.getKey().name());
				}
			}
		);
		// write tallied features to file
		int size = tallies.size();
		out.println(Integer.toString(size));
		for (int i=0; i < size; i++) {
			Map.Entry<Feature,Integer> entry = tallies.get(i);
			out.println(entry.getKey().name() + " " + entry.getValue());
		}
		// close files
		eventFile.close();
		out.close();
	}

	/** Main routine for filtering event file to an alphabet file. */
	public static void main(String[] args) throws IOException {
		if (args.length < 2) {
			System.out.println("Usage: java perceptron.Alphabet <eventfile> <alphabetfile> (-s <tablesize>) (-p <pruningthreshold>");
			System.exit(0);
		}
		String eventfile = args[0];
		String alphabetfile = args[1];
		int tablesize = 1000000;
		int pruningthreshold = 0;
		for (int i=2; i < args.length; i++) {
			if (args[i].equals("-s")) tablesize = Integer.valueOf(args[++i]);
			if (args[i].equals("-p")) pruningthreshold = Integer.valueOf(args[++i]);
		}
		System.out.println("Writing alphabet to " + alphabetfile + " from event file " + eventfile);
		if (pruningthreshold > 0) System.out.println("with pruning threshold " + pruningthreshold);
		createAlphabet(eventfile, alphabetfile, tablesize, pruningthreshold);
	}
}


================================================
FILE: src/opennlp/ccg/perceptron/ComposedFeatureExtractor.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2009 Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.perceptron;

import java.util.ArrayList;

import opennlp.ccg.synsem.*;

/** 
 * Class for composing feature extractors. 
 * Features from the component feature extractors are assumed to be independent.
 * 
 * @author Michael White
 * @version $Revision: 1.5 $, $Date: 2011/01/15 17:52:59 $
 */ 
public class ComposedFeatureExtractor implements FeatureExtractor {

	/** The feature extractors. */
	public final FeatureExtractor[] featureExtractors;
	
	/** Constructor. */
	public ComposedFeatureExtractor(FeatureExtractor[] featureExtractors) {
		this.featureExtractors = featureExtractors;
	}
	
	/** Binary constructor. */
	public ComposedFeatureExtractor(FeatureExtractor featureExtractor1, FeatureExtractor featureExtractor2) {
		this.featureExtractors = new FeatureExtractor[]{ featureExtractor1, featureExtractor2 };
	}
	
	/** Constructor for sign scorers, some of which may be feature extractors. */
	public ComposedFeatureExtractor(SignScorer[] models) { 
    	ArrayList<FeatureExtractor> feList = new ArrayList<FeatureExtractor>(models.length);
        for (int i = 0; i < models.length; i++) {
        	if (models[i] instanceof FeatureExtractor) feList.add((FeatureExtractor)models[i]);
        }
        this.featureExtractors = feList.toArray(new FeatureExtractor[feList.size()]);
	}
	
	/** Returns the features for the given sign and completeness flag. */
	public FeatureVector extractFeatures(Sign sign, boolean complete) {
		FeatureVector[] featureVectors = new FeatureVector[featureExtractors.length];
		for (int i=0; i < featureExtractors.length; i++)
			featureVectors[i] = featureExtractors[i].extractFeatures(sign, complete);
		return new ComposedFeatureVector(featureVectors);
	}
	
	/** Sets the alphabet. */
	public void setAlphabet(Alphabet alphabet) {
		for (FeatureExtractor fe : featureExtractors) {
			fe.setAlphabet(alphabet);
		}
	}
}


================================================
FILE: src/opennlp/ccg/perceptron/ComposedFeatureVector.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2009 Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.perceptron;

/** 
 * Class for composing feature vectors. 
 * Features from the component feature vectors are assumed to be independent.
 * 
 * @author Michael White
 * @version $Revision: 1.2 $, $Date: 2011/01/15 17:52:59 $
 */ 
public class ComposedFeatureVector implements FeatureVector {

	/** The feature vectors. */
	public final FeatureVector[] featureVectors;
	
	/** Constructor. */
	public ComposedFeatureVector(FeatureVector[] featureVectors) {
		this.featureVectors = featureVectors;
	}
	
	/** Binary constructor. */
	public ComposedFeatureVector(FeatureVector featureVector1, FeatureVector featureVector2) {
		this.featureVectors = new FeatureVector[]{ featureVector1, featureVector2 };
	}
	
	/** Size. */
	public int size() {
		int retval = 0;
		for (FeatureVector fv : featureVectors) retval += fv.size();
		return retval;
	}
	
	/** Returns an iterator over the entries. */
	public Iterator iterator() {
		if (featureVectors.length == 0) return EMPTY_ITERATOR;
		return new Iterator() {
			int i = 0;
			Iterator it = featureVectors[0].iterator();
			public boolean hasNext() { 
				if (it.hasNext()) return true;
				if (i == featureVectors.length-1) return false;
				it = featureVectors[++i].iterator();
				return hasNext(); 
			}
			public Alphabet.Feature nextFeature() { return it.nextFeature(); }
			public Float nextValue() { return it.nextValue(); }
		};
	}
}


================================================
FILE: src/opennlp/ccg/perceptron/EventFile.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2008-2013 Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.perceptron;

import java.util.*;
import java.util.zip.*;
import java.io.*;

import opennlp.ccg.synsem.Sign;

/**
 * An abstract representation of an event file, whose syntax is a more readable version 
 * of what's used in the TADM toolkit.  A constructor flag controls whether to keep the 
 * events in memory (defaults to false).
 * 
 * An event file may be given an alphabet, which allows features to be filtered to 
 * just those present in the alphabet, when it's closed; otherwise, the 
 * alphabet is constructed dynamically.
 * 
 * The concrete syntax of an event file is as follows.
 * An event file consists of a sequence of blocks.
 * A block starts with the number of events on a line by itself.
 * It is followed by each event, one per line.
 * Each event line has a frequency, followed by the number of feature-value pairs,
 * then the sequence of feature-value pairs, 
 * where the feature name is a string with no white space.
 * Each feature can appear only once in an event, and must have a value greater than zero. 
 * You can have events with a zero frequency -- these are used for dispreferred analyses 
 * in ranking tasks such as parse selection or realization ranking. 
 * 
 * An example file appears below.  There are two blocks, corresponding to the 
 * parses of two different senses.  The first block has two possible parses, 
 * the first of which is correct, while the second block has three possible 
 * parses, where the second one is the correct one.
 * 
 * <pre>
 * 2
 * 1 2 feat1 1.22 feat2 3
 * 0 3 feat1 1.55 feat3 1 feat4 2.7
 * 3
 * 0 2 feat1 1.44 feat4 2.2
 * 1 1 feat1 1.33
 * 0 2 feat1 1.32 feat4 3.21
 * </pre>
 * 
 * @author Michael White
 * @version     $Revision: 1.5 $, $Date: 2009/11/01 22:26:29 $
 */
public class EventFile {

	/** A block is a list of events. */
	public static class Block {
		/** The list. */
		public List<Event> events;
		/** Constructor. */
		public Block(List<Event> events) { this.events = events; }
		/** The event with the highest count (first tied if ties). */
		public Event best() {
			Event retval = null; int max = -1;
			for (Event event : events) {
				if (event.count > max) { retval = event; max = event.count; }
			}
			return retval;
		}
	}
	
	/** An event is a feature vector with a count. */
	public static class Event {
		/** The count. */
		public int count; 
		/** The feature vector. */
		public FeatureVector features;
		/** Constructor. */
		public Event(FeatureVector features, int count) {
			this.features = features;
			this.count = count;
		}
		/** toString. */
		public String toString() { return "event: count: " + count + " " + features; }
	}
	
	
	// the alphabet
	private Alphabet alphabet;
	
	// the file, which can be reopened
	private File file;
	
	// the current reader
	private Reader reader;
	
	// the current tokenizer
	private StreamTokenizer tokenizer;
	
	// the saved blocks, if kept in memory
	private List<Block> blocks = null;
	
	// the iterator over saved blocks
	private Iterator<Block> blockIt = null;
	
	// whether the end-of-file has been reached
	private boolean eofReached = false;
	
	/** Constructor with filename. */
	public EventFile(String filename) throws IOException {
		this(filename, false);
	}

	/** Constructor with filename and in-memory flag. */
	public EventFile(String filename, boolean inMemory) throws IOException {
		this(filename, new Alphabet(10000), inMemory);
	}

	/** Constructor with filename and alphabet. */
	public EventFile(String filename, Alphabet alphabet) throws IOException {
		this(filename, alphabet, false);
	}

	/** Constructor with filename, alphabet and in-memory flag. */
	public EventFile(String filename, Alphabet alphabet, boolean inMemory) throws IOException {
		file = new File(filename); init();
		this.alphabet = alphabet;
		if (inMemory) this.blocks = new ArrayList<Block>(10000);
	}

	
	/** Returns the alphabet. */
	public Alphabet getAlphabet() { return alphabet; }

	
	/** Closes the reader. */
	public void close() throws IOException {
		reader.close();
	}
	
	/** Resets the event file for reading again. */
	public void reset() throws IOException {
		close(); init();
	}
	
	// inits the reader and tokenizer, or 
	// if keeping blocks in memory, resets the iterator
	private void init() throws IOException {
		// in-memory case
		if (blocks != null && eofReached) {
			blockIt = blocks.iterator(); return;
		}
		// degenerate case: keeping blocks in memory but eof not reached
		if (blocks != null) {
			// dump saved blocks
			blocks.clear();
		}
		// regular init
		reader = openReader(file);
		tokenizer = initTokenizer(reader);
	}
	
	
	/** Initializes the given tokenizer to recognize most chars as word chars. */
	public static StreamTokenizer initTokenizer(Reader reader) throws IOException {
		StreamTokenizer tokenizer = new StreamTokenizer(reader);
		tokenizer.resetSyntax();
		tokenizer.wordChars(33, 255);
		tokenizer.whitespaceChars(0, 32);
		return tokenizer;
	}
	
	/** Returns whether EOF has been reached. */
	public boolean endOfFile() throws IOException {
		tokenizer.nextToken();
		boolean eof = (tokenizer.ttype == StreamTokenizer.TT_EOF);
		tokenizer.pushBack();
		return eof;
	}
	
	
	/** Reads the next event. Feature are filtered if apropos. */
	private Event nextEvent() throws IOException {
		tokenizer.nextToken();
		int count = Integer.parseInt(tokenizer.sval); 
		tokenizer.nextToken();
		int numFeats = Integer.parseInt(tokenizer.sval); 
		FeatureList fv = new FeatureList(numFeats);
		for (int i=0; i < numFeats; i++) {
			tokenizer.nextToken();
			String feat = tokenizer.sval;
			tokenizer.nextToken();
			float val = Float.parseFloat(tokenizer.sval);
			Alphabet.Feature f = alphabet.index(feat);
			if (f != null) fv.add(f, val); 
		}
		return new Event(fv, count);
	}
	
	/** Reads the next block, or null if none. */
	public Block nextBlock() throws IOException {
		// first check block iterator for in-mem case
		if (blockIt != null) {
			return (blockIt.hasNext()) ? blockIt.next() : null;
		}
		// otherwise check for eof, noting completion for in-mem case
		if (endOfFile()) {
			eofReached = true; return null;
		}
		// otherwise parse next block
		tokenizer.nextToken();
		int numEvents = Integer.parseInt(tokenizer.sval);
		List<Event> events = new ArrayList<Event>(numEvents);
		for (int i=0; i < numEvents; i++) {
			events.add(nextEvent());
		}
		Block retval = new Block(events);
		// save block with in-mem case
		if (blocks != null) blocks.add(retval);
		// done
		return retval;
	}
	
	
	/** Returns a reader for the given file, using gzip inflation if the file's name ends with .gz. */
	public static Reader openReader(File file) throws IOException {
		if (file.getName().endsWith(".gz"))
			return new InputStreamReader(new GZIPInputStream(new FileInputStream(file)));
		else
			return new BufferedReader(new FileReader(file));
	}

	/** Returns a printwriter for the given file, using gzip deflation if the file's name ends with .gz. */
	public static PrintWriter openWriter(File file) throws IOException {
		if (file.getName().endsWith(".gz"))
			return new PrintWriter(new OutputStreamWriter(new GZIPOutputStream(new FileOutputStream(file))));
		else
			return new PrintWriter(new BufferedWriter(new FileWriter(file)));
	}
	
	/** Writes the events for a given list of signs according to the feature extractor and best sign. */
	public static void writeEvents(PrintWriter pw, List<Sign> signs, Sign best, FeatureExtractor fe) throws IOException {
    	Collections.shuffle(signs);
    	pw.println(Integer.toString(signs.size()));
    	for (Sign s : signs) {
    		int count = 0;
    		if (s == best) count = 1;
    		pw.print(count + " ");
    		FeatureVector fvect = fe.extractFeatures(s, true);
    		int numfeats = fvect.size();
    		pw.print(numfeats + " ");
			for (FeatureVector.Iterator it = fvect.iterator(); it.hasNext(); ) {
    			pw.print(it.nextFeature().name() + " " + it.nextValue() + " ");
			}
    		pw.println();
    	}
	}
}


================================================
FILE: src/opennlp/ccg/perceptron/FeatureExtractor.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2008 Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.perceptron;

import opennlp.ccg.synsem.*;

/** 
 * Interface for mappings signs to features. 
 * 
 * @author Michael White
 * @version     $Revision: 1.5 $, $Date: 2009/06/22 04:32:50 $
 */ 
public interface FeatureExtractor {
	
	/** Returns the features for the given sign and completeness flag. */
	public FeatureVector extractFeatures(Sign sign, boolean complete);
	
	/** Sets the alphabet. */
	public void setAlphabet(Alphabet alphabet);
}


================================================
FILE: src/opennlp/ccg/perceptron/FeatureList.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2008 Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.perceptron;

import java.util.*;

/** 
 * A feature vector represented by a list of features and a list of values.
 * Features are assumed to be unique. 
 * 
 * @author	Michael White
 * @version	$Revision: 1.2 $, $Date: 2011/10/11 03:20:05 $
 */ 
public class FeatureList implements FeatureVector {
	
	@SuppressWarnings("unused")
	private static final long serialVersionUID = 325935806787566283L;
	
	// features
	private ArrayList<Alphabet.Feature> features;
	// values
	private ArrayList<Float> values;
	
	
	/** Default constructor. */
	public FeatureList() {
		features = new ArrayList<Alphabet.Feature>();
		values = new ArrayList<Float>();
	}
	
	/** Constructor with size. */
	public FeatureList(int size) { 
		features = new ArrayList<Alphabet.Feature>(size);
		values = new ArrayList<Float>(size);
	}
	
	/** Constructor from feature vector. */
	public FeatureList(FeatureVector fv) {
		for (Iterator it = fv.iterator(); it.hasNext(); ) 
			add(it.nextFeature(), it.nextValue());
	}

	
	/** Add feature-value pair. */
	public void add(Alphabet.Feature feature, Float value) {
		features.add(feature); values.add(value);
	}
	
	/** Add feature vector (features assumed distinct). */
	public void add(FeatureVector fv) {
		features.ensureCapacity(size() + fv.size());
		values.ensureCapacity(size() + fv.size());
		for (Iterator it = fv.iterator(); it.hasNext(); ) 
			add(it.nextFeature(), it.nextValue());
	}
	
	/** Get feature at index. */
	public Alphabet.Feature getFeature(int index) { return features.get(index); }
	
	/** Get value at index. */
	public Float getValue(int index) { return values.get(index); }

	
	/** Size. */
	public int size() { return features.size(); }
	
	/** Iterator. */
	public Iterator iterator() {
		return new Iterator() {
			java.util.Iterator<Alphabet.Feature> itF = features.iterator();
			java.util.Iterator<Float> itV = values.iterator();
			public boolean hasNext() { return itF.hasNext(); }
			public Alphabet.Feature nextFeature() { return itF.next(); }
			public Float nextValue() { return itV.next(); }
		};
	}
	
	
	/** toString. */
	public String toString() {
		String retval = "features: ";
		for (int i=0; i < features.size(); i++)
			retval += "<" + getFeature(i).name() + "," + getValue(i) + "> "; 
		return retval;
	}
}


================================================
FILE: src/opennlp/ccg/perceptron/FeatureMap.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2008 Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.perceptron;

import java.util.*;

/** 
 * A feature vector represented using a <Alphabet.Feature,Float> map. 
 * 
 * @author Michael White
 * @version     $Revision: 1.9 $, $Date: 2011/10/11 03:20:06 $
 */ 
public class FeatureMap implements FeatureVector {

	@SuppressWarnings("unused")
	private static final long serialVersionUID = -5054109887068464041L;

	// the map
	private HashMap<Alphabet.Feature,Float> map;
	
	/** Default constructor. */
	public FeatureMap() { map = new LinkedHashMap<Alphabet.Feature,Float>(); } 
	
	/** Constructor with size. */
	public FeatureMap(int size) { map = new LinkedHashMap<Alphabet.Feature,Float>(size*2); }
	
	/** Constructor from feature vector. */
	public FeatureMap(FeatureVector fv) { 
		this(fv.size()*4);
		for (Iterator it = fv.iterator(); it.hasNext(); ) 
			map.put(it.nextFeature(), it.nextValue());
	}
	
	/** Constructor from two feature vectors. */
	public FeatureMap(FeatureVector fv1, FeatureVector fv2) { 
		this((fv1.size()+fv2.size())*3);
		for (Iterator it = fv1.iterator(); it.hasNext(); ) 
			map.put(it.nextFeature(), it.nextValue());
		add(fv2);
	}
	
	
	/** Increments a feature count. */
	public void inc(Alphabet.Feature feature) {
		float count = 1;
		Float val = map.get(feature);
		if (val != null) count = Math.round(val) + 1;
		map.put(feature, count);
	}
	
	/** Adds to a feature's value (starting with zero). */
	public void add(Alphabet.Feature feature, Float value) {
		Float val = map.get(feature);
		if (val != null) map.put(feature, val + value);
		else map.put(feature, value);
	}
	
	/** Adds a feature vector. */
	public void add(FeatureVector fv) {
		for (Iterator it = fv.iterator(); it.hasNext(); ) 
			add(it.nextFeature(), it.nextValue());
	}
	
	/** Returns the feature's value (zero if not present). */
	public float get(Alphabet.Feature feature) {
		Float retval = map.get(feature);
		return (retval != null) ? retval : 0;
	}
	
	/** Clears the map. */
	public void clear() { map.clear(); }
	
	/** Size. */
	public int size() { return map.size(); }
	
	/** Returns an iterator over the entries. */
	public Iterator iterator() {
		return new Iterator() {
			java.util.Iterator<Map.Entry<Alphabet.Feature,Float>> it = map.entrySet().iterator();
			Map.Entry<Alphabet.Feature,Float> entry = null;
			public boolean hasNext() { return it.hasNext(); }
			public Alphabet.Feature nextFeature() { entry = it.next(); return entry.getKey(); }
			public Float nextValue() { return entry.getValue(); }
		};
	}
}


================================================
FILE: src/opennlp/ccg/perceptron/FeatureVector.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2008 Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.perceptron;

/** 
 * A sparse feature vector, with size and an iterator over feature-value pairs. 
 * 
 * @author 	Michael White
 * @version	$Revision: 1.6 $, $Date: 2011/01/15 17:52:59 $
 */ 
public interface FeatureVector {
	
	/**
	 * Iterator over feature-value pairs.
	 * Features and values must be retrieved using a pair of calls 
	 * to nextFeature and nextValue, otherwise the behavior is not defined.
	 */
	public interface Iterator {
		
		/** Whether any items remain. */
		public boolean hasNext();
		
		/** Returns the next feature. */
		public Alphabet.Feature nextFeature();
		
		/** Returns the next value. */
		public Float nextValue();
	}
	
	/** Size. */
	public int size();

	/** Iterator over feature-value pairs. */
	public Iterator iterator();
	
	/** Empty iterator. */
	public static Iterator EMPTY_ITERATOR = new Iterator() {
		public boolean hasNext() { return false; }
		public Alphabet.Feature nextFeature() { return null; }
		public Float nextValue() { return null; }
	};
}


================================================
FILE: src/opennlp/ccg/perceptron/Model.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2008 Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.perceptron;

import java.util.*;
import java.io.*;

import opennlp.ccg.perceptron.Alphabet.Feature;
import opennlp.ccg.util.Pair;

/**
 * A model is a vector of weights for an alphabet.
 * 
 * A model can be read from a file, which starts with the number 
 * of features on one line, followed by one line per feature pairing 
 * the feature name with its weight.
 * 
 * A new model with all zero weights can also be created from an alphabet.
 * 
 * The main routine tests the model on an event file.
 * 
 * @author Michael White
 * @version     $Revision: 1.7 $, $Date: 2009/11/09 18:54:30 $
 */
public class Model {

	/** Filter interface for adjusting feature weights when loading a model. */
	public interface FeatureFilter {
		/** Returns the modified feature weight for the given feature. */
		public double adjustedWeight(String name, double weight);
	}

	/** Flag for whether to print debugging info to System.err. */
	public boolean debug = false;
	
	// weight vector
	private double[] weights;
	
	// alphabet
	private Alphabet alphabet;

	
	/** Constructor with alphabet, for a new model with all zero weights. */
	public Model(Alphabet alphabet) {
		this.alphabet = alphabet;
		weights = new double[alphabet.size()];
		zero();
	}
	
	/** Constructor to load a model from a file. The alphabet is set to closed. */
	public Model(String filename) throws IOException {
	    this(filename, null);
	}

	/**
	 * Constructor to load a model from a file using a feature filter. The
	 * alphabet is set to closed.
	 */
	public Model(String filename, FeatureFilter filter) throws IOException {
		Reader reader = EventFile.openReader(new File(filename));
		StreamTokenizer tokenizer = EventFile.initTokenizer(reader);
		tokenizer.nextToken();
		int size = Integer.parseInt(tokenizer.sval);
		alphabet = new Alphabet(size);
		weights = new double[size];
		for (int i = 0; i < size; i++) {
			tokenizer.nextToken();
			String name = tokenizer.sval;
			tokenizer.nextToken();
			double weight = Double.parseDouble(tokenizer.sval);
			if (filter != null)
				weight = filter.adjustedWeight(name, weight);
			alphabet.add(name);
			weights[i] = weight;
		}
		reader.close();
		alphabet.setClosed(true);
	}
	
	/** Returns the size of the model. */
	public int size() { return weights.length; }
	
	/** Returns the alphabet. */
	public Alphabet getAlphabet() { return alphabet; }
	
	
	/** Returns the weight for the given index. */
	public double getWeight(int index) { return weights[index]; }
	
	/** Returns the weight for the given feature. */
	public double getWeight(String feat) { return weights[alphabet.index(feat).getIndex()]; }
	
	/** Returns the weight for the given feature. */
	public double getWeight(Alphabet.Feature f) { return weights[f.getIndex()]; }
	
	/** Sets the weight for the given index. */
	public void setWeight(int index, double weight) { weights[index] = weight; }
	
	/** Sets the weight for the given feature. */
	public void setWeight(String feat, double weight) { weights[alphabet.index(feat).getIndex()] = weight; }

	/** Sets the weight for the given feature. */
	public void setWeight(Alphabet.Feature f, double weight) { weights[f.getIndex()] = weight; }

	
	/** Returns the dot product of the weights and features. */
	public double score(FeatureVector fv) {
		double retval = 0.0;
		for (FeatureVector.Iterator it = fv.iterator(); it.hasNext(); ) {
			Feature feat = it.nextFeature();
			Float value = it.nextValue();
			Integer index = feat.getIndex();
			if (index == null) continue;
			retval += weights[index] * value;
		}
		if (debug) System.err.println("score: " + retval + " " + fv);
		return retval;
	}
	
	/** Adds the feature vector values to the weights. */
	public void add(FeatureVector fv) {
		for (FeatureVector.Iterator it = fv.iterator(); it.hasNext(); ) {
			Feature feat = it.nextFeature();
			Float value = it.nextValue();
			Integer index = feat.getIndex();
			if (index == null) continue;
			weights[index] += value;
		}
	}
	
	/** Subtracts the feature vector values from the weights. */
	public void subtract(FeatureVector fv) {
		for (FeatureVector.Iterator it = fv.iterator(); it.hasNext(); ) {
			Feature feat = it.nextFeature();
			Float value = it.nextValue();
			Integer index = feat.getIndex();
			if (index == null) continue;
			weights[index] -= value;
		}
	}

	
	/** Adds the given model's weights to this model.  The models are assumed to share the same alphabet. */
	public void add(Model model) {
		for (int i=0; i < weights.length; i++) {
			weights[i] += model.weights[i];
		}
	}
	
	/** Multiplies the weights by the given number. */
	public void multiply(double num) {
		for (int i=0; i < weights.length; i++) {
			weights[i] *= num;
		}
	}

	/** Resets the weights to zero. */
	public void zero() {
		for (int i=0; i < weights.length; i++) {
			weights[i] = 0.0;
		}
	}

	
	/** Sets this model's weights to the given model's ones, where the alphabets intersect. */
	public void set(Model model) {
		zero();
		for (int i=0; i < model.weights.length; i++) {
			Alphabet.Feature f = model.alphabet.feature(i);
			Alphabet.Feature f0 = alphabet.index(f);
			if (f0 == null || f0.getIndex() == null) continue;
			weights[f0.getIndex()] = model.weights[i];
		}
	}
	
	
	/** Returns the best event (first tied if ties). */
	public FeatureVector best(List<FeatureVector> fvs) {
		FeatureVector retval = null; double max = Double.NEGATIVE_INFINITY;
		for (FeatureVector fv : fvs) {
			double score = score(fv);
			if (score > max) { retval = fv; max = score; }
		}
		return retval;
	}
	
	/** Returns the best event (first tied if ties). */
	public EventFile.Event best(EventFile.Block block) {
		EventFile.Event retval = null; double max = Double.NEGATIVE_INFINITY;
		for (EventFile.Event event : block.events) {
			double score = score(event.features);
			if (score > max) { retval = event; max = score; }
		}
		return retval;
	}
	
	/** Returns the accuracy on the event file. */
	public double accuracy(EventFile eventFile) throws IOException {
		if (alphabet != eventFile.getAlphabet()) {
			throw new RuntimeException("Model and EventFile must share the same alphabet!");
		}
		int correct = 0; int total = 0;
		EventFile.Block block;
		while ( (block = eventFile.nextBlock()) != null ) {
			total++;
			if (best(block) == block.best()) {
				correct++;
				if (debug) System.err.println("CORRECT");
			}
			else {
				if (debug) System.err.println("WRONG; best: " + block.best());
			}
		}
		if (debug) System.err.println("correct: " + correct + " total: " + total);
		return 1.0 * correct / total;
	}
	
	
	/** Saves the model to a file, filtering out zero weights. */
	public void save(String filename) throws IOException { save(filename, 0.0); }
	
	/** Saves the model to a file, filtering out weights whose absolute value does not exceed the pruning value. */
	public void save(String filename, double minPrune) throws IOException {
		File file = new File(filename);
		PrintWriter out = EventFile.openWriter(file);
		// calc pruned size
		int size = size();
		int pruned = 0;
		for (int i=0; i < size; i++) if (Math.abs(weights[i]) <= minPrune) pruned++;
		int prunedSize = size - pruned;
		// write pruned size 
		out.println(Integer.toString(prunedSize));
		// collect unpruned weights
		List<Pair<Feature,Double>> featWeights = new ArrayList<Pair<Feature,Double>>(prunedSize);
		for (int i=0; i < size; i++) {
			if (Math.abs(weights[i]) <= minPrune) continue;
			featWeights.add(new Pair<Feature,Double>(alphabet.feature(i), weights[i]));
		}
		// sort weights by descending absolute value
		// (further sorting alphabetically may take too long)
		Collections.sort(
				featWeights, 
				new Comparator<Pair<Feature,Double>>() {
					public int compare(Pair<Feature,Double> entry1, Pair<Feature,Double> entry2) {
						double val1 = Math.abs(entry1.b); double val2 = Math.abs(entry2.b);
						if (val1 > val2) return -1;
						if (val1 < val2) return 1;
						return 0;
						//return entry1.a.name().compareTo(entry2.a.name());
					}
				}
		);
		// write sorted weights
		for (Pair<Feature,Double> fw : featWeights) {
			out.println(fw.a.name() + " " + fw.b);
		}
		out.close();
	}
	
	
	/**
	 * Loads a model from a file and tests it on the given event file.
	 */
	public static void main(String[] args) throws IOException {
		// help
		if (args.length < 2) {
			System.out.println("Usage: java perceptron.Model <modelfile> <eventfile> (-debug)");
			System.exit(0);
		}
		// args
		String modelfile = args[0];
		String eventfile = args[1];
		boolean debug = Arrays.asList(args).contains("-debug");
		// load model
		System.out.println("Loading model from: " + modelfile);
		Model model = new Model(modelfile); 
		model.debug = debug;
		System.out.println("model size: " + model.size());
		System.out.println("debug: " + debug);
		// compute accuracy
		System.out.println("Scoring events in: " + eventfile);
		EventFile eventFile = new EventFile(eventfile, model.alphabet);
		double accuracy = model.accuracy(eventFile);
		System.out.println("accuracy: " + accuracy);
	}
}


================================================
FILE: src/opennlp/ccg/perceptron/PerceptronScorer.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2008 Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.perceptron;

import opennlp.ccg.synsem.*;

/**
 * A sign scorer for a perceptron model.
 * 
 * @author Michael White
 * @version     $Revision: 1.7 $, $Date: 2011/03/21 20:46:43 $
 */
public class PerceptronScorer implements SignScorer {

	/** The feature extractor. */
	public final FeatureExtractor featureExtractor;
	
	/** The model. */
	public final Model model;
	
	/** Constructor. */
	public PerceptronScorer(FeatureExtractor featureExtractor, Model model) {
		this.featureExtractor = featureExtractor;
		this.model = model;
		featureExtractor.setAlphabet(model.getAlphabet());
	}
	
    /** 
     * Returns a score for the given sign and completeness flag, where higher 
     * numbers are better than lower numbers.
     * In particular, returns the score assigned by the model to the features 
     * extracted from the given sign with the given completeness flag.
     */
    public double score(Sign sign, boolean complete) {
    	return model.score(featureExtractor.extractFeatures(sign, complete));
    }
}


================================================
FILE: src/opennlp/ccg/perceptron/ReRankingPerceptronScorer.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2011 Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.perceptron;

import opennlp.ccg.synsem.*;

/**
 * A re-ranking sign scorer for a perceptron model.
 * Note that at present, n-best re-ranking has been found to work better 
 * for parsing, but not for realization, where forest re-ranking (ie using 
 * the perceptron scorer throughout) seems to work better.
 * 
 * @author Michael White
 * @version     $Revision: 1.1 $, $Date: 2011/03/21 20:46:32 $
 */
public abstract class ReRankingPerceptronScorer extends PerceptronScorer implements ReRankingScorer {

	/** Flag for whether to use the full model. */
    protected boolean useFullModel = false;

    /** Sets the full model flag. */
    public void setFullModel(boolean on) { useFullModel = on; }

	/** The base scorer, for use when the full model is turned off. */
    protected SignScorer baseScorer;

    /** Returns the base scorer, using the given feature extractor if desired. */
    abstract protected SignScorer getBaseScorer(FeatureExtractor featureExtractor);

    /** Constructor that configures the base scorer using getBaseScorer. */
	public ReRankingPerceptronScorer(FeatureExtractor featureExtractor, Model model) {
		super(featureExtractor, model);
		baseScorer = getBaseScorer(featureExtractor);
	}

    /** Scores the sign with the full or base model, according to the full model flag. */
    public double score(Sign sign, boolean complete) {
		if (useFullModel) return super.score(sign, complete);
		else return baseScorer.score(sign, complete);
    }
}


================================================
FILE: src/opennlp/ccg/perceptron/Trainer.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2008-2013 Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.perceptron;

//import java.util.*;
import java.io.*;

/**
 * Trains an averaged perceptron model by iterating through an event file. 
 * 
 * The main routine trains and saves a model.  Options include saving 
 * the final, non-averaged model, and saving the averaged model after 
 * every N iterations.  There's also an option to keep the events in 
 * memory for subsequent iterations.
 * 
 * An alphabet must be supplied as input.  The main routine of the 
 * Alphabet class can be used to derive an alphabet from a training
 * file.
 * 
 * @author Michael White
 * @version     $Revision: 1.4 $, $Date: 2009/06/18 23:38:57 $
 */
public class Trainer {

	/** The training file. */
	public final String trainfile;
	
	/** The alphabet. */
	public final Alphabet alphabet;
	
	/** The number of training iterations. */
	public final int iterations;
	
	/** The model file. */
	public final String modelfile;
	
	/** The in-memory flag. */
	public final boolean inMemory;
	
	/** The current model. */
	public final Model currentModel;
	
	/** The averaged model. */
	public final Model averagedModel;
	
	/** The model for averaging over the current iteration. */
	private Model iterationModel;
	
	/** The number of iterations to use when saving every N iterations. */
	private int saveEveryNth = 0;

	
	/** Constructor. */
	public Trainer(String trainfile, String alphabetfile, int iterations, String modelfile, boolean inMemory) throws IOException {
		this.trainfile = trainfile;
		this.alphabet = new Alphabet(alphabetfile);
		this.iterations = iterations;
		this.modelfile = modelfile;
		this.inMemory = inMemory;
		this.currentModel = new Model(alphabet);
		this.averagedModel = new Model(alphabet);
		this.iterationModel = new Model(alphabet);
	}
	
	/** Initializes the model. */
	public void initModel(String initmodelfile) throws IOException {
		Model model = new Model(initmodelfile);
		currentModel.set(model);
		averagedModel.set(model);
	}
	
	
	/** Train the model, reporting accuracy of the averaged model for each iteration and the final model. */
	public void train() throws IOException {
		// open training file
		EventFile eventFile = new EventFile(trainfile, alphabet, inMemory);
		// iterate
		boolean converged = false;
		for (int i=0; i < iterations; i++) {
			System.out.println("iteration: " + i);
			// reset training file
			eventFile.reset();
			// zero iteration model
			iterationModel.zero();
			// init counters
			int updates = 0; int correct = 0; int total = 0;
			EventFile.Block block;
			// go through training file
			while ( (block = eventFile.nextBlock()) != null ) {
				total++;
				// update if wrong
				EventFile.Event modelBest = currentModel.best(block);
				EventFile.Event actualBest = block.best();
				if (modelBest != actualBest) {
					updates++;
					currentModel.add(actualBest.features);
					currentModel.subtract(modelBest.features);
				}
				// see if averaged model correct
				EventFile.Event avgModelBest = averagedModel.best(block);
				if (avgModelBest == actualBest) correct++;
				// update iteration model
				iterationModel.add(currentModel);
			}
			// divide iteration model by total to yield an average for this iteration, 
			// and divide by iteration number (+1) to yield proportion of this 
			// iteration to averaged model; combine these two steps into one call
			double denominator = 1.0 * total * (i+1);
			iterationModel.multiply(1.0 / denominator);
			// multiply averaged model by i/(i+1) for proportion of previous iterations
			if (i > 0) {
				double mult = 1.0 * i / (i+1);
				averagedModel.multiply(mult);
			}
			// updated averaged model
			averagedModel.add(iterationModel);
			// report
			System.out.println("updates: " + updates);
			System.out.println("avg model correct: " + correct + " total: " + total + " accuracy: " + (1.0 * correct / total));
			System.out.println();
			if (updates == 0) {
				System.out.println("converged");
				System.out.println();
				converged = true; break;
			}
			// save every nth
			if (saveEveryNth > 0 && i < (iterations-1) && i % saveEveryNth == 0) {
				String nthModelfile = nthFilename(modelfile, i);
				System.out.println("Saving model to " + nthModelfile);
				averagedModel.save(nthModelfile);
				System.out.println();
			}
		}
		// do one more iteration to compute accuracy if not converged
		if (!converged) {
			System.out.println("final iteration: ");
			// reset training file
			eventFile.reset();
			// init counters
			int finalCorrect = 0; int correct = 0; int total = 0;
			EventFile.Block block;
			// go through training file
			while ( (block = eventFile.nextBlock()) != null ) {
				total++;
				// see if correct
				EventFile.Event modelBest = currentModel.best(block);
				EventFile.Event avgModelBest = averagedModel.best(block);
				EventFile.Event actualBest = block.best();
				if (modelBest == actualBest) finalCorrect++;
				if (avgModelBest == actualBest) correct++;
			}
			// report
			System.out.println("final model correct: " + finalCorrect + " total: " + total + " accuracy: " + (1.0 * finalCorrect / total));
			System.out.println("avg model correct: " + correct + " total: " + total + " accuracy: " + (1.0 * correct / total));
			System.out.println();
		}
		// close training file
		eventFile.close();
	}

	
	/** Returns a filename with .N added before the extension, if any. */
	public static String nthFilename(String filename, int N) {
		int lastdot = filename.lastIndexOf('.');
		if (lastdot > 0) return filename.substring(0,lastdot) + "." + N + filename.substring(lastdot);
		else return filename + "." + N;
	}
	
	
	/**
	 * Trains an averaged perceptron model from the training file using the alphabet file and the given 
	 * number of iterations, saving the file to model file.
	 * The final (non-averaged) model can optionally be saved using the -f option, 
	 * and intermediate models can be saved every N iterations using the -n option.
	 * The -in_mem option keeps the events in memory for subsequent iterations.
	 */
	public static void main(String[] args) throws IOException {
		// help
		if (args.length < 4) {
			System.out.println(
				"Usage: java perceptron.Trainer <traineventfile> <alphabetfile> <iterations> <modelfile> " + 
				"(-i <initmodelfile>) (-f <finalmodelfile>) (-n <save-every-nth>) (-in_mem)"
			);
			System.exit(0);
		}
		// args
		String traineventfile = args[0];
		String alphabetfile = args[1];
		int iterations = Integer.parseInt(args[2]);
		String modelfile = args[3];
		String initmodelfile = null;
		String finalmodelfile = null;
		int saveEveryNth = 0;
		boolean inMemory = false;
		for (int i=4; i < args.length; i++) {
			if (args[i].equals("-i")) initmodelfile = args[++i]; 
			if (args[i].equals("-f")) finalmodelfile = args[++i]; 
			if (args[i].equals("-n")) saveEveryNth = Integer.parseInt(args[++i]); 
			if (args[i].equals("-in_mem")) inMemory = true;
		}
		// setup, train
		System.out.println("Training on " + traineventfile + " using " + alphabetfile + " for " + iterations + " iterations");
		if (initmodelfile != null) System.out.println("with " + initmodelfile + " as the initial model");
		if (inMemory) System.out.println("keeping events in memory");
		System.out.println();
		Trainer trainer = new Trainer(traineventfile, alphabetfile, iterations, modelfile, inMemory);
		if (initmodelfile != null) trainer.initModel(initmodelfile);
		trainer.saveEveryNth = saveEveryNth;
		trainer.train();
		// save model
		System.out.println("Saving model to " + modelfile);
		trainer.averagedModel.save(modelfile);
		if (finalmodelfile != null) {
			System.out.println("Saving model to " + finalmodelfile);
			trainer.currentModel.save(finalmodelfile);
		}
	}

}


================================================
FILE: src/opennlp/ccg/realize/Chart.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003-11 University of Edinburgh / Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.realize;

import opennlp.ccg.*;
import opennlp.ccg.synsem.*;
import opennlp.ccg.util.Pair;
import opennlp.ccg.ngrams.NgramPrecisionModel;
import opennlp.ccg.parse.DerivationHistory;
import opennlp.ccg.hylo.*;

import java.io.*;
import java.util.*;
import java.util.prefs.*;

import gnu.trove.*;

/**
 * The chart manages the creation of edges.  Newly added edges are kept on an 
 * agenda prior to rule applications.  In the anytime mode, the chart completion 
 * process can be interrupted according to the given parameters and preferences 
 * (see Chart.combine).  In the packing mode, completing the chart produces 
 * a packed representation, which may then be unpacked if the DO_UNPACKING 
 * preference is set.
 *
 * A single chart instance per realization request is assumed.
 *
 * @author      Michael White
 * @version     $Revision: 1.79 $, $Date: 2011/08/28 04:05:39 $
 */
public class Chart
{
    
    /** Preference key for time limit on edge combination. */
    public static final String TIME_LIMIT = "Time Limit";
    
    /** Preference key for time limit on finding a new best complete realization. 
        If between o-1, the time limit is interpreted as a percentage of the 
        time until the first realization is found. */
    public static final String NEW_BEST_TIME_LIMIT = "New Best Time Limit";
    
    /** A constant indicating no time limit on edge combination. */
    public static final int NO_TIME_LIMIT = 0;

    /** Preference key for edge limit on edge combination. */
    public static final String EDGE_LIMIT = "Edge Limit";
    
    /** A constant indicating no edge limit on edge combination. */
    public static final int NO_EDGE_LIMIT = 0;

    /** Preference key for pruning the number of signs kept per equivalence class. */
    public static final String PRUNING_VALUE = "Pruning Value";

    /** Preference key for pruning the number of signs kept per cell. */
    public static final String CELL_PRUNING_VALUE = "Cell Pruning Value";

    /** A constant indicating no pruning of signs per equivalence class. */
    public static final int NO_PRUNING = 0;

    /** Preference key for whether to collect category combinations. */
    public static final String USE_COMBOS = "Use Combos";
    
    /** Preference key for whether to create a packed generation forest in the first of 
        two realization stages (deferring unpacking to the later stage). 
        This option pre-empts the use of collected combos in a single, anytime realization stage. */
    public static final String USE_PACKING = "Use Packing";
    
    /** Preference key for whether to unpack a generation forest in the second of 
        two realization stages.  This option is only relevant if packing is 
        used in the first stage. */
    public static final String DO_UNPACKING = "Do Unpacking";

    
    /** The edge factory for the realization request. */
    public final EdgeFactory edgeFactory;

    /** The pruning strategy. */
    public final PruningStrategy pruningStrategy;
    
    /** Flag for whether to use depth-first search.  Defaults to false. */
    public boolean depthFirst = false; 
    
    /** New best time limit, in ms.  Set from prefs in constructor. */
    public int newBestTimeLimit = NO_TIME_LIMIT;
    
    /** New best time limit, as a percentage of time from the first complete realization.  Set from prefs in constructor. */
    public double newBestTimeLimitPct = NO_TIME_LIMIT;
    
    /** Edge limit.  Set from prefs in constructor. */
    public int edgeLimit = NO_EDGE_LIMIT;
    
    /** Pruning value.  Set from prefs in constructor. */
    public int pruningValue = NO_PRUNING;
    
    /** Cell pruning value.  Set from prefs in constructor. */
    public int cellPruningValue = NO_PRUNING;
    
    /** Flag for whether to collect category combos.  Set from prefs in constructor. */
    public boolean collectCombos = true;

    /** Flag for whether to use packing.  Set from prefs in constructor. */
    public boolean usePacking = false;

    /** Flag for whether to do unpacking.  Set from prefs in constructor. */
    public boolean doUnpacking = true;
    
    /** Flag for whether to join best fragments if no complete realization found.  Defaults to false. */
    public boolean joinFragments = false;

    /** Flag for whether to glue fragments currently. Defaults to false. */
    public boolean gluingFragments = false;

    
    // the agenda of edges that have yet to be added to the chart
    private List<Edge> agenda = new ArrayList<Edge>();
    
    // the (representative) edges in the chart
    private List<Edge> edges = new ArrayList<Edge>();
    
    // all unpruned (and unpacked, if apropos) edges in the chart
    private List<Edge> allEdges = new ArrayList<Edge>();

    // edges to be removed from the chart, after having been superceded 
    // by an edge with an equivalent sign (up to surface words) and 
    // a less complex derivation
    private List<Edge> supercededEdgesPendingRemoval = new ArrayList<Edge>();

    // maps signs to edges (w/o optional bits marked as covered)
    private Map<Sign,Edge> signMap = new IdentityHashMap<Sign,Edge>();
    
    // the edges seen so far
    private EdgeHash edgeHash = new EdgeHash();
    

    // maps edges to representative edges, according to their 
    // coverage vectors and their cats, sans LFs
    @SuppressWarnings("unchecked")
    private Map<Edge, Edge> catMap = new THashMap(
        new TObjectHashingStrategy() {
			private static final long serialVersionUID = 1L;
			public int computeHashCode(Object o) {
                Edge edge = (Edge) o;
                return edge.bitset.hashCode() + edge.sign.getCategory().hashCodeNoLF();
            }
            public boolean equals(Object o1, Object o2) {
                Edge edge1 = (Edge) o1; Edge edge2 = (Edge) o2;
                return edge1.bitset.equals(edge2.bitset) &&
                    edge1.sign.getCategory().equalsNoLF(edge2.sign.getCategory());
            }
        }
    );
    
    // cell map: based on input coverage vectors
    private Map<BitSet,Integer> cellMap = new HashMap<BitSet,Integer>();
    
    // non-empty cells: cells to avoid when gluing fragments
    private Set<BitSet> nonEmptyCells  = null;
    
    // reusable bitset for checking non-empty cells
    private transient BitSet tmpBitSet = new BitSet();
    
    /** 
     * The best edge found so far (or null), 
     * where a complete edge is always given preference 
     * to an incomplete one.
     */
    public Edge bestEdge = null;
    
    /** The best edge created by joining fragments, if necessary. */
    public Edge bestJoinedEdge = null;
    
    /** Whether the realization search has been completed. */
    public boolean done = false;
    
    /** The number of nominals in the input LF. */
    public int numNominals = 0;
    
    /** The number of elementary predications in the input LF. */
    public int numPreds = 0;
    
    /** The number of edges created and added to the agenda. */
    public int numEdges = 0;
    
    /** The number of pruned edges removed from the chart. */
    public int numPrunedRemoved = 0;
    
    /** The number of pruned edges never added to the chart. */
    public int numPrunedNeverAdded = 0;
    
    /** The number of new complete best edges found after the first one. */
    public int newBest = 0;
    
    /** The maximum number of edges in a cell. */
    public int cellMax = 0;
    
    /** The time at which realization started. */
    protected long startTime = System.currentTimeMillis();
    /** The time in ms until lex lookup was completed. */
    public int timeTilLex = 0;
    /** The time in ms until the first complete edge was found. */
    public int timeTilFirst = 0;
    /** The time in ms until the best edge was found. */
    public int timeTilBest = 0;
    /** The time in ms until the search was stopped. */
    public int timeTilStopped = 0;
    /** The time in ms until the packed chart was completed. */
    public int timeTilPacked = 0;
    /** The time in ms until the search was finished. */
    public int timeTilDone = 0;
    
    
    /** 
     * Constructor with explicit pruning strategy. 
     */
     // * NB: Even with a non-default pruning strategy, it could potentially help 
     // *     to set the pruning value to an estimate of the number of 
     // *     edges per equivalent category that will be stored.
    public Chart(EdgeFactory edgeFactory, PruningStrategy pruningStrategy) {
        this.edgeFactory = edgeFactory;
        this.pruningStrategy = pruningStrategy;
        Preferences prefs = Preferences.userNodeForPackage(TextCCG.class);
        newBestTimeLimitPct = prefs.getDouble(NEW_BEST_TIME_LIMIT, NO_TIME_LIMIT);
        if (newBestTimeLimitPct >= 1) {
            newBestTimeLimit = (int) newBestTimeLimitPct;
            newBestTimeLimitPct = NO_TIME_LIMIT; 
        }
        edgeLimit = prefs.getInt(EDGE_LIMIT, NO_EDGE_LIMIT);
        pruningValue = prefs.getInt(PRUNING_VALUE, NO_PRUNING);
        cellPruningValue = prefs.getInt(CELL_PRUNING_VALUE, NO_PRUNING);
        usePacking = prefs.getBoolean(USE_PACKING, false); 
        collectCombos = !usePacking && prefs.getBoolean(USE_COMBOS, true);
        doUnpacking = usePacking && prefs.getBoolean(DO_UNPACKING, true);
    }
        
    
    /** Returns the number of (representative) edges in the chart. */
    public int numEdgesInChart() { return edges.size(); }

    /** Returns the number of unpruned (and unpacked, if apropos) edges in the chart. */
    public int numUnprunedEdges() { return allEdges.size(); }

    
    //-----------------------------------------------------------------
    // main algorithm routines    
    
    /** Initializes the agenda. */
    public void initialize() {
        // record number of nominals
        numNominals = edgeFactory.nominals.size();
        numPreds = edgeFactory.preds.size();
        // create various initial edges and add to the agenda
        for (Edge edge : edgeFactory.createInitialEdges())  
            addEdgeToAgenda(edge);
        // record time 'til lex
        long currentTime = System.currentTimeMillis();
        timeTilLex = (int) (currentTime - startTime);
    }
    
    /** Returns whether there were no uncovered lexical or featural preds after lex lookup. */
    public boolean noUncoveredPreds() { return !edgeFactory.hasUncoveredPreds; }
    
    
    /** 
     * Reinitializes the agenda for gluing fragments.  
     * A runtime exception is thrown if not in packing mode.
     */
    public void reInitForGluing() {
    	// check packing mode
    	if (!usePacking) throw new RuntimeException("Packing mode required for gluing fragments.");
    	// set flags here and in edge factory
    	gluingFragments = true; 
    	edgeFactory.gluingFragments = true; edgeFactory.useIndexing = false;
    	// add opt for uncovered preds, unless already done for relaxed relation matching
    	if (!edgeFactory.useRelaxedRelationMatching)
    		edgeFactory.addLFOptsForUncoveredPreds();
    	// add opts for rule instances
    	edgeFactory.addLFOptsForRuleInstances();
    	// record non-empty cells
    	nonEmptyCells = new HashSet<BitSet>(cellMap.keySet());
    	// add edges back to agenda, for possible gluing
    	for (Edge edge : edges) addEdgeToAgenda(edge);
    }
    
    
    /** 
     * Adds to the chart by iteratively moving an edge from the agenda to the chart, 
     * creating new edges for the agenda by applying available rules, 
     * while updating the best edge found so far, 
     * until a stopping criterion is reached.
     * The basic stopping criterion is when the agenda becomes empty, and thus the 
     * search is done.
     * Otherwise, the search is stopped either when the edge limit (if any) is reached, 
     * or the time limit (if any) is reached, 
     * or the first complete edge is found (if beyond the edge/time limit, and according to the given flag), 
     * or until the new best time limit (if any; anytime case only) beyond the first 
     * complete realization is exceeded.
     * In the packing case, unpacking is then performed according to the preference setting.
     * In the anytime case, if the collect combos option is set, then the combinatory rules 
     * are only invoked when an edge with a new category is moved to the chart, in which case 
     * any successful combinations are collected in the edge's combos data structure; 
     * if the edge instead has an already seen category, new edges are created as 
     * alternatives to the collected combos in its representative, much as with unpacking.
     */
    public void combine(int timeLimitMS, boolean waitForCompleteEdge) {
        
        // until agenda is empty
        while (!agenda.isEmpty()) {

            // check for timeout
            long currentTime = System.currentTimeMillis();
            int timeSoFar = (int) (currentTime - startTime);
            int timeSinceFirst = timeSoFar - timeTilFirst;
            boolean bestEdgeComplete = (bestEdge != null && bestEdge.complete()); 
            if (
            	// edge limit case
            	(edgeLimit != NO_EDGE_LIMIT && numEdges > edgeLimit &&
                 (!waitForCompleteEdge || bestEdgeComplete))
            	||
                // timeout case
                (timeLimitMS != NO_TIME_LIMIT && timeSoFar > timeLimitMS &&
                 (!waitForCompleteEdge || bestEdgeComplete))
                ||  
                // new best timeout case (anytime only)
                (!usePacking && bestEdgeComplete && 
                 ((newBestTimeLimit != NO_TIME_LIMIT && 
                   timeSinceFirst > newBestTimeLimit) ||
                  (newBestTimeLimitPct != NO_TIME_LIMIT && 
                   (double) timeSinceFirst / timeTilFirst > newBestTimeLimitPct)))
            ) {
                // ensure best edge in chart
                if (!allEdges.contains(bestEdge)) { addEdgeToChart(bestEdge); }
                // set timing
                timeTilStopped = timeSoFar;
                // stop
                break;
            }
            
            // take edge from agenda
            Edge next = agenda.remove(0);
            
            // add edge to chart
            boolean actuallyAdded = addEdgeToChart(next);
            
            // skip if edge didn't survive pruning (anytime case), 
            // or was folded into an existing edge (packing case)
            if (!actuallyAdded) { continue; }
            
            // otherwise do combos 
            doEdgeCombos(next);
        }

        // set done packing time
        if (usePacking) {
            long donePackingTime = System.currentTimeMillis();
            timeTilPacked = (int) (donePackingTime - startTime);
            // do unpacking, if apropos
            if (doUnpacking) doUnpacking();
        }
        
        // set done flag, timing
        done = agenda.isEmpty();
        if (done) {
	        long endTime = System.currentTimeMillis();
	        timeTilDone = (int) (endTime - startTime);
        }
        
        // join best fragments, if nec.
        if (joinFragments && !bestEdge.complete()) joinBestFragments(); 
    }
    
    // does binary combinations with all edges in the chart and unary ones too; 
    // when collecting combos, invokes the combinatory rules only when nec.; 
    // prunes superceded edges before returning
    private void doEdgeCombos(Edge next) {
    	// skip semantically null edges when gluing fragments
    	if (gluingFragments && next.bitset.isEmpty()) return;
    	// when collecting combos ...
        if (collectCombos) {
            // existing rep case: just make alt edges from collected combos
            Edge nextRep = catMap.get(next);
            if (next != nextRep) {
                addNewEdges(edgeFactory.createAltEdges(next, nextRep));
                // and prune any superceded edges before returning
                pruneSupercededEdges();
                return;
            }
        }
        // otherwise combine edge with those in chart 
        List<Edge> edgesToUse = (usePacking || collectCombos) ? edges : allEdges;
        for (Edge edge : edgesToUse) {
            if (edge == next) continue; // skip this edge
            // skip fragment gluing if semantically null or if result cell non-empty
            if (gluingFragments) {
            	if (edge.bitset.isEmpty()) continue;
            	tmpBitSet.clear();
            	tmpBitSet.or(edge.bitset); tmpBitSet.or(next.bitset);
            	if (nonEmptyCells.contains(tmpBitSet)) continue;
            }
            // add new combos to agenda
            addNewEdges(edgeFactory.createNewEdges(edge, next, collectCombos));
        }
        // combine edge via unary rules and with semantically null edges, 
        // adding new edges to the agenda
    	addNewEdges(edgeFactory.createNewEdges(next, collectCombos));
        // prune any superceded edges before returning
        pruneSupercededEdges();
    }

    // adds all new edges to the agenda
    private void addNewEdges(List<Edge> newEdges) {
        for (Edge newEdge : newEdges) {
            addEdgeToAgenda(newEdge);
        }
    }
    
    /** Greedily combines best fragments, updating bestJoinedEdge. */
    protected void joinBestFragments() {
    	// start with best edge
    	bestJoinedEdge = bestEdge;
    	// greedily find best fragments
    	List<Edge> fragments = new ArrayList<Edge>();
    	BitSet bitset = bestEdge.bitset;
    	while (true) {
        	Edge bestFrag = null;
        	for (Edge edge : allEdges) bestFrag = chooseBestFrag(bitset, bestFrag, edge);
        	for (Edge edge : agenda) bestFrag = chooseBestFrag(bitset, bestFrag, edge);
        	if (bestFrag == null) break;
        	fragments.add(bestFrag);
        	bitset = (BitSet) bitset.clone();
        	bitset.or(bestFrag.bitset);
    	}
    	// greedily join
    	while (fragments.size() > 0) {
    		Edge nextJoinedEdge = null; Edge nextFrag = null;
	    	for (Edge edge : fragments) {
	    		Edge joinedEdge = edgeFactory.makeJoinedEdge(bestJoinedEdge, edge);
	    		if (nextJoinedEdge == null || nextJoinedEdge.score < joinedEdge.score) {
	    			nextJoinedEdge = joinedEdge; nextFrag = edge;
	    		}
	    		Edge joinedEdgeR = edgeFactory.makeJoinedEdge(edge, bestJoinedEdge);
	    		if (nextJoinedEdge.score < joinedEdgeR.score) {
	    			nextJoinedEdge = joinedEdgeR; nextFrag = edge;
	    		}
	    	}
	    	bestJoinedEdge = nextJoinedEdge;
	    	fragments.remove(nextFrag);
    	}
    }
    
    // returns edge as the new best frag if it doesn't intersect bitset 
    // and has a better completeness or better score with same completeness; 
    // otherwise returns bestFrag
    private Edge chooseBestFrag(BitSet bitset, Edge bestFrag, Edge edge) {
		if (edge.bitset.isEmpty() || edge.bitset.intersects(bitset)) return bestFrag;
        if (bestFrag == null) return edge;
        if (bestFrag.completeness < edge.completeness) return edge;
        if (bestFrag.completeness == edge.completeness && bestFrag.score < edge.score) return edge;
        return bestFrag;  
    }
    
    
    //-----------------------------------------------------------------
    // unpacking    
    
    /** Unpack complete edges, if any; otherwise unpack all. */
	protected void doUnpacking() {
	    @SuppressWarnings("unchecked")
        Set<Edge> unpacked = new THashSet(new TObjectIdentityHashingStrategy());
	    boolean foundComplete = bestEdge.complete();
        // unpack each relevant edge, updating best edge 
        for (Edge edge : edges) {
            if (foundComplete && !edge.complete()) continue;
            unpack(edge, unpacked);
            updateBestEdge(edge.altEdges.get(0));
        }
    }
    
    // recursively unpack and prune edge, unless already visited
    private void unpack(Edge edge, Set<Edge> unpacked) {
        if (unpacked.contains(edge)) return;
        // add to unpacked set
        unpacked.add(edge);
        // OR: recursively unpack alts, merging resulting alts
        EdgeHash merged = new EdgeHash();
	    if (edge.altEdges == null) {
	    	throw new RuntimeException("No alts for: " + edge);
	    }
        for (Edge alt : edge.altEdges) {
            // AND: unpack inputs, make alts, add to merged
            unpackAlt(alt, unpacked, merged);
        }
        // sort, rescore and prune
        List<Edge> mergedList = new ArrayList<Edge>(merged.asEdgeSet());
        Collections.sort(mergedList, edgeComparator);
        List<Edge> prunedEdges = pruningStrategy.pruneEdges(mergedList);
        numPrunedNeverAdded += prunedEdges.size();
        // replace edge's alts, add to unpruned edges
        edge.altEdges.clear(); edge.altEdges.addAll(mergedList);
        allEdges.addAll(mergedList);
        // update signMap (for debugging)
        for (Edge mergedEdge : mergedList) {
        	if (!signMap.containsKey(mergedEdge.sign))
        		signMap.put(mergedEdge.sign, mergedEdge);
        }
    }
    
    // recursively unpack inputs, make alt combos and add to merged
    private void unpackAlt(Edge alt, Set<Edge> unpacked, EdgeHash merged) {
        // first check for opt completed edge
        if (alt.optCompletes != null) {
            // recursively unpack input edge
            Edge inputEdge = alt.optCompletes;
            unpack(inputEdge, unpacked);
            // then make and merge alt edges from input alt edges
            for (Edge inputAlt : inputEdge.altEdges) {
                Edge edgeToAdd = (inputAlt.sign == alt.sign)
                    ? alt // use this alt for same sign
                    : edgeFactory.makeAltEdge(inputAlt.sign, alt); // otherwise make edge for new alt
                merged.insert(edgeToAdd);
            }
            return;
        }
        // otherwise unpack via input signs
        DerivationHistory history = alt.sign.getDerivationHistory(); 
        Sign[] inputSigns = history.getInputs();
        // base case: no inputs
        if (inputSigns == null) {
            merged.insert(alt); return;
        }
        // otherwise recursively unpack
        Edge[] inputEdges = new Edge[inputSigns.length];
        for (int i = 0; i < inputSigns.length; i++) {
            inputEdges[i] = signMap.get(inputSigns[i]); // get input edge using signMap
            unpack(inputEdges[i], unpacked);
        }
        // then make edges for new combos, and add to merged (if unseen)
        Category resultCat = alt.sign.getCategory();
        boolean lefthead = (alt.sign.getLexHead() == inputSigns[0].getLexHead());
        List<Sign[]> altCombos = inputCombos(inputEdges, 0);
        for (Sign[] combo : altCombos) {
        	Sign lexHead = (lefthead) ? combo[0].getLexHead() : combo[1].getLexHead();
            Sign sign = Sign.createDerivedSignWithNewLF(resultCat, combo, history.getRule(), lexHead);
            Edge edgeToAdd = (sign.equals(alt.sign))
                ? alt // use this alt for equiv sign
                : edgeFactory.makeAltEdge(sign, alt); // otherwise make edge for new alt
            merged.insert(edgeToAdd);
        }
    }

    // returns a list of sign arrays, with each array of length inputEdges.length - i, 
    // representing all combinations of alt signs from i onwards
    private List<Sign[]> inputCombos(Edge[] inputEdges, int index) {
        Edge edge = inputEdges[index];
        // base case, inputEdges[last]
        if (index == inputEdges.length-1) {
            List<Edge> altEdges = edge.altEdges; 
            List<Sign[]> retval = new ArrayList<Sign[]>(altEdges.size());
            for (Edge alt : altEdges) {
                retval.add(new Sign[] { alt.sign });
            }
            return retval;
        }
        // otherwise recurse on index+1
        List<Sign[]> nextCombos = inputCombos(inputEdges, index+1);
        // and make new combos
        List<Edge> altEdges = edge.altEdges; 
        List<Sign[]> retval = new ArrayList<Sign[]>(altEdges.size() * nextCombos.size());
        for (Edge alt : altEdges) {
            for (int i = 0; i < nextCombos.size(); i++) {
                Sign[] nextSigns = nextCombos.get(i);
                Sign[] newCombo = new Sign[nextSigns.length+1];
                newCombo[0] = alt.sign;
                System.arraycopy(nextSigns, 0, newCombo, 1, nextSigns.length);
                retval.add(newCombo);
            }
        }
        return retval;
    }
    
    
    //-----------------------------------------------------------------
    // best edges (single best is available directly as bestEdge)
    
    // cached best edges
    private transient List<Edge> bestEdges = null;
    
    /** 
     * Returns the best complete edges, sorted by their score and 
     * pruned by the pruning strategy. 
     */
    public List<Edge> bestEdges() {
    	if (bestEdges != null) return bestEdges;
        bestEdges = new ArrayList<Edge>();
        if (!bestEdge.complete()) return bestEdges;
        List<Edge> edgesToUse = (usePacking && !doUnpacking) ? edges : allEdges;
        for (Edge edge : edgesToUse) {
            if (edge.complete()) bestEdges.add(edge); 
        }
        Collections.sort(bestEdges, edgeComparator);
        pruningStrategy.pruneEdges(bestEdges);
        return bestEdges;
    }
    
    /** 
     * Returns the oracle best edge for the given string, together 
     * with a flag indicating whether the target string was found.
     * At present, returns the edge from bestEdges() whose 
     * orthography equals the given string, otherwise the one 
     * with the highest 4-gram precision score (breaking ties 
     * using the list order).
     * TODO: It would be better to return the forest oracle. 
     */
    public Pair<Edge,Boolean> oracleBest(String target) {
    	List<Edge> edges = bestEdges();
    	// check orth
    	for (Edge edge : edges) {
    		if (edge.getSign().getOrthography().equals(target)) 
    			return new Pair<Edge,Boolean>(edge, true); 
    	}
    	// check 4-gram precision
    	Edge retval = null;
    	double bestScore = 0;
    	NgramPrecisionModel oracle = new NgramPrecisionModel(new String[]{target});
    	for (Edge edge : edges) {
    		double score = oracle.score(edge.getSign(), true);
    		if (score > bestScore) {
    			retval = edge; bestScore = score;
    		}
    	}
    	// done
    	return new Pair<Edge,Boolean>(retval, false);
    }
    
    
    //-----------------------------------------------------------------
    // printing routines
    
    /** The PrintWriter to use with the printing routines.  Default wraps System.out. */
    public PrintWriter out = new PrintWriter(System.out);

    /** Prints the best edge found. */
    public void printBestEdge() {
        printEdge(bestEdge);
        if (!edgeFactory.labeledNominals.isEmpty()) {
            try {
                ByteArrayOutputStream bstr = new ByteArrayOutputStream();
                edgeFactory.grammar.serializeXml(
                    bestEdge.sign.getWordsInXml(edgeFactory.labeledNominals), bstr
                );
                out.println(bstr.toString());
            }
            catch (java.io.IOException exc) { 
                throw (RuntimeException) new RuntimeException().initCause(exc);
            }
        }
        out.println(bestEdge.sign.getBracketedString());
        out.flush();
    }
    
    /** Prints the best joined edge. */
    public void printBestJoinedEdge() {
    	if (bestJoinedEdge == null) return;
        printEdge(bestJoinedEdge);
        out.println(bestJoinedEdge.sign.getBracketedString());
        out.flush();
    }
    
    /** Prints the timing (and related) info. */
    public void printTiming() {
        out.println();
        if (!usePacking) {
            if (bestEdge != null && bestEdge.complete())
                out.println("time 'til first   (ms): " + timeTilFirst);
            if (bestEdge != null)
                out.println("time 'til best    (ms): " + timeTilBest);
            if (timeTilStopped != 0)
                out.println("time 'til stopped (ms): " + timeTilStopped);
        }
        else {
            out.println("time 'til packed  (ms): " + timeTilPacked); 
        }
        if (timeTilDone != 0)
            out.println("time 'til done    (ms): " + timeTilDone); 
        out.println();
        out.println("rule apps:   " + edgeFactory.ruleApps());
        out.println("# edges:     " + edges.size());
        out.println("# unpruned edges:     " + allEdges.size());
        if (!usePacking) {
            out.println("# pruned:    " + numPrunedRemoved + " removed, " + numPrunedNeverAdded + " never added");
        }
        if (doUnpacking) {
            out.println("# pruned:    " + numPrunedNeverAdded);
        }
        out.println("cell max:    " + cellMax);
        out.flush();
    }
    
    /** Prints all chart edges, unsorted. */
    public void printEdges() { printEdges(false); }
    
    /** Prints chart edges unsorted, using the complete edges filter according to the given flag. */ 
    public void printEdges(boolean complete) { printEdges(complete, false); }
    
    /** 
     * Prints chart edges using the complete edges filter according to the given flag 
     * and sorting according to the given flag.
     * In the packing only case, the representative edges are shown, otherwise 
     * the unpruned (and possibly unpacked) edges are shown.
     */ 
    public void printEdges(boolean complete, boolean sort) {
        List<Edge> edgeList = (usePacking && !doUnpacking) ? edges : allEdges;
        if (sort) {
            edgeList = new ArrayList<Edge>(edgeList);
            Collections.sort(edgeList, edgeComparator);
        }
        for (int i=0; i < edgeList.size(); i++) { 
        	Edge edge = edgeList.get(i);
            if (!complete || edge.complete()) {
            	if (!sort) printEdge(edge, i, edgeList);
            	else printEdge(edge);
            }
                
        }
        out.flush();
    }

    /**
     * Prints the agenda.
     */
    public void printAgenda() {
        for (Edge edge : agenda) {
            printEdge(edge);
        }
        out.flush();
    }
    
    /**
     * Prints the initial edges.
     */
    public void printInitialEdges() {
        for (Edge edge : edgeFactory.initialEdges) {
            printEdge(edge);
        }
        out.flush();
    }
    
    // prints edge with incomplete LF chunks and active alts
    private void printEdge(Edge edge) { printEdge(edge, -1, null); }
    
    // prints also with edge index and derivation, if index non-negative
    private void printEdge(Edge edge, int index, List<Edge> edgeList) {
        String str = "";
        if (index >= 0) str += index + ". ";
        str += edge.toString();
        if (edge.incompleteLfChunk != null) {
            int id = edgeFactory.lfChunks.indexOf(edge.incompleteLfChunk);
            str += " <[" + id + "]>";
        }
        if (edge.activeLfAlts.size() > 0) str += " ";
        for (List<Alt> altSet : edge.activeLfAlts) {
            for (Alt alt : altSet) str += "?" + alt.altSet + "." + alt.numInSet;
        }
        str += edgeDerivation(edge, index, edgeList);
        out.println(str);
        // show alts subordinated in packing only case
        if (usePacking && !doUnpacking && edge.isDisjunctive()) {
            for (Edge alt : edge.altEdges) {
                if (alt != edge) 
                	out.println(" \\_ " + alt + edgeDerivation(alt, index, edgeList));
            }
        }
    }
    
    // returns derivation, if index non-negative
    private String edgeDerivation(Edge edge, int index, List<Edge> edgeList) {
    	if (index < 0) return "";
    	if (edge.optCompletes != null) {
    		return " (" + edgeList.indexOf(edge.optCompletes) + " optC)";
    	}
    	DerivationHistory history = edge.sign.getDerivationHistory();
    	Sign[] inputs = history.getInputs();
    	if (inputs == null) return " (lex)";
    	String retval = " (";
		for (Sign sign : inputs) {
			Edge repEdge = signMap.get(sign);
			if (repEdge != null) retval += edgeList.indexOf(repEdge) + " ";
		}
		retval += history.getRule().name() + ")";
    	return retval;
    }

    
    /**
     * Prints the licensed, marked initial edges.
     */
    public void printMarkedEdges() {
        for (Edge edge : edgeFactory.markedEdges) {
            printEdge(edge);
        }
        out.flush();
    }
    
    /**
     * Prints the licensed, instantiated purely syntactic (semantically null) edges.
     */
    public void printInstantiatedNoSemEdges() {
        for (Edge edge : edgeFactory.instantiatedNoSemEdges) {
            printEdge(edge);
        }
        out.flush();
    }
    
    /**
     * Prints the licensed, uninstantiated purely syntactic (semantically null) edges.
     */
    public void printNoSemEdges() {
        for (Edge edge : edgeFactory.noSemEdges) {
            out.println(edge.toString());
        }
        out.flush();
    }
    
    /**
     * Prints the rule instances, with instantiated semantics.
     */
    public void printRuleInstances() {
        for (Iterator<?> it = edgeFactory.ruleInstances.iterator(); it.hasNext(); ) {
            out.println(it.next().toString());
        }
        out.flush();
    }
    
    /**
     * Prints the LF chunks.
     */
    public void printLfChunks() {
        List<BitSet> chunks = edgeFactory.lfChunks;
        for (int i = 0; i < chunks.size(); i++) {
            BitSet chunk = chunks.get(i);
            out.println("chunk[" + i + "]:  " + Edge.toString(chunk));
        }
        out.flush();
    }
    
    /**
     * Prints the LF alternatives.
     */
    public void printLfAlts() {
        for (List<Alt> altSet : edgeFactory.lfAlts) {
            for (Alt alt : altSet) {
                out.print("alt[" + alt.altSet + "." + alt.numInSet + "]: ");
                out.println(Edge.toString(alt.bitset));
            }
        }
        out.flush();
    }
    
    /**
     * Prints the LF optional parts.
     */
    public void printLfOpts() {
        List<BitSet> opts = edgeFactory.lfOpts;
        for (int i = 0; i < opts.size(); i++) {
            BitSet opt = opts.get(i);
            out.println("opt[" + i + "]:  " + Edge.toString(opt));
        }
        out.flush();
    }
    
    /**
     * Prints the elementary predications.
     */
    public void printEPs() {
        List<SatOp> preds = edgeFactory.preds; 
        for (int i=0; i < preds.size(); i++) {
            SatOp lf_i = preds.get(i);
            out.println("ep[" + i + "]:  " + lf_i);
        }
        out.flush();
    }
    
    
    //-----------------------------------------------------------------
    // chart management

    // in the anytime case, first checks signs to see whether an edge 
    // whose sign is equivalent (up to surface words) and which has 
    // an equal or higher score or equal 
    // or lower derivational complexity has been seen already, and drops 
    // the given edge if so (in the packing case, this equivalence check is 
    // performed during unpacking);
    // if the edge replaces an (essentially) equivalent edge of lower score or higher 
    // derivational complexity, removes the old edge from the agenda 
    // or removes it from its equivalence class and puts it on a list of 
    // superceded edges to be pruned from the chart;
    // then, in all cases, adds the given edge to the agenda, 
    // and updates the best edge so far, with preference given to completeness, 
    // then sign score
    private void addEdgeToAgenda(Edge edge) {
    	numEdges++;
    	if (!usePacking) {
	    	// update edgeHash, checking for equivalent edge of equal or lower complexity
    		Edge retEdge = edgeHash.insert(edge);
    		boolean actuallyInserted = (retEdge != null);
	    	if (!actuallyInserted) { return; } // just drop it
	    	// remove old edge, if apropos
	    	Edge oldEdge = (retEdge != edge) ? retEdge : null; 
	    	if (oldEdge != null) {
	    		// check agenda first
	    		boolean onAgenda = agenda.remove(oldEdge);
	    		// if not on agenda, remove from equiv class, if present, 
	    		// and add to list of superceded edges pending removal
	    		// nb: delaying pruning of superceded edges from chart 
	    		//     is nec. to avoid a problem with concurrent access 
	    		//     to allEdges in doEdgeCombos
	    		if (!onAgenda) {
	    	        Edge repEdge = catMap.get(oldEdge);
	    	        if (repEdge != null) {
	    	        	boolean inChart = repEdge.altEdges.remove(oldEdge);
	    	        	if (inChart) supercededEdgesPendingRemoval.add(oldEdge);
	    	        }
	    		}
	    	}
    	}
        if (depthFirst) { agenda.add(0, edge); }
        else if (edge.score == 0) { agenda.add(edge); }
        else { addSorted(agenda, edge); }
        updateBestEdge(edge);
    }
    
    // update bestEdge wrt given edge, and adjust timing info
    private void updateBestEdge(Edge edge) {
        if (bestEdge == null) {
            bestEdge = edge; 
            long endTime = System.currentTimeMillis();
            timeTilBest = (int) (endTime - startTime);
            if (bestEdge.complete()) timeTilFirst = timeTilBest; 
            return;
        }
        if (bestEdge.completeness > edge.completeness) return;
        if (bestEdge.completeness < edge.completeness) {
            bestEdge = edge; 
            long endTime = System.currentTimeMillis();
            timeTilBest = (int) (endTime - startTime);
            if (bestEdge.complete()) timeTilFirst = timeTilBest; 
            return;
        }
        if (edge.score > bestEdge.score) {
            bestEdge = edge;
            long endTime = System.currentTimeMillis();
            timeTilBest = (int) (endTime - startTime);
            if (bestEdge.complete()) newBest++;
        }
    }
    
    // removes superceded edges from the chart
    private void pruneSupercededEdges() {
    	for (Edge oldEdge : supercededEdgesPendingRemoval) {
    		allEdges.remove(oldEdge); numPrunedRemoved++;
    	}
    	supercededEdgesPendingRemoval.clear();
    }
    
    // adds the edge to the chart and makes it a representative edge if it's the 
    // first one added for its equiv class; otherwise it's added as an alternative;
    // in the anytime case, prunes the edges listed as alts for the representative edge, 
    // and adds the edge to the list of all unpruned edges, if it survives pruning;
    // returns true if the edge is actually added, and false if it doesn't survive 
    // the pruning (anytime case), or is folded into an existing edge (packing case);
    // prunes the edge and returns false if the cell count is exceeded
    private boolean addEdgeToChart(Edge edge) {
    	// check cell count
    	if (cellPruningValue != NO_PRUNING && cellCount(edge) >= cellPruningValue) {
    		numPrunedNeverAdded++; return false;
    	}
    	// inc cell count
    	incCellCount(edge);
        // get representative edge for this edge
        Edge repEdge = catMap.get(edge);
        // check for same edge already in chart; pretend it's been added
        if (edge == repEdge) return true;
        // if none, make this edge into one, adding it to the chart
        if (repEdge == null) {
            edge.initAltEdges(); // nb: could try capacity of pruningValue+1
            if (collectCombos) edge.initEdgeCombos();
            catMap.put(edge, edge);
            edges.add(edge);
        	signMap.put(edge.sign, edge);
            // anytime case: add to all edges list too
            if (!usePacking) allEdges.add(edge);
            // and return
            return true;
        }
        // otherwise add edge to alts (sorted)
        else {
            addSorted(repEdge.altEdges, edge);
            // packing case: return false, as edge is simply folded into repEdge
            if (usePacking) return false;
        }
        // anytime case: if not pruning, just add edge to all edges list, and return
        if (pruningValue == NO_PRUNING) {
            allEdges.add(edge);
        	signMap.put(edge.sign, edge); // for debugging
            return true;
        }
        // otherwise do pruning
        List<Edge> prunedEdges = pruningStrategy.pruneEdges(repEdge.altEdges);
        boolean edgeItselfPruned = false;
        for (Edge prunedEdge : prunedEdges) {
            if (prunedEdge != edge) {
                allEdges.remove(prunedEdge);
                numPrunedRemoved++;
            }
            else edgeItselfPruned = true;
        }
        // add edge to all edges list, if it was not pruned
        if (!edgeItselfPruned) {
            allEdges.add(edge);
        	signMap.put(edge.sign, edge); // for debugging
            return true;
        }
        // otherwise false
        numPrunedNeverAdded++;
        return false;
    }
    
    // cell count
    private int cellCount(Edge edge) {
    	Integer count = cellMap.get(edge.bitset);
    	return (count == null) ? 0 : count;
    }

    // inc cell count
    private void incCellCount(Edge edge) {
    	int count = cellCount(edge);
    	cellMap.put(edge.bitset, ++count);
    	if (count > cellMax) cellMax = count;
    }
    
    
    //-----------------------------------------------------------------
    // edge sorted insertion and comparison
    
    // adds the given edge into the already sorted list, 
    // maintaining the sort order;
    // when gluing fragments, edges are sorted first by size, 
    // otherwise by score
    private void addSorted(List<Edge> list, Edge edge) {
    	Comparator<Edge> comparator = (gluingFragments) ? edgeSizeComparator : edgeComparator; 
        // do binary search
        int index = Collections.binarySearch(list, edge, comparator);
        // check if search found an edge with the same sort pos
        if (index >= 0) {
            // if so, advance the index past sort equiv edges
            while (index < list.size()) {
                Edge existingEdge = list.get(index);
                //if (existingEdge.score == edge.score) index++;
                if (comparator.compare(existingEdge, edge) == 0) index++;
                else break;
            }
        }
        else {
            // otherwise, convert index to insertion point
            index = Math.abs(index) - 1;
        }
        // then add edge at index
        list.add(index, edge); 
    }

    /** Compares edges based on their relative score, in descending order. */
    public static final Comparator<Edge> edgeComparator = new Comparator<Edge>() {
        public int compare(Edge edge1, Edge edge2) {
            return -1 * Double.compare(edge1.score, edge2.score);
        }
    };

    /** Compares edges based on their relative size then score, in descending order. */
    public static final Comparator<Edge> edgeSizeComparator = new Comparator<Edge>() {
        public int compare(Edge edge1, Edge edge2) {
        	int retval = -1 * Float.compare(edge1.completeness, edge2.completeness);
        	if (retval != 0) return retval;
            return -1 * Double.compare(edge1.score, edge2.score);
        }
    };
}
    

================================================
FILE: src/opennlp/ccg/realize/DiversityPruningStrategy.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2004-5 University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.realize;

import opennlp.ccg.synsem.Sign;

import java.util.*;

import gnu.trove.*;

/**
 * Abstract n-best edge pruning strategy that keeps edges diversified 
 * according to the notCompellinglyDifferent equivalence relation. 
 * The edges are clustered into a ranked list of equivalence classes, 
 * which are sequentially sampled until the limit n is reached to determine 
 * the edges to keep.
 * If the singleBestPerGroup flag is set, then a maximum of one edge 
 * per equivalence class is retained.
 *
 * @author      Michael White
 * @version     $Revision: 1.4 $, $Date: 2009/12/21 03:27:18 $
 */
abstract public class DiversityPruningStrategy extends NBestPruningStrategy
{
    /** Flag for whether to keep only the single best edge among those that 
        are not compellingly different (defaults to false). */
    public boolean singleBestPerGroup = false;
    
    /** Reusable set of edges to keep. */
    protected THashSet keepers = new THashSet(new TObjectIdentityHashingStrategy());
    
    /** Returns true iff the given signs are not compellingly different. */
    abstract public boolean notCompellinglyDifferent(Sign sign1, Sign sign2);
    
    /**
     * Returns a (possibly empty) list of edges pruned 
     * from the given ones, which should have equivalent
     * categories and be sorted by score, from highest to lowest. 
     * In particular, prunes and returns the edges that fall below the N-best 
     * cutoff when the diversity strategy determined by notCompellinglyDifferent 
     * is applied.
     * If the singleBestPerGroup flag is set, no more than one edge 
     * per group of equivalent ones will be returned.
     */
    public List<Edge> pruneEdges(List<Edge> catEdges) {
        // clear reusable return list
        retval.clear();
        // ensure pruning enabled
        if (CAT_PRUNE_VAL == Chart.NO_PRUNING) return retval;
        // ensure there are edges to prune
        if (!singleBestPerGroup && catEdges.size() <= CAT_PRUNE_VAL) return retval;
        // group edges into ranked equivalence classes, 
        // by using a list of lists, preserving order
        List<List<Edge>> groups = new ArrayList<List<Edge>>();
        for (Edge edge : catEdges) {
            boolean foundGroup = false;
            for (int i = 0; i < groups.size(); i++) {
                List<Edge> members = groups.get(i);
                Edge first = members.get(0);
                if (notCompellinglyDifferent(first.sign, edge.sign)) {
                    members.add(edge); 
                    foundGroup = true; break;
                }
            }
            if (!foundGroup) {
                List<Edge> members = new ArrayList<Edge>();
                members.add(edge);
                groups.add(members);
            }
        }
        // add top n to keepers by sequentially visiting groups, 
        // according also to singleBestPerGroup flag
        keepers.clear();
        int counter = 0;
        int numGroups = groups.size();
        while (keepers.size() < CAT_PRUNE_VAL && 
               (!singleBestPerGroup || counter < numGroups)) 
        {
            int groupNum = counter % numGroups;
            int indexInGroup = counter / numGroups;
            List<Edge> members = groups.get(groupNum);
            if (indexInGroup < members.size()) { 
                keepers.add(members.get(indexInGroup));
            }
            counter++;
        }
        // prune edges not in keepers
        for (Iterator<Edge> it = catEdges.iterator(); it.hasNext(); ) {
            Edge edge = it.next();
            if (!keepers.contains(edge)) {
                retval.add(edge);
                it.remove();
            }
        }
        // done
        return retval;
    }
}


================================================
FILE: src/opennlp/ccg/realize/Edge.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003-5 University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.realize;

import opennlp.ccg.synsem.*;
import opennlp.ccg.hylo.*;
import opennlp.ccg.*;
import java.util.*;
import java.util.prefs.*;
import java.text.*;

/**
 * <p>
 * An edge is a tracker for a sign, ie a sign together 
 * with bitsets representing its coverage of the 
 * input predicates and the semantic indices used, 
 * along with lists of the active LF alts.
 * It also has a completeness percentage and a score, 
 * as well as its most specific incomplete LF chunk (if any).
 * Edges are created by an EdgeFactory and managed by a Chart.
 * </p>
 * <p>
 * A representative edge is an edge that represents (stands in for) 
 * other edges with the same category during the chart generation
 * process.  A representative edge has a list of alternative edges, 
 * which are assumed to share the same category; it is considered 
 * disjunctive when there is more than one alternative.
 * Note that initially a representative edge will be in its list 
 * of alternatives, but it can be removed during pruning.
 * Finally, for the anytime search, a representative edge can  
 * maintain a collection of successful combinations, to avoid 
 * invoking the combinatory rules multiple times with the same 
 * combinations of categories.
 * </p>
 *
 * @author      Michael White
 * @version     $Revision: 1.32 $, $Date: 2010/08/10 04:10:15 $
 */
public class Edge extends Tracker
{

    /** Preference key for showing completeness. */
    public static final String SHOW_COMPLETENESS = "Show Completeness";

    /** Preference key for showing coverage bitset. */
    public static final String SHOW_BITSET = "Show Bitset";

    
    /** The sign. */
    protected Sign sign;
    
    /** The completeness percentage. */
    public final float completeness;
    
    /** The edge score. */
    public final double score;
    
    /** The most specific incomplete LF chunk (if any). */
    public final BitSet incompleteLfChunk;
    
    /** The alternative edges (none initially). */
    protected List<Edge> altEdges = null;
    
    /** The edge combos (none initially). */
    protected EdgeCombos edgeCombos = null;
    
    /** The edge, if any, that this edge is constructed from 
        by marking optional bits as completed. */
    protected Edge optCompletes = null;
    
    
    /** Constructor. */
    public Edge(Sign sign, BitSet bitset, BitSet indices, 
                float completeness, double score, 
                List<List<Alt>> activeLfAlts, BitSet incompleteLfChunk) 
    {
        super(bitset, indices, activeLfAlts);
        this.sign = sign;
        this.completeness = completeness; this.score = score; 
        this.incompleteLfChunk = incompleteLfChunk;
    }

    
    /** Returns the sign. */
    public Sign getSign() { return sign; }
    
    /** Returns whether this edge has completeness 1.0, ie, covers all the input preds. */
    public boolean complete() {
        return (completeness == 1.0);
    }
    
    /**
     * Returns the nominal which is the value of the index feature on the 
     * sign's target cat, or null if none.
     */
    public Nominal getIndexNominal() { return sign.getCategory().getIndexNominal(); }
    

    /**
     * Returns true iff this edge can combine with the given tracker 
     * without violating its LF chunk constraint (if any).
     * Specifically, returns true when this edge has no incomplete chunk 
     * or the tracker is semantically empty; otherwise, returns true 
     * iff the incomplete chunk intersects with the tracker's 
     * coverage vector.
     */
    public boolean meetsLfChunkConstraints(Tracker tracker) {
        if (incompleteLfChunk == null || tracker.bitset.isEmpty()) return true;
        return incompleteLfChunk.intersects(tracker.bitset);
    }
    

    /** Returns whether this edge is a representative. */
    public boolean isRepresentative() { return altEdges != null; }
    
    /** Returns whether this edge is disjunctive. */
    public boolean isDisjunctive() { return altEdges != null && altEdges.size() > 1; }
    
    /** Returns the list of alt edges, or the empty list if none. */
    public List<Edge> getAltEdges() {
        if (altEdges == null) return Collections.emptyList(); 
        else return altEdges;
    }
    
    /** Initializes the alt edges list with a default capacity, adding this edge. */
    public void initAltEdges() { initAltEdges(3); }
    
    /** Initializes the alt edges list with the given capacity, adding this edge. */
    public void initAltEdges(int capacity) {
        // check uninitialized
        if (altEdges != null) throw new RuntimeException("Alt edges already initialized!");
        altEdges = new ArrayList<Edge>(capacity);
        altEdges.add(this);
    }
    
    
    /** Initializes the edge combos. */
    public void initEdgeCombos() {
        // check representative status
        if (!isRepresentative()) throw new RuntimeException("Not a representative!");
        if (edgeCombos != null) throw new RuntimeException("Edge combos already initialized!");
        edgeCombos = new EdgeCombos();
    }
    
    
    /** Returns a hash code for this edge. (Alternatives are not considered.) */
    public int hashCode() {
        int retval = sign.hashCode() + 31 * bitset.hashCode() + indices.hashCode();
        retval += (int) (31000 * score);
        return retval;
    }
    
    /** 
     * Returns a hash code for this edge based on the surface words, 
     * ignoring the LF and ignoring the score. 
     */
    public int surfaceWordHashCode() {
    	return sign.surfaceWordHashCode(true) + 31 * bitset.hashCode() + indices.hashCode();
    }
    
    /** Returns whether this edge equals the given object. (Alternatives are not considered.) */
    public boolean equals(Object obj) {
        if (obj == this) return true;
        if (!(obj instanceof Edge)) return false;
        Edge edge = (Edge) obj;
        return bitset.equals(edge.bitset) && indices.equals(edge.indices) && 
        	completeness == edge.completeness && score == edge.score &&
        	sign.equals(edge.sign);
    }
    
    /** 
     * Returns whether this edge equals the given object based on the surface words, 
     * ignoring the LF and ignoring the score. 
     */
    public boolean surfaceWordEquals(Object obj) {
        if (obj == this) return true;
        if (!(obj instanceof Edge)) return false;
        Edge edge = (Edge) obj;
        return bitset.equals(edge.bitset) && indices.equals(edge.indices) &&
               sign.surfaceWordEquals(edge.sign, true);
    }
    
    
    /**
     * Returns a string for the edge in the format
     * {completeness} [score] orthography :- category {bitset}. 
     */
    public String toString() {
        Preferences prefs = Preferences.userNodeForPackage(TextCCG.class);
        boolean showCompleteness = prefs.getBoolean(SHOW_COMPLETENESS, false);
        boolean showBitset = prefs.getBoolean(SHOW_BITSET, false);
        StringBuffer sbuf = new StringBuffer();
        //sbuf.append(indices + " ");
        if (showCompleteness) { sbuf.append("{" + nf2.format(completeness) + "} "); }
        if (score >= 0.001 || score == 0.0) {
            sbuf.append("[" + nf3.format(score) + "] ");
        }
        else {
            sbuf.append("[" + nfE.format(score) + "] ");
        }
        sbuf.append(sign.toString());
        if (showBitset) { sbuf.append(' ').append(toString(bitset)); }
        return sbuf.toString();
    }
    
    // formats to two decimal places
    private static final NumberFormat nf2 = initNF2();
    private static NumberFormat initNF2() { 
        NumberFormat f = NumberFormat.getInstance();
        f.setMinimumIntegerDigits(1);
        f.setMinimumFractionDigits(2);
        f.setMaximumFractionDigits(2);
        return f;
    }
    
    // formats to three decimal places
    private static final NumberFormat nf3 = initNF3();
    private static NumberFormat initNF3() { 
        NumberFormat f = NumberFormat.getInstance();
        f.setMinimumIntegerDigits(1);
        f.setMinimumFractionDigits(3);
        f.setMaximumFractionDigits(3);
        return f;
    }
    
    // formats to "0.##E0"
    private static final NumberFormat nfE = new DecimalFormat("0.##E0");
    
    /** Formats bitset compactly, with ranges hyphenated. */
    public static String toString(BitSet bitset) {
        StringBuffer sbuf = new StringBuffer();
        sbuf.append('{');
        int j = 0;
        for (int i = bitset.nextSetBit(0); i >= 0; i = bitset.nextSetBit(j+1)) {
            if (j != 0) sbuf.append(',');
            j = bitset.nextClearBit(i);
            if (j == i+1) sbuf.append(Integer.toString(i));
            else sbuf.append(i + "-" + (j-1));
        }
        sbuf.append('}');
        return sbuf.toString();
    }
}


================================================
FILE: src/opennlp/ccg/realize/EdgeCombos.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2005 University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.realize;

import java.util.*;

/**
 * EdgeCombos is a simple data structure that allows a representative edge 
 * to collect the info about successful combinations of the edge (with 
 * other edges or unary rules) that is needed to create analogous new result edges 
 * for edges that share the same category, without having to invoke 
 * the combinatory rules.
 *
 * @author      Michael White
 * @version     $Revision: 1.3 $, $Date: 2005/10/13 18:20:30 $
 */
public class EdgeCombos
{
    
    /** Info for a collected category combination. */
    public class CatCombo {
        /** The (other) input edge for the category combo. */
        public final Edge inputEdge;
        /** The result edge, to use in making alternative edges. */
        public final Edge resultEdge;
        /** Constructor */
        public CatCombo(Edge inputEdge, Edge resultEdge) {
            this.inputEdge = inputEdge; this.resultEdge = resultEdge; 
        }
    }
    
    /** The rightward combos. */
    public final List<CatCombo> rightwardCombos = new ArrayList<CatCombo>(5);
    
    /** The leftward combos. */
    public final List<CatCombo> leftwardCombos = new ArrayList<CatCombo>(5);
    
    /** The unary results. */
    public final List<Edge> unaryResults = new ArrayList<Edge>(3);
    
    /** The optional results, ie with optional parts marked as completed. */
    public final List<Edge> optionalResults = new ArrayList<Edge>(3);
    
    
    /** Adds a rightward combo. */
    public void addRightwardCombo(Edge inputEdge, Edge resultEdge) {
        rightwardCombos.add(new CatCombo(inputEdge, resultEdge));
    }
    
    /** Adds a leftward combo. */
    public void addLeftwardCombo(Edge inputEdge, Edge resultEdge) {
        leftwardCombos.add(new CatCombo(inputEdge, resultEdge));
    }
}


================================================
FILE: src/opennlp/ccg/realize/EdgeFactory.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003-11 University of Edinburgh / Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.realize;

import opennlp.ccg.*;
import opennlp.ccg.lexicon.*;
import opennlp.ccg.grammar.*;
import opennlp.ccg.unify.*;
import opennlp.ccg.synsem.*;
import opennlp.ccg.hylo.*;
import opennlp.ccg.util.*;

import gnu.trove.*;

import java.util.*;
import java.util.prefs.*;

/**
 * The EdgeFactory is responsible for creating edges. 
 * A single edge factory instance per realization request is assumed.
 *
 * @author      Michael White
 * @version     $Revision: 1.87 $, $Date: 2011/10/30 21:06:47 $
 */
public class EdgeFactory
{

    /** Preference key for whether to use indexing to filter edges to combine. */
    public static final String USE_INDEXING = "Use Indexing";
    
    /** Preference key for whether to (exceptionally) allow categories with no target cat index nominal to combine. */
    public static final String ALLOW_MISSING_INDEX_COMBOS = "Allow Missing Index Combos";
    
    /** Preference key for whether to use LF chunks to filter edges to combine. */
    public static final String USE_CHUNKS = "Use Chunks";
    
    /** Preference key for whether to use feature licensing; if false, 
        the simple lex feature is used for comparison purposes. */
    public static final String USE_FEATURE_LICENSING = "Use Feature Licensing";
    

    /** The grammar used to create edges. */    
    public final Grammar grammar;
    
    /** The elementary predications to be covered. */
    public final List<SatOp> preds;
    
    /** The sign scorer. */
    public final SignScorer signScorer;
    
    /** The hypertagger. */
    public final Hypertagger hypertagger;
    
    /** The initial, unmarked edges instantiated after lexical lookup. */
    public final List<Edge> initialEdges = new ArrayList<Edge>();

    /** The marked initial edges licensed by features in the other initial edges. */
    public final List<Edge> markedEdges = new ArrayList<Edge>();

    /** The licensed and instantiated purely syntactic (semantically null) edges. */
    public final List<Edge> instantiatedNoSemEdges = new ArrayList<Edge>();
    
    /** The licensed, uninstantiated purely syntactic edges. */
    public final List<Edge> noSemEdges = new ArrayList<Edge>();

    /** The rule instances, ie the type changing rules with instantiated semantics. */
    public final List<RuleInstance> ruleInstances = new ArrayList<RuleInstance>();
    
    /** The LF chunks, represented as bitsets. */
    public final List<BitSet> lfChunks = new ArrayList<BitSet>();
    
    /** The LF alts, represented as a list of lists of alts 
        (where each list of alts forms an exclusive disjunction). */
    public final List<List<Alt>> lfAlts = new ArrayList<List<Alt>>();
    
    /** The LF optional parts, represented as bitsets. */
    public final List<BitSet> lfOpts = new ArrayList<BitSet>();
    
    /** Flag indicating whether there are any LF alts or optional parts. */
    public boolean hasLfAltsOrOpts = false;
    
    // a bitset for all preds
    private final BitSet allPreds;
    
    
    // the lexicon used to create edges    
    private final Lexicon lexicon;
    
    // general rules, ie the ones with no associated semantics
    private final RuleGroup generalRules;
    
    // rule group for rules wrapped by rule instances
    private final RuleGroup ruleInstancesGroup;
    
    // rule for joining fragments
    private final FragmentJoining fragmentRule = new FragmentJoining();
    
    // helper class for licensing features
    private final FeatureLicenser featureLicenser;
    
    
    /** Set of nominals whose phrases are marked for labeling in the output (with mark=+). */
    public final Set<Nominal> labeledNominals = new HashSet<Nominal>();
    
    /** Map from nominals to ints, for indexing edges. */
    final TObjectIntHashMap nominals = new TObjectIntHashMap();
    
    // indexes the preds by their position, 
    // by mapping pred keys to a list of pred indices for that key
    private final Map<String,List<Integer>> predMap = new HashMap<String,List<Integer>>();
    
    // list of paired nominals in the input LF
    private final List<BitSet[]> pairedNominals = new ArrayList<BitSet[]>();
    
    // flag for whether there are any paired nominals
    private boolean anyPairedNominals = false;
    
    /** Set of nominals under a BoundVar relation. */
    final Set<Nominal> boundVarNominals = new HashSet<Nominal>();
    
    // list of nominals for a particular cat or pair of cats
    private final List<Object> catNominals = new ArrayList<Object>();
    
    
    /** 
     * Flag for whether to use indexing. 
     * Setting retrieved from preferences; turned off when gluing fragments. 
     */
    public boolean useIndexing = true;

    // flag for whether to (exceptionally) allow categories with no target cat index nominal to combine
    private boolean allowMissingIndexCombos = false;
    
    // flag for whether to use chunks
    private boolean useChunks = true;
    
    // flag for whether to use feature licensing
    private boolean useFeatureLicensing = true;

    /** 
     * Flag for whether to debug category instantiation (defaults to false). 
     * If true, cases of complex categories whose outermost category 
     * is not instantiated with index nominals are reported to 
     * System.err. Note that realization is more efficient if such 
     * categories can be avoided in the grammar.
     * Uncovered EPs after lex lookup are also reported to System.err.
     */ 
    public boolean debugInstantiation = false;
    
    
    /* The number of unary rule applications executed. */
    private int unaryRuleApps = 0;

    /* The number of unary rule instance applications executed. */
    private int unaryRuleInstApps = 0;

    /* The number of binary rule applications executed. */
    private int binaryRuleApps = 0;
    

    /** Flag for whether to glue fragments currently. Defaults to false. */
    public boolean gluingFragments = false;

    /** Bit vector for EPs not covered by a lexical edge or rule instance; null if none. */
    protected BitSet uncoveredEPs = null;
    
    /** Flag indicating whether any lexical or featural EPs are uncovered. */
    public boolean hasUncoveredPreds = false;
    
    /** Flag for whether to use relaxed relation matching. */  // XXX tmp switch
    protected boolean useRelaxedRelationMatching = Boolean.getBoolean("useRelaxedRelationMatching");
    
    
    /** Constructor. */
    public EdgeFactory(Grammar grammar, List<SatOp> preds, SignScorer signScorer) {
    	this(grammar, preds, signScorer, null);
    }
    
    /** Constructor with hypertagger. */
    public EdgeFactory(Grammar grammar, List<SatOp> preds, SignScorer signScorer, Hypertagger hypertagger) {
        this.grammar = grammar;
        this.preds = preds;
        this.signScorer = signScorer;
        this.hypertagger = hypertagger;
        
        lexicon = grammar.lexicon;
        generalRules = new RuleGroup(grammar);
        generalRules.borrowSupercatRuleCombos(grammar.rules);
        ruleInstancesGroup = new RuleGroup(grammar);
        ruleInstancesGroup.borrowSupercatRuleCombos(grammar.rules);
        
        allPreds = new BitSet(preds.size());
        allPreds.set(0, preds.size());
        
        Preferences prefs = Preferences.userNodeForPackage(TextCCG.class);
        useIndexing = prefs.getBoolean(USE_INDEXING, true);
	allowMissingIndexCombos = prefs.getBoolean(ALLOW_MISSING_INDEX_COMBOS,false);
        useChunks = prefs.getBoolean(USE_CHUNKS, true);
        useFeatureLicensing = prefs.getBoolean(USE_FEATURE_LICENSING, true);

        if (useFeatureLicensing) {
            featureLicenser = new FeatureLicenser(this);
        } else {
            // if feature licensing off, use simple lex feature for comparison purposes
            featureLicenser = new FeatureLicenser(
                this, 
                new LicensingFeature[] { LicensingFeature.simpleLexFeature }
            );
        }
            
        UnifyControl.startUnifySequence();
        extractLabeledNominals();
        indexPreds();
        listNominals();
        listPairedNominals();
        addBoundVarNominals();
        fillLfChunks(); 
        fillLfAlts(); fillLfOpts();
        hasLfAltsOrOpts = lfAlts.size() > 0 || lfOpts.size() > 0;
        
        if (hypertagger != null) hypertagger.mapPreds(preds);
    }

    /**
     * Adds LF optional parts for any preds not covered by a lex item or rule instance,
     * divided up by chunks, for use with fragment gluing or relaxed relation matching.
     */
    public void addLFOptsForUncoveredPreds() {
    	// see if all preds covered
    	if (uncoveredEPs == null) return;
    	// clone what's not covered by lex items and rule instances
    	BitSet opt = (BitSet) uncoveredEPs.clone();
		// otherwise add opts for what's missing
		// nb: need to split up by chunks
		for (BitSet chunk : lfChunks) {
			if (opt.intersects(chunk)) {
				BitSet optChunk = (BitSet) opt.clone();
				optChunk.and(chunk);
				if (!lfOpts.contains(optChunk)) lfOpts.add(optChunk);
				opt.andNot(optChunk);
			}
		}
		// add anything remaining
		if (!opt.isEmpty() && !lfOpts.contains(opt)) lfOpts.add(opt);
    	// ensure hasLfAltsOrOpts set
    	hasLfAltsOrOpts = true;
		// TODO deal with lf alts too (may require sorting chunks and alts by size)
    }
    
    /**
     * Adds an LF optional part for each instantiated rule instance, 
     * for use with fragment gluing.
     */
    public void addLFOptsForRuleInstances() {
    	// do each rule instance
    	for (RuleInstance ruleInstance : ruleInstances) {
    		BitSet opt = (BitSet) ruleInstance.bitset.clone();
    		lfOpts.add(opt);
    	}
    	// ensure hasLfAltsOrOpts set
    	if (lfOpts.size() > 0) hasLfAltsOrOpts = true;
    }
    
    // returns the uncovered preds, or null if none
    private BitSet uncoveredPreds() {
    	// determine what's covered by lex items and rule instances
    	BitSet retval = new BitSet(preds.size());
    	for (Edge edge : initialEdges) retval.or(edge.bitset);
    	for (Edge edge : markedEdges) retval.or(edge.bitset);
    	for (RuleInstance ruleInstance : ruleInstances) retval.or(ruleInstance.bitset);
    	// see if all preds covered
    	if (retval.equals(allPreds)) return null;
		// otherwise xor what's missing
		retval.xor(allPreds);
		// set missing lex preds flag
		for (int i = retval.nextSetBit(0); i >= 0; i = retval.nextSetBit(i+1)) {
			SatOp pred = preds.get(i);
			if (HyloHelper.isLexPred(pred) || HyloHelper.isAttrPred(pred)) {
				hasUncoveredPreds =  true; break;
			}
		}
		// return
    	return retval;
    }
    
    
    //-----------------------------------------------------------------
    // edge construction
    //

    /** Makes an edge, computing the completeness percentage, sign score, 
        and indices, and setting the most specific incomplete LF chunk (if any). */
    protected Edge makeEdge(Sign sign, BitSet bitset, List<List<Alt>> activeLfAlts) {
        BitSet indices = getIndices(sign.getCategory(), null);
        float completeness = bitset.cardinality() / (float) preds.size();
        boolean complete = (completeness == 1.0);
        double score = signScorer.score(sign, complete);
        BitSet incompleteLfChunk = getIncompleteLfChunk(bitset, activeLfAlts);
        return new Edge(sign, bitset, indices, completeness, score, activeLfAlts, incompleteLfChunk);
    }

    /** Makes an edge for the given alt sign from the given edge, after computing the sign's score. */
    protected Edge makeAltEdge(Sign altSign, Edge edge) {
        double score = signScorer.score(altSign, edge.complete());
        return new Edge(
        		altSign, edge.bitset, edge.indices, 
        		edge.completeness, score, 
        		edge.activeLfAlts, edge.incompleteLfChunk
        );
    }
    
    /** Makes an edge consisting of two joined fragments. */
    public Edge makeJoinedEdge(Edge edge1, Edge edge2) {
    	Sign sign = fragmentRule.applyRule(edge1.sign, edge2.sign);
    	BitSet bitset = (BitSet) edge1.bitset.clone();
    	bitset.or(edge2.bitset);
        float completeness = bitset.cardinality() / (float) preds.size();
        boolean complete = (completeness == 1.0);
        double score = signScorer.score(sign, complete);
        return new Edge(
        		sign, bitset, edge1.indices, 
        		completeness, score, 
        		edge1.activeLfAlts, edge1.incompleteLfChunk
        );
    }
    
    
    //-----------------------------------------------------------------
    // active alts
    //

    /** From the given LF alts, returns the active ones for the given bitset, 
        updating the bitset for any completely covered alts. 
        NB: If the given LF alts list is not the entire list, each alt is assumed to intersect. */
    private List<List<Alt>> getActiveLfAlts(List<List<Alt>> fromLfAlts, BitSet bitset) {
        if (fromLfAlts.isEmpty()) return fromLfAlts;
        boolean checkingAllAlts = (fromLfAlts == lfAlts);
        BitSet tmpBitSet = new BitSet(bitset.size());
        List<List<Alt>> retval = new ArrayList<List<Alt>>(fromLfAlts.size());
        // check each 'from' alt 
        for (List<Alt> altSet : fromLfAlts) {
            List<Alt> activeAltSet = null; // for collecting active alts
            boolean foundCoveredAlt = false;
            for (Alt alt : altSet) { 
                // if checking all alts, check intersection with alt
                if (!checkingAllAlts || alt.bitset.intersects(bitset)) {
                    // check whether alt completely covered
                    tmpBitSet.clear(); tmpBitSet.or(bitset); tmpBitSet.and(alt.bitset);
                    if (tmpBitSet.equals(alt.bitset)) {
                        foundCoveredAlt = true; break;
                    }
                    else {
                        // otherwise add to active alts
                        if (activeAltSet == null) activeAltSet = new ArrayList<Alt>(3);
                        activeAltSet.add(alt);
                    }
                }
            }
            if (foundCoveredAlt) {
                // update coverage bitset to include all alts in this set
                List<Alt> fullAltSet = lfAlts.get(altSet.get(0).altSet);
                for (Alt alt : fullAltSet) bitset.or(alt.bitset); 
            }
            else {
                // otherwise update active alts, if any
                if (activeAltSet != null) retval.add(activeAltSet);
            }
        }
        return retval;
    }
    
    /** Returns the active LF alts that result from combining the given ones, 
        or null if these are incompatible.
        For alt sets in common, the combined alts consist of the intersection 
        of these alt sets, or null if this intersection is empty.
        For alts sets not in common, the active alts are carried through 
        unchanged. */
    private List<List<Alt>> getCombinedLfAlts(List<List<Alt>> activeLfAlts1, List<List<Alt>> activeLfAlts2) {
        if (activeLfAlts1.isEmpty()) return activeLfAlts2;
        if (activeLfAlts2.isEmpty()) return activeLfAlts1;
        List<List<Alt>> retval = new ArrayList<List<Alt>>(activeLfAlts1.size() + activeLfAlts2.size());
        Iterator<List<Alt>> it1 = activeLfAlts1.iterator(); Iterator<List<Alt>> it2 = activeLfAlts2.iterator();
        List<Alt> altSet1 = it1.next(); List<Alt> altSet2 = it2.next();
        for (int i = 0; i < lfAlts.size(); i++) {
            // inc to alt set i, if not yet there (or beyond)
            if (altSet1.get(0).altSet < i && it1.hasNext()) altSet1 = it1.next(); 
            if (altSet2.get(0).altSet < i && it2.hasNext()) altSet2 = it2.next();
            // check whether only one or the other has alt set i
            if (altSet1.get(0).altSet == i && altSet2.get(0).altSet != i) retval.add(altSet1);
            else if (altSet2.get(0).altSet == i && altSet1.get(0).altSet != i) retval.add(altSet2);
            else if (altSet1.get(0).altSet == i && altSet2.get(0).altSet == i) {
                // take intersection
                List<Alt> combined = new ArrayList<Alt>(Math.min(altSet1.size(),altSet2.size()));
                for (Alt alt : altSet1) {
                    if (altSet2.contains(alt)) combined.add(alt);
                }
                // check for empty intersection, returning null 
                if (combined.isEmpty()) return null;
                // otherwise add combined list
                retval.add(combined);
            }
        }
        return retval;
    }
    
    
    //-----------------------------------------------------------------
    // misc bookkeeping
    //

    // extracts the nominal atoms marked for labeling in the output
    private void extractLabeledNominals() {
        for (Iterator<SatOp> it = preds.iterator(); it.hasNext(); ) {
        	SatOp pred = it.next();
            if (!HyloHelper.isAttrPred(pred)) continue;
            Nominal nom1 = HyloHelper.getPrincipalNominal(pred);
            if (!(nom1 instanceof NominalAtom)) continue;
            String rel = HyloHelper.getRel(pred);
            if (rel == null || !rel.equals("mark")) continue;
            labeledNominals.add(nom1);
            it.remove();
        }
    }
    
    // lists the nominals in the preds
    private void listNominals() {
    	for (SatOp pred : preds) {
            Nominal nom1 = HyloHelper.getPrincipalNominal(pred);
            Nominal nom2 = HyloHelper.getSecondaryNominal(pred);
            if (nom1 instanceof NominalAtom && !nominals.containsKey(nom1)) { 
                nominals.put(nom1, nominals.size()); 
            }
            if (nom2 instanceof NominalAtom && !nominals.containsKey(nom2)) { 
                nominals.put(nom2, nominals.size()); 
            }
        }
    }
    
    // create bitset for cat indices
    private BitSet getIndices(Category cat, Category cat2) {
        catNominals.clear();
        cat.forall(gatherIndices);
        if (cat2 != null) { cat2.forall(gatherIndices); }
        BitSet retval = new BitSet(nominals.size());
        for (Iterator<Object> it = catNominals.iterator(); it.hasNext(); ) {
            Object nom = it.next();
            int index = nominals.get(nom);
            retval.set(index);
        }
        return retval;
    }

    // check for uninstantiated outer args; if found,  
    // set the indices to allow all combos, and issue 
    // a warning if the debugInstantiation flag is set
    private void checkInstantiation(List<Edge> edges) {
        for (int i = 0; i < edges.size(); i++) {
            Edge edge = edges.get(i);
            if (noSemEdges.contains(edge)) continue; // exempt uninstantiated no sem edges
            if (outerArgUninstantiated(edge.sign.getCategory())) {
                edge.indices.set(0, nominals.size());
                if (debugInstantiation) {
                	System.err.println("Warning: outer arg uninstantiated: " + edge.sign);
                }
            }
        }
    }
        
    // returns whether the outermost arg is not instantiated
    private boolean outerArgUninstantiated(Category cat) {
        if (!(cat instanceof ComplexCat)) return false;
        Arg outer = ((ComplexCat)cat).getOuterArg();
        catNominals.clear();
        outer.forall(gatherIndices);
        return catNominals.isEmpty();
    }
    
    // gathers values of index feature in atomic cats
    private CategoryFcn gatherIndices = new CategoryFcnAdapter() {
        public void forall(Category c) {
            if (!(c instanceof AtomCat)) return;
            FeatureStructure fs = c.getFeatureStructure();
            if (fs == null) return;
            addCatNominal(fs.getValue("index"));
            addCatNominal(fs.getValue("mod-index"));
        }
    };
    
    // adds a nominal atom to catNominals
    private void addCatNominal(Object indexVal) {
        if (indexVal instanceof NominalAtom) { 
            if (!catNominals.contains(indexVal)) { catNominals.add(indexVal); }
        }
    }

    // lists the paired nominals in the input LF, as a bitset pair
    private void listPairedNominals() {
        for (int i=0; i < preds.size(); i++) {
        	SatOp pred = preds.get(i);
            if (!"tup".equals(HyloHelper.getLexPred(pred))) continue;
            Nominal tupNom = HyloHelper.getPrincipalNominal(pred);
            Nominal nom1 = null;
            Nominal nom2 = null;
            for (int j = i+1; j < preds.size(); j++) {
            	SatOp predJ = preds.get(j);
                if (!tupNom.equals(HyloHelper.getPrincipalNominal(predJ))) break;
                if ("Item1".equals(HyloHelper.getRel(predJ))) {
                    nom1 = HyloHelper.getSecondaryNominal(predJ);
                }
                if ("Item2".equals(HyloHelper.getRel(predJ))) {
                    nom2 = HyloHelper.getSecondaryNominal(predJ);
                }
            }
            if (nom1 == null || nom2 == null) {
                System.err.println("Warning, couldn't find paired nominals for tuple: " + tupNom);
                continue;
            }
            if (!(nom1 instanceof NominalAtom)) continue;
            if (!(nom2 instanceof NominalAtom)) continue;
            BitSet[] pair = new BitSet[2];
            pair[0] = new BitSet(nominals.size());
            pair[0].set(nominals.get(nom1));
            pair[1] = new BitSet(nominals.size());
            pair[1].set(nominals.get(nom2));
            pairedNominals.add(pair);
            anyPairedNominals = true;
        }
    }
    
    // adds the bound var nominals
    private void addBoundVarNominals() {
        for (int i=0; i < preds.size(); i++) {
        	SatOp pred = preds.get(i);
            String rel = HyloHelper.getRel(pred);
            if (rel == null || !rel.equals("BoundVar")) continue;
            Nominal nom2 = HyloHelper.getSecondaryNominal(pred);
            if (!(nom2 instanceof NominalAtom)) continue;
            boundVarNominals.add(nom2);
            // check if nom2 is a tuple
            for (int j = 0; j < preds.size(); j++) {
            	SatOp predJ = preds.get(j);
                if (!nom2.equals(HyloHelper.getPrincipalNominal(predJ))) continue;
                if (!"tup".equals(HyloHelper.getLexPred(predJ))) continue;
                // if so, add paired items as bound vars too
                for (int k = j+1; k < preds.size(); k++) {
                	SatOp predK = preds.get(k);
                    if (!nom2.equals(HyloHelper.getPrincipalNominal(predK))) break;
                    String relK = HyloHelper.getRel(predK);
                    if ("Item1".equals(relK) || "Item2".equals(relK)) {
                        Nominal nom2K = HyloHelper.getSecondaryNominal(predK);
                        if (!(nom2K instanceof NominalAtom)) continue;
                        boundVarNominals.add(nom2K);
                    }
                }
            }
        }
    }
    
    /**
     * Returns whether the indices for the two edges are paired in the input LF.
     */
    public boolean pairedWith(Edge edgeA, Edge edgeB) {
        for (int i = 0; i < pairedNominals.size(); i++) {
            BitSet[] pair = pairedNominals.get(i);
            if (pair[0].equals(edgeA.indices) && pair[1].equals(edgeB.indices)) {
                return true;
            }
        }
        return false;
    }
    

    // indexes the preds by their position into predMap
    private void indexPreds() {
        for (int i=0; i < preds.size(); i++) {
            String[] keys = predKeys(preds.get(i));
            for (int j=0; j < keys.length; j++) {
                List<Integer> indices = predMap.get(keys[j]);
                if (indices == null) { 
                    indices = new ArrayList<Integer>(1);
                    predMap.put(keys[j], indices);
                }
                indices.add(i);
            }
        }
    }

    // returns 0-2 keys for the given pred (where nom vars are skipped):
    // a lex pred is indexed by atom(pred)
    // a rel pred is indexed by atom<rel> and <rel>atom2
    // an attr pred is indexed by atom<rel>
    private static String[] predKeys(LF pred) {
        Nominal nom = HyloHelper.getPrincipalNominal(pred);
        String lexPred = HyloHelper.getLexPred(pred);
        String rel = HyloHelper.getRel(pred);
        Nominal nom2 = HyloHelper.getSecondaryNominal(pred);
        List<String> keys = new ArrayList<String>(2);
        if (nom instanceof NominalAtom && lexPred != null) 
            keys.add(nom.toString() + "(" + lexPred + ")");
        if (nom instanceof NominalAtom && rel != null) 
            keys.add(nom.toString() + "<" + rel + ">");
        if (nom2 instanceof NominalAtom && rel != null) 
            keys.add("<" + rel + ">" + nom2.toString());
        return (String[]) keys.toArray(new String[keys.size()]);
    }
    
    // fills in the LF chunks list with the chunks for each pred, 
    // then sorts them by specificity, from most to least
    private void fillLfChunks() {
        // for each pred, fill in chunks
        for (int i=0; i < preds.size(); i++) {
        	SatOp pred = preds.get(i);
        	TIntArrayList chunks = pred.getChunks();
            if (chunks == null) continue;
            // for each chunk that this pred is part of
            for (int j = 0; j < chunks.size(); j++) {
                int chunkId = chunks.get(j);
                // ensure chunk bitset exists
                while (lfChunks.size() < (chunkId + 1)) {
                    lfChunks.add(new BitSet(preds.size()));
                }
                // update chunk bitset
                BitSet chunk = lfChunks.get(chunkId);
                chunk.set(i);
            }
        }
        // do insertion sort, to ensure subset ordering
        List<BitSet> tmpList = new ArrayList<BitSet>(lfChunks);
        lfChunks.clear();
        allChunks: for (BitSet chunk : tmpList) {
            for (int i=0; i < lfChunks.size(); i++) {
                BitSet sortedChunk = lfChunks.get(i);
                if (subset(chunk, sortedChunk)) {
                    lfChunks.add(i, chunk); continue allChunks;
                }
            }
            lfChunks.add(chunk);
        }
    }
    
    // gets the most specific incomplete chunk for an edge, or null
    private BitSet getIncompleteLfChunk(BitSet bitset, List<List<Alt>> activeLfAlts) {
        // check each chunk
        allChunks: for (BitSet lfChunk : lfChunks) {
        	// for intersection
            if (!lfChunk.intersects(bitset)) { continue; }
            // for incomplete coverage
            if (!subset(lfChunk, bitset) && subset(bitset, lfChunk)) {
            	// and for part of all active alts
            	for (List<Alt> altSet : activeLfAlts) {
            		for (Alt alt : altSet) {
            			if (!subset(lfChunk, alt.bitset)) continue allChunks;
            		}
            	}
            	// return chunk
            	return lfChunk;
            }
        }
    	// otherwise null
    	return null;
    }

    // returns true iff bitset1 is a subset of bitset2
	private BitSet tmpBitSet = new BitSet();
	private boolean subset(BitSet bitset1, BitSet bitset2) {
		tmpBitSet.clear();
		tmpBitSet.or(bitset1);
		tmpBitSet.andNot(bitset2);
		return tmpBitSet.isEmpty();
	}
    
    // returns true iff combining the edges would complete a chunk
	private boolean completesChunk(Edge edgeA, Edge edgeB) {
		if (edgeA.incompleteLfChunk != null) {
			tmpBitSet.clear();
			tmpBitSet.or(edgeA.incompleteLfChunk);
			tmpBitSet.andNot(edgeA.bitset); tmpBitSet.andNot(edgeB.bitset);
			if (tmpBitSet.isEmpty()) return true;
		}
		if (edgeB.incompleteLfChunk != null) {
			tmpBitSet.clear();
			tmpBitSet.or(edgeB.incompleteLfChunk);
			tmpBitSet.andNot(edgeA.bitset); tmpBitSet.andNot(edgeB.bitset);
			if (tmpBitSet.isEmpty()) return true;
		}
		return false;
	}
	
    // fills in the LF alts list with the alts for each pred
    private void fillLfAlts() {
        // for each pred
        for (int i=0; i < preds.size(); i++) {
            SatOp pred = preds.get(i);
            List<Alt> alts = pred.getAlts();
            if (alts == null) continue;
            // for each alt that this pred is part of
            for (Alt alt : alts) {
                // ensure list for alt set exists
                while (lfAlts.size() < (alt.altSet + 1)) {
                    lfAlts.add(null);
                }
                List<Alt> altSet = lfAlts.get(alt.altSet);
                if (altSet == null) {
                    altSet = new ArrayList<Alt>(5);
                    lfAlts.set(alt.altSet, altSet);
                }
                // ensure list item for alt num is alt
                while (altSet.size() < (alt.numInSet + 1)) {
                    altSet.add(null);
                }
                altSet.set(alt.numInSet, alt);
                // update alt bitset
                alt.bitset.set(i);
            }
        }
    }
    
    // fills in the LF opts list with the opts for each pred
    private void fillLfOpts() {
        // for each pred
        for (int i=0; i < preds.size(); i++) {
            SatOp pred = preds.get(i);
            TIntArrayList opts = pred.getOpts();
            if (opts == null) continue;
            // for each opt that this pred is part of
            for (int j = 0; j < opts.size(); j++) {
                int optId = opts.get(j);
                // ensure opt bitset exists
                while (lfOpts.size() < (optId + 1)) {
                    lfOpts.add(new BitSet(preds.size()));
                }
                // update opt bitset
                BitSet opt = lfOpts.get(optId);
                opt.set(i);
            }
        }
    }
    
    
    // returns the list of coart rels for the pred with the given index
    // NB: assumes that preds are sorted by their principal nominals, with the lex pred first
    private List<String> getCoartRels(int predIndex) {
    	SatOp pred = preds.get(predIndex);
        Nominal nom = HyloHelper.getPrincipalNominal(pred);
        List<String> retval = null;
        for (int i = predIndex+1; i < preds.size(); i++) {
        	SatOp relPred = preds.get(i);
            if (!nom.equals(HyloHelper.getPrincipalNominal(relPred))) break;
            String rel = HyloHelper.getRel(relPred);
            if (rel != null && grammar.lexicon.isCoartRel(rel)) { 
                if (retval == null) retval = new ArrayList<String>(3);
                retval.add(rel);
            }
        }
        return retval;
    }

    
    //-----------------------------------------------------------------
    // createInitialEdges
    //

    /** 
     * Creates and returns all initial edges.
     * In particular, initializes all lexical edges that cover some of the input semantics;  
     * also initializes edges for semantically null lexical items, 
     * and initializes instances of type changing rules which 
     * introduce their own semantics.
     * If a hypertagger is in place, only the beta-best edges are returned for each EP.
     */
    public List<Edge> createInitialEdges() {

        // marked initial edges that need to be licensed
        List<Edge> markedEdgesForLicensing = new ArrayList<Edge>(); 
        
        // for each pred, create edges for signs indexed 
        // by lexical preds and by indexed rels; 
        // and similarly for type changing rules
        for (int i=0; i < preds.size(); i++) {
        	SatOp pred = preds.get(i);
            String key = HyloHelper.getLexPred(pred);
            String rel = HyloHelper.getRel(pred);
            // skip if no lex pred or indexed rel (not expected)
            if (key == null && rel == null) continue;
            // update hypertagger for beta-best lookup
            if (hypertagger != null) hypertagger.setPred(i); 
            Collection<Sign> signs = new ArrayList<Sign>();
            Collection<TypeChangingRule> typeChangingRules = new ArrayList<TypeChangingRule>();
            // add signs and rules for lex pred
            if (key != null) {
                List<String> coartRels = getCoartRels(i);
                Collection<Sign> lexPredSigns = lexicon.getSignsFromPred(key, coartRels);
                if (lexPredSigns != null) { signs.addAll(lexPredSigns); }
                Collection<TypeChangingRule> lexPredRules = grammar.rules.getRulesForPred(key);
                if (lexPredRules != null) { typeChangingRules.addAll(lexPredRules); }
            }
            // add signs and rules for indexed rel
            if (rel != null) {
                Collection<Sign> indexedRelSigns = lexicon.getSignsFromRel(rel);
                if (indexedRelSigns != null) { signs.addAll(indexedRelSigns); }
                Collection<TypeChangingRule> indexedRelRules = grammar.rules.getRulesForRel(rel);
                if (indexedRelRules != null) { typeChangingRules.addAll(indexedRelRules); }
            }
            // create initial and marked edges for each sign, updating feature map
            for (Sign sign : signs) {
                List<Edge> initialEdgesForSign = createInitialEdges(sign, i);
                if (initialEdgesForSign != null) {
                    for (Edge initialEdge : initialEdgesForSign) {
                        Category cat = initialEdge.sign.getCategory();
                        if (featureLicenser.needsLicensing(cat))
                            markedEdgesForLicensing.add(initialEdge);
                        else {
                            initialEdges.add(initialEdge);
                            featureLicenser.updateFeatureMap(cat);
                        }
                    }
                }
            }
            // create rules instances for each rule, updating feature map
            for (TypeChangingRule rule : typeChangingRules) {
                List<RuleInstance> ruleInstancesForRule = createRuleInstances(rule, i);
                if (ruleInstancesForRule != null) {
                    for (RuleInstance ruleInst : ruleInstancesForRule) { 
                        ruleInstances.add(ruleInst);
                        featureLicenser.updateFeatureMap(ruleInst.rule.getArg());
                        featureLicenser.updateFeatureMap(ruleInst.rule.getResult());
                    }
                }
            }
        }
        
        // add licensed, marked initial edges
        int prevSize;
        do { // while list size is changing
            prevSize = markedEdgesForLicensing.size();
            for (Iterator<Edge> it = markedEdgesForLicensing.iterator(); it.hasNext(); ) {
                // check each edge
                Edge edge = it.next();
                Category cat = edge.sign.getCategory();
                if (featureLicenser.isLicensed(cat)) {
                    // and add to marked edges if licensed
                    markedEdges.add(edge);
                    it.remove();
                    // updating feature map
                    featureLicenser.updateFeatureMap(cat);
                }
            }
        } while (markedEdgesForLicensing.size() != prevSize);
        
        // initialize general rules
        initGeneralRules();

        // initialize edges for semantically null lexical items        
        initNoSemEdges();
        
        // collect all initial edges
        List<Edge> retval = new ArrayList<Edge>(
            initialEdges.size() + markedEdges.size() + 
            instantiatedNoSemEdges.size() + noSemEdges.size()
        );
        retval.addAll(initialEdges);
        retval.addAll(markedEdges);
        retval.addAll(instantiatedNoSemEdges);
        retval.addAll(noSemEdges);
        
        // check instantiation of outermost cats
        checkInstantiation(retval);
        
        // set uncovered EPs
        uncoveredEPs = uncoveredPreds();
        // warn if EPs missing and debug instantiation flag set
        if (uncoveredEPs != null && debugInstantiation) {
        	System.err.println("Warning, uncovered preds after lex instantiation: " + Edge.toString(uncoveredEPs));
        }
        
        // set opts for missing relations, if apropos
        if (useRelaxedRelationMatching) addLFOptsForUncoveredPreds();
        	
        // return
        return retval;
    }
    
    // return null if LF doesn't unify with preds
    private List<Edge> createInitialEdges(Sign sign, int predIndex) {
        // get parts of sign 
        List<Word> words = sign.getWords();
        Category cat = sign.getCategory();
        // instantiate
        List<Pair<Substitution,BitSet>> instantiations = instantiate(cat, null, predIndex);
        // check for failure
        if (instantiations == null) return null;
        // otherwise fill cats and make edges
        List<Edge> retval = new ArrayList<Edge>(instantiations.size());
        for (Pair<Substitution,BitSet> inst : instantiations) {
            Substitution subst = inst.a; BitSet bitset = inst.b;
            Category filledCat = null;
            try {
                filledCat = (Category) cat.fill(subst);
            } catch (UnifyFailure uf) {
                // shouldn't happen
                throw new RuntimeException("Unable to fill cat: " + uf);
            }
            // index subcategorized semantically null words
            featureLicenser.indexSemanticallyNullWords(filledCat);
            // update lex origins for new sign
            Sign newSign = new Sign(words, filledCat);
            newSign.setOrigin();
            // and add new edge
            List<List<Alt>> activeLfAlts = getActiveLfAlts(lfAlts, bitset);
            retval.add(makeEdge(newSign, bitset, activeLfAlts));
        }
        // and return them
        return retval;
    }
    
    // return null if result LF doesn't unify with preds
    private List<RuleInstance> createRuleInstances(TypeChangingRule rule, int predIndex) {
        // get parts of rule
        Category result = rule.getResult();
        Category arg = rule.getArg();
        // instantiate
        List<Pair<Substitution,BitSet>> instantiations = instantiate(result, arg, predIndex);
        // check for failure
        if (instantiations == null) return null;
        // otherwise fill cats and make rule instances
        List<RuleInstance> retval = new ArrayList<RuleInstance>(instantiations.size());
        for (Pair<Substitution,BitSet> inst : instantiations) {
            Substitution subst = inst.a; BitSet bitset = inst.b;
            Category filledResult = null; Category filledArg = null;
            try {
                filledResult = (Category) result.fill(subst);
                filledArg = (Category) arg.fill(subst);
            } catch (UnifyFailure uf) {
                // shouldn't happen
                throw new RuntimeException("Unable to fill cat: " + uf);
            }
            // index subcategorized semantically null words
            featureLicenser.indexSemanticallyNullWords(filledArg);
            featureLicenser.indexSemanticallyNullWords(filledResult);
            // and return new rule instance
            BitSet indices = getIndices(filledResult, filledArg);
            TypeChangingRule newRule = new TypeChangingRule(filledArg, filledResult, rule.name(), rule.getFirstEP());
            ruleInstancesGroup.addRule(newRule);
            List<List<Alt>> activeLfAlts = getActiveLfAlts(lfAlts, bitset);
            RuleInstance ruleInst = new RuleInstance(newRule, bitset, indices, activeLfAlts);
            retval.add(ruleInst);
        }
        // and return them
        return retval;
    }
    

    // return null if cat LF doesn't unify with preds
    private List<Pair<Substitution,BitSet>> instantiate(Category cat, Category cat2, int predIndex) {

        // unify with indexed pred
        UnifyControl.reindex(cat, cat2); 
        List<SatOp> lfPreds = HyloHelper.getPreds(cat.getLF());
        Substitution subst = null;
        SatOp indexedPred = preds.get(predIndex);
        int lfPredIndex = -1;
        for (int i=0; i < lfPreds.size(); i++) {
            LF lfPred = lfPreds.get(i);
            subst = new SimpleSubstitution();
            try {
                Unifier.unify(lfPred, indexedPred, subst);
                lfPredIndex = i;
                break;
            } catch (UnifyFailure uf) {}
        }
        
        // if failed, return empty list
        if (lfPredIndex == -1) return null;
        
        // set indexed pred in bitset
        BitSet bitset = new BitSet(preds.size());
        bitset.set(predIndex);
        
        // unify with rest of lfPreds, extending subst/bitset
        List<SatOp> remainingPreds = new ArrayList<SatOp>(lfPreds.size());
        remainingPreds.addAll(lfPreds);
        remainingPreds.remove(lfPredIndex);
        int prevSize = -1;
        List<Pair<Substitution,BitSet>> retval = new ArrayList<Pair<Substitution,BitSet>>(3);
        List<Pair<Substitution,BitSet>> prev = new ArrayList<Pair<Substitution,BitSet>>(3);
        retval.add(new Pair<Substitution, BitSet>(subst, bitset));
        // loop until empty or no changes, in order to propagate matches
        while (!remainingPreds.isEmpty() && remainingPreds.size() != prevSize) {
            prevSize = remainingPreds.size();
            for (Iterator<SatOp> it = remainingPreds.iterator(); it.hasNext(); ) {
            	SatOp lfPred = it.next();
                try {
                    // fill index
                    lfPred = (SatOp) lfPred.fill(subst);
                } catch (UnifyFailure uf) {
                    // shouldn't happen
                    throw new RuntimeException("Unable to fill lfPred: " + uf);
                }
                // find matching pred
                String[] lfPredKeys = predKeys(lfPred);
                if (lfPredKeys.length == 0) {
                    // nb: this means the lfPred is underconstrained; 
                    //     will need to check it later!
                    continue;
                }
                List<Integer> matchingPredIndices = new ArrayList<Integer>(3);
                for (int i = 0; i < lfPredKeys.length; i++) {
                    List<Integer> indices = predMap.get(lfPredKeys[i]);
                    if (indices != null) matchingPredIndices.addAll(indices);
                }
                if (matchingPredIndices.isEmpty()) {
                	if (useRelaxedRelationMatching && HyloHelper.isRelPred(lfPred)) continue; // skip
                	else return null; // fail
                }
                // try extending each subst/bitset: 
                // first swap retval, prev, and clear retval
                List<Pair<Substitution,BitSet>> tmp = prev;
                prev = retval; retval = tmp; 
                retval.clear();
                for (Pair<Substitution,BitSet> inst : prev) {
                    Substitution s = inst.a; BitSet b = inst.b;
                    if (matchingPredIndices.size() == 1) { // reuse current instantiation
                        int matchingPredIndex = matchingPredIndices.get(0);
                        b.set(matchingPredIndex);
                        if (checkAlts(b)) {
                            try { // unify
                            	SatOp matchingPred = preds.get(matchingPredIndex);
                                Unifier.unify(lfPred, matchingPred, s);
                                retval.add(inst);
                            } catch (UnifyFailure uf) {}
                        }
                    }
                    else { // otherwise make copies
                        for (int matchingPredIndex : matchingPredIndices) {
                            Substitution s2 = new SimpleSubstitution((SimpleSubstitution)s);
                            BitSet b2 = (BitSet)b.clone();
                            b2.set(matchingPredIndex);
                            if (checkAlts(b2)) {
                                try { // unify
                                	SatOp matchingPred = preds.get(matchingPredIndex);
                                    Unifier.unify(lfPred, matchingPred, s2);
                                    Pair<Substitution,BitSet> inst2 = new Pair<Substitution, BitSet>(s2, b2);
                                    retval.add(inst2);
                                } catch (UnifyFailure uf) {}
                            }
                        }
                    }
                }
                if (retval.isEmpty()) {
                	if (useRelaxedRelationMatching && HyloHelper.isRelPred(lfPred)) {
                		retval.addAll(prev);
                		continue; // skip
                	}
                	else return null; // fail
                }
                it.remove();
            }
        }
        
        // check for no more than one (rel) pred left over
        if (remainingPreds.size() > 1) return null;
        // done
        return retval;
    }
    
    
    // returns true iff no alt exclusions are violated
    // nb: needs to check that if there any intersections 
    //     with multiple alts, then these are only in the shared part
    private boolean checkAlts(BitSet b) {
        for (List<Alt> altSet : lfAlts) {
            int intersects = 0;
            for (Alt alt : altSet) {
                if (alt.bitset.intersects(b)) intersects++;
            }
            if (intersects > 1) { // check intersections 
                for (int i = 0; i < altSet.size(); i++) {
                    Alt alt = altSet.get(i);
                    if (alt.bitset.intersects(b)) {
                        for (int j = i+1; j < altSet.size(); j++) {
                            Alt alt2 = altSet.get(j);
                            if (alt2.bitset.intersects(b)) {
                                BitSet altOnly = (BitSet) alt.bitset.clone();
                                altOnly.andNot(alt2.bitset);
                                BitSet alt2Only = (BitSet) alt2.bitset.clone();
                                alt2Only.andNot(alt.bitset);
                                if (altOnly.intersects(b) && alt2Only.intersects(b))
                                    return false;
                            }
                        }
                    }
                }
            }
        }
        return true;
    }
    

    //-----------------------------------------------------------------
    // createNewEdges
    //

    /**
     * Returns all edges that can be created by combining the given edges, 
     * without collecting combos.
     */
    public List<Edge> createNewEdges(Edge edge, Edge next) {
        return createNewEdges(edge, next, false);
    }
     
    /**
     * Returns all edges that can be created by combining the given edges;
     * if the collectCombos flag is true, the edges are updated with collected combos, 
     * and additional alt edges are made for the remaining alternative edges for 
     * the given first edge.
     */
    public List<Edge> createNewEdges(Edge edge, Edge next, boolean collectCombos) {
        
        // check for sem overlap
        if (edge.intersects(next)) return Collections.emptyList();
        // check LF chunk constraints
        if (useChunks) {
            if (!edge.meetsLfChunkConstraints(next) || 
                !next.meetsLfChunkConstraints(edge)) return Collections.emptyList();
        }
        
        // make new edges ...
        List<Edge> newEdges = null;
        // when using indexing:
        if (useIndexing) {
            // check for intersecting indices
            if (edge.indicesIntersect(next)) {
                newEdges = createNewEdges(edge, next, collectCombos, true);
            }
            // check for PairedWith relation
            else if (anyPairedNominals && pairedWith(edge, next)) {
                newEdges = createNewEdges(edge, next, collectCombos, false);
            }
            else if (anyPairedNominals && pairedWith(next, edge)) {
                newEdges = createNewEdges(next, edge, collectCombos, false);
            }
	    // check for a missing index nominal on the target cat,
	    // which can indicate a type-raised category that needs to combine
	    // before its indices become adjacent
            else if (allowMissingIndexCombos && (edge.getIndexNominal() == null || next.getIndexNominal() == null))
	    {
                newEdges = createNewEdges(edge, next, collectCombos, true);
            }
            else { return Collections.emptyList(); }
        } 
        // otherwise try everything
        else {
            newEdges = createNewEdges(edge, next, collectCombos, true);
        }
        
        // make alt edges for rest of edge's alts, with collectCombos option
        if (collectCombos && edge.altEdges.size() > 0) {
            int numNewEdges = newEdges.size(); // get num before adding any more
            for (int i = 0; i < numNewEdges; i++) {
                Edge resultEdge = newEdges.get(i);
                Sign resultSign = resultEdge.sign;
                Category resultCat = resultSign.getCategory();
                Rule rule = resultSign.getDerivationHistory().getRule();
                Sign[] resultInputs = resultSign.getDerivationHistory().getInputs(); 
                boolean rightward = (resultInputs[0] == next.sign);
                boolean lefthead = (resultSign.getLexHead() == resultInputs[0].getLexHead());
                for (int j = 0; j < edge.altEdges.size(); j++) {
                    Edge furtherEdge = edge.altEdges.get(j);
                    if (furtherEdge == edge) continue;
                    Sign[] signs = (rightward) 
                        ? new Sign[] { next.sign, furtherEdge.sign }
                        : new Sign[] { furtherEdge.sign, next.sign };
                    Sign lexHead = (rightward == lefthead) 
                    	? next.sign.getLexHead() 
            			: furtherEdge.sign.getLexHead(); 
                	Sign altSign = Sign.createDerivedSignWithNewLF(resultCat, signs, rule, lexHead);
                    newEdges.add(makeAltEdge(altSign, resultEdge));
                }
            }
        }
        
        // check instantiation of outermost cats
        checkInstantiation(newEdges);
        
        // done
        return newEdges;
    }

    // creates edges, combining in one or both directions per flag
    private List<Edge> createNewEdges(Edge edgeA, Edge edgeB, boolean collectCombos, boolean bothDirections) {

        // get combined alts, checking compatibility        
        List<List<Alt>> combinedLfAlts = getCombinedLfAlts(edgeA.activeLfAlts, edgeB.activeLfAlts);
        if (combinedLfAlts == null) return Collections.emptyList();
        
        // check whether a chunk is completed when gluing fragments
        boolean fragCompletion = false;
        if (gluingFragments) fragCompletion = completesChunk(edgeA, edgeB);
        
        // A B combos
        List<Sign> results;
        if (gluingFragments) results = generalRules.applyGlueRule(edgeA.sign, edgeB.sign);
        else results = generalRules.applyBinaryRules(edgeA.sign, edgeB.sign);
        binaryRuleApps++; 
        int numResults = results.size();
        
        // B A combos
        List<Sign> reversedResults = Collections.emptyList();
        if (bothDirections) {
        	if (gluingFragments) reversedResults = generalRules.applyGlueRule(edgeB.sign, edgeA.sign);
        	else reversedResults = generalRules.applyBinaryRules(edgeB.sign, edgeA.sign);
            binaryRuleApps++; 
        }
        int numReversedResults = reversedResults.size();
        
        // make edges to return, updating edge combos (if apropos)
        List<Edge> retval = Collections.emptyList();
        if (numResults + numReversedResults > 0) {
            retval = new ArrayList<Edge>(numResults + numReversedResults);
            BitSet union = (BitSet) edgeA.bitset.clone();
            union.or(edgeB.bitset);
            int cardBefore = union.cardinality();
            List<List<Alt>> activeLfAlts = getActiveLfAlts(combinedLfAlts, union);
            // check for alt completion when gluing fragments
            if (gluingFragments && union.cardinality() > cardBefore) fragCompletion = true;
            for (int i = 0; i < numResults; i++) {
                Sign sign = results.get(i);
                if (fragCompletion) { ((AtomCat)sign.getCategory()).fragCompletion = true; }
                Edge resultEdge = makeEdge(sign, union, activeLfAlts); 
                retval.add(resultEdge);
                if (collectCombos) {
                    edgeA.edgeCombos.addRightwardCombo(edgeB, resultEdge);
                    edgeB.edgeCombos.addLeftwardCombo(edgeA, resultEdge);
                }
            }
            for (int i = 0; i < numReversedResults; i++) {
                Sign sign = reversedResults.get(i);
                if (fragCompletion) { ((AtomCat)sign.getCategory()).fragCompletion = true; }
                Edge resultEdge = makeEdge(sign, union, activeLfAlts); 
                retval.add(resultEdge);
                if (collectCombos) {
                    edgeB.edgeCombos.addRightwardCombo(edgeA, resultEdge);
                    edgeA.edgeCombos.addLeftwardCombo(edgeB, resultEdge);
                }
            }
        }
        
        // done
        return retval;
    }

    
    /**
     * Returns all edges that can be created by applying a unary rule 
     * to the given edge or by combining it with a purely syntactic edge, 
     * without collecting combos.
     */
    public List<Edge> createNewEdges(Edge edge) {
        return createNewEdges(edge, false);
    }
    
    /**
     * Returns all edges that can be created by applying a unary rule 
     * to the given edge, or by combining it with a purely syntactic edge,
     * or by completing a realization/chunk/alt with an optional part,  
     * while updating the given edge with collected combos, 
     * if the collectCombos flag is true.
     * When gluing fragments, only the opt completion step is done.
     */
    public List<Edge> createNewEdges(Edge edge, boolean collectCombos) {
        
        List<Edge> retval = null; // instantiate on demand
        
        if (!gluingFragments) {
	        	
	        List<Sign> genResults = generalRules.applyUnaryRules(edge.sign);
	        unaryRuleApps++;
	        // make edges for results, updating edge combos
	        if (genResults.size() > 0) {
	            if (retval == null) retval = new ArrayList<Edge>(genResults.size());
	            for (int i = 0; i < genResults.size(); i++) {
	                Sign sign = genResults.get(i);
					// check for unary rule cycle; skip result if found
	                if (sign.getDerivationHistory().containsCycle()) continue;
	                Edge resultEdge = makeEdge(sign, edge.bitset, edge.activeLfAlts); 
	                retval.add(resultEdge);
	                if (collectCombos) edge.edgeCombos.unaryResults.add(resultEdge);
	            }
	        }
	        
	        // do rule instances
	        Sign[] signs = { edge.sign };
	        for (int i = 0; i < ruleInstances.size(); i++) {
	            RuleInstance ruleInst = ruleInstances.get(i);
	            // check sem overlap
	            if (edge.intersects(ruleInst)) continue; 
	            // check for indices in common
	            if (useIndexing && !edge.indicesIntersect(ruleInst)) continue; 
	            // check LF chunk constraints
	            if (useChunks && !edge.meetsLfChunkConstraints(ruleInst)) continue;
	            // get combined alts, checking compatibility        
	            List<List<Alt>> combinedLfAlts = getCombinedLfAlts(edge.activeLfAlts, ruleInst.activeLfAlts);
	            if (combinedLfAlts == null) continue;
	        
	            // apply rule
	            List<Sign> instResults = new ArrayList<Sign>(1);
	            ruleInst.rule.applyRule(signs, instResults);
	            unaryRuleInstApps++;
	            if (instResults.size() > 0) {
	                if (retval == null) retval = new ArrayList<Edge>(instResults.size());
	                BitSet union = (BitSet) edge.bitset.clone();
	                union.or(ruleInst.bitset);
	                List<List<Alt>> activeLfAlts = getActiveLfAlts(combinedLfAlts, union);
	                for (int j = 0; j < instResults.size(); j++) {
	                    Sign sign = instResults.get(j);
	    				// check for unary rule cycle; skip result if found
	                    if (sign.getDerivationHistory().containsCycle()) continue;
	                    Edge resultEdge = makeEdge(sign, union, activeLfAlts); 
	                    retval.add(resultEdge);
	                    if (collectCombos) edge.edgeCombos.unaryResults.add(resultEdge);
	                }
	            }
	        }
        }
        
        // do opt completed edges
        if (!lfOpts.isEmpty() && !edge.complete()) {
            // get completed bitsets for each completed active alt or chunk, and for whole thing
            List<BitSet> optCompleted = new ArrayList<BitSet>(2);
            addOptCompletedBitSet(edge, allPreds, optCompleted);
            for (List<Alt> altSet : edge.activeLfAlts) {
                for (Alt alt : altSet) {
                    addOptCompletedBitSet(edge, alt.bitset, optCompleted);
                }
            }
            for (BitSet chunk : lfChunks) {
                addOptCompletedBitSet(edge, chunk, optCompleted);
            }
            // for each completed bitset, make complete edge with same sign
            for (BitSet completed : optCompleted) {
                List<List<Alt>> activeLfAlts = getActiveLfAlts(edge.activeLfAlts, completed);
                // set frag completion if apropos
                if (gluingFragments && edge.sign.getCategory() instanceof AtomCat) {
                	AtomCat ac = (AtomCat) edge.sign.getCategory();
                	if (ac.isFragment()) ac.fragCompletion = true;
                }
                Edge resultEdge = makeEdge(edge.sign, completed, activeLfAlts);
                resultEdge.optCompletes = edge;
                if (retval == null) retval = new ArrayList<Edge>(1);
                retval.add(resultEdge);
                if (collectCombos) edge.edgeCombos.optionalResults.add(resultEdge);
            }
        }

        // ensure retval instantiated        
        if (retval == null) retval = Collections.emptyList();
        
        // check instantiation of outermost cats
        if (!gluingFragments) checkInstantiation(retval);
        
        // done
        return retval;
    }

    // bitset for checking completeness
    private BitSet tmpBitSetCompleteness = new BitSet();
    
    // bitset for making retval
    private BitSet tmpBitSetRetval = new BitSet();
    
    // adds a bitset with optional parts completed within the given bitset scope 
    // to the given list, if the optional parts complete the given edge's bitset
    private void addOptCompletedBitSet(Edge edge, BitSet bitset, List<BitSet> optCompleted) {
        // check whether already complete
    	tmpBitSetRetval.clear(); tmpBitSetRetval.or(edge.bitset);
    	tmpBitSetRetval.and(bitset);
        if (tmpBitSetRetval.cardinality() == bitset.cardinality()) return;
        tmpBitSetRetval.or(edge.bitset);
        // or retval with opts when apropos
        for (BitSet opt : lfOpts) {
            if (subset(opt, bitset)) {
            	if (edge.bitset.intersects(opt)) continue; // skip if opt not entirely missing
            	tmpBitSetRetval.or(opt);
            }
        }
        // check completeness, add retval if complete (and distinct)
        tmpBitSetCompleteness.clear(); tmpBitSetCompleteness.or(bitset); 
        tmpBitSetCompleteness.and(tmpBitSetRetval);
        if (tmpBitSetCompleteness.cardinality() == bitset.cardinality()) {
            if (!optCompleted.contains(tmpBitSetRetval)) 
            	optCompleted.add((BitSet)tmpBitSetRetval.clone());
        }
    }
    
    
    /** Returns the edges that can be made by constructing alternative edges 
        from the given edge and the collected combos in its representative edge. */
    public List<Edge> createAltEdges(Edge edge, Edge repEdge) {
        // instantiate return list with right capacity
        EdgeCombos edgeCombos = repEdge.edgeCombos;
        int numResults = numResultsFromCombos(edgeCombos.rightwardCombos);
        numResults += numResultsFromCombos(edgeCombos.leftwardCombos);
        numResults += edgeCombos.unaryResults.size();
        numResults += edgeCombos.optionalResults.size();
        List<Edge> retval = new ArrayList<Edge>(numResults);
        // make alt edges
        addAltsFromCombos(edge, edgeCombos.rightwardCombos, true, retval);
        addAltsFromCombos(edge, edgeCombos.leftwardCombos, false, retval);
        addAltsFromUnaryResults(edge, edgeCombos.unaryResults, retval);
        addAltsFromOptionalResults(edge, edgeCombos.optionalResults, retval);
        // done
        return retval;
    }
    
    // returns the number of results from the given combos
    private int numResultsFromCombos(List<EdgeCombos.CatCombo> combos) {
        int retval = 0;
        for (int i = 0; i < combos.size(); i++) {
            EdgeCombos.CatCombo combo = combos.get(i);
            retval += combo.inputEdge.altEdges.size();
        }
        return retval;
    }
    
    // adds alt edges for the given edge, combos, and direction to results
    private void addAltsFromCombos(Edge edge, List<EdgeCombos.CatCombo> combos, boolean rightward, List<Edge> results) {
        for (EdgeCombos.CatCombo combo : combos) {
            Edge resultEdge = combo.resultEdge;
            Sign resultSign = resultEdge.sign;
            Category resultCat = resultSign.getCategory();
            Rule rule = resultSign.getDerivationHistory().getRule();
            Sign[] resultInputs = resultSign.getDerivationHistory().getInputs(); 
            boolean lefthead = (resultSign.getLexHead() == resultInputs[0].getLexHead());
            List<Edge> comboEdges = combo.inputEdge.altEdges;
            for (Edge comboEdge : comboEdges) {
                Sign[] signs = (rightward) 
                    ? new Sign[] { edge.sign, comboEdge.sign }
                    : new Sign[] { comboEdge.sign, edge.sign };
                Sign lexHead = (rightward == lefthead) 
                	? edge.sign.getLexHead() 
        			: comboEdge.sign.getLexHead();
                Sign altSign = Sign.createDerivedSignWithNewLF(resultCat, signs, rule, lexHead);
                results.add(makeAltEdge(altSign, resultEdge));
            }
        }
    }
    
    // adds alt edges for the given edge and unary results to results
    private void addAltsFromUnaryResults(Edge edge, List<Edge> unaryResults, List<Edge> results) {
        for (Edge resultEdge : unaryResults) {
            Sign resultSign = resultEdge.sign;
            Category resultCat = resultSign.getCategory();
            Rule rule = resultSign.getDerivationHistory().getRule();
            Sign[] signs = { edge.sign };
            Sign lexHead = edge.sign.getLexHead();
            Sign altSign = Sign.createDerivedSignWithNewLF(resultCat, signs, rule, lexHead);
            results.add(makeAltEdge(altSign, resultEdge));
        }
    }
    
    // adds alt edges for the given edge and optional results to results
    private void addAltsFromOptionalResults(Edge edge, List<Edge> optionalResults, List<Edge> results) {
        for (Edge resultEdge : optionalResults) { 
            results.add(makeAltEdge(edge.sign, resultEdge));
        }
    }
    
    
    /** Returns the number of rule applications executed. */
    public int ruleApps() {
        return 
            unaryRuleApps * generalRules.getUnaryRules().size() +
            unaryRuleInstApps +
            binaryRuleApps * generalRules.getBinaryRules().size();
    }
    

    //-----------------------------------------------------------------
    // initGeneralRules
    //

    // separates out general rules with no semantics
    // nb: could consider adding feature licensing for type changing rules with no semantics
    private void initGeneralRules() {
        // add all binary rules to general rules
        for (Rule r : grammar.rules.getBinaryRules()) {
            generalRules.addRule(r);
        }
        // add type raising rules, and type changing ones with no semantics too
        for (Rule r : grammar.rules.getUnaryRules()) {
            // skip type changing rules with semantics
            if (r instanceof TypeChangingRule) {
                TypeChangingRule rule = (TypeChangingRule) r;
                if (rule.getResult().getLF() != null) { continue; }
            }
            // otherwise add it
            generalRules.addRule(r);
        }
    }
    
        
    //-----------------------------------------------------------------
    // initNoSemEdges
    //

    // creates edges for signs flagged as having no semantics,  
    // and with appropriate licensing values in the initial edges
    private void initNoSemEdges() {
        // lookup signs by special index rel constant NO_SEM_FLAG
        lexicon.setSupertagger(null); // turn off hypertagger first
        Collection<Sign> noSemSigns = lexicon.getSignsFromRel(Lexicon.NO_SEM_FLAG);
        lexicon.setSupertagger(hypertagger); // reset hypertagger
        if (noSemSigns == null) return;
        // sets for accumulating no sem edges
        Set<Edge> instEdges = new HashSet<Edge>();
        Set<Edge> uninstEdges = new HashSet<Edge>();
        // add signs with no LF and with matching licensing values
        Set<Category> instantiatedCats = new HashSet<Category>();
        Set<Category> uninstantiatedCats = new HashSet<Category>();
        List<List<Alt>> emptyLfAlts = Collections.emptyList();
        // loop until no more no sem edges
        int numInstEdges, numUninstEdges;
        do {
        	numInstEdges = instEdges.size(); numUninstEdges = uninstEdges.size();
	        for (Sign sign : noSemSigns) {
	            Category cat = sign.getCategory();
	            // get licensed, potentially instantiated cats
	            instantiatedCats.clear();
	            uninstantiatedCats.clear();
	            featureLicenser.licenseEmptyCat(cat, instantiatedCats, uninstantiatedCats);
	            // add edges for instantiated cats to initial edges, updating
				// feature map
	            for (Category instCat : instantiatedCats) {
                    featureLicenser.updateFeatureMap(instCat);
                    featureLicenser.indexSemanticallyNullWords(instCat);
	                Sign instSign = new Sign(sign.getWords(), instCat);
	                instEdges.add(makeEdge(instSign, new BitSet(preds.size()), emptyLfAlts));
	            }
	            // add edges for uninstantiated cats to no-sem edges, updating
				// feature map
	            for (Category uninstCat : uninstantiatedCats) {
                    featureLicenser.updateFeatureMap(uninstCat);
                    featureLicenser.indexSemanticallyNullWords(uninstCat);
	                Sign uninstSign = new Sign(sign.getWords(), uninstCat);
	                Edge noSemEdge = makeEdge(uninstSign, new BitSet(preds.size()), emptyLfAlts); 
	                uninstEdges.add(noSemEdge);
	            }
	        }
        } while (numInstEdges != instEdges.size() || numUninstEdges != uninstEdges.size());
        // update no sem edge lists
        instantiatedNoSemEdges.addAll(instEdges);
        noSemEdges.addAll(uninstEdges);
    }
}


================================================
FILE: src/opennlp/ccg/realize/EdgeHash.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2005 Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.realize;

import gnu.trove.*;
import java.util.*;

/**
 * A set of edges, unique up to surface words.
 * Edges with higher scores or whose signs have lower derivational complexity are kept during insertion.
 *
 * @author      Michael White
 * @version     $Revision: 1.2 $, $Date: 2010/01/14 22:52:01 $
 */
public class EdgeHash extends THashSet {

	private static final long serialVersionUID = 1L;
	
	/** Hashing strategy that uses Edge's surfaceWordHashCode and surfaceWordEquals methods. */
    protected static TObjectHashingStrategy surfaceWordHashingStrategy = new TObjectHashingStrategy() {
		private static final long serialVersionUID = 1L;
		public int computeHashCode(java.lang.Object o) {
            return ((Edge)o).surfaceWordHashCode();
        }
        public boolean equals(java.lang.Object o1, java.lang.Object o2) {
            return ((Edge)o1).surfaceWordEquals((Edge)o2);
        }
    };

    /** Default constructor. */
    public EdgeHash() { super(surfaceWordHashingStrategy); }

    /**
     * Returns this as a set of edges.
     */
    @SuppressWarnings("unchecked")
	public Set<Edge> asEdgeSet() { return (Set<Edge>) this; }

    /**
     * Adds an edge, keeping the one with a higher score or whose sign has lower derivational complexity 
     * if there is an equivalent one there already; returns the old
     * edge if it was displaced, the new edge if there was no equivalent 
     * old edge, or null if the edge was not actually added.
     */
    public Edge insert(Edge edge) {
        int pos = index(edge);
        // equiv edge
        if (pos >= 0) {
            Edge oldEdge = (Edge) _set[pos];
            // already there?
            if (oldEdge == edge) return null;
            // check score
            if (edge.score > oldEdge.score) { 
            	_set[pos] = edge; return oldEdge;
            }
            // check complexity
            int complexity = edge.sign.getDerivationHistory().complexity();
            int oldComplexity = oldEdge.sign.getDerivationHistory().complexity();
            if (complexity < oldComplexity) {
            	_set[pos] = edge; return oldEdge;
            }
            // otherwise toss
            else return null;
        }
        // add new
        else {
        	add(edge); return edge;
        }
    }
}


================================================
FILE: src/opennlp/ccg/realize/FeatureLicenser.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003-4 University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.realize;

import opennlp.ccg.lexicon.*;
import opennlp.ccg.unify.*;
import opennlp.ccg.synsem.*;
import opennlp.ccg.hylo.*;

import java.util.*;

/**
 * The feature licenser is a helper class for the edge factory, 
 * responsible for managing features which license the use and 
 * instantiation of semantically null or marked categories.
 *
 * @author      Michael White
 * @version     $Revision: 1.13 $, $Date: 2009/12/21 03:27:18 $
 */
public class FeatureLicenser
{

    // the edge factory for which this feature licenser is a helper
    private final EdgeFactory edgeFactory;
    
    // the licensing features     
    private final LicensingFeature[] licensingFeatures;
    
    /** Constructor. */
    public FeatureLicenser(EdgeFactory edgeFactory) { 
        this.edgeFactory = edgeFactory; 
        this.licensingFeatures = edgeFactory.grammar.lexicon.getLicensingFeatures();
    }

    /** Constructor with licensing features. */
    public FeatureLicenser(EdgeFactory edgeFactory, LicensingFeature[] licensingFeatures) { 
        this.edgeFactory = edgeFactory; 
        this.licensingFeatures = licensingFeatures;
    }

    
    //-----------------------------------------------------------------
    // semantically null word indexing

    /**
     * Adds new nominal atoms for subcategorized semantically null words.  
     * A check is made for atomic categories with a value for the 'lex' 
     * feature but with a null or uninstantiated index feature.  If found, a new nominal atom is 
     * created as the value of the index feature, and the nominal is 
     * added to the edge factory's nominals map, for indexing purposes. 
     * The same nominal is reused for repeated occurrences of a 'lex' value.
     */
    public void indexSemanticallyNullWords(Category cat) {
        cat.forall(semanticallyNullWordIndexer);
    }
    
    // counter
    private int wordCounter = 0;
    
    // 'lex' value to index map
    private Map<String, String> wordIndexMap = new HashMap<String, String>();
    
    // cat function
    private CategoryFcn semanticallyNullWordIndexer = new CategoryFcnAdapter() {
        public void forall(Category c) {
            if (!(c instanceof AtomCat)) return;
            FeatureStructure fs = c.getFeatureStructure();
            if (fs == null) return;
            if (!fs.hasAttribute("lex")) return;
            Object indexVal = fs.getValue("index"); 
            if (indexVal == null || (indexVal instanceof NominalVar)) {
                String lexVal = fs.getValue("lex").toString();
                String index = wordIndexMap.get(lexVal);
                NominalAtom nom;
                if (index == null) {
                    do {
                        index = "w" + ++wordCounter;
                        nom = new NominalAtom(index);
                    } while (edgeFactory.nominals.containsKey(nom));
                    wordIndexMap.put(lexVal, index);
                    edgeFactory.nominals.put(nom, edgeFactory.nominals.size());
                }
                else nom = new NominalAtom(index);
                fs.setFeature("index", nom);
            }
        }
    };
    

    //-----------------------------------------------------------------
    // feature map  
    //
    
    /**
     * Updates the licensed feature map with the info from the given initial category.
     */
    public void updateFeatureMap(Category cat) {
        currentFeatureMap = featureMap; 
        cat.forall(featureMapUpdater);
        currentFeatureMap = null;
    }
    
    // updates the category-specific licensed feature map
    private void updateCatFeatureMap(Category cat) {
        catFeatureMap.clear(); 
        currentFeatureMap = catFeatureMap; 
        cat.forall(featureMapUpdater);
        currentFeatureMap = null;
    }
    
    // a map from an attr name to a map from vals to sets of atomic categories 
    // containing those attr-val pairs
    private Map<String, Map<String, Set<Category>>> featureMap = new HashMap<String, Map<String, Set<Category>>>();
    
    // a feature map for a specific category to be checked
    private Map<String, Map<String, Set<Category>>> catFeatureMap = new HashMap<String, Map<String, Set<Category>>>();
    
    // working feature map
    private Map<String, Map<String, Set<Category>>> currentFeatureMap = null; 
    
    // list of all initial atom cats checked for main feature map
    private List<Category> allInitialAtomCats = new ArrayList<Category>();
    
    // feature map updater    
    private CategoryFcn featureMapUpdater = new CategoryFcnAdapter() {
        public void forall(Category c) {
            if (!(c instanceof AtomCat)) return;
            if (currentFeatureMap == featureMap) allInitialAtomCats.add(c);
            FeatureStructure fs = c.getFeatureStructure();
            if (fs == null) return;
            // for each feature
            for (int i = 0; i < licensingFeatures.length; i++) {
                String attr = licensingFeatures[i].attr; 
                Object val = fs.getValue(attr);
                if (val != null && !(val instanceof Variable)) {
                    // check for relevant value
                    String valStr = val.toString(); 
                    String fVal = licensingFeatures[i].val;
                    List<String> alsoList = licensingFeatures[i].alsoLicensedBy;
                    if (fVal != null && !fVal.equals(valStr) && !alsoList.contains(valStr)) continue;
                    // add to feature map
                    Map<String, Set<Category>> valMap = currentFeatureMap.get(attr); 
                    if (valMap == null) {
                        valMap = new HashMap<String, Set<Category>>(); 
                        currentFeatureMap.put(attr, valMap);
                    }
                    Set<Category> acSet = valMap.get(valStr);
                    if (acSet == null) {
                        acSet = new HashSet<Category>();
                        valMap.put(valStr, acSet);
                    }
                    acSet.add(c);
                }
            }
        }
    };

    
    //-----------------------------------------------------------------
    // category licensing 
    //
    
    /**
     * Returns whether the given category contains a feature indicating that 
     * it needs to be licensed.
     */
    public boolean needsLicensing(Category cat) {
        return checkLicensing(cat, true);
    }

    /**
     * Returns whether the given category is licensed according to 
     * the current feature map.
     */
    public boolean isLicensed(Category cat) {
        return checkLicensing(cat, false);
    }

    // records the licensing feature which succeeded in licensing the last cat (or null if none)
    private LicensingFeature currentLicensingFeature = null; 
    
    // checks the given category according to the given flag, 
    // updating currentLicensingFeature
    private boolean checkLicensing(Category cat, boolean needsLicensing) {
        currentLicensingFeature = null;
        boolean emptyCat = (cat.getLF() == null);
        // set up cat feature map
        updateCatFeatureMap(cat);
        Category target = getTarget(cat);
        // for each feature, look for appropriate attr-val pairs
        for (int i = 0; i < licensingFeatures.length; i++) {
            // skip when appropriate license flag not set
            if (emptyCat && !licensingFeatures[i].licenseEmptyCats) continue; 
            if (!emptyCat && !licensingFeatures[i].licenseMarkedCats) continue;
            String attr = licensingFeatures[i].attr;
            Map<String, Set<Category>> valMap = catFeatureMap.get(attr);
            if (valMap == null) continue;
            String fVal = licensingFeatures[i].val;
            Collection<String> vals;
            if (fVal != null) {
                if (!valMap.containsKey(fVal)) continue;
                vals = new ArrayList<String>(1);
                vals.add(fVal);
            } else {
                vals = valMap.keySet();
            }
            byte loc = licensingFeatures[i].loc;
            // for each attr-val pair
            for (Iterator<String> it = vals.iterator(); it.hasNext(); ) {
                String val = it.next();
                Set<Category> atomCats = valMap.get(val); 
                // check loc
                if (loc == LicensingFeature.TARGET_ONLY) {
                    if (atomCats.size() != 1) continue;
                    if (!atomCats.contains(target)) continue;
                } else if (loc == LicensingFeature.ARGS_ONLY) {
                    if (atomCats.contains(target)) continue;
                }
                // branch on needs-licensing flag
                if (needsLicensing) {
                    // found a feature needing to be licensed
                    return true; 
                }
                else {
                    // check for licensing feature in feature map
                    Map<String, Set<Category>> fmValMap = featureMap.get(attr);
                    // return false if not found
                    if (fmValMap == null) return false;
                    boolean foundLicensingVal = fmValMap.containsKey(val);
                    if (!foundLicensingVal) {
                        List<String> alsoList = licensingFeatures[i].alsoLicensedBy;
                        for (int j = 0; j < alsoList.size(); j++) {
                            if (fmValMap.containsKey(alsoList.get(j))) { 
                                foundLicensingVal = true; break;
                            }
                        }
                    }
                    if (!foundLicensingVal) return false;   
                    // otherwise record licensing feature and return true
                    currentLicensingFeature = licensingFeatures[i]; 
                    return true;
                }
            }
        }
        // otherwise false
        return false;
    }

    // returns the target cat, if complex,  otherwise 
    // just the cat itself    
    private Category getTarget(Category cat) {
        Category target = cat;
        if (cat instanceof ComplexCat) { target = ((ComplexCat)cat).getTarget(); }
        return target;
    }

    
    //-----------------------------------------------------------------
    // empty (semantically null) category licensing and instantiation  
    //
    
    // reusable simple substitution for instantiating vars on atom cats
    private SimpleSubstitution simpleSubst = new SimpleSubstitution();

    /**
     * Determines whether the given semantically null category 
     * is licensed according to the licensed feature map, and if so, returns 
     * appropriately (un-)instantiated versions of the category. 
     * The licensing features are checked in priority order.
     * NB: Instantiation is limited to the case where there is a single 
     *     value for the operative licensing feature.
     */
    public void licenseEmptyCat(Category cat, Set<Category> instantiatedCats, Set<Category> uninstantiatedCats) {
        // reindex
        UnifyControl.reindex(cat);
        // return cat uninstantiated if no licensing features found
        if (!needsLicensing(cat)) {
            uninstantiatedCats.add(cat); return; 
        }
        // return nothing if not licensed
        if (!isLicensed(cat)) return;
        // find operative licensing feature, if necessary
        if (currentLicensingFeature == null) {
            for (int i = 0; i < licensingFeatures.length; i++) {
                if (!catFeatureMap.containsKey(licensingFeatures[i].attr)) continue;
                Map<String, Set<Category>> valMap = catFeatureMap.get(licensingFeatures[i].attr);
                String fVal = licensingFeatures[i].val;
                if (fVal != null && !valMap.containsKey(fVal)) continue;
                currentLicensingFeature = licensingFeatures[i]; 
                break;
            }
            // if still not found, return cat uninstantiated
            if (currentLicensingFeature == null) {
                uninstantiatedCats.add(cat); 
                return; 
            }
        }
        // return cat uninstantiated if licensing feature does not 
        // have instantiation flag set
        if (!currentLicensingFeature.instantiate) {
            uninstantiatedCats.add(cat); return; 
        }
        // return cat uninstantiated if licensing feature has more than one val
        String attr = currentLicensingFeature.attr;
        Map<String, Set<Category>> valMap = catFeatureMap.get(attr);
        if (valMap.size() > 1) {
            uninstantiatedCats.add(cat); return; 
        }
        String val = valMap.keySet().iterator().next();
        Set<Category> atomCats = valMap.get(val);
        // for each atom cat, go ahead with instantiation ...
        for (Iterator<Category> acIt = atomCats.iterator(); acIt.hasNext(); ) {
            Category ac = acIt.next(); 
            // ensure cats with lex feature have an index var
            FeatureStructure fs = ac.getFeatureStructure();
            if (fs.hasAttribute("lex") && !fs.hasAttribute("index")) {
                fs.setFeature("index", new NominalVar("W"));
                UnifyControl.reindex(ac);
            }
            // unify with appropriate initial cats
            Collection<Category> initialCats = null; 
            if (!currentLicensingFeature.licenseEmptyCats) 
                initialCats = allInitialAtomCats;
            else { 
                Map<String, Set<Category>> fmValMap = featureMap.get(attr);
                initialCats = fmValMap.get(val);
                List<String> alsoList = currentLicensingFeature.alsoLicensedBy;
                if (alsoList.size() > 0) { 
                    if (initialCats != null) initialCats = new HashSet<Category>(initialCats);
                    else initialCats = new HashSet<Category>();
                    for (int i = 0; i < alsoList.size(); i++) {
                        Set<Category> alsoSet = fmValMap.get(alsoList.get(i));
                        if (alsoSet != null) initialCats.addAll(alsoSet);
                    }
                }
            }
            if (initialCats == null) {
                System.out.println("Warning, unable to find initial cats for feature " + attr + "=" + val); 
                uninstantiatedCats.add(cat); return; 
            }
            // for each initial cat
            for (Iterator<Category> it = initialCats.iterator(); it.hasNext(); ) {
                Category initialAC = it.next();
                // ensure index instantiated
                FeatureStructure initialFS = initialAC.getFeatureStructure();
                if (initialFS == null) continue;
                Object index = initialFS.getValue("index"); 
                if (!(index instanceof NominalAtom)) continue;
                // block instantiation with bound vars
                if (edgeFactory.boundVarNominals.contains(index)) {
                    instantiatedCats.clear();
                    uninstantiatedCats.add(cat); 
                    return; 
                }
                // try unifying index ...
                simpleSubst.clear(); 
                try {
                    Unifier.unify(ac.getFeatureStructure(), initialFS, simpleSubst);
                    // ensure substitution contains index
                    if (!simpleSubst.containsValue(index)) continue;
                    // get rid of other substitutions
                    for (Iterator<?> it2 = simpleSubst.values().iterator(); it2.hasNext(); ) {
                        if (!it2.next().equals(index)) it2.remove();
                    }
                    // instantiate
                    Category instCat = (Category) cat.fill(simpleSubst);
                    // and add instantiated cats
                    instantiatedCats.add(instCat);
                }
                catch (UnifyFailure uf) {}
            }
        }
    }
}
    

================================================
FILE: src/opennlp/ccg/realize/Hypertagger.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2008-9 Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.realize;

import opennlp.ccg.lexicon.*;
import opennlp.ccg.hylo.*;
import java.util.*;

/**
 * A hypertagger is a realization supertagger.  It must extend the 
 * SupertaggerAdapter interface for plugging a supertagger into the 
 * lexicon.
 * 
 * @author      Michael White
 * @version     $Revision: 1.5 $, $Date: 2009/08/24 01:56:14 $
 */
public interface Hypertagger extends SupertaggerAdapter {
	
	/**
	 * Maps the given elementary predications to their predicted categories, 
	 * so that the beta-best categories can be returned by calls to setPred
	 * and getSupertags.
	 */
	public void mapPreds(List<SatOp> preds);
	
	/**
	 * Sets the current elementary predication to the one with the given index, 
	 * so that the beta-best categories for it can be returned by a call to 
	 * getSupertags.
	 */
	public void setPred(int index);
	
	/** 
	 * Stores the gold standard pred info, for use in discriminative training.
	 * The string consists of space delimited tokens, where each token 
	 * is a colon-separated list of fields, with the first field containing 
	 * the nominal id, and the second field the gold supertag.
	 */
	public void storeGoldStdPredInfo(String goldStdPredInfo);
}


================================================
FILE: src/opennlp/ccg/realize/LexicalDiversityPruningStrategy.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2011 Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.realize;

import opennlp.ccg.lexicon.Word;
import opennlp.ccg.synsem.Sign;

import gnu.trove.THashSet;
import gnu.trove.TObjectIdentityHashingStrategy;

import java.util.*;

/**
 * A diversity pruning strategy that defines signs to be 
 * notCompellinglyDifferent if the set of open class stems 
 * is the same.  The POS classes of interest are set in the 
 * constructor.
 *
 * @author      Michael White
 * @version     $Revision: 1.1 $, $Date: 2011/04/02 16:32:17 $
 */
public class LexicalDiversityPruningStrategy extends DiversityPruningStrategy
{
    /** The interned POS values to use for relevant open class stems. */
    @SuppressWarnings("unchecked")
	protected Set<String> posValsToUse = new THashSet(new TObjectIdentityHashingStrategy());
    
    /** Reusable set of observed interned stems for comparison purposes. */
    @SuppressWarnings("unchecked")
	protected Set<String> stemsSeen = new THashSet(new TObjectIdentityHashingStrategy());
    
    /** Constructor, which sets POS classes of interest. */
    public LexicalDiversityPruningStrategy() {
    	String[] poslist = {
    		"JJ", "JJR", "JJS",
    		"NN", "NNP", "NNS", "NNPS",
    		"RB", "RBR", "RBS",
    		"VB", "VBD", "VBG", "VBN", "VBP", "VBZ"
    	};
    	for (String pos : poslist) posValsToUse.add(pos);
    }
    
    /** Returns true iff the given signs are not compellingly different.
        In particular, returns true iff the set of relevant open class stems are the same. */
    public boolean notCompellinglyDifferent(Sign sign1, Sign sign2) {
    	stemsSeen.clear();
    	for (Word w : sign1.getWords()) {
    		if (posValsToUse.contains(w.getPOS())) stemsSeen.add(w.getStem());
    	}
    	for (Word w : sign2.getWords()) {
    		if (posValsToUse.contains(w.getPOS()) && !stemsSeen.contains(w.getStem()))
    			return false;
    	}
        return true;
    }
}


================================================
FILE: src/opennlp/ccg/realize/NBestPruningStrategy.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2004 University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.realize;

import opennlp.ccg.TextCCG;

import java.util.*;
import java.util.prefs.*;

/**
 * Default, n-best edge pruning strategy.
 *
 * @author      Michael White
 * @version     $Revision: 1.9 $, $Date: 2011/03/27 14:45:32 $
 */
public class NBestPruningStrategy implements PruningStrategy
{
    /** The current pruning val. */
    protected int CAT_PRUNE_VAL;
    
    /** Reusable return list. */
    protected List<Edge> retval = new ArrayList<Edge>();
    
    /** Constructor with pruning val. */
    public NBestPruningStrategy(int pruningVal) {
        CAT_PRUNE_VAL = pruningVal;
    }
    
    /** Default constructor retrieves pruning val from preferences. */
    public NBestPruningStrategy() {
        Preferences prefs = Preferences.userNodeForPackage(TextCCG.class);
        CAT_PRUNE_VAL = prefs.getInt(Chart.PRUNING_VALUE, Chart.NO_PRUNING);
    }
    
    /**
     * Returns a (possibly empty) list of edges pruned 
     * from the given ones, which should be sorted by score, 
     * from highest to lowest. 
     * In particular, prunes and returns the edges that follow the N-best 
     * ones in the given list.
     */
    public List<Edge> pruneEdges(List<Edge> catEdges) {
        // clear reusable return list
        retval.clear();
        // ensure pruning enabled
        if (CAT_PRUNE_VAL == Chart.NO_PRUNING) return retval;
        // nb: could add an option to prune all egdes with zero score
        /*
        for (Iterator it = catEdges.iterator(); it.hasNext(); ) {
            Edge edge = it.next();
            if (edge.score == 0) {
                retval.add(edge);
                it.remove();
            }
        }
        */
        // return edges at bottom of list, starting with CAT_PRUNE_VAL (if any)
        while (CAT_PRUNE_VAL < catEdges.size()) {
            retval.add(catEdges.remove(CAT_PRUNE_VAL));
        }
        // done
        return retval;
    }
}


================================================
FILE: src/opennlp/ccg/realize/PruningStrategy.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2004 University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.realize;

import java.util.*;

/**
 * Interface for edge pruning strategies.
 *
 * @author      Michael White
 * @version     $Revision: 1.4 $, $Date: 2011/03/27 14:45:32 $
 */
public interface PruningStrategy
{
    /**
     * Prunes and returns a (possibly empty) list of edges 
     * from the given ones, which should be sorted by score, 
     * from highest to lowest.
     */
    public List<Edge> pruneEdges(List<Edge> catEdges);
}


================================================
FILE: src/opennlp/ccg/realize/Realizer.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003-11 University of Edinburgh / Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.realize;

import opennlp.ccg.grammar.*;
import opennlp.ccg.synsem.*;
import opennlp.ccg.hylo.*;
import opennlp.ccg.*;
import org.jdom.*;
import java.util.*;
import java.util.prefs.*;

/**
 * The realizer manages the realization process.
 * Realization options may be set for use across calls 
 * to the realizer.
 *
 * @author      Michael White
 * @version     $Revision: 1.31 $, $Date: 2011/07/19 03:40:46 $
 */
public class Realizer
{
    
    /** The grammar used for realization. */
    public final Grammar grammar; 
    
    /** Flag for whether to use depth-first search.  Defaults to false. */
    public boolean depthFirst = false; 
    
    // the chart used to realize a request
    private Chart chart = null;
    
   
    /** Constructor. */
    public Realizer(Grammar grammar) { 
        this.grammar = grammar;
    }
    
    /** Returns the chart used in the latest request, or null if none. */
    public Chart getChart() { return chart; }
    
    
    //-----------------------------------------------------------------
    // default options, for use when not given in realization request
    // nb: as the usual practice is to set these options once 
    //     for reuse across calls to the realizer, only a subset of 
    //     the options may be overridden in different calls to the 
    //     realize method
        
    /** Time limit in ms.  (Default is -1, or none.) */
    public int timeLimitMS = -1;
    
    /** Flag for whether to wait for a complete edge. (Default is false.) */
    public boolean waitForCompleteEdge = false;

    /** Sign scorer to use.  (Default is none.) */
    public SignScorer signScorer = null;
    
    /** Pruning strategy to use. (Default is none.) */
    public PruningStrategy pruningStrategy = null;
    
    /** Hypertagger to use. (Default is none.) */
    public Hypertagger hypertagger = null;
    

    //-----------------------------------------------------------------
    // get LF from doc    
    
    /**
     * Retrieves an input LF from the given XML doc, processing any 
     * LF chunks along the way.
     */
    public static LF getLfFromDoc(Document doc) {
        Element rootElt = doc.getRootElement();
        Element lfElt = (rootElt.getName().equals("lf")) ? rootElt : rootElt.getChild("lf");
        return getLfFromElt(lfElt);
    }

    /**
     * Retrieves an input LF from the given XML element, processing any 
     * LF chunks along the way.
     */
    public static LF getLfFromElt(Element lfElt) {
        HyloHelper.processChunks(lfElt);
        LF lf = HyloHelper.getLF(lfElt);
        return lf;
    }

    
    //-----------------------------------------------------------------
    // realization routines    
    
    /**
     * Realizes the input LF, 
     * returning the best edge found (or null if none).
     */
    public Edge realize(LF lf) {
        return realize(lf, this.signScorer);
    }

    /**
     * Realizes the input LF relative to the given sign scorer, 
     * returning the best edge found (or null if none).
     */
    public Edge realize(LF lf, SignScorer signScorer) {
        Preferences prefs = Preferences.userNodeForPackage(TextCCG.class);
        int timeLimitToUse = (timeLimitMS != -1) 
            ? timeLimitMS
            : prefs.getInt(Chart.TIME_LIMIT, Chart.NO_TIME_LIMIT);
        return realize(lf, signScorer, timeLimitToUse, waitForCompleteEdge);
    }
    
    /**
     * Realizes the input LF relative to given sign scorer, 
     * returning the best edge found (or null if none)
     * in the given time limit (in ms), potentially waiting 
     * longer for a complete edge according to the given flag.
     * If a hypertagger is employed, realization proceeds 
     * iteratively through the available beta-best values 
     * within the overall time or edge limit.
     */
    public Edge realize(LF lf, SignScorer signScorer, int timeLimitMS, boolean waitForCompleteEdge) {
        List<SatOp> preds = HyloHelper.flatten(lf);
        SignScorer scorerToUse = (signScorer != null) 
            ? signScorer : SignScorer.nullScorer;
        PruningStrategy strategyToUse = (pruningStrategy != null) 
            ? pruningStrategy : new NBestPruningStrategy();
        // realize iteratively with hypertagger, if present
        if (hypertagger != null) { 
        	return realizeWithHypertagger(preds, scorerToUse, strategyToUse, timeLimitMS);
        }
        // otherwise make chart, set start time
        long startTime = System.currentTimeMillis(); 
        chart = new Chart(new EdgeFactory(grammar, preds, scorerToUse), strategyToUse);
        chart.startTime = startTime; 
        chart.depthFirst = depthFirst;
        // run request
        chart.initialize();
        chart.combine(timeLimitMS, waitForCompleteEdge);
        // XXX tmp
    	// if no complete edge, try again gluing fragments
//        if (!chart.bestEdge.complete()) {
//        	System.out.println("Trying to glue fragments ...");
//        	chart.reInitForGluing();
//        	chart.combine(timeLimitMS, waitForCompleteEdge);
//        }
        // return best edge
        return chart.bestEdge;
    }
    
    // XXX tmp switch for gluing
    private boolean useGluing = Boolean.getBoolean("useGluing");
    
    // iterate through beta-best values until a complete realization is found; 
    // otherwise return the best fragment using the glue rule, or if all else 
    // fails (or not using gluing), greedy fragment joining
    private Edge realizeWithHypertagger(List<SatOp> preds, SignScorer signScorer, PruningStrategy pruningStrategy, int timeLimitMS) {
        // get start time
        long startTime = System.currentTimeMillis();
        // get edge limit
        Preferences prefs = Preferences.userNodeForPackage(TextCCG.class);
        int edgeLimit = prefs.getInt(Chart.EDGE_LIMIT, Chart.NO_EDGE_LIMIT);
    	// set supertagger in lexicon
    	grammar.lexicon.setSupertagger(hypertagger);
    	// reset beta
    	hypertagger.resetBeta();
        // loop until retval set or need to give up
        Edge retval = null;
        chart = null;
        boolean outOfBetas = false;
        boolean pastTimeLimit = false;
        boolean exceededEdgeLimit = false;
        long iterStartTime = 0, currentTime = 0;
        int iterTime = 0;
        while (retval == null && !outOfBetas && !pastTimeLimit && !exceededEdgeLimit) {
        	// instantiate chart and set start time for this iteration
            chart = new Chart(new EdgeFactory(grammar, preds, signScorer, hypertagger), pruningStrategy);
            iterStartTime = System.currentTimeMillis();
        	// do realization in packing mode to see if a complete realization 
        	// can be found with this hypertagger setting
            chart.usePacking = true; chart.collectCombos = false;
            chart.doUnpacking = false; chart.joinFragments = false;
            // run request
            chart.initialize();
            if (chart.noUncoveredPreds()) 
            	chart.combine(timeLimitMS, false);
            // check time limit
            currentTime = System.currentTimeMillis();
            iterTime = (int) (currentTime - iterStartTime);
            if (timeLimitMS != Chart.NO_TIME_LIMIT && iterTime >= timeLimitMS) {
            	pastTimeLimit = true;
//            	System.out.println("Went past time limit with ht beta: " + hypertagger.getCurrentBetaValue());
            }
            // check edge limit
            if (edgeLimit != Chart.NO_EDGE_LIMIT && chart.numEdges >= edgeLimit) {
            	exceededEdgeLimit = true;
//            	System.out.println("Exceeded edge limit with ht beta: " + hypertagger.getCurrentBetaValue());
            }
            // if complete, unpack and return best edge
            if (chart.bestEdge.complete()) {
            	chart.doUnpacking = true; chart.doUnpacking();
            	retval = chart.bestEdge;
            }
            // otherwise check beta level if still within limits
            else if (!pastTimeLimit && !exceededEdgeLimit) {
            	// progress to next beta setting, if any
            	if (hypertagger.hasMoreBetas()) {
            		hypertagger.nextBeta();
            	}
            	else {
	            	// otherwise out of betas
            		outOfBetas = true;
//	            	System.out.println("Ran out of betas with ht beta: " + hypertagger.getCurrentBetaValue());
            	}
            }
        }
        // if no result, take desperate measures with fragments
        if (retval == null) {
        	// try realization with gluing
            if (useGluing) {
//	            System.out.println("Num edges for final iteration: " + chart.numEdges);
//	            System.out.println("Trying gluing option after iterTime: " + iterTime);
	        	chart.reInitForGluing();
	        	// double time and space limits, to give gluing option some room
	        	chart.edgeLimit = edgeLimit * 2;
	        	chart.combine(timeLimitMS * 2, waitForCompleteEdge);
//	            System.out.println("Num edges after gluing: " + chart.numEdges);
	            currentTime = System.currentTimeMillis();
	            iterTime = (int) (currentTime - iterStartTime);
	            // if complete, unpack and return best edge
	            if (chart.bestEdge.complete()) {
//	                System.out.println("Unpacking in final iteration after iterTime: " + iterTime);
	            	chart.doUnpacking = true; chart.doUnpacking();
	            	retval = chart.bestEdge;
	            }
            }
            // otherwise try a final iteration in an iteration in anytime mode, possibly resorting to joining fragments 
            if (retval == null) {
//                System.out.println("Trying a final iteration in anytime mode after iterTime: " + iterTime);
            	// instantiate chart and set start time for this iteration
                chart = new Chart(new EdgeFactory(grammar, preds, signScorer, hypertagger), pruningStrategy);
                iterStartTime = System.currentTimeMillis();
                // run request
        		chart.usePacking = false; chart.joinFragments = true;
                chart.initialize();
                chart.combine(timeLimitMS, waitForCompleteEdge);
//	            System.out.println("Num edges after anytime iteration: " + chart.numEdges);
	            currentTime = System.currentTimeMillis();
	            iterTime = (int) (currentTime - iterStartTime);
//	            if (chart.bestEdge.complete()) 
//	                System.out.println("Found complete edge after iterTime: " + iterTime);
//	            else
//	                System.out.println("Resorting to joined fragments after iterTime: " + iterTime);
                // return best edge
                retval = chart.bestEdge;
            }
        }
    	// update end time
        long endTime = System.currentTimeMillis();
        chart.timeTilDone = (int) (endTime - startTime);
    	// reset supertagger in lexicon
    	grammar.lexicon.setSupertagger(null);
        // return
    	return retval;
    }
}


================================================
FILE: src/opennlp/ccg/realize/RuleInstance.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003-5 University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.realize;

import opennlp.ccg.grammar.*;
import opennlp.ccg.hylo.*;
import java.util.*;
//import java.util.prefs.*;
//import java.text.*;

/**
 * A rule instance is a tracker for an instantiated version of a type changing 
 * rule, ie a type changing rule with its semantics instantiated together with 
 * bitsets representing its coverage of the input predicates 
 * and the indices in its arg category, along with lists of the active LF alts.
 * Such rule instances are created and managed by an EdgeFactory.
 * The design follows the Singleton pattern.
 *
 * @author      Michael White
 * @version     $Revision: 1.7 $, $Date: 2005/11/24 03:22:08 $
 */
public class RuleInstance extends Tracker
{
    /** The instantiated type changing rule. */
    public final TypeChangingRule rule;
    
    /** Constructor. */
    public RuleInstance(TypeChangingRule rule, BitSet bitset, BitSet indices, List<List<Alt>> activeLfAlts) {
        super(bitset, indices, activeLfAlts);
        this.rule = rule;
    }

    /** Returns '{bitset} name: arg => result'. */
    public String toString() {
        StringBuffer sb = new StringBuffer();
        //sb.append(indices + " ");
        sb.append(bitset + " ");
        sb.append(rule);
        return sb.toString();
    }
}
    

================================================
FILE: src/opennlp/ccg/realize/StemPruningStrategy.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2012 Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.realize;

import opennlp.ccg.lexicon.Word;
import opennlp.ccg.synsem.Sign;

import java.util.*;

/**
 * A diversity pruning strategy that defines signs to be 
 * notCompellinglyDifferent if they have the same sequence of
 * stems. 
 * The empty constructor defaults the singleBestPerGroup flag 
 * to true.
 *
 * @author      Michael White
 * @version     $Revision: 1.1 $, $Date: 2011/04/02 16:32:17 $
 */
public class StemPruningStrategy extends DiversityPruningStrategy
{
    /** Constructor, defaults singleBestPerGroup to true. */
    public StemPruningStrategy() { this(true); }

    /** Full constructor. */
    public StemPruningStrategy(boolean singleBestPerGroup) { 
        this.singleBestPerGroup = singleBestPerGroup;
    }
    
    /** Returns true iff the given signs are not compellingly different.
        In particular, returns true iff the signs have the same
        sequence of stems. */
    public boolean notCompellinglyDifferent(Sign sign1, Sign sign2) {
	List<Word> words1 = sign1.getWords();
	List<Word> words2 = sign2.getWords();
	if (words1.size() != words2.size()) return false;
    	for (int i=0; i < words1.size(); i++) {
	    if (words1.get(i).getStem() != words2.get(i).getStem())
		return false;
    	}
        return true;
    }
}


================================================
FILE: src/opennlp/ccg/realize/Tracker.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003-5 University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.realize;

import opennlp.ccg.hylo.*;
import java.util.*;

/**
 * A tracker is a wrapper for either a sign (ie, an edge) or 
 * a type changing rule (ie, a rule instance) which has bitsets for 
 * representing the coverage of the input predicates and the semantic indices used.
 * It also has a list of active LF alts.
 * Trackers are created by an EdgeFactory.
 * The design follows the Singleton pattern.
 *
 * @author      Michael White
 * @version     $Revision: 1.9 $, $Date: 2005/11/24 03:15:26 $
 */
public class Tracker
{
    /** The coverage bitset. */
    public final BitSet bitset;
    
    /** The indices bitset. */
    public final BitSet indices;
    
    /** The active LF alts. */
    public final List<List<Alt>> activeLfAlts;
    
    /** Constructor. */
    public Tracker(BitSet bitset, BitSet indices, List<List<Alt>> activeLfAlts) {
        this.bitset = bitset; this.indices = indices; this.activeLfAlts = activeLfAlts;
    }
    
    /** 
     * Returns whether the coverage bitset of this tracker intersects with the 
     * coverage bitset of the given one.
     */
    public boolean intersects(Tracker tracker) {
        return bitset.intersects(tracker.bitset);
    }

    /** 
     * Returns whether the indices bitset of this tracker intersects with the 
     * indices bitset of the given one, if both non-empty; otherwise, returns 
     * true (if either this tracker or the given one has no indices).
     */
    public boolean indicesIntersect(Tracker tracker) {
        return indices.isEmpty() || tracker.indices.isEmpty() || 
            indices.intersects(tracker.indices);
    }
}


================================================
FILE: src/opennlp/ccg/realize/hypertagger/FeatureExtractionException.java
================================================
package opennlp.ccg.realize.hypertagger;

public class FeatureExtractionException extends Exception {

	public FeatureExtractionException(String string) {
		super(string);
	}
	
	public FeatureExtractionException() {
		super();
	}

	/**
	 * 
	 */
	private static final long serialVersionUID = 1L;
	
}


================================================
FILE: src/opennlp/ccg/realize/hypertagger/LFInfo.java
================================================
package opennlp.ccg.realize.hypertagger;

import opennlp.ccg.synsem.LF;

/**
 * @author espinosa
 *	This class encapsulates a LF and its corresponding gold standard predicate info, if available.
 */
public class LFInfo {
	LF lf;
	String fullWords;
	String lfNum;
	public LFInfo(LF lf, String fullWords, String lfNum) {
		this.lf = lf;
		this.fullWords = fullWords;
		this.lfNum = lfNum;
	}
	public LF getLF() {
		return this.lf;
	}
	public String getFullWords() {
		return this.fullWords;
	}
	public String getLFNum() {
		return this.lfNum;
	}
}


================================================
FILE: src/opennlp/ccg/realize/hypertagger/LFLoader.java
================================================
package opennlp.ccg.realize.hypertagger;

import java.io.File;
import java.io.FileFilter;
import java.io.IOException;
import java.net.MalformedURLException;
import java.net.URL;
import java.util.ArrayList;
import java.util.Arrays;
import java.util.Iterator;
import java.util.LinkedList;
import java.util.List;

import opennlp.ccg.grammar.Grammar;
import opennlp.ccg.hylo.HyloHelper;
import opennlp.ccg.realize.Realizer;
import opennlp.ccg.synsem.LF;

import org.jdom.Document;
import org.jdom.Element;


/**
 * @author espinosa
 *	This class abstracts over a collection of LFs contained in a collection of files.
 */
public class LFLoader implements Iterator<LFInfo> {
	static class XmlFilenameFilter implements FileFilter {
		public boolean accept(File f) {
			return f.getName().toLowerCase().endsWith(".xml");
		}
	}
	Grammar grammar;
	ArrayList<File> lfFiles;
	int filePos = 0;
	LinkedList<LFInfo> lfs;
	int total = 0;
	int skipped = 0;

	/**
	 * Constructs a new LFLoader which will load LFs from a collection of files or directories under a base directory.
	 * @param grammarFile The grammar to use
	 * @param baseDir The base directory. Paths will be interpreted relative to this directory.
	 * @param paths The files to load the LFs from. Directories or files can be given. Directories are not searched recursively. Only files ending
	 *  in .xml will be loaded.
	 */
	public LFLoader(File grammarFile, File baseDir, List<String> paths) {
		lfs = new LinkedList<LFInfo>();
		URL grammarURL = null;
		try {
			grammarURL = grammarFile.toURI().toURL();
		} 
		catch (MalformedURLException e1) {
			e1.printStackTrace();
		}
		try {
			grammar = new Grammar(grammarURL);
		} 
		catch (Exception e) {
			e.printStackTrace();
		}
		lfFiles = new ArrayList<File>();
		paths = normalize(paths);
		for (String lfFilename : paths) {
			// if this argument is a directory, load all XML files from it
			File f = new File(baseDir, lfFilename);
			if(f.isDirectory()) {
				lfFiles.addAll(Arrays.asList(f.listFiles(new XmlFilenameFilter())));
			}
			else {
				lfFiles.add(f);
			}
		}
	}

	private List<String> normalize(List<String> paths) {
		ArrayList<String> ret = new ArrayList<String>();
		for(String s: paths) {
			if(s.indexOf(',') < 0) {
				ret.add(s.trim());
			}
			else {
				// explode comma-separated values into separate strings
				String[] fields = s.split(",");
				for(String f : fields) {
					ret.add(f.trim());
				}
			}
		}
		return ret;
	}

	@SuppressWarnings("unchecked")
	private void loadFile(File lfFile) {
		Document doc = null;
		int n = 0;
		try {
			doc = grammar.loadFromXml(lfFile.getAbsolutePath());
		} 
		catch (IOException e) {
			// if there's a problem, just skip this file
			System.err.println("Couldn't open input file " + lfFile + ", skipping.\n");
			return;
		}
		catch (Exception e) {
			e.printStackTrace();
			return;
		}
		Element root = doc.getRootElement();
		List<Element> testItems = root.getChildren();
		// Iterate through test item LFS and print to file/stdio tags predicted
		// by the hypertagger
		for (Element item : testItems) {
			String lfNum = "unk";
			lfNum = item.getAttributeValue("info");
			Element itemLFElt = item.getChild("lf");
			//Element itemFullWordsElt = item.getChild("full-words");
			Element itemPredInfoElt = item.getChild("pred-info");
			//String sentId = itemFullWordsElt.getAttributeValue("info");
			//String fullWords = itemFullWordsElt.getTextNormalize();
			// mww: extra null check
			String predInfo = null;
			if (itemPredInfoElt != null) predInfo = itemPredInfoElt.getAttributeValue("data");
			//String predInfo = itemPredInfoElt.getAttributeValue("data");
			if(predInfo == null || predInfo.equals("")) {
				/* because this class is used to load LFs for training purposes, we can't continue without the gold-std info */
				// mww: added info: lfNum
				System.err.println("No pred-info found for lf #" + n + " (info: " + lfNum + ") in file " + lfFile + ", skipping.");
				skipped++;
				continue;
			}
			// mww: added try-catch block
			try {
				LF lf = Realizer.getLfFromElt(itemLFElt);
				LF flatLF = HyloHelper.flattenLF(lf);
				lfs.offer(new LFInfo(flatLF, predInfo, lfNum));
			}
			catch (Exception exc) {
				System.err.println("Skipping lf #" + n + " (info: " + lfNum + ") in file " + lfFile + ", uncaught exception:");
				System.err.println(exc.getMessage());
				exc.printStackTrace(System.err);
				skipped++;
				continue;
				
			}
			n++;
			total++;
		}
		System.err.println("LFL: loaded " + n + " LFs from " + lfFile);
	}
	/* two cases:
	 * - if there's an LF in the queue, return it
	 * - if there isn't, load the next file -- BUT -- if the LF queue is still empty, load the next file, and so on
	 */
	public boolean hasNext() {
		if(!lfs.isEmpty()) {
			return true;
		}
		// queue is empty, load next file
		while(lfs.isEmpty()) {
			if(filePos == lfFiles.size()) {
				return false; // no more files
			}
			loadFile(lfFiles.get(filePos));
			filePos++;
		}
		return true;
	}

	// this method returns null when no more LFs can be loaded
	public LFInfo next() {
		if(!lfs.isEmpty()) {
			return lfs.poll();
		}
		while(lfs.isEmpty()) {
			if(filePos == lfFiles.size()) {
				return null;
			}
			loadFile(lfFiles.get(filePos));
		}
		return lfs.poll();
	}

	public void remove() {
		// NOT IMPLEMENTED
		throw new RuntimeException("Method not implemented");
	}
	public int getTotal() {
		return this.total;
	}
	public int getSkipped() {
		return this.skipped;
	}
}

================================================
FILE: src/opennlp/ccg/realize/hypertagger/LMFactorExtractor.java
================================================
package opennlp.ccg.realize.hypertagger;

import java.io.BufferedReader;
import java.io.File;
import java.io.FileReader;
import java.io.IOException;


/* this is a copy of TagExtract, modified to extract SRILM-format data using  the full-words
 * element from XML-format LFs.
 * The input is a file in which each line is a "pred-info"-style line, one per LF.
 * The input file is given as the sole commandline argument. 
 * The factors are written to stdout.
 */
public class LMFactorExtractor {
	public static void main(String args[]) {
		BufferedReader rd = null;
		int lineNum = 0;
		int bNum = 0;
		try {
			rd = new BufferedReader(new FileReader(new File(args[0])));
		}
		catch (Exception e) {
			e.printStackTrace();
			System.exit(1);
		}
		String line = null;
		StringBuilder out;
		while(true) {
			try { 
				line = rd.readLine();
			}
			catch(IOException e) {
				e.printStackTrace();
				System.exit(1);
			}
			lineNum++;
			if(line == null) {
				break;
			}
			if(line.matches("^\\s*$")) {
				continue;
			}
			out = new StringBuilder();
			out.append("<s> ");
			String[] fields = line.split("\\s+");
			bNum = 0;
			for(String f : fields) {
				bNum++;
				String[] info = f.split(":");
				if(info.length != 4) {
					System.err.println("Wrong number of fields encountered in input line " + lineNum + ", bundle " + bNum);
					System.exit(1);
				}
				out.append(info[3]);
				out.append(":S-");
				out.append(info[3]);
				out.append(":P-");
				out.append(info[2]);
				out.append(":T-");
				out.append(info[1]);
				out.append(" ");
			}
			out.append("</s>");
			System.out.println(out.toString());
		}
	}	
}


================================================
FILE: src/opennlp/ccg/realize/hypertagger/TagExtract.java
================================================
package opennlp.ccg.realize.hypertagger;

import java.io.BufferedWriter;
import java.io.File;
import java.io.FileFilter;
import java.io.FileWriter;
import java.io.IOException;
import java.util.Comparator;
import static java.util.Arrays.*;
import joptsimple.*;

import opennlp.ccg.realize.hypertagger.TagExtractor;
import opennlp.ccg.synsem.LF;
import opennlp.ccg.util.Pair;

public class TagExtract {
	private static boolean quiet = false; // when true, suppress stderr messages
	@SuppressWarnings("unused")
	private static File posModelFile;
	private static File hyperModelFile;
	private static File posPriorModelFile;
	private static File htPriorModelFile;
	private static File posVocabFile;
	private static File htVocabFile;
	private static String argnames;
	private TagExtractor tex;
	private BufferedWriter output;
	@SuppressWarnings({ "unchecked", "rawtypes" })
	static class PairComparator implements Comparator {
		@SuppressWarnings("boxing")
		public int compare(Pair<Double,Integer> p, Pair<Double,Integer> q) {
			if(p.a > q.a) {
				return 1;
			}
			if(p.a == q.a) {
				return 0;
			}
			return -1;
		}
		public int compare(Object p, Object q) {
			return this.compare((Pair<Double,Integer>) p, (Pair<Double,Integer>)q );
		}
	}
	static class XmlFilenameFilter implements FileFilter {
		public boolean accept(File f) {
			return f.getName().toLowerCase().endsWith(".xml");
		}
	}
	public TagExtract(TagExtractor t) {
		this.tex = t;
	}
	/* TODO: this method should probably be rewritten to use LFLoader and a config file */
	public static void main(String[] args) throws IOException {
		TagExtract t = null;
		//PrintStream output = System.out;
		BufferedWriter output;
		//int lfcount = 0;
		//int lfNum = 0;
		// option processing
		OptionParser o = new OptionParser();
		o.acceptsAll(asList("help", "h"), "this message");
		o.acceptsAll(asList("quiet", "q"), "print no messages");
		o.acceptsAll(asList("pos", "pos"), "extract POS features");
		OptionSpec<File> pos_s = o.acceptsAll(asList("p", "pos-model")).withRequiredArg().ofType(File.class).describedAs("POS model to use");
		OptionSpec<File> outf = o.acceptsAll(asList("o", "output")).withRequiredArg().ofType(File.class).describedAs("output file");
		OptionSpec<File> posPrior_s = o.acceptsAll(asList("P", "pos-prior")).withRequiredArg().ofType(File.class).describedAs("POS prior model to use");
		OptionSpec<File> ht_s = o.acceptsAll(asList("y", "hyper-model")).withRequiredArg().ofType(File.class).describedAs("HT model to use as input to 2-pass model (see README)");
		OptionSpec<File> htPrior_s = o.acceptsAll(asList("H", "ht-prior")).withRequiredArg().ofType(File.class).describedAs("HT prior model to use");
		OptionSpec<File> gr_s = o.acceptsAll(asList("g", "grammar")).withRequiredArg().ofType(File.class).describedAs("grammar filename");
		OptionSpec<File> ht_vocab_s = o.acceptsAll(asList("V", "ht-prior-vocab")).withRequiredArg().ofType(File.class).describedAs("HT prior vocab filename");
		OptionSpec<File> pos_vocab_s = o.acceptsAll(asList("v", "pos-prior-vocab")).withRequiredArg().ofType(File.class).describedAs("POS prior vocab filename");
		OptionSpec<File> corpusDir_s = o.acceptsAll(asList("d", "lf-dir")).withRequiredArg().ofType(File.class).describedAs("Directory to change to before searching for XML files");
		OptionSpec<String> argnames_s = o.acceptsAll(asList("an", "argnames")).withRequiredArg().describedAs("Names of argument roles in format name(:shortname)?");
		OptionSet options = o.parse(args);
		/* if -h (help) is given, print message and exit */
		if (options.has("h") || args.length == 0) {
			o.printHelpOn(System.out);
			System.out.println("See the README for additional information.");
			System.exit(0);
		}
		output = new BufferedWriter(new FileWriter(options.valueOf(outf)));
		// some of these will be nulls, depending on what the user is trying to do
		hyperModelFile = options.valueOf(ht_s);
		posModelFile = options.valueOf(pos_s);
		posPriorModelFile = options.valueOf(posPrior_s);
		posVocabFile = options.valueOf(pos_vocab_s);
		htPriorModelFile = options.valueOf(htPrior_s);
		htVocabFile = options.valueOf(ht_vocab_s);
		argnames = options.valueOf(argnames_s);
		if(options.has("q"))
			quiet = true;
		LFLoader lfs = new LFLoader(options.valueOf(gr_s), options.valueOf(corpusDir_s), options.nonOptionArguments());
		if(options.has("pos")) {
			TagExtractor tex = new ZLPOSTagger();
			// mww: set arg names
			if (argnames != null) debug("Setting arg names to " + argnames + "\n");
			tex.setArgNames(argnames); // uses default names if null
			if(posPriorModelFile != null && posVocabFile != null) {
				debug("Loading POS model priors from " + posPriorModelFile + "\n");
				debug("Loading POS model vocab from " + posVocabFile + "\n");
				tex.loadPriorModel(posPriorModelFile, posVocabFile);
			}
			debug("Extracting POS features..." + "\n");
			t = new TagExtract(tex);
		}
		else {
			// extracting hypertags
			// using GS pos tags
			TagExtractor tex = new ZLMaxentHypertagger();
			// mww: set arg names
			if (argnames != null) debug("Setting arg names to " + argnames + "\n");
			tex.setArgNames(argnames); // uses default names if null
			if(htPriorModelFile != null && htVocabFile != null) {
				debug("Loading HT model priors from " + htPriorModelFile + "\n");
				debug("Loading HT model vocab from " + htVocabFile + "\n");
				tex.loadPriorModel(htPriorModelFile,htVocabFile);
			}
			if(hyperModelFile != null) {
				debug("Loading proto-HT model from " + hyperModelFile + "\n");
				tex.loadProtoModel(hyperModelFile);
			}
			debug("Extracting hypertagger features..." + "\n");
			t = new TagExtract(tex);
		}
		t.setOutput(output);
		while(lfs.hasNext()) {
				LFInfo lfi = lfs.next();
				LF lf = lfi.getLF();
				try {
					//lfNum++;
					t.extract(lf, lfi.getFullWords());
					//lfcount++;
					//debug("LFs extracted:       " + lfcount + "\r");
				} catch (FeatureExtractionException e) {
					debug("In LF #" + lfi.getLFNum() + ":\n");
					debug(e.toString() + "\n");
				}
		}
		output.close();
		debug("\n");
	}
	private void extract(LF flatLF, String fullWords) throws FeatureExtractionException {
		tex.storeGoldStdPredInfo(fullWords);
		tex.setLF(flatLF);
		try {
			output.write(tex.getAllFeaturesAndAnswer());
		} catch (IOException e) {
			// TODO Auto-generated catch block
			e.printStackTrace();
		}

	}
	private void setOutput(BufferedWriter output) {
		this.output = output;

	}
	public static void debug(String string) {
		if(!quiet) 
			System.err.print(string);
	}
}


================================================
FILE: src/opennlp/ccg/realize/hypertagger/TagExtractor.java
================================================
package opennlp.ccg.realize.hypertagger;

import java.io.File;
import java.util.*;

import opennlp.ccg.hylo.*;
import opennlp.ccg.synsem.*;
import opennlp.ccg.util.Pair;

/** This class contains methods for extracting features from a logical form
 * 
 * @author espinosa
 *
 */
public abstract class TagExtractor {
	protected class LfGraphLink {
		String label; // eg. "genrel"
		String arg; // if applicable
		LfGraphNode target; // graph node it points to
		LfGraphNode source; // node it extends from
		public LfGraphLink(String l, String a, LfGraphNode t) {
			label = l;
			arg = a;
			target = t;
		}
		public LfGraphNode getTarget() {
			return target;
		}
		public void setTarget(LfGraphNode t) {
			target = t;
		}
		public String getLabel() {
			return label;
		}
		public LfGraphNode getSource() {
			return source;
		}
		public void setSource(LfGraphNode source) {
			this.source = source;
		}
	}
	protected class LfGraphNode {
		String data;
		String predicateName;
		int index; // from original LF
		SatOp pred; // original predicate object
		ArrayList<LfGraphLink> children;
		LfGraphLink parentLink;
		HashMap<String,String> attribs;
		protected String POS; // caches the part-of-speech tag for this node (or GS postag)
		protected String ST; // gold-standard supertag
		ArrayList<Pair<String,Double>> POSList; // not used atm
		Set<Pair<String, Double>> STList; // for 2-pass tags
		
		public Set<Pair<String, Double>> getSTList() {
			return STList;
		}
		public void setSTList(Set<Pair<String, Double>> set) {
			STList = set;
		}
		ArrayList<LfGraphNode> multiparents;
		FeatureList features;
		private String id; // e.g. "w1"
		protected FeatureList getFeatures() {
			return features;
		}
		protected void setFeatures(FeatureList features) {
			this.features = features;
		}
		public LfGraphNode(String s, int idx) {
			data = s; // this is just "w1" or whatever
			index = idx;
			children = new ArrayList<LfGraphLink>();
			attribs = new HashMap<String,String>();
			POS = null;
			multiparents = new ArrayList<LfGraphNode>();
		}
		public String getData() {
			return data;
		}
		public void setData(String s) {
			data = s;
		}
		public void addAttribute(String name, String value) {
			attribs.put(name, value);
		}
		public void addChild(LfGraphLink link) {
			children.add(link);
		}
		public ArrayList<LfGraphLink> getChildren() {
			return children;
		}
		public int getNumChildren() {
			return children.size();
		}
		public boolean isLeafNode() {
			if(children.isEmpty()) {
				return true;
			}
			else {
				return false;
			}
		}
		/*
		public boolean isLexPred() {
			return HyloHelper.isLexPred(data);
		}*/
		public LfGraphNode findNode(BitSet b) {
			// intended to be run from the root node; only searches
			// nodes below this one
			// Say we want a node whose index is between 1-4 inclusive
			// pass a bitset with those bits set. Returns the lex pred
			// node whose index is in the bitset.
			if(b.get(index)) {
				return this;
			}
			for(LfGraphLink n : children) {
				n.getTarget().findNode(b);
			}
			return null;
		}
		public HashMap<String, String> getAttribs() {
			return attribs;
		}
		public void setAttribs(HashMap<String, String> attribs) {
			this.attribs = attribs;
		}
		public int getIndex() {
			return index;
		}
		public void setIndex(int index) {
			this.index = index;
		}
		public void setChildren(ArrayList<LfGraphLink> children) {
			this.children = children;
		}
		public String getPredicateName() {
			return predicateName;
		}
		public void setPredicateName(String predicateName) {
			this.predicateName = predicateName;
		}
		public LfGraphLink getParentLink() {
			return parentLink;
		}
		public void setParentLink(LfGraphLink parentLink) {
			this.parentLink = parentLink;
		}
		public void addMultiParent(LfGraphNode parentNode) {
			// XXX should not be necessary! fix bug & eliminate
			if(parentNode == this) {
				return;
			}
			this.multiparents.add(parentNode);
		}
		public ArrayList<LfGraphNode> getMultiParents() {
			return this.multiparents;
		}
		public SatOp getPred() {
			return pred;
		}
		protected void setPred(SatOp pred) {
			this.pred = pred;
		}
		public String getPOS() {
			return POS;
		}
		public void setPOS(String pos) {
			POS = new String(pos);
		}
		public ArrayList<Pair<String, Double>> getPOSList() {
			return POSList;
		}
		public void setPOSList(ArrayList<Pair<String,Double>> plist) {
			this.POSList = plist;
		}
		public void setID(String string) {
			this.id = string;
		}
		public String getID() {
			return this.id;
		}
	}
	public static int LFID = 0;
	/** Implements  a list of features. Keys are short strings, e.g. "CN", "FO", ...
	 * Values are arbitrary strings, but a key can have multiple values. Thus, the values are actually of type ArrayList<String>. 
	 * @author espinosa
	 *
	 */
	protected class FeatureList extends HashMap<String, ArrayList<String>> {
		/**
		 * 
		 */
		private static final long serialVersionUID = 1L;
		int numFeatures = 0;
		// deprecated
		protected void addFeature(String featureName, String value) {
			/*if(value == null) {
				return;
			}
			if(this.get(featureName) == null) {
				this.put(featureName.trim(), new ArrayList<String>());
			}
			ArrayList<String> feats = this.get(featureName);
			feats.add(value.trim());
			this.put(featureName.trim(), feats);
			numFeatures++; */
			addFeatureWithProb(featureName, value);
		}
		protected void addFeatures(String featureName, ArrayList<Pair<String,Double>> values) {
			for(Pair<String,Double> v : values) {
				this.addFeatureWithProb(featureName, v.a, v.b );
			}
		}
		// merge f's features into self
		/*
		protected void addFeatures(FeatureList f) {
			Set<Map.Entry<String,ArrayList<String>>> es = this.entrySet();
			for(Map.Entry<String,ArrayList<String>> e : es) {
				String fn = e.getKey();
				for(String fv : e.getValue()) {
					this.addFeature(fn, fv);
				}
			}
		} */
		protected void addFeatureWithProb(String featureName, String value, Double prob) {
			if(value == null) {
				return;
			}
			if(this.get(featureName) == null) {
				this.put(featureName.trim(), new ArrayList<String>());
			}
			ArrayList<String> feats = this.get(featureName);
			feats.add(value.trim() + ":" + prob.toString());
			this.put(featureName.trim(), feats);
			numFeatures++;
		}
		protected void addFeatureWithProb(String featureName, String value) {
			this.addFeatureWithProb(featureName, value, new Double(1.0));
		}
		protected ArrayList<String> getFeature(String featureName) {
			return this.get(featureName);
		}
		protected String getSingleFeature(String featureName) {
			return this.get(featureName).get(0);
		}
		protected String getAllFeatures() {
			String output = "";
			for(String k : this.keySet()) {
				for(String v : this.get(k)) {
					output = output.concat(k + "=" + v);
					output = output.concat(" ");
				}
			}
			return output;
		}
		protected String[] getAllFeaturesForMaxent() {
			String[] out = new String[this.getNumFeatures()];
			int i = 0;
			for(String k : this.keySet()) {
				for(String v : this.get(k)) {
					out[i] = k + "=" + v;
					i++;
				}
			}
			return out;
		}
		protected int getNumFeatures() {
			return numFeatures;
		}
	}
	// fields
	protected LfGraphNode lfGraph; // stores the graph structure of the LF
	protected HashMap<String,LfGraphNode> nomTable;
	protected HashMap<String,LfGraphNode> varTable;
	protected HashMap<LfGraphNode,String> lexpairs;
	protected HashMap<LfGraphNode,String> pospairs;
	protected LF lf;
	protected List<SatOp> preds;
	protected List<SatOp> flatLF;
	protected int maxIndex;
	protected Map<String,String> argNameMap; // mww: map from arg names to short arg names
	

	public TagExtractor() {	argNameMap = new HashMap<String,String>(); }
	
	public void setLF(LF lf) throws FeatureExtractionException {
		LFID++;
		// experimental
		HyloHelper.convertNominals(lf);
		setLF(HyloHelper.getPreds(lf));
	}
	
	/** This method takes an LF and extracts its features, changing the internal state
	 * of this object accordingly. Other methods such as getSupertag() can then
	 * be called to obtain the tagger's prediction.
	 * @param preds A logical form
	 * @throws FeatureExtractionException when the logical form cannot be processed and the extracted features will not be meaningful
	 */
	public void setLF(List<SatOp> preds) throws FeatureExtractionException {
		this.preds = preds;
		LfGraphNode curNode = null;
		curNode = null;
		nomTable = new HashMap<String,LfGraphNode>();
		varTable = new HashMap<String,LfGraphNode>();
		int i = 0;
		// Pass 1: find and store nominals
		for(SatOp s: preds) {
			if(s == null) {
					throw new FeatureExtractionException(); // ??? why is it sometimes null?
			}
			if(s.getArg() instanceof Proposition) {
				LfGraphNode thisNode = new LfGraphNode(s.getNominal().toString(), i);
				thisNode.setPredicateName(((Proposition)s.getArg()).getName());
				thisNode.setID(s.getNominal().toString());
				thisNode.setPred(s);
				if(lfGraph == null) {
					// i.e., the first node processed
					lfGraph = thisNode;
				}
				nomTable.put(thisNode.getID(), thisNode);
			}
			i++;
		}
		this.maxIndex = i;
		// Pass 2: traverse all other nodes, linking to nominals found in pass 1
		i = 0;
		for(SatOp s: preds) {
			if(s == null) {
				throw new FeatureExtractionException();
			}
			if(s.getArg() instanceof Proposition) {
				curNode = nomTable.get(s.getNominal().toString());
				i++;
				continue;
			}
			Diamond d = (Diamond)s.getArg();
			// not sure how this could happen, but it did
			if(d == null || (d.getArg() == null)) { throw new FeatureExtractionException(); }
			if(d.getArg() instanceof NominalVar) {
				// XXX all this is probably defunct and can safely be deleted
				// add multiparent
				// might need getName() instead of toString()
				//System.err.println("found var: str = " + d.getArg().toString());
				LfGraphNode target = nomTable.get(d.getArg().toString());
				LfGraphLink ln = new LfGraphLink(d.getMode().toString(), null, target);
				ln.setSource(curNode);
				//target.addMultiParent(ln);
			}
			else if(d.getArg() instanceof Nominal) {
				// make link labeled <mode> to nominal
				LfGraphNode target = nomTable.get(d.getArg().toString());
				LfGraphLink ln = new LfGraphLink(d.getMode().toString(), null, target);
				ln.setSource(curNode);
				if(target != null) {
					// ??? why is it sometimes null? and if it is, should an exception be thrown?
					target.setParentLink(ln);
					target.addMultiParent(curNode);
				}
				else {
					//System.err.println("TE: target was null: " + d.getArg().toString());
				}
				if(curNode == null) { throw new FeatureExtractionException();}
				curNode.addChild(ln);
			}
			else {
				// proposition
				// add attr <mode><arg> to current node
				try {
					curNode.addAttribute(d.getMode().toString(), d.getArg().toString());
				}
				catch(Exception e) {
					// ??? this null must occur because there were no attributes, but this
					// probably isn't the best way to handle it
				}
				
			}
			// don't change curNode here
			i++;
		}
	}
	
	public LF getLF() {
		return this.lf;
	}
	
	/** This method extracts features from a node in the graph and returns
	 * them as an array of strings. It's implemented slightly differently
	 * in HyperTagger and POSTagExtractor.
	 * @param n The node from which to extract the features.
	 * @return A list of features.
	 */
	protected abstract FeatureList getFeatures(LfGraphNode n);
	
	/** Get the features for the index'th node
	 * 
	 * @param index The index into the LF
	 */
	public FeatureList getFeatures(int index) {
		for(LfGraphNode n : nomTable.values()) {
			if(n.getIndex() == index) {
				return getFeatures(n);
			}
		}
		return null; // bad index
	}
	
	// these methods only make sense for training, because
	// they fetch the gold-standard supertag or POS tag.
	public String getSupertag(LfGraphNode n) {
		return lexpairs.get(n);
	}
	
	public String getSupertag(int index) {
		for(LfGraphNode n : nomTable.values()) {
			if(n.getIndex() == index) {
				return lexpairs.get(n);
			}
		}
		return null;
	}
	
	public String getPOStag(LfGraphNode n) {
		return pospairs.get(n);
	}
	
	public String getPOStag(int index) {
		for(LfGraphNode n : nomTable.values()) {
			if(n.getIndex() == index) {
				return pospairs.get(n);
			}
		}
		return null;
	}

	// return the node with the given index
	protected LfGraphNode findNode(int index) {
		for(LfGraphNode n : nomTable.values()) {
			if(n.getIndex() == index) {
				return n;
			}
		}
		return null;
	}
	protected int numNodes() {
		return nomTable.size();
	}
	protected int maxIndex() {
		return this.maxIndex;
	}
	// utility method to do the inverse of java.String.split()
	public static String join(ArrayList<String> a, String delimiter) {
		String out = new String();
		int i;
		for(i = 0; i < a.size(); i++) {
			out = out.concat(a.get(i));
			if(i != a.size() - 1) {
				out = out.concat(delimiter);
			}
		}
		return out;
	}
	/**
	 * @param predInfo
	 * @throws FeatureExtractionException
	 * This method stores gold standard predicate info, which is expected to be in the following format:
	 * predInfo :: (field<space>)+
	 * field :: wordId:supertag:POStag:predName
	 * 
	 * The supertag and postag are expected to have been escaped by Lexicon.DefaultTokenizer.escape(), and will be unescaped during storage.
	 * This method throws a runtime error if the predInfo string cannot be parsed.
	 * 
	 */
	public abstract void storeGoldStdPredInfo(String predInfo);

	public abstract String getAllFeaturesAndAnswer();

	public abstract void loadPriorModel(File priorModelFile, File vocabFile);

	public void loadProtoModel(File hyperModelFile) {
		// TODO refactor TagExtract app so this isn't needed
		return;
	} 

	// mww: sets configurable arg names 
	/**
	 * Sets the arg name map to the given names.
	 * @param argnames Space-delimited arg names in format name(:shortname)?.
	 *   Defaults to "Arg0:A0 Arg1:A1 Arg1a:A1a Arg1b:A1b Arg2:A2 Arg2a:A2a Arg2b:A2b Arg3:A3 Arg4:A4 Arg5:A5".
	 */
	protected void setArgNames(String argnames) {
		argNameMap.clear();
		// default is augmented propbank arg names
		if (argnames == null) argnames = "Arg0:A0 Arg1:A1 Arg1a:A1a Arg1b:A1b Arg2:A2 Arg2a:A2a Arg2b:A2b Arg3:A3 Arg4:A4 Arg5:A5";
		String[] nameslist = argnames.split("\\s+");
		for (String argname : nameslist) {
			String[] namepair = argname.split(":");
			if (namepair.length == 2) argNameMap.put(namepair[0], namepair[1]);
			else if (namepair.length == 1) argNameMap.put(namepair[0], namepair[1]);
		}
	}
}


================================================
FILE: src/opennlp/ccg/realize/hypertagger/ZLMaxentHypertagger.java
================================================
package opennlp.ccg.realize.hypertagger;

import static java.util.Arrays.asList;

import java.io.BufferedWriter;
import java.io.File;
import java.io.FileWriter;
import java.io.IOException;
import java.io.OutputStreamWriter;
import java.util.ArrayList;
import java.util.Collection;
import java.util.Collections;
import java.util.HashMap;
import java.util.HashSet;
import java.util.List;
import java.util.Map;
import java.util.Set;
import java.util.logging.Level;
import java.util.logging.Logger;
import java.util.regex.Matcher;
import java.util.regex.Pattern;

import joptsimple.OptionParser;
import joptsimple.OptionSet;
import joptsimple.OptionSpec;

import opennlp.ccg.hylo.Nominal;
import opennlp.ccg.hylo.SatOp;
import opennlp.ccg.lexicon.DefaultTokenizer;
import opennlp.ccg.lexicon.Word;
import opennlp.ccg.parse.supertagger.io.XMLPOSDictionaryReader;
import opennlp.ccg.parse.supertagger.io.XMLWordDictionaryReader;
import opennlp.ccg.parse.supertagger.ml.STPriorModel;
import opennlp.ccg.parse.supertagger.util.STTaggerPOSDictionary;
import opennlp.ccg.parse.supertagger.util.STTaggerWordDictionary;
import opennlp.ccg.parse.tagger.util.ConfigFileProcessor;
import opennlp.ccg.parse.tagger.util.ResultSink;
import opennlp.ccg.realize.Hypertagger;
import opennlp.ccg.util.Pair;

/**
 * 
 * @author espinosa
 * This class implements the hypertagger. Instantiating a hypertagger requires several external
 * files:
 * <ol>
 * <li> A POS model
 * <li> A prior model for POS tags, and its vocab file
 * <li> A prior model for hypertags, and its vocab file
 * </ol>
 * The prior model files are optional.
 * <p/>
 * To use the hypertagger for realization, instantiate a POS tagger first, then
 * instantiate the hypertagger using that POS tagger. Example in pseudo-code:
 * <code>
 * POSPriorModel ppm = new POSPriorModel(String flmFile, String vocabFile);
 * ZLMaxentModel posMod = new ZLMaxentModel(String fileName);
 * ZLPOSTagger pt = new ZLPOSTagger(posMod, ppm);
 * ZLMaxentHypertagger ht = new ZLMaxentHypertagger(pt, File htModelPath);
 * ht.loadPriorModel(File priorModelFile, File vocabFile);
 * 
 * The tagger can also be instantiated from a config file. This is the recommended
 * method for using the tagger as part of the realizer. See the method 'ZLMaxentHypertaggerFactory'.
 * </code>
 * 
 */
public class ZLMaxentHypertagger extends TagExtractor implements Hypertagger {
	File hypertagModelFilename;
	File posModelFilename;
	public ZLMaxentModel hypertagModel; // null if extracting feats for training
	ZLMaxentModel posModel; // null if extracting feats for training
	ZLPOSTagger postagger;
	ZLMaxentModel protoHTModel;
	double protoHTBeta = 0.01; // FIXME what should this be?
	LfGraphNode currentPred;
	String LFNum;
	protected double[] betas;
	int currentBeta;
	//Flag which indicates whether gold std tags need to be ensured during tag prediction
	//Gold std tag info for perceptron training (event generation)
	private boolean goldStdTagInsert=false;
	//Nominal id to gold std supertag mapping
	private HashMap<String,String> goldPred2Tag;
	private STPriorModel priorModel;
	double priorBeta = 0.4;
	private HashMap<String, String> goldPredPOS;
	private STTaggerWordDictionary wdict;  // word (pred)-level tagging dictionary
	private STTaggerPOSDictionary posdict; // pos-level tagging dictionary
	int dictK; // frequency threshold for tagdict lookups
	public BufferedWriter tdErr;

	public class ProbIndexPair implements Comparable<Object> {
		public double prob;
		public int index;
		public ProbIndexPair(double prob, int index) {
			this.prob = prob;
			this.index = index;
		}
		public int compareTo(Object o) {
			if(prob < ((ProbIndexPair)o).prob) {
				return -1;
			}
			else if(prob == ((ProbIndexPair)o).prob) {
				return 0;
			}
			else {
				return 1;
			}
		}
	}

	/**
	 * @author espinosa
	 * This is a singleton class containing functions for extracting various features
	 * from the LF graph nodes. These
	 * feature functions are called from ZLMaxentHypertagger#getFeatures.
	 * 
	 * Some of the functions extract several features at once, to avoid unnecessary iteration.
	 * Feature template abbreviations:
	 * 
	 * FO -- fan-out, i.e. number of children
	 * PN -- predicate name
	 * RN -- parent name 
	 * CT -- type of child
	 * A1N, A2N, ... -- Arg1 name, Arg2 name, ... (by default)
	 * A1P, A2P, ... -- Arg1 POS tag, Arg2 POS tag, ... (by default)
	 * MP -- Modifier POS tag (non-arg children)
	 * PP -- parent's POS tag, if any parent
	 * CN -- name of child
	 * NA -- number of Argument children
	 * PT -- POS tag (see docs) 
	 * ZD -- det=value
	 * ZM -- mood=value
	 * ZN -- num=value
	 * ZT -- tense=value
	 * ZP -- partic=value
	 * XC -- semantic class of node, if applicable
	 * XnD -- semantic class of argument child node n, if applicable (by default)
	 * XP -- semantic class of parent node, if applicable
	 * XM -- semantic class of non-arg child node, if applicable
	 * CS -- child supertag
	 * PS -- parent supertag
	 * AS -- argument supertag
	 * MS -- modifier supertag
	 * 
	 */
	// mww: switched to configurable arg names
	void fillFeatures(LfGraphNode n, FeatureList f) {

		f.addFeatureWithProb("FO",  Integer.toString(n.getNumChildren()));

		for(String att : n.getAttribs().keySet()) {
			f.addFeatureWithProb("Z" + att.substring(0,1).toUpperCase(), n.getAttribs().get(att));
		}

		f.addFeatureWithProb("PN",  n.getPredicateName());

		if(n.getMultiParents().size() > 0) {
			for(LfGraphNode parent : n.getMultiParents() ) {
				f.addFeatureWithProb("RN", parent.getPredicateName());
				/* the line below will add the parent's best-ranked POS tag with prob=1.0 */
				f.addFeatureWithProb("PP", getPOS(parent));
				/* The code below will add the parent's best-ranked POS tag with its actual probability */
				/*
					 ArrayList<Pair<String,Double>> poslist = getBetaBestPOS(parent);
					 Pair<String,Double> pospair = poslist.get(0);
					 feats.addFeatureWithProb("PP", pospair.a, pospair.b);
				 */
				// add class name, if available
				String cls = parent.getPred().getNominal().toString();
				// string is in X:Y:Z format. Remove 'X:' leaving 'Y:Z'.
				if(cls != null && cls.indexOf(':') > 0) {
					String cfeat = cls.substring(cls.indexOf(':') + 1);
					f.addFeatureWithProb("XP", cfeat);
				}
			}
		}
		else {
			f.addFeatureWithProb("RN", "0");
		}
		int argchildren = 0;
		for(LfGraphLink lnk  : n.getChildren()) {
			f.addFeatureWithProb("CT", lnk.getLabel());
			if(lnk.getTarget() != null) {
				// how could it be null? 
				f.addFeatureWithProb("CN", lnk.getTarget().getPredicateName());
				// mww: use short arg name
				String shortArgName = argNameMap.get(lnk.getLabel());
				if (shortArgName != null) {
					// increment argchild count
					argchildren++;
					f.addFeatureWithProb(shortArgName + "N", lnk.getTarget().getPredicateName());
					f.addFeatureWithProb(shortArgName + "P", getPOS(lnk.getTarget()) );
					// add class info for arg child, if applicable
					String cls = lnk.getTarget().getPred().getNominal().toString();
					// string is in X:Y:Z format. Remove 'X:' leaving 'Y:Z'.
					if(cls != null && cls.indexOf(':') > 0) {
						String cfeat = cls.substring(cls.indexOf(':') + 1);
						// mww: for backwards compatibility
						String argNumOrName = (shortArgName.startsWith("A")) ? shortArgName.substring(1) : shortArgName;
						f.addFeatureWithProb("X" + argNumOrName + "D", cfeat);
					}
				}
				else {
					// not an argument child
					f.addFeatureWithProb("MP", getPOS(lnk.getTarget()));
					// add class info for non-arg child, if applicable
					String cls = lnk.getTarget().getPred().getNominal().toString();
					// string is in X:Y:Z format. Remove 'X:' leaving 'Y:Z'.
					if(cls != null && cls.indexOf(':') > 0) {
						String cfeat = cls.substring(cls.indexOf(':') + 1);
						f.addFeatureWithProb("XM", cfeat);
					}
				}
			}
		}
		f.addFeatureWithProb("NA", Integer.toString(argchildren));

		if(posModel == null) {
			f.addFeatureWithProb("PT", getPOS(n));
		}
		else {
			ArrayList<Pair<String,Double>> poslist = getBetaBestPOS(n);
			for(Pair<String,Double> pospair : poslist) {
				// add PT=NNP:0.7, PT=NN:0.6, etc
				f.addFeatureWithProb("PT", pospair.a, pospair.b);
				n.setPOS(pospair.a); // take the top choice to be "the pos tag", used later for prior
			}
		}
		// class name feature for node, if available
		Nominal idx = n.getPred().getNominal();
		String cls = idx.toString();
		// string is in X:Y:Z format. Remove 'X:' leaving 'Y:Z'.
		if(cls != null && cls.indexOf(':') > 0) {
			String cfeat = cls.substring(cls.indexOf(':') + 1);
			f.addFeatureWithProb("XC", cfeat);
		}
		// prior features
		if(priorModel != null) {
			Word w = Word.createWord(n.getPredicateName(), null, null, n.getPredicateName(),
					getPOS(n), null, null);
			priorModel.computePriors(w);
			List<Pair<String, Double>> tags = priorModel.getBetaBestPriors(w, priorBeta);
			for(Pair<String,Double> t : tags) {
				f.addFeatureWithProb("PR_ST", DefaultTokenizer.unescape(t.a), t.b);
			}
		}
	}

	private void fillTwoPassFeatures(LfGraphNode n, FeatureList f) {
		// get the STs from the STList
		for(Pair<String,Double> p : n.getSTList()) {
			f.addFeatureWithProb("ST", p.a, p.b);
		}
		// get parent STs
		for(LfGraphNode pl : n.getMultiParents()) {
			for(Pair<String,Double> p : pl.getSTList()) {
				f.addFeatureWithProb("STP", p.a, p.b);
			}
		}
		for(LfGraphLink cl : n.getChildren()) {
			/*
			for(Pair<String,Double> p : cl.getTarget().getSTList()) {
			*/
			LfGraphNode c = cl.getTarget();
				if(c != null) {
					for(Pair<String,Double> p : c.getSTList()) {
						f.addFeatureWithProb("STC", p.a, p.b);
					}
				}
		}
	}
	
	public ZLMaxentHypertagger() {
		super();
		betas = new double[7];
		// values determined by DNM 20 April 2008).
		betas[0] = 0.16;
		betas[1] = 0.05;
		betas[2] = 0.0058;
		betas[3] = 0.00175;
		betas[4] = 0.000625;
		betas[5] = 0.000125;
		betas[6] = 0.000058;
		currentBeta = 0;
		goldPred2Tag = new HashMap<String,String>();
		goldPredPOS = new HashMap<String, String>();
	}

	/** This constructor loads both a POS-tagging model and a hypertagging model. 
	 * 
	 * @param posModelFile The filename from which to load the POS-tagging model. If null,
	 * gold-stardard POS tags will be used (and must be stored via storeGoldStdPredInfo()).
	 * @param hyperModelFile The filename from which to load the hypertagging model
	 * @throws IOException If any model fails to load.
	 */
	public ZLMaxentHypertagger(File posModelFile, File hyperModelFile) throws IOException {
		this();
		this.posModelFilename = posModelFile;
		// load the models
		if(posModelFile != null) {
			this.posModel = new ZLMaxentModel();
			this.posModel.load(posModelFile);
			this.postagger = new ZLPOSTagger(posModel);
			postagger.setPrefixLength(4);
			postagger.setSuffixLength(4);
			postagger.argNameMap = this.argNameMap; // share the arg name map
		}
		this.hypertagModelFilename = hyperModelFile;
		this.hypertagModel = new ZLMaxentModel();
		this.hypertagModel.load(hyperModelFile);
	}
	/* POS tagger can be null. In that case, gold-standard POS tags will be used.
	 * To use in "realization mode", do the following:
	 * 1) instantiate a ZLPOSTagger as normal
	 * 2) load the POS prior model into the POS tagger
	 * 3) Instantiate the ZLMaxentHypertagger with this constructor, passing the POS tagger
	 * and the path to the trained hypertagging model file
	 * 4) load the ht-prior model into the ZLMaxentHypertagger using setPriorModel(vocab, priorfile)
	 * 5) commence tagging via setLF() and getSupertags()
	 */
	public ZLMaxentHypertagger(ZLPOSTagger ptag, File hyperModelFile) {
		this();
		this.postagger = ptag;
		this.postagger.argNameMap = this.argNameMap; // share the arg name map
		this.hypertagModelFilename = hyperModelFile;
		this.hypertagModel = new ZLMaxentModel();
		this.hypertagModel.load(hyperModelFile);
	}

	/** This constructor loads only a POS-tagging model. It's useful for extracting features for Maxent training.
	 * 
	 * @param posModelFile The filename from which to load the model.
	 * @throws IOException If the model couldn't be loaded for any reason.
	 */
	public ZLMaxentHypertagger(File posModelFile) throws IOException {
		this();
		this.posModelFilename = posModelFile;
		// load the model
		this.posModel = new ZLMaxentModel();
		this.posModel.load(posModelFile);
		this.postagger = new ZLPOSTagger(posModel);
		postagger.setPrefixLength(4);
		postagger.setSuffixLength(4);
		postagger.argNameMap = this.argNameMap; // share the arg name map
	}

	public static ZLMaxentHypertagger ZLMaxentHypertaggerFactory(String configFile) throws IOException {
		ZLMaxentHypertagger hypertagger = new ZLMaxentHypertagger();
		ZLPOSTagger postagger = null;
		String[] pathKeys = { "priormodel", "priormodelvocab", "wdict", "posdict", "maxentmodel", "posconfig" };
		Map<String,String> opts = ConfigFileProcessor.readInConfig(configFile, pathKeys);
		// load the POS model first
		String posConfig = opts.get("posconfig");
		if(posConfig != null) {
			postagger = ZLPOSTagger.ZLPOSTaggerFactory(posConfig);
		}
		hypertagger.postagger = postagger;
		// now load the prior models and/or tag dicts
		// if prior models are specified, then tagdicts are not used, or even loaded
		String priorModelPath = opts.get("priormodel");
		String wdictPath = opts.get("wdict");
		if(priorModelPath != null) {
			String vocabPath = opts.get("priormodelvocab");
			if(vocabPath == null) {
				throw new IOException("You must specify a vocab filename along with the prior model filename.");
			}
			hypertagger.loadPriorModel(new File(priorModelPath), new File(vocabPath));
		}
		else if(wdictPath != null) {
			String posdictPath = opts.get("posdict");
			if(posdictPath == null) {
				throw new IOException("You must specify both a word-level dict and a POS dict.");
			}
			XMLWordDictionaryReader wdr = new XMLWordDictionaryReader(new File(wdictPath));
			XMLPOSDictionaryReader pdr = new XMLPOSDictionaryReader(new File(posdictPath));
			STTaggerWordDictionary wdict = wdr.read();
			STTaggerPOSDictionary posdict = pdr.read();
			hypertagger.wdict = wdict;
			hypertagger.posdict = posdict;
			String kstring = opts.get("dictk");
			if(kstring != null) 
				hypertagger.dictK = Integer.parseInt(kstring);
		}
		String maxentModelPath = opts.get("maxentmodel");
		if(maxentModelPath == null) {
			System.err.println("Maxent model path must be specified with key \"maxentmodel\".");
			throw new IOException();
		}
		String protoHTModelPath = opts.get("protomodel");
		// process betas
		String betaString = opts.get("betas");
		if(betaString != null) {
			String[] bs = betaString.split("\\s+");
			double[] betaVals = new double[bs.length];
			int i;
			for(i = 0; i < bs.length; i++) {
				betaVals[i] = Double.parseDouble(bs[i]);
			}
			// can't sort descending w/o extra code and vars?
			// for now, assume betas are in correct order in configfile
			//Arrays.sort(betaVals);
			hypertagger.betas = betaVals;
		}
		hypertagger.hypertagModel = new ZLMaxentModel(maxentModelPath);
		if(protoHTModelPath != null) {
			hypertagger.protoHTModel = new ZLMaxentModel(protoHTModelPath);
			System.err.println("Two-pass model instantiated. Initializing hyperdrive.");
		}
		// mww: add argnames
		String argnames = opts.get("argnames");
		hypertagger.setArgNames(argnames);
		return hypertagger;
	}

	private String getPOS(LfGraphNode n) {
		if(postagger == null) {
			// use gold-standard POS tag
			String posTag = goldPredPOS.get(n.getPred().getNominal().getName());
			if(posTag == null) {
				// XXX this is not correct
				posTag = "UNK";
			}
			return posTag;
		}
		// else use POS model to get beta-best POS
		if(n.getPOS() == null) {
			FeatureList feats = postagger.getFeatures(n);
			//String pos = new String(postagger.getBestPOS(feats));
			// POS tags for nodes are cached in the node itself
			// so as to avoid repeated calls to the model for the same node
			ArrayList<Pair<String,Double>> pos = postagger.getBetaBestPOS(feats);
			n.setPOS(pos.get(0).a);
		}
		return n.getPOS();
	}

	private String getGoldSupertag(LfGraphNode n) {
		return goldPred2Tag.get(n.getPred().getNominal().getName());
	}

	private ArrayList<Pair<String,Double>> getBetaBestPOS(LfGraphNode n) {
		// TODO (for training): add gold-standard POS tag, if it is not in the beta-best
		// list. Or should we use beta-best POS tags in training at all?
		if(n.getPOSList() == null) {
			FeatureList feats = postagger.getFeatures(n);       
			ArrayList<Pair<String,Double>> pos = null;			
			//String pos = new String(postagger.getBestPOS(feats));
			pos = postagger.getBetaBestPOS(feats);
			n.setPOSList(pos);
		}
		return n.getPOSList();
	}

	// computes all features for the graph node, returns a feature list
	protected FeatureList getFeatures(LfGraphNode n) {
		FeatureList feats; 
		feats = n.getFeatures();
		if(feats != null) {
			return feats;
		}
		feats = new FeatureList();
		fillFeatures(n, feats);
		return feats;
	}

	/** Get all features for the current LF as a single multi-line string.
	 * Used during extraction of training data.
	 * @return All features for the current LF.
	 */
	public String getAllFeaturesAndAnswer() {
		StringBuilder output = new StringBuilder();
		for(LfGraphNode n : nomTable.values()) {
			FeatureList feats = getFeatures(n);
			String context = feats.getAllFeatures();
			//String tag = n.getPred().getOrigin().getSupertag();
			String tag = goldPred2Tag.get(n.getPred().getNominal().getName());
			output = output.append(tag + " " + context);
			output = output.append("\n");
		}
		return output.toString();
	}

	// for every node in the tree, compute its features, and store them inside the nodes
	private void assignAllFeatures() {
		for(LfGraphNode n : nomTable.values()) {
			FeatureList feats = getFeatures(n);
			n.setFeatures(feats);
			// eval the proto-model, set the node's STList to the returned outcomes/probs
			if(protoHTModel != null) {
				n.setSTList(getProtoSupertagsAndProbs(n, protoHTBeta));
			}
		}
		// now traverse the graph again, calculating the additional STS features,
		// then unioning that feature list with the cached one
		if(protoHTModel != null) {
			for(LfGraphNode n : nomTable.values()) {
				FeatureList feats = getFeatures(n); // feats guaranteed cached by first pass
				fillTwoPassFeatures(n, feats);
				n.setFeatures(feats); // necessary?
			}
		}
	}

	public ZLMaxentModel getPosModel() {
		return posModel;
	}

	public File getPosModelFilename() {
		return posModelFilename;
	}

	public void setLF(List<SatOp> preds) throws FeatureExtractionException {
		super.setLF(preds);
		if(postagger != null) {
			postagger.setLF(preds);
		}
		assignAllFeatures();
	}

	public String getLFNum() {
		return this.LFNum;
	}

	public void setLFNum(String s) {
		this.LFNum = s;
	}

	/** Set the POS tagging model to use.
	 * @param posModelFilename The filename containing the LBFGS model to use for
	 * computing simple POS tags as part of the featureset.
	 * @throws IOException when the model cannot be loaded for some reason.
	 */
	public void setPOSModelFilename(File posModelFilename) throws IOException {
		this.posModelFilename = posModelFilename;
		// load the model
		this.posModel = new ZLMaxentModel();
		this.posModel.load(posModelFilename);
		this.postagger = new ZLPOSTagger(posModel); 
	}

	public File getHypertagModelFilename() {
		return hypertagModelFilename;
	}

	/** Set the POS tagging model to use.
	 * @param posModelFilename The filename containing the LBFGS model to use for
	 * computing simple POS tags as part of the featureset.
	 * @throws IOException when the model cannot be loaded for some reason.
	 */
	public void setHypertagModelFilename(File hypertagModelFilename) throws IOException {
		this.hypertagModelFilename = hypertagModelFilename;
		// load the model
		this.hypertagModel = new ZLMaxentModel();
		this.hypertagModel.load(hypertagModelFilename);
	}

	/* methods from Hypertagger interface */

	// should probably just rename setLF to mapPreds in the first place
	public void mapPreds(List<SatOp> preds) {
		try {
			setLF(preds);
		}
		catch(FeatureExtractionException e) {
			throw (RuntimeException) new RuntimeException().initCause(e);
		}
	}

	public void setPred(int index) {
		currentPred = findNode(index);
	}

	public void resetBeta() {
		currentBeta = 0;
	}
	public void resetBetaToMax() {
		currentBeta = betas.length - 1;
	}

	public void nextBeta() {
		if(currentBeta < betas.length -1) {
			currentBeta++;
		}
	}
	public void previousBeta() {
		if(currentBeta > 0) {
			currentBeta--;
		}
	}

	public boolean hasMoreBetas() {
		if(currentBeta < betas.length - 1) {
			return true;
		}
		return false;
	}

	public boolean hasLessBetas() {
		if(currentBeta > 0 && this.hasMoreBetas()) {
			return true;
		}
		return false;
	}


	public Map<String,Double> getSupertags() {
		Set<Pair<String, Double>> tp = this.getSupertagsAndProbs(this.currentPred, this.betas[this.currentBeta]);
		if(tp == null) {
			return null;
		}
		HashMap<String,Double> tagMap = new HashMap<String,Double>(tp.size());
		for(Pair<String,Double> p : tp) {
			tagMap.put(p.a, p.b);
		}
		return tagMap;
	}

	/* this method is for use with the ResultSink class, during testing. That code requires the elements of the pairs to be swapped. */
	private List<Pair<Double,String>> getSupertagsAsList() {
		Set<Pair<String, Double>> tp = this.getSupertagsAndProbs(this.currentPred, this.betas[this.currentBeta]);
		ArrayList<Pair<Double,String>> ret = new ArrayList<Pair<Double,String>>();
		for(Pair<String, Double> p : tp) {
			ret.add(new Pair<Double,String>(p.b,p.a));
		}
		return ret;
	}
	
	// cannot be made static due to ProbIndexPair
	private ArrayList<ProbIndexPair> getModelOutcomes(FeatureList f, ZLMaxentModel m) {
		ArrayList<ProbIndexPair> probList = new ArrayList<ProbIndexPair>();
		double[] probs = m.eval(f.getAllFeaturesForMaxent(),true);
		for(int i = 0; i < probs.length; i++) {
			probList.add(new ProbIndexPair(probs[i], i));
		}
		Collections.sort(probList);
		Collections.reverse(probList);
		return probList;
	}

	private HashSet<Pair<String,Double>> betaSearch(ArrayList<ProbIndexPair> probList, double beta) {
		double maxProb = probList.get(0).prob;	
		HashSet<Pair<String,Double>> names = new HashSet<Pair<String, Double>>();
		for(int i = 0; i < probList.size(); i++) {
			if(probList.get(i).prob >= beta * maxProb) {
				names.add(new Pair<String, Double>(protoHTModel.getOutcome(probList.get(i).index), probList.get(i).prob));
			} else {
				break;
			}
		}
		return names;
	}

	public Set<Pair<String,Double>> getProtoSupertagsAndProbs(LfGraphNode n, double beta) {
		HashSet<Pair<String,Double>> names;
		ArrayList<ProbIndexPair> probList = new ArrayList<ProbIndexPair>();
		probList = getModelOutcomes(n.getFeatures(), protoHTModel);
		names = betaSearch(probList, beta);
		return names;
	}
	
	/* 'MAIN' hypertagging entry point */
	@SuppressWarnings("boxing")
	public Set<Pair<String,Double>> getSupertagsAndProbs(LfGraphNode n, double beta) {
		if(currentPred == null) {
			return null; // not handling EPs for rels or feats, so return null
		}
		double bestOCProb = 0.0, curOCProb = 0.0;
		HashSet<Pair<String,Double>> names = new HashSet<Pair<String, Double>>();
		HashSet<String> tagList = new HashSet<String>();
		ArrayList<ProbIndexPair> probList = new ArrayList<ProbIndexPair>();
		probList = getModelOutcomes(n.getFeatures(), hypertagModel);
		/* check tagdict */
		if(wdict != null) {
			// get pred name, get tags from dict at K, if none, try pos dict
			String predName = n.getPredicateName();
			Collection<String> permittedOutcomes = wdict.getEntry(predName, this.dictK);
			if(permittedOutcomes == null) {
				// back off to POS dict
				String pos = getPOS(n);
				permittedOutcomes = posdict.getEntry(pos);
				// sanity check
				if(permittedOutcomes == null) {
					System.err.println("!! No pos dict entries for " + pos);
				}
			}
			ArrayList<String> po = new ArrayList<String>();
			for(String s : permittedOutcomes) {
				po.add(DefaultTokenizer.unescape(s));
			}
			permittedOutcomes = (Collection<String>)po;
			if(permittedOutcomes != null) {
				String oc = "";
				for(ProbIndexPair p : probList) {
					oc = hypertagModel.getOutcome(p.index);
					curOCProb = p.prob;
					if(permittedOutcomes.contains(oc)) {
						if (bestOCProb == 0) {
							bestOCProb = curOCProb;
						}
						if (curOCProb >= (bestOCProb * beta)) { // Beta constraint.
							// The cut-off was met, add the outcome.
							names.add(new Pair<String,Double>(oc, p.prob));
							tagList.add(oc);
							// update max, for first selected outcome
							if (curOCProb > bestOCProb) {
								bestOCProb = curOCProb;
							}
						} else {
							// Else, since our ProbIndexPair[] is sorted by probablity, there will be no more
							// outcomes that make the (beta) cut.
							break;
						}
					}
					else {
						// the outcome was ruled out by the tagdict. make a note of it.
						String nomId = currentPred.pred.getNominal().getName();
						String gsTag = "";
						String gsPos = "";
						if(goldPred2Tag.containsKey(nomId)) {
							gsTag = goldPred2Tag.get(nomId);
							gsPos = goldPredPOS.get(nomId);
						}
						if(gsTag.equals(oc)) {
							try {
								tdErr.write(predName + "\t" + currentPred.index + "\t" + LFNum + "\t" + gsTag + "\t" + gsPos + "\n");
								tdErr.flush();
							}
							catch(Exception e) {
								throw new RuntimeException(e);
							}
						}
					}
				}
			}
		}
		else { // not using dicts
			double maxProb = probList.get(0).prob;	
			for(int i = 0; i < probList.size(); i++) {
				if(probList.get(i).prob >= beta * maxProb) {
					names.add(new Pair<String, Double>(hypertagModel.getOutcome(probList.get(i).index), probList.get(i).prob));
					tagList.add(hypertagModel.getOutcome(probList.get(i).index));
				} else {
					break;
				}
			}
		}
		String nomId=currentPred.pred.getNominal().getName();
		if(goldPred2Tag.containsKey(nomId)){
			String goldStdTag=goldPred2Tag.get(nomId);
			if(goldStdTagInsert && !tagList.contains(goldStdTag))
				names.add(new Pair<String, Double>(goldStdTag,1.0));
		}
		return names;
	}

	public double getCurrentBetaValue() {
		if(currentBeta<betas.length)
			return betas[currentBeta];
		else return 0.0;
	}

	public double[] getBetas() {
		return betas;
	}

	public void setBetas(double[] betas) {
		this.betas = betas;
	}

	public void setPOSBeta(double beta) {
		postagger.setBeta(beta);
	}
	public double getPOSBeta() {
		return postagger.getBeta();
	}

	/* (non-Javadoc)
	 * @see opennlp.ccg.realize.hypertagger.TagExtractor#storeGoldStdPredInfo(java.lang.String)
	 */
	public void storeGoldStdPredInfo(String predInfo) {
		String[] preds = predInfo.split("\\s+");
		if(preds != null) {
			for(int i = 0; i < preds.length; i++) {
				String[] info = preds[i].split(":");
				if(info.length != 4) {
					System.err.println("Malformed pred-info field, skipping (value was \"" + preds[i] + "\")\nPRED-INFO: " + predInfo + "\n");
					continue;
				}
				goldPred2Tag.put(info[0], DefaultTokenizer.unescape(info[1]));
				goldPredPOS.put(info[0], DefaultTokenizer.unescape(info[2]));
			}
		} 
	}

	public void setIncludeGold(boolean v) {
		this.goldStdTagInsert = v;
	}

	@Override
	public void loadPriorModel(File priorModelFile, File vocabFile) {
		try {
			priorModel = new STPriorModel(priorModelFile.getAbsolutePath(), vocabFile.getAbsolutePath());
		} catch (IOException e) {
			System.err.println("Unable to load prior model or vocab file");
			e.printStackTrace();
		}
	}
	
	@Override
	public void loadProtoModel(File hyperModelFile) {
		this.protoHTModel = new ZLMaxentModel(hyperModelFile.getAbsolutePath()); 
	}
	
	public String getSRILMFactors() {
		StringBuilder out = new StringBuilder();
		out.append("<s> ");
		for(LfGraphNode n : nomTable.values()) {
			if(goldPred2Tag.get(n.getPred().getNominal().getName()) == null) {
				continue; // skip has-rel for now
			}
			out.append(DefaultTokenizer.escape(n.getPredicateName()));
			out.append(":S-");
			out.append(DefaultTokenizer.escape(n.getPredicateName()));
			out.append(":P-");
			out.append(DefaultTokenizer.escape(getPOS(n)));
			out.append(":T-");
			out.append(DefaultTokenizer.escape(goldPred2Tag.get(n.getPred().getNominal().getName())));
			out.append(" ");
		}
		out.append("</s>\n");
		return out.toString();
	}

	public Word getPredAsWord(int idx) {
		LfGraphNode n = findNode(idx);
		Word w = Word.createWord(n.getPredicateName(), null, null, n.getPredicateName(),
				getPOS(n), getGoldSupertag(n), null);
		return w;
	}
	private Word getPredAsWord() {
		Word w = Word.createWord(currentPred.getPredicateName(), null, null, currentPred.getPredicateName(), getPOS(currentPred), getGoldSupertag(currentPred), null);
		return w;
	}

	@SuppressWarnings("boxing")
	public static void main(String[] args) throws IOException {
		String usage = "\nhypertagger (-i <input>) (-o <output> [defaults to <stdout>]) (-c <config file>)\n";
		if (args.length > 0 && args[0].equals("-h")) {
			System.out.println(usage);
			System.exit(0);
		}
		OptionParser o = new OptionParser();
		o.acceptsAll(asList("help", "h"), "this message");
		o.acceptsAll(asList("quiet", "q"), "print no status messages");
		OptionSpec<Double> b_s = o.acceptsAll(asList("beta", "b"), "ignore betas in config file and use this value").withRequiredArg().ofType(Double.class);
		OptionSpec<File> gr_s = o.acceptsAll(asList("g", "grammar")).withRequiredArg().ofType(File.class).describedAs("grammar filename");
		OptionSpec<File> corpusDir_s = o.acceptsAll(asList("d", "lf-dir")).withRequiredArg().ofType(File.class).describedAs("Directory to change to before searching for XML files");
		OptionSpec<File> configFile_s = o.acceptsAll(asList("c", "config")).withRequiredArg().ofType(File.class).describedAs("configfilename");
		OptionSpec<File> output_s = o.acceptsAll(asList("o", "output")).withRequiredArg().ofType(File.class).describedAs("output filename");
		OptionSpec<File> dump_s = o.acceptsAll(asList("dump-tags", "T")).withRequiredArg().ofType(File.class).describedAs("dump predicted tags to file");
		o.acceptsAll(asList("goldstd", "G"), "include gold-standard supertags in tag dump");
		OptionSet options = o.parse(args);
		File outputF = options.valueOf(output_s);
		File dumpF = options.valueOf(dump_s);
		File configFile = options.valueOf(configFile_s);
		BufferedWriter out = null;
		BufferedWriter dump = null;
		ArrayList<ResultSink> resBetas;
		boolean quiet = options.has("q");
		int lfcount = 0;
		try {
			out = (output_s.equals("stdout")) ? new BufferedWriter(new OutputStreamWriter(System.out)) : new BufferedWriter(new FileWriter(outputF));
		} 
		catch (IOException ex) {
			System.err.print("Output file " + outputF + " could not be opened.  Exiting...");
			Logger.getLogger(STPriorModel.class.getName()).log(Level.SEVERE, null, ex);
			System.exit(1);
		} 
		ZLMaxentHypertagger ht = ZLMaxentHypertagger.ZLMaxentHypertaggerFactory(configFile.getAbsolutePath());
		if(options.has("T")) {
			try {
				dump = new BufferedWriter(new FileWriter(dumpF));
			}
			catch(IOException e) {
				System.err.print("Output file " + dumpF + " could not be opened.  Exiting...");
				System.exit(1);
			}
		}
		if(options.has("b")) {
			double beta = options.valueOf(b_s);
			ht.betas = new double[1];
			ht.betas[0] = beta;
		}
		resBetas = new ArrayList<ResultSink>(ht.betas.length);
		for(int i = 0; i < ht.betas.length; i++) {
			ResultSink r = new ResultSink();
			resBetas.add(r);
		}
		ArrayList<BufferedWriter> errFiles = new ArrayList<BufferedWriter>();
		for(int i = 0; i < ht.betas.length; i++) {
			File logdir = new File("logs");
			if (!logdir.exists()) logdir.mkdirs();
			BufferedWriter b = new BufferedWriter(new FileWriter(new File("logs/tagdict.err.out." + i)));
			b.write("### beta = " + ht.betas[i] + "\n");
			errFiles.add(b);
		}
		LFLoader lfs = new LFLoader(options.valueOf(gr_s), options.valueOf(corpusDir_s), options.nonOptionArguments());
		while(lfs.hasNext()) {
			lfcount++;
			LFInfo lfi = lfs.next();
			try {
				ht.setLF(lfi.getLF());
				ht.storeGoldStdPredInfo(lfi.getFullWords());
				ht.setLFNum(lfi.getLFNum());
			} 
			catch (FeatureExtractionException e) {
				e.printStackTrace();
			}
			List<List<Pair<Double,String>>> lfTagging = new ArrayList<List<Pair<Double,String>>>();
			List<Word> gsTagging = new ArrayList<Word>();
			List<Pair<Double,String>> tags;
			Word w;
			for(int bi = 0; bi < ht.betas.length; bi++) {
				gsTagging = new ArrayList<Word>();
				lfTagging = new ArrayList<List<Pair<Double,String>>>();
				ht.setBetaIndex(bi);
				ht.tdErr = errFiles.get(bi); 
				for(int i = 0; i < ht.maxIndex(); i++) {
					ht.setPred(i);
					if(ht.currentPred == null) {
						//System.err.println("Skipping null pred " + i);
						continue;
					}
					w = ht.getPredAsWord();
					tags = ht.getSupertagsAsList();
					lfTagging.add(tags);
					gsTagging.add(w);
					if(dump != null) {
						if(options.has("G") && w.getSupertag() != null) {
							dump.write(w.getSupertag() + " ");
						}
						dump.write(w.getForm() + " ");
						for(int j = 0; j < tags.size(); j++) {
							dump.write(tags.get(j).a + " " + tags.get(j).b + " ");
						}
						dump.write("\n");
					}
				}
				resBetas.get(bi).addSent(lfTagging, gsTagging);
				if(!quiet) {
					System.err.println("LFs processed:       " + lfcount + "\r");
				}
				ht.tdErr.flush();
			}
		}
		if(dump != null) {
			dump.flush();
			dump.close();
		}
		for(int i = 0; i < ht.betas.length; i++) {
			errFiles.get(i).close();
		}
		for(int i = 0; i < ht.betas.length; i++) {
			out.write("---------------\n");
			out.write("BETA: " + ht.betas[i] + "\n");
			out.write(resBetas.get(i).report());
		}
		out.flush();
		out.close();
	}

	private void setBetaIndex(int bi) {
		this.currentBeta = bi;
	}
}

================================================
FILE: src/opennlp/ccg/realize/hypertagger/ZLMaxentModel.java
================================================
package opennlp.ccg.realize.hypertagger;
import java.io.BufferedReader;
import java.io.File;
import java.io.FileNotFoundException;
import java.io.FileReader;
import java.io.IOException;
import java.util.ArrayList;
import java.util.HashMap;
import java.util.Map;

public class ZLMaxentModel {
    private MyIntegerPool intPool = new MyIntegerPool(50000);
    private double doubMax = 1.79769E+308;
    private ItemMap predMap = new ItemMap(this.intPool);
    private ItemMap outComeMap = new ItemMap(this.intPool);
    private Map<Integer,ArrayList<ZPair<Integer, Double>>> params = new HashMap<Integer,ArrayList<ZPair<Integer,Double>>>();
    private boolean loaded = false;
    private double[] probs;
    private int n_outcome;
    
    public ZLMaxentModel() {
        
    }
    public ZLMaxentModel(String modelFilename) {
        this.load(new File(modelFilename));
    }
    
    public void load(File modelFile) {
        if(!this.loaded) {
            this.loaded = true;
            BufferedReader br = null; 
            try {
                br = new BufferedReader(new FileReader(modelFile));
                String line = br.readLine();
                
                if(line.contains("#")) {
                    //DEBUG: outf.write(line+"\n");
                    line = br.readLine();
                }
                // Read in contextual predicates.
                int numPreds = Integer.parseInt(line.trim());
                for(int i=0; i<numPreds; i++) {
                    line = br.readLine().trim();
                    this.predMap.add(line);
                }
                // Read in outcomes (labels).
                line = br.readLine();
                int numOutcomes = Integer.parseInt(line);
                for(int j=0; j<numOutcomes; j++){
                    line = br.readLine().trim();
                    this.outComeMap.add(line);
                }
                // Read parameters.
                ArrayList<ArrayList<ZPair<Integer,Integer>>> tempParamsMap = new ArrayList<ArrayList<ZPair<Integer,Integer>>>();
                int numParameters = this.predMap.size();
                ArrayList<ZPair<Integer,Integer>> prms;
                int fid = 0;
                String ln = "";
                for(int q=0; q<numParameters; q++) {
                    ln = br.readLine();
                    String[] lineParts = ln.split("\\s+");
                    prms = new ArrayList<ZPair<Integer,Integer>>();
                    Integer oid;
                    for(int p=1; p<lineParts.length; p++) {
                        oid = this.intPool.getInt(Integer.parseInt(lineParts[p]));
                        prms.add(new ZPair<Integer,Integer>(oid, this.intPool.getInt(fid)));
                        fid++;
                    }
                    tempParamsMap.add(prms);
                }
                // Load theta.
                int nTheta = Integer.parseInt(br.readLine().trim());
                double[] theta = new double[nTheta];
                for(int z=0; z<theta.length; z++) {
                    theta[z] = Double.parseDouble(br.readLine().trim());
                }
                // Set the params mapping with the oid's and the theta.
                ArrayList<ZPair<Integer,Double>> tmpParamsList;
                int index = 0;
                for(ArrayList<ZPair<Integer,Integer>> param : tempParamsMap) {
                    tmpParamsList = new ArrayList<ZPair<Integer,Double>>();
                    for(ZPair<Integer,Integer> mapping : param) {
                        //System.out.print(mapping.b.intValue()+" ");
                        tmpParamsList.add(new ZPair<Integer,Double>(mapping.a, new Double(theta[mapping.b.intValue()])));
                    }
                    this.params.put(this.intPool.getInt(index), tmpParamsList);
                    index++;
                    
                }
                
                this.n_outcome = this.outComeMap.size();
                this.probs = new double[this.n_outcome];
                // Initialise the array for computing distribution over all labels.
            } catch (FileNotFoundException e) {
                e.printStackTrace();
            } catch (IOException e) {
                e.printStackTrace();
            } finally {
                try {
                    br.close();
                } catch(IOException ioe) {
                    ioe.printStackTrace();
                }
            }
        }
    }
    
    public String getBestOutcome(double[] probs) {
        double maxprob = 0.0;
        int maxidx = -1;
        for(int i = 0; i < probs.length; i++) {
            if(probs[i] > maxprob) {
                maxidx = i;
                maxprob = probs[i];
            }
        }
        return getOutcome(maxidx);
    }
    
    @SuppressWarnings("boxing")
		public double[] eval(String[] context, boolean realValued) {        
        // Zero out prob distribution over labels.
        for(int i=0; i<this.probs.length; i++)
            this.probs[i] = 0.0;
        
        // Keep building up unexponentiated, unnormalised
        // scores for each outcome (each slot in this.probs).
        ArrayList<ZPair<String,Double>> pred_value =
                new ArrayList<ZPair<String,Double>>(context.length);
        
        Double one = new Double(1.0);
        // Split up the strings into (pred,double) pairs.
        int splitPoint;
        for(int m=0; m<context.length; m++) {
            if(realValued) {
            splitPoint = context[m].lastIndexOf(":");
            pred_value.add(
                    new ZPair<String,Double>(context[m].substring(0, splitPoint),
                    Double.parseDouble(context[m].substring(splitPoint+1, context[m].length()))) );
            } else {
                pred_value.add(
                    new ZPair<String,Double>(context[m],   
                    one) );
            }
        }
        
        
        ArrayList<ZPair<Integer,Double>> featureWeights;
        //for(int j=0; j<context.length; j++) {
        for(ZPair<String,Double> pv : pred_value) {
            Integer predID = this.predMap.id(pv.a);
            if(predID!=null) {
                featureWeights = this.params.get(predID);
                for(ZPair<Integer,Double> fw : featureWeights) {
                    this.probs[fw.a.intValue()] += (fw.b.doubleValue() * pv.b.doubleValue());
                }
            }
        }
        
        double sum = 0.0;
        for(int p=0; p<this.probs.length; p++) {
            try {
                this.probs[p] = Math.exp(this.probs[p]);
            } catch(Exception e) {
                this.probs[p] = this.doubMax;
            }
            sum += this.probs[p];
        }
        for(int q=0; q<this.probs.length; q++) {
            this.probs[q] /= sum;
        }
        return this.probs;
    }
    
    public String getOutcome(int index) {
        return this.outComeMap.getItem(index);
    }
}

class ItemMap {
    private Integer index;
    private Map<String, Integer> dict = new HashMap<String, Integer>();
    private Map<Integer, String> reverseDict = new HashMap<Integer, String>();
    private MyIntegerPool intPool;
    
    public ItemMap(MyIntegerPool intPool) {
        this.intPool = intPool;
        this.index =  intPool.getInt(0);
    }
    @SuppressWarnings("boxing")
		public int add(String item) {
        if(this.dict.containsKey(item)) {
            return this.dict.get(item);
        } else {
            this.dict.put(item, index);
            this.reverseDict.put(index, item);
            this.index = this.intPool.getInt(index.intValue() + 1);
            return index.intValue()-1;
            
        }
        
    }
    
    public Integer id(String item) {
        if(this.dict.containsKey(item)) {
            return this.dict.get(item);
        } else {
            return null;
        }
    }
    
    public int size() {
        return this.dict.size();
    }
    
    public String getItem(int i) {
        return this.reverseDict.get(this.intPool.getInt(i));
    }
}


class ZPair<A,B> {
    public A a;
    public B b;
    
    public ZPair(A a, B b) {
        this.a = a;
        this.b = b;
    }
}


class MyIntegerPool {
    private Integer[] _table;
    public MyIntegerPool(int size) {
        this._table = new Integer[size];
        for(int i=0; i<size; i++) {
            this._table[i] = new Integer(i);
        }
    }
    public Integer getInt(int i) {
        if (i < this._table.length && i >= 0) {
            return this._table[i];
        } else {
            return new Integer(i);
        }
    }
}


================================================
FILE: src/opennlp/ccg/realize/hypertagger/ZLPOSTagger.java
================================================
package opennlp.ccg.realize.hypertagger;
import java.io.BufferedReader;
import java.io.BufferedWriter;
import java.io.File;
import java.io.FileNotFoundException;
import java.io.FileReader;
import java.io.FileWriter;
import java.io.IOException;
import java.io.OutputStreamWriter;
import java.util.ArrayList;
import java.util.Collections;
import java.util.HashMap;
import java.util.List;
import java.util.Map;
import java.util.logging.Level;
import java.util.logging.Logger;
import java.util.regex.Matcher;
import java.util.regex.Pattern;

import opennlp.ccg.hylo.Nominal;
import opennlp.ccg.lexicon.DefaultTokenizer;
import opennlp.ccg.parse.postagger.ml.POSPriorModel;
import opennlp.ccg.parse.tagger.util.ConfigFileProcessor;
import opennlp.ccg.parse.tagger.util.ResultSink;
import opennlp.ccg.util.Pair;

public class ZLPOSTagger extends TagExtractor {
	ZLMaxentModel model;
	POSPriorModel priorModel;
	int prefixLength = 4;
	int suffixLength = 4;
	double beta = 0.35;
	private HashMap<String,String> goldPred2Tag=new HashMap<String,String>();
	public class ProbIndexPair implements Comparable<ProbIndexPair> {
		public double prob;
		public int index;
		public ProbIndexPair(double prob, int index) {
			this.prob = prob;
			this.index = index;
		}
		public int compareTo(ProbIndexPair o) {
			if(prob < o.prob) {
				return -1;
			}
			else if(prob == o.prob) {
				return 0;
			}
			else {
				return 1;
			}
		}
	}

	public ZLPOSTagger() { super(); }

	public ZLPOSTagger(ZLMaxentModel model) {
		this();
		this.model = model;
		this.prefixLength = 4;
		this.suffixLength = 4;
		this.beta = 0.35; // 0.4 delivers 1.08 POStags/pred
	}
	public ZLPOSTagger(ZLMaxentModel model, POSPriorModel priorModel) {
		this();
		this.model = model;
		this.prefixLength = 4;
		this.suffixLength = 4;
		this.beta = 0.35;
		this.priorModel = priorModel;
	}
	public POSPriorModel getPriorModel() {
		return priorModel;
	}

	public void setPriorModel(POSPriorModel priorModel) {
		this.priorModel = priorModel;
	}
	/** get the features for one node
	 * 
	 * FO -- fan-out, i.e. number of children
	 * PN -- predicate name
	 * RN -- parent name 
	 * RT -- parent relation
	 * CT -- type of child
	 * CN -- name of child
	 * NA -- number of Argument children
	 * A0N, A1N, ... -- names of argument children (by default)
	 * PX -- prefix (N characters)
	 * SX -- suffix (M characters)
	 * HD -- has a digit
	 * UH -- has an uppercase character or a hyphen
	 * 
	 * @param n The graph node to extract features from
	 * @return An array of strings representing the features
	 */	
	// mww: switched to configurable arg names
	@SuppressWarnings("boxing")
	protected FeatureList getFeatures(LfGraphNode n) {
		FeatureList feats = new FeatureList();
		int argchildren = 0;
		feats.addFeature("PN", n.getPredicateName());
		feats.addFeature("FO", Integer.toString(n.getNumChildren()));
		// add name of parent, if any parent, and parent relation
		if(n.getMultiParents().size() > 0) {
			for(LfGraphNode parent : n.getMultiParents() ) {
				feats.addFeature("RN", parent.getPredicateName());
				// add class name, if available
				String cls = parent.getPred().getNominal().toString();
				// string is in X:Y:Z format. Remove 'X:' leaving 'Y:Z'.
				if(cls != null && cls.indexOf(':') > 0) {
					String cfeat = cls.substring(cls.indexOf(':') + 1);
					feats.addFeature("XP", cfeat);
				}
			}
		}
		else {
			feats.addFeature("RN", "0");
		}
		// add types of children, count up argument children
		for(LfGraphLink lnk  : n.getChildren()) {
			feats.addFeature("CT", lnk.getLabel());
			if(lnk.getTarget() != null) { 
				feats.addFeature("CN", lnk.getTarget().getPredicateName());
				// mww: use short arg name
				String shortArgName = argNameMap.get(lnk.getLabel());
				if (shortArgName != null) {
					// increment argchild count
					argchildren++;
					feats.addFeature(shortArgName + "N", lnk.getTarget().getPredicateName());
					// add class info for arg child, if applicable
					String cls = lnk.getTarget().getPred().getNominal().toString();
					// string is in X:Y:Z format. Remove 'X:' leaving 'Y:Z'.
					if(cls.indexOf(':') > 0) {
						String cfeat = cls.substring(cls.indexOf(':') + 1);
						// mww: for backwards compatibility
						String argNumOrName = (shortArgName.startsWith("A")) ? shortArgName.substring(1) : shortArgName;
						feats.addFeature("X" + argNumOrName + "D", cfeat);
					}
				}
			}
		}
		feats.addFeature("NA", Integer.toString(argchildren));
		// class name feature, if available
		Nominal idx = n.getPred().getNominal();
		String cls = idx.toString();
		// string is in X:Y:Z format. Remove 'X:' leaving 'Y:Z'.
		if(cls.indexOf(':') > 0) {
			String cfeat = cls.substring(cls.indexOf(':') + 1);
			feats.addFeature("XC", cfeat);
		}
		// compute prefix and suffix
		String predname = n.getPredicateName();
		// chop .04 part, if any
		Pattern pat = Pattern.compile("(\\w+)\\.\\d+$");
		String basePredName = new String(predname);
		Matcher mat = pat.matcher(basePredName);
		if(mat.matches()) {
			basePredName = mat.group(1);
		}
		if(basePredName.length() > prefixLength + 1) {
			String prefix = predname.substring(0, prefixLength);
			feats.addFeature("PX", prefix);
		}
		if(basePredName.length() > suffixLength + 1) {
			String suffix = basePredName.substring(basePredName.length() - suffixLength, basePredName.length());
			feats.addFeature("SX", suffix);
		}
		// check for digit and/or (upcase char and hyphen)
		if(basePredName.matches("\\d+")) {
			feats.addFeature("HD", "1");
		}
		else {
			feats.addFeature("HD", "0");
		}
		if(predname.matches("[A-Z]+") || predname.matches("-+")) {
			// XXX hack, because I don't think these PASS nodes should have a positive val
			// for this feature
			if(predname != "PASS") {
				feats.addFeature("UH", "1");
			}
			else {
				feats.addFeature("UH", "0");
			}
		}
		else {
			feats.addFeature("UH", "0");
		}
		// features from prior model, PPOS, if applicable
		if(priorModel != null) {
			List<Pair<Double,String>> priors = priorModel.getPriors(predname);
			double beta = 0.1;
      double best = priors.get(0).a;
      for(Pair<Double,String> prior : priors) {
          if(prior.a > (beta * best)) {
              // add the feature PPOS=<POSTAG>:<log-prob>
              feats.addFeatureWithProb("PPOS", prior.b, prior.a);
          } else {
              break;
          }
      }
		}
		return feats;
	}

	/** Get the features for the index'th node
	 * 
	 * @param index The index into the LF
	 * @return An array of strings representing the features
	 */
	public FeatureList getFeatures(int index) {
		for(LfGraphNode n : nomTable.values()) {
			if(n.getIndex() == index) {
				return getFeatures(n);
			}
		}
		return null; // bad index
	}
	public int getPrefixLength() {
		return prefixLength;
	}
	public void setPrefixLength(int prefixLength) {
		this.prefixLength = prefixLength;
	}
	public int getSuffixLength() {
		return suffixLength;
	}
	public void setSuffixLength(int suffixLength) {
		this.suffixLength = suffixLength;
	}
	/** Get all features for the current LF as a single multi-line string.
	 *  Used during extraction of training data.
	 * @return All features for the current LF.
	 */
	// formerly known as getAllFeaturesAndPOS()
	public String getAllFeaturesAndAnswer() {
		StringBuilder output = new StringBuilder();
		for(LfGraphNode n : nomTable.values()) {
			String feats = getFeatures(n).getAllFeatures();
			String postag = goldPred2Tag.get(n.getPred().getNominal().getName());
			output = output.append(postag + " ");
			output = output.append(feats);
			output = output.append("\n");
		}
		return output.toString();
	}
	
	public String getAllFeaturesAndPOSWithID() {
		String output = "";
		for(LfGraphNode n : nomTable.values()) {
			String feats = getFeatures(n).getAllFeatures();
			String postag = n.getPred().getOrigin().getPOS();
			output = output.concat("<" + Integer.toString(LFID) + "> " + postag + " " + feats);
			output = output.concat(postag + " ");
			output = output.concat(feats);
			output = output.concat("\n");
		}
		return output;
	}

	/* Returns an arraylist of tuples (POS, probability) */
	@SuppressWarnings({ "boxing" })
	public ArrayList<Pair<String,Double>> getBetaBestPOS(FeatureList feats) {
		ArrayList<Pair<String,Double>> poss = new ArrayList<Pair<String,Double>>();
		ArrayList<ProbIndexPair> probList = new ArrayList<ProbIndexPair>();
		double[] probs = model.eval(feats.getAllFeaturesForMaxent(),true);
		for(int i = 0; i < probs.length; i++) {
			probList.add(new ProbIndexPair(probs[i], i));
		}
		Collections.sort(probList);
		Collections.reverse(probList);
		double maxProb = probList.get(0).prob;
		for(int i = 0; i < probList.size(); i++) {
			if(probList.get(i).prob >= this.beta * maxProb) {
				poss.add(new Pair<String,Double>(model.getOutcome(probList.get(i).index), probList.get(i).prob));
			}
		}
		return poss;
	}
	@SuppressWarnings("boxing")
	public ArrayList<Pair<String,Double>> getBetaBestPOS(String[] feats) {
		ArrayList<Pair<String,Double>> poss = new ArrayList<Pair<String,Double>>();
		ArrayList<ProbIndexPair> probList = new ArrayList<ProbIndexPair>();
		double[] probs = model.eval(feats,true);
		for(int i = 0; i < probs.length; i++) {
			probList.add(new ProbIndexPair(probs[i], i));
		}
		Collections.sort(probList);
		Collections.reverse(probList);
		double maxProb = probList.get(0).prob;
		for(int i = 0; i < probList.size(); i++) {
			if(probList.get(i).prob >= this.beta * maxProb) {
				poss.add(new Pair<String,Double>(model.getOutcome(probList.get(i).index), probList.get(i).prob));
			}
		}
		return poss;
	}

//	for tagging (i.e. evaluating feature list against model)
	public String getBestPOS(FeatureList feats) {
		// feed the features to the model, and get the best guess
		// at the POS tag given those features.
		double[] probs = model.eval(feats.getAllFeaturesForMaxent(),false);
		return new String(model.getBestOutcome(probs));
	}

	public double getBeta() {
		return beta;
	}

	public void setBeta(double beta) {
		this.beta = beta;
	}

	/* (non-Javadoc)
	 * @see opennlp.ccg.realize.hypertagger.TagExtractor#storeGoldStdPredInfo(java.lang.String)
	 */
	public void storeGoldStdPredInfo(String predInfo) {
		String[] preds = predInfo.split("\\s+");
		if(preds != null) {
			for(int i = 1; i < preds.length; i++) {
				String[] info = preds[i].split(":");
				if(info.length != 4) {
					System.err.println("Malformed pred-info field, skipping (value was \"" + preds[i] + "\")");
					continue;
				}
				goldPred2Tag.put(info[0], DefaultTokenizer.unescape(info[2]));
			}
		} 
	}
	public void loadPriorModel(File priorModelFile, File vocabFile) {
		try {
			priorModel = new POSPriorModel(priorModelFile.getAbsolutePath(), vocabFile.getAbsolutePath());
		} catch (IOException e) {
			System.err.println("Unable to load prior model or vocab file");
			e.printStackTrace();
		}
	}
	@SuppressWarnings({"unused" })
	public static void main(String[] args) throws IOException {
		String usage = "\nBasicPOSTagger -c <configFile> (-i <input>) (-o <output> [defaults to <stdout>])\n"+
		"                 (-b beta value) (-m model file)\n";
		if (args.length > 0 && args[0].equals("-h")) {
			System.out.println(usage);
			System.exit(0);
		}

		//SRILMFactoredBundleCorpusIterator inp = null;
		// input is just a file full of maxent events
		// i.e., we are not really tagging an lf, just testing a model by feeding it pre-extracted
		// events and comparing with the GS tags
		BufferedReader inp = null;
		BufferedWriter out = null;
		try {
			String inputCorp = null;
			String configFile = null;
			String output = null;
			String modelFile = null;
			double beta = 0;

			boolean test = false;

			for (int i = 0; i < args.length; i++) {
				if (args[i].equals("-i")) { inputCorp = args[++i]; continue; }
				if (args[i].equals("-o")) { output = args[++i];    continue; }
				if (args[i].equals("-c")) { configFile = args[++i]; continue; }
				if (args[i].equals("-m")) { modelFile = args[++i]; continue; }
				if (args[i].equals("-b")) { beta = Double.parseDouble(args[++i]); continue; }
				System.out.println("Unrecognized option: " + args[i]);
			}

			ResultSink rs = new ResultSink(ResultSink.ResultSinkType.POSTAG);

			try {                        
				inp = new BufferedReader(new FileReader(new File(inputCorp)));                
			} catch (FileNotFoundException ex) {
				System.err.print("Input corpus " + inputCorp + " not found.  Exiting...");
				Logger.getLogger(POSPriorModel.class.getName()).log(Level.SEVERE, null, ex);
				System.exit(-1);
			}  

			try {
				out = (output.equals("<stdout>")) ? new BufferedWriter(new OutputStreamWriter(System.out)) : new BufferedWriter(new FileWriter(new File(output)));
			} catch (IOException ex) {
				System.err.print("Output file " + output + " not found.  Exiting...");
				Logger.getLogger(POSPriorModel.class.getName()).log(Level.SEVERE, null, ex);
				System.exit(-1);
			}
			//String[] pathKeys = { "maxentmodel", "priormodel", "priormodelvocab", "sequencemodel" };
			//Map<String, String> opts = ConfigFileProcessor.readInConfig(configFile, pathKeys);
			//POSPriorModel posPrior = new POSPriorModel(opts.get("priormodel"), opts.get("priormodelvocab"));
			ZLPOSTagger post = new ZLPOSTagger(new ZLMaxentModel(modelFile));
			if(beta > 0) { post.setBeta(beta); }
			//post.setPriorModel(posPrior); // unneeded?
			String line;
			int count = 0;
			int wins = 0;
			int tagsPerPred = 0;
			while(true) {
				line = inp.readLine();
				if(line == null) { break; }
				count++;
				int pos = line.indexOf(' ');
				String gs = line.substring(0,pos);
				//System.err.println("GS: " + gs);
				//System.err.println("Featline: " + line.substring(pos + 1));
				String[] feats = line.substring(pos+1).split("\\s+");
				ArrayList<Pair<String,Double>> ptags = post.getBetaBestPOS(feats);
				tagsPerPred += ptags.size();
				// now check for the win...
				for(Pair<String,Double> p : ptags) {
					if(p.a.equals(gs)) {
						wins++;
						break;
					}
				}

			}
			// for now, just print overall accuracy
			out.write("Beta: " + post.getBeta() + "\n");
			out.write("Acc: " + (double)wins / (double)count * 100.0 + "\n");
			out.write("Tags/Pred: " + (double)tagsPerPred / (double)count + "\n");
			out.flush();
		} catch(Throwable t) {
			t.printStackTrace();
		} finally {
			try {                
				inp.close();
				out.close();
			} catch (IOException ex) {
				Logger.getLogger(POSPriorModel.class.getName()).log(Level.SEVERE, null, ex);
			}
		}
	}

	public static ZLPOSTagger ZLPOSTaggerFactory(String configFile) throws IOException {
		ZLPOSTagger postagger = new ZLPOSTagger();
		String[] pathKeys = { "priormodel", "priormodelvocab", "maxentmodel"};
		Map<String,String> opts = ConfigFileProcessor.readInConfig(configFile, pathKeys);
		String priorModelFile = opts.get("priormodel");
		if(priorModelFile != null) {
			String vocabFile = opts.get("priormodelvocab");
			if(vocabFile == null) {
				throw new IOException("A vocab file must be specified.");
			}
			postagger.loadPriorModel(new File(priorModelFile), new File(vocabFile));
		}
		String modelFile = opts.get("maxentmodel");
		if(modelFile == null) {
			throw new IOException("You must specify the maxent model to use.");
		}
		postagger.model = new ZLMaxentModel(modelFile);
		String betaString = opts.get("beta");
		if(betaString != null) {
			double beta = Double.parseDouble(betaString);
			postagger.beta = beta;
		}
		return postagger;
	}
}


================================================
FILE: src/opennlp/ccg/synsem/AbstractCat.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003-5 Jason Baldridge, Gann Bierner and 
//                      University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.synsem;

import java.io.IOException;
import java.io.Serializable;
import gnu.trove.*;
import org.jdom.*;

import opennlp.ccg.hylo.*;
import opennlp.ccg.unify.*;

/**
 * Abstract category adapter for CCG categories.
 *
 * @author      Gann Bierner
 * @author      Jason Baldridge
 * @author      Michael White
 * @version     $Revision: 1.22 $, $Date: 2011/05/22 03:40:55 $ 
 */
public abstract class AbstractCat implements Category, Serializable { 

	private static final long serialVersionUID = 1L;

	/** The feature structure, which should only be used with atomic categories. */
    protected FeatureStructure _featStruc;
    
    /** The logical form, which should be used only with the outermost category. */
    protected LF _lf;
    
    /** The hash code, if already computed. */
    private transient int _hashCode = -1;

    /** The hash code for the category without its LF, if already computed. */
    private transient int _hashCodeNoLF = -1;
    
    /** The mapping from vars to ints, if already computed. */
    private transient TObjectIntHashMap _varMap = null;

    /** The supertag, if already computed. */
    protected String _supertag = null;
    
    /** Default constructor. */
    public AbstractCat() {}

    /** Constructor which sets the LF. */
    public AbstractCat(LF lf) { _lf = lf; }

    /** 
     * Constructor which retrieves the LF from the XML element 
     * and flattens it to a conjunction of elementary predications
     * (or a single one). 
     */
    public AbstractCat(Element elt) {
        Element lfElt = elt.getChild("lf");
        if (lfElt != null) {
            _lf = HyloHelper.flattenLF(HyloHelper.getLF(lfElt));
        }
    }

    /**
     * Adds an XML element for the LF, if any, to the given catElt.
     * Uses {@link HyloHelper#toXml(LF)}.
     */
    public void toXml(Element catElt) {
    	if (_lf != null) catElt.addContent(HyloHelper.toXml(_lf));
    }

    // during deserialization, intern computed supertag, and ensure varmap recomputed
    private void readObject(java.io.ObjectInputStream in) throws IOException, ClassNotFoundException {
    	in.defaultReadObject();
    	if (_supertag != null) _supertag = _supertag.intern();
    	_varMap = null;
    }
    
    
    /** Gets the feature structure. */
    public FeatureStructure getFeatureStructure() { 
        return _featStruc; 
    }

    /** Sets the feature structure. */
    public void setFeatureStructure(FeatureStructure fs) { 
        _featStruc = fs; 
    }
    
    /** Gets the LF. */
    public LF getLF() { return _lf; }
    
    /** Sets the LF. */
    public void setLF(LF lf) { _lf = lf; }
    

    //-----------------------------------------------------------------
    // methods from Category which should be implemented by subclasses of
    // AbstractCat
    
    public abstract String toString();
    
    /**
     * Returns the supertag for the category.
     */
    public abstract String getSupertag();
    
    /**
     * This will return a TeX formatted representation for a category.
     * If toTeX() is not implemented for this category, the normal
     * toString() method is invoked instead.
     */
    public String toTeX()
    {
        return toString();
    }
    
    public abstract Category copy();
    public abstract Category shallowCopy();
    
    public abstract Object fill (Substitution s) throws UnifyFailure;
    public abstract void unifyCheck (Object u) throws UnifyFailure;
    /** NB: The LF does not participate in unification. */
    public abstract Object unify (Object u, Substitution sub) 
        throws UnifyFailure;

    /**
     * Returns the target category of this category.
     */
    public abstract TargetCat getTarget();
    
    
    //-----------------------------------------------------------------
    // implemented methods from Category
    
    public boolean shallowEquals(Object o) { 
        return equals(o); 
    }

    public void deepMap(ModFcn mf) { 
        if (_lf != null) _lf.deepMap(mf);
        mf.modify(this);
    }

    public void forall(CategoryFcn f) { 
        f.forall(this); 
    }
    
    public boolean occurs(Variable v) {
        if (_lf == null) return false;
        return _lf.occurs(v); 
    }


    // methods to support printing of Categories
    public String prettyPrint() { return prettyPrint(""); }
    protected String prettyPrint(String pad) { return pad+toString(); }

    protected int prettyLength(String s) {
        int max=0, cur=0;
        for(int i=0; i<s.length(); i++)
            if(s.charAt(i) == '\n') {
                max = Math.max(cur, max);
                cur = 0;
            } else cur++;
        return Math.max(max, cur);
    }

    
    /** 
     * Returns a hash code for this category. 
     * The hash code handles equivalence up to variable names 
     * as long as features and predicates are in the same order.
     * The implementation calls hashCodeNoLF(varMap) and hashCode(varMap) 
     * on the LF.
     */
    public int hashCode() {
    	// NB: caching of the hash code has been turned off to avoid problems with stale values;
    	//     in principle, a check for staleness could be added
        //if (_varMap != null && _hashCode != -1) { return _hashCode; }
        _varMap = new TObjectIntHashMap();
        _hashCodeNoLF = hashCodeNoLF(_varMap);
        _hashCode = _hashCodeNoLF;
        if (_lf != null) { _hashCode += _lf.hashCode(_varMap); }
        return _hashCode;
    }
    
    /** 
     * Returns a hash code for this category ignoring the LF.
     * The hash code handles equivalence up to variable names 
     * as long as features and predicates are in the same order.
     * The implementation calls hashCodeNoLF(varMap). 
     */
    public int hashCodeNoLF() {
    	// NB: caching of the hash code has been turned off to avoid problems with stale values;
    	//     in principle, a check for staleness could be added
        //if (_varMap != null && _hashCodeNoLF != -1) { return _hashCodeNoLF; }
        _varMap = new TObjectIntHashMap();
        _hashCodeNoLF = hashCodeNoLF(_varMap);
        return _hashCodeNoLF;
    }
    
    /**
     * Returns a hash code for this category ignoring the LF, 
     * using the given map from vars to ints, 
     * to allow for equivalence up to variable names.
     */
    public abstract int hashCodeNoLF(TObjectIntHashMap varMap);

    /** 
     * Returns whether this category equals the given object. 
     * Equivalence up to variable names is handled  
     * as long as features and predicates are in the same order.
     * The implementation calls equalsNoLF(obj, varMap, varMap2).
     */
    public boolean equals(Object obj) { return equals(obj, true); }
    
    /** 
     * Returns whether this category equals the given object, 
     * ignoring the LFs (if any).
     */
    public boolean equalsNoLF(Object obj) { return equals(obj, false); }

    // checks equality, with a flag whether to check the LFs
    private boolean equals(Object obj, boolean checkLF) {
        // NB: The following line can be uncommented, in order to 
        //     turn off category equality checking; it hasn't been 
        //     put on a preferences switch, due to efficiency concerns.
        // if (true) return super.equals(obj);
        if (obj == this) return true;
        if (obj == null) return false;
        if (obj.getClass() != this.getClass()) { return false; }
        AbstractCat ac = (AbstractCat) obj;
        // ensure var maps in place
        if (checkLF) {
        	hashCode(); ac.hashCode();
        } else {
        	hashCodeNoLF(); ac.hashCodeNoLF();
        }
        // check equality wrt mappings
        if (checkLF) {
            if (_lf != null && ac._lf == null) { return false; }
            if (_lf == null && ac._lf != null) { return false; }
        }
        if (!equalsNoLF(obj, _varMap, ac._varMap)) return false;
        if (checkLF && _lf != null && !_lf.equals(ac._lf, _varMap, ac._varMap)) { return false; }
        return true;
    }

    /**
     * Returns whether this category equals the given object  
     * up to variable names, using the given maps from vars to ints, 
     * ignoring the LFs (if any).
     */
    public abstract boolean equalsNoLF(Object obj, TObjectIntHashMap varMap, TObjectIntHashMap varMap2);


    /**
     * Returns the nominal which is the value of the index feature on the 
     * target cat, or null if none.
     */
    public Nominal getIndexNominal() {
        Category target = getTarget();
        FeatureStructure fs = target.getFeatureStructure();
        if (fs != null) { 
            Object index = fs.getValue("index");
            if (index instanceof Nominal) return (Nominal) index;
        }
        return null;
    } 

    /**
     * Returns whether this category is a fragment category (false by default).
     */
    public boolean isFragment() { return false; }
}


================================================
FILE: src/opennlp/ccg/synsem/Arg.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2002-5 Jason Baldridge and University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.synsem;

import opennlp.ccg.unify.*;
import gnu.trove.*;

/**
 * An interface for objects that can be arguments in a category.
 *
 * @author      Jason Baldridge
 * @author      Michael White
 * @version     $Revision: 1.8 $, $Date: 2009/11/28 03:39:27 $
 */
public interface Arg extends Unifiable, Mutable {

    public Arg copy();
    public void forall(CategoryFcn fcn);
    public void unifySlash(Slash s) throws UnifyFailure;
    
    /** Sets the modifier status of each slash. */
    public void setSlashModifier(boolean modifier);
    
    /** Sets the harmonic composition result of each slash. */
    public void setSlashHarmonicCompositionResult(boolean harmonicResult);
    
    /**
     * Returns a hash code for this arg, 
     * using the given map from vars to ints.
     */
    public int hashCode(TObjectIntHashMap varMap);
    
    /**
     * Returns whether this arg equals the given object  
     * up to variable names, using the given maps from vars to ints.
     */
    public boolean equals(Object obj, TObjectIntHashMap varMap, TObjectIntHashMap varMap2);
    
    /**
     * Returns the supertag for the arg.
     */
    public String getSupertag();
    
    /**
     * Returns a TeX-formatted string representation for the arg.
     */
    public String toTeX();
}


================================================
FILE: src/opennlp/ccg/synsem/ArgStack.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2002-5 Jason Baldridge and University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.synsem;

import opennlp.ccg.unify.*;
import gnu.trove.*;
import org.jdom.*;

import java.io.Serializable;
import java.util.*;

/**
 * A stack of arguments with their associated slashes.
 * 
 * @author Jason Baldridge
 * @author Michael White
 * @version $Revision: 1.11 $, $Date: 2009/11/28 03:39:27 $
 */
public class ArgStack implements Serializable {

	private static final long serialVersionUID = -4610015768742537105L;

	protected Arg[] _list;

	protected boolean _hasDollar = false;

	protected boolean _hasSet = false;

	public ArgStack() {
		_list = new Arg[0];
	}

	public ArgStack(Arg c) {
		_list = new Arg[1];
		_list[0] = c;
		if (c instanceof Dollar) {
			_hasDollar = true;
		} else if (c instanceof SetArg) {
			_hasSet = true;
		}
	}

	public ArgStack(Slash s, Category c) {
		this(new BasicArg(s, c));
	}

	public ArgStack(Arg[] list) {
		_list = list;
		checkForDollar();
		checkForSet();
	}

	public ArgStack(List<Element> info) {
		List<Arg> args = new ArrayList<Arg>();
		for (Iterator<Element> infoIt = info.iterator(); infoIt.hasNext();) {
			Element el = infoIt.next();
			String elName = el.getName();
			if (elName.equals("setarg")) {
				args.add(new SetArg(el));
				_hasSet = true;
			} else if (elName.equals("dollar")) {
				String name = el.getAttributeValue("name");
				if (name == null)
					name = el.getAttributeValue("n");
				args.add(new Dollar(name));
				_hasDollar = true;
			} else if (elName.equals("slash") || elName.equals("sl")) {
				Slash s = new Slash(el);
				Element argEl = infoIt.next();
				if (argEl.getName().equals("dollar")) {
					String name = argEl.getAttributeValue("name");
					if (name == null)
						name = argEl.getAttributeValue("n");
					args.add(new Dollar(s, name));
					_hasDollar = true;
				} else {
					args.add(new BasicArg(s, CatReader.getCat(argEl)));
				}
			} else {
				System.out.println("Invalid element for creating ArgStack: "
						+ elName);
			}
		}
		_list = new Arg[args.size()];
		args.toArray(_list);
	}

	public void toXml(Element catElt) {
		for (Arg arg: _list) {
			if (arg instanceof SetArg)
				catElt.addContent(((SetArg) arg).toXml());
			else if (arg instanceof Dollar) {
				Dollar dollar = (Dollar) arg;
				if (!dollar.getSlash().toString().equals("|."))
					catElt.addContent(dollar.getSlash().toXml());
				Element dollarElt = new Element("dollar");
				dollarElt.setAttribute("name", dollar.name());
				catElt.addContent(dollarElt);
			}
			else if (arg instanceof BasicArg) {
				BasicArg barg = (BasicArg) arg;
				catElt.addContent(barg.getSlash().toXml());
				catElt.addContent(barg.getCat().toXml());
			}
		}
	}
	
	public void addAt(Arg c, int index) {
		Arg[] $list = new Arg[_list.length + 1];
		insert(subList(0, index)._list, $list, 0);
		$list[index] = c;
		insert(subList(index)._list, $list, index + 1);
		_list = $list;
		if (c instanceof Dollar) {
			_hasDollar = true;
		} else if (c instanceof SetArg) {
			_hasSet = true;
		}
	}

	public void add(Arg c) {
		Arg[] $list = new Arg[_list.length + 1];
		int last = insert(_list, $list, 0);
		$list[last] = c;
		_list = $list;
		if (c instanceof Dollar) {
			_hasDollar = true;
		} else if (c instanceof SetArg) {
			_hasSet = true;
		}
	}

	public void addAt(ArgStack cl, int index) {
		Arg[] $list = new Arg[_list.length + cl._list.length];
		int last = insert(subList(0, index)._list, $list, 0);
		last = insert(cl._list, $list, last);
		insert(subList(index)._list, $list, last);
		_list = $list;
		if (cl.containsDollarArg()) {
			_hasDollar = true;
		} else if (cl.containsSetArg()) {
			_hasSet = true;
		}
	}

	public void add(ArgStack cl) {
		Arg[] $list = new Arg[_list.length + cl._list.length];
		int last = insert(_list, $list, 0);
		insert(cl._list, $list, last);
		_list = $list;
		if (cl.containsDollarArg()) {
			_hasDollar = true;
		} else if (cl.containsSetArg()) {
			_hasSet = true;
		}
	}

	public void addFront(Arg c) {
		Arg[] $list = new Arg[_list.length + 1];
		$list[0] = c;
		insert(_list, $list, 1);
		_list = $list;
		if (c instanceof Dollar) {
			_hasDollar = true;
		} else if (c instanceof SetArg) {
			_hasSet = true;
		}
	}

	public void addFront(ArgStack cl) {
		Arg[] $list = new Arg[_list.length + cl._list.length];
		int last = insert(cl._list, $list, 0);
		insert(_list, $list, last);
		_list = $list;
		if (cl.containsDollarArg()) {
			_hasDollar = true;
		} else if (cl.containsSetArg()) {
			_hasSet = true;
		}
	}

	public void insertFront(ArgStack cl) {
		insertAt(cl, 0);
	}

	public void insertEnd(ArgStack cl) {
		insertAt(cl, _list.length - 1);
	}

	public void insertAt(ArgStack cl, int index) {
		Arg insertInto = _list[index];
		if (insertInto instanceof BasicArg) {
			cl.add(insertInto);
			_list[index] = new SetArg(cl);
			_hasSet = true;
		} else if (insertInto instanceof SetArg) {
			((SetArg) insertInto).add(cl);
		} else {
			System.out.println("Problem inserting arg stack: " + cl);
		}
	}

	public int size() {
		return _list.length;
	}

	public boolean containsDollarArg() {
		return _hasDollar;
	}

	public boolean containsSetArg() {
		return _hasSet;
	}

	public Arg get(int i) {
		return _list[i];
	}

	public void set(int i, Arg c) {
		_list[i] = c;
		if (c instanceof Dollar) {
			_hasDollar = true;
		} else if (c instanceof SetArg) {
			_hasSet = true;
		}
	}

	public Arg getLast() {
		return _list[_list.length - 1];
	}

	public void setLast(Arg c) {
		set(_list.length - 1, c);
	}

    /** Sets the harmonic composition result of each arg's slash. */
    public void setSlashHarmonicCompositionResult(boolean harmonicResult) {
    	for (int i=0; i < _list.length; i++) {
    		_list[i].setSlashHarmonicCompositionResult(harmonicResult);
    	}
    }
    
	public ArgStack copy() {
		Arg[] $list = new Arg[_list.length];
		for (int i = 0; i < $list.length; i++) {
			$list[i] = _list[i].copy();
		}
		return new ArgStack($list);
	}

	public ArgStack copyWithout(int indexToRemove) {
		Arg[] $list = new Arg[_list.length - 1];
		if ($list.length < 1) {
			System.out.println("Removing last item from an argument stack!");
		}
		int index = 0;
		for (int i = 0; i < _list.length; i++) {
			if (i != indexToRemove) {
				$list[index++] = _list[i].copy();
			}
		}
		return new ArgStack($list);
	}

	public ArgStack subList(int from) {
		return subList(from, _list.length);
	}

	public ArgStack subList(int from, int upto) {
		Arg[] $list;
		if (upto > from) {
			$list = new Arg[upto - from];
			int index = 0;
			for (int i = from; i < upto; i++) {
				$list[index++] = _list[i];
			}
		} else {
			$list = new Arg[0];
		}
		return new ArgStack($list);
	}

	public ArgStack shallowCopy() {
		return new ArgStack(_list);
	}

	public boolean occurs(Variable v) {
		for (int i = 0; i < _list.length; i++) {
			if (_list[i].occurs(v)) {
				return true;
			}
		}
		return false;
	}

	public ArgStack fill(Substitution s) throws UnifyFailure {
		ArgStack args = new ArgStack();
		for (int i = 0; i < _list.length; i++) {
			Object value = _list[i].fill(s);
			if (value instanceof ArgStack) {
				args.add((ArgStack) value);
			} else {
				args.add((Arg) value);
			}
		}
		return args;
	}

	public void deepMap(ModFcn mf) {
		for (int i = 0; i < _list.length; i++) {
			_list[i].deepMap(mf);
		}
	}

	public boolean containsContrarySlash() {
		for (int i = 0; i < _list.length; i++) {
			if (_list[i] instanceof BasicArg
					&& !((BasicArg) _list[i]).getSlash().sameDirAsModality()) {
				return true;
			} else if (_list[i] instanceof SetArg
					&& ((SetArg) _list[i]).containsContrarySlash()) {
				return true;
			}
		}
		return false;
	}

	public void slashesUnify(Slash s) throws UnifyFailure {
		for (int i = 0; i < _list.length; i++) {
			_list[i].unifySlash(s);
		}
	}

	public int unifySuffix(ArgStack as, Substitution sub) throws UnifyFailure {

		int asIndex = as.size();
		for (int i = _list.length - 1; i >= 0; i--) {
			asIndex--;
			get(i).unify(as.get(asIndex), sub);
		}
		return asIndex;
	}

	public ArgStack unify(ArgStack as, Substitution sub) throws UnifyFailure {
		return unifyPrefix(as, as.size(), sub);
	}

	public ArgStack unifyPrefix(ArgStack as, int upto, Substitution sub)
			throws UnifyFailure {

		ArgStack $args;
		if (containsDollarArg()) {
			if (as.containsDollarArg()) {
				$args = unifyDollarWithDollar(as, upto, sub);
			} else {
				$args = unifyDollarWithNoDollar(size(), as, upto, sub);
			}
		} else if (as.containsDollarArg()) {
			$args = as.unifyDollarWithNoDollar(upto, this, size(), sub);
		} else if (size() == upto) {
			$args = unifySimple(as, upto, sub);
		} else {
			$args = unifyComplex(as, upto, sub);
			// throw new UnifyFailure();
		}
		return $args;
	}

	private ArgStack unifySimple(ArgStack as, int upto, Substitution sub)
			throws UnifyFailure {

		ArgStack $args = new ArgStack();
		for (int i = upto - 1; i >= 0; i--) {
			$args.addFront((Arg) _list[i].unify(as.get(i), sub));
		}
		return $args;
	}

	private ArgStack unifyComplex(ArgStack as, int upto, Substitution sub)
			throws UnifyFailure {

		ArgStack $args = new ArgStack();

		int aIndex = size() - 1;
		int bIndex = upto - 1;
		while (aIndex >= 0 && bIndex >= 0) {
			// while (null != aArg && null != bArg) {
			Arg aArg = get(aIndex);
			Arg bArg = as.get(bIndex);

			if ((aArg instanceof BasicArg && bArg instanceof BasicArg)
					|| (aArg instanceof SetArg && bArg instanceof SetArg)) {
				$args.addFront((Arg) aArg.unify(bArg, sub));
				aIndex--;
				bIndex--;
			} else if (aArg instanceof BasicArg && bArg instanceof SetArg) {
				int setsize = ((SetArg) bArg).size();
				if (setsize <= aIndex + 1) {
					int stop = aIndex - setsize;
					for (; aIndex > stop;) {
						aIndex--;
						if (bArg instanceof BasicArg) {
							$args.addFront((Arg) aArg.unify(bArg, sub));
						} else {
							int idInSet = ((SetArg) bArg)
									.indexOf((BasicArg) aArg);
							if (idInSet == -1)
								throw new UnifyFailure();
							$args.addFront((Arg) aArg.unify(((SetArg) bArg)
									.get(idInSet), sub));
							aArg = get(aIndex);
							bArg = ((SetArg) bArg).copyWithout(idInSet);
						}
					}
					bIndex--;
				} else {
					throw new UnifyFailure();
				}
			} else if (aArg instanceof SetArg && bArg instanceof BasicArg) {
				throw new UnifyFailure();
			} else {
				throw new UnifyFailure();
			}
		}
		if (aIndex > -1 || bIndex > -1) {
			throw new UnifyFailure();
		}
		return $args;
	}

	private ArgStack unifyDollarWithNoDollar(int uptoThis, ArgStack otherStack,
			int uptoOther, Substitution sub) throws UnifyFailure {

		if ((!(_hasSet || otherStack._hasSet) && uptoThis > uptoOther + 1)
				|| (uptoThis > 1 && uptoOther < 1)) {
			throw new UnifyFailure();
		}
		ArgStack $args = new ArgStack();
		otherStack = otherStack.subList(0, uptoOther);
		int otherIndex = uptoOther - 1;

		for (int i = uptoThis - 1; i >= 0; i--) {
			Arg argi = get(i);
			if (argi instanceof Dollar) {
				if (i > 0) {
					throw new UnifyFailure();
				} else {
					ArgStack $subArgs = otherStack.subList(0, otherIndex + 1);
					// Slash dsl = ((Dollar) argi).getSlash();
					((Dollar) argi).unify($subArgs.copy(), sub);
					otherIndex = 0;
					$args.addFront($subArgs);
				}
			} else if (argi instanceof BasicArg) {
				if (otherIndex < 0) {
					throw new UnifyFailure();
				}

				Arg otherArg = otherStack.get(otherIndex);
				if (otherArg instanceof BasicArg) {
					$args.addFront((Arg) argi.unify(otherArg, sub));
					otherIndex--;
				} else if (otherArg instanceof SetArg) {
					SetArg sa = (SetArg) otherArg;
					int id = sa.indexOf((BasicArg) argi);
					if (id == -1)
						throw new UnifyFailure();
					$args.addFront((Arg) argi.unify(sa.get(id), sub));
					otherStack.set(otherIndex, sa.copyWithout(id));
				}
			} else {
				throw new UnifyFailure();
			}
		}
		if (otherIndex > 0) {
			throw new UnifyFailure();
		}
		return $args;
	}

	private ArgStack unifyDollarWithDollar(ArgStack as, int upto,
			Substitution sub) throws UnifyFailure {

		ArgStack $args;
		if (size() == 1) {
			$args = as.subList(0, upto);
			((Dollar) get(0)).unify($args.copy(), sub);
		} else if (upto == 1) {
			$args = subList(0, size());
			((Dollar) as.get(0)).unify($args.copy(), sub);
		} else if (upto == size()) {
			$args = unifySimple(as, upto, sub);
		} else {
			throw new UnifyFailure();
		}
		return $args;
	}

	public void forall(CategoryFcn fcn) {
		for (int i = 0; i < _list.length; i++) {
			_list[i].forall(fcn);
		}
	}

	private void checkForDollar() {
		for (int i = 0; i < _list.length; i++) {
			if (_list[i] instanceof Dollar) {
				_hasDollar = true;
				return;
			}
		}
	}

	private void checkForSet() {
		for (int i = 0; i < _list.length; i++) {
			if (_list[i] instanceof SetArg) {
				_hasSet = true;
				return;
			}
		}
	}

	public String toString() {
		StringBuffer sb = new StringBuffer();
		for (int i = 0; i < _list.length; i++) {
			sb.append(_list[i].toString());
		}
		return sb.toString();
	}

// 	private boolean methodExists(Object o, String methodName) {
// 		java.lang.reflect.Method[] m = o.getClass().getMethods();
// 		for (int i = 0; i < m.length; i++)
// 			if (m[i].getName() == methodName) {
// 				if (m[i].getDeclaringClass().toString().startsWith("class"))
// 					return true;
// 				else
// 					return false;
// 			}
// 		return false;
// 	}

	/**
	 * Returns the supertag for this arg stack.
	 */
	public String getSupertag() {
		StringBuffer sb = new StringBuffer();
		for (int i = 0; i < _list.length; i++) {
			Arg arg = (Arg) _list[i];
			sb.append(arg.getSupertag());
		}
		return sb.toString();
	}

	/**
	 * Returns a TeX-formatted string representation for this arg stack.
	 */
	public String toTeX() {
		StringBuffer sb = new StringBuffer();
		for (int i = 0; i < _list.length; i++) {
		    sb.append(_list[i].toTeX());
		}
		return sb.toString();
	}

	/**
	 * Returns a hash code using the given map from vars to ints.
	 */
	public int hashCode(TObjectIntHashMap varMap) {
		int retval = 0;
		for (int i = 0; i < _list.length; i++) {
			retval += _list[i].hashCode(varMap);
		}
		return retval;
	}

	/**
	 * Returns whether this arg stack equals the given object up to variable
	 * names, using the given maps from vars to ints.
	 */
	public boolean equals(Object obj, TObjectIntHashMap varMap,
			TObjectIntHashMap varMap2) {
		if (obj.getClass() != this.getClass()) {
			return false;
		}
		ArgStack as = (ArgStack) obj;
		if (_list.length != as._list.length) {
			return false;
		}
		for (int i = 0; i < _list.length; i++) {
			if (!_list[i].equals(as._list[i], varMap, varMap2)) {
				return false;
			}
		}
		return true;
	}

	protected static int insert(Arg[] a, Arg[] b, int pos) {
		for (int i = 0; i < a.length; i++) {
			b[pos++] = a[i];
		}
		return pos;
	}
}


================================================
FILE: src/opennlp/ccg/synsem/AtomCat.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003-11 Jason Baldridge, Gann Bierner and 
//                       University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.synsem;

import opennlp.ccg.unify.*;
import opennlp.ccg.util.DisplayPrefs;
import opennlp.ccg.grammar.Grammar;
import org.jdom.*;

import gnu.trove.*;

/**
 * The most basic CG category.  This corresponds to a category like 'np[acc]',
 * i.e. a category name and associated features.
 *
 * @author      Gann Bierner
 * @author      Jason Baldridge
 * @author      Michael White
 * @version     $Revision: 1.18 $, $Date: 2011/07/15 03:02:53 $
 */
public final class AtomCat extends AbstractCat implements TargetCat {

    private static final long serialVersionUID = 1L;

    private String type;

    /** Flag indicating whether this cat is a fragment with completion status true (defaults to false). */
    public boolean fragCompletion = false;
    
    /** Constructor which creates an atomic category with the given type. */
    public AtomCat(String t) {
        this(t, new GFeatStruc());
    }

    /** Constructor which creates an atomic category with the given type and feature structure. */
    public AtomCat(String t, FeatureStructure fs) {
        this(t, fs, null); 
    }

    /** Constructor which creates an atomic category with the given type, feature structure and LF. */
    public AtomCat(String t, FeatureStructure fs, LF lf) {
        super(lf);
        type = t; 
        _featStruc = fs; 
    }

    /** Constructor which retrieves the atomic category from the XML element. */
    public AtomCat(Element acel) {
        // call super to get LF if present
        super(acel);
        // get type
        type = acel.getAttributeValue("type");
        if (type == null) type = acel.getAttributeValue("t"); 
        // get feature structure
        Element fsEl = acel.getChild("fs");
        if (fsEl != null) {
            _featStruc = new GFeatStruc(fsEl);
        }
        // or create empty one
        else {
            _featStruc = new GFeatStruc();
        }
    }

    /**Returns an XML element representing the category. */
    public Element toXml() {
    	Element retval = new Element("atomcat");
    	retval.setAttribute("type", type);
    	if (!_featStruc.isEmpty() || _featStruc.getIndex() > 0) {
    		if (_featStruc instanceof GFeatStruc) { // only supporting GFeatStruc per xml construction
    			retval.addContent(((GFeatStruc) _featStruc).toXml());
    		}
    	}
    	// call super to add LF if present
    	super.toXml(retval);
    	return retval;
    }

    /**
     * Returns this category as the target category.
     */
    public TargetCat getTarget() { return this; }
    
    
    public String getType() {
        return type;
    }

    
    public Category copy() {
    	AtomCat retval = new AtomCat(type, _featStruc.copy(), (_lf == null) ? null : (LF) _lf.copy());
    	retval.fragCompletion = fragCompletion;
        return retval;
    }

    public Category shallowCopy() {
        AtomCat retval = new AtomCat(type, _featStruc, _lf);
    	retval.fragCompletion = fragCompletion;
        return retval;
    }

    public void deepMap(ModFcn mf) { 
        super.deepMap(mf);
        _featStruc.deepMap(mf);
    }

    public void unifyCheck (Object u) throws UnifyFailure {
        if (u instanceof AtomCat) {
            AtomCat u_ac = (AtomCat)u;
            if (!(type.equals(u_ac.type))) {
                throw new UnifyFailure();
            }
            if (_featStruc != null && u_ac._featStruc != null) {
                _featStruc.unifyCheck(u_ac._featStruc);
            }
        } else if (!(u instanceof Variable)) {
            throw new UnifyFailure();
        }
    }

    /** NB: The LF does not participate in unification. */
    public Object unify (Object u, Substitution sub) 
        throws UnifyFailure {

        if (u instanceof AtomCat && type.equals(((AtomCat)u).type)) {
            AtomCat u_ac = (AtomCat)u;
            FeatureStructure $fs;
            if (_featStruc == null) {
                $fs = u_ac._featStruc;
            } else if (u_ac._featStruc == null) {
                $fs = _featStruc;
            } else {
                $fs = (FeatureStructure)_featStruc.unify(u_ac._featStruc, sub);
            }
            return new AtomCat(type, $fs);
        }
        else {
            throw new UnifyFailure();
        }
    }

    public Object fill (Substitution s) throws UnifyFailure {
        AtomCat $ac =
            new AtomCat(type,
                        (FeatureStructure)_featStruc.fill(s),
                        (_lf == null) ? null : (LF) _lf.fill(s));
        return $ac;
    }

    public boolean shallowEquals(Object c) {
        if (c instanceof AtomCat) {
            AtomCat ac = (AtomCat)c;
            return type.equals(ac.type);
        }
        return false;
    }
    
    public String toString() {
        DisplayPrefs prefs = Grammar.theGrammar.prefs;

        StringBuffer sb = new StringBuffer();
        sb.append(type);
        if (fragCompletion) sb.append("_c");
        
        if(_featStruc != null && prefs.showFeats)
            sb.append(_featStruc.toString());

        if (_lf != null && prefs.showSem) {
            sb.append(" : ").append(_lf.toString());
        }

        if (sb.length() == 0) return "UnknownCat";
        return sb.toString();
    }

    /**
     * Returns the interned supertag for the category.
     */
    public String getSupertag() {
		if (_supertag != null) return _supertag;
        StringBuffer sb = new StringBuffer();
        sb.append(type);
        if(_featStruc != null) sb.append(_featStruc.getSupertagInfo());
        if (sb.length() == 0) _supertag = "UnknownCat";
        else _supertag = sb.toString().intern();
		return _supertag;
    }
    
    public String toTeX() {
        DisplayPrefs prefs = Grammar.theGrammar.prefs;
        StringBuffer sb = new StringBuffer();
        sb.append(type);
        if(_featStruc != null && prefs.showFeats)
            sb.append(_featStruc.toTeX());
        if (sb.length() == 0) return "UnknownCat";
        return sb.toString();
    }

    
    /**
     * Returns a hash code for this category ignoring the LF, 
     * using the given map from vars to ints.
     */
    public int hashCodeNoLF(TObjectIntHashMap varMap) {
        int retval = type.hashCode();
        if (_featStruc != null) { 
            if (_featStruc instanceof GFeatStruc) {
                retval += ((GFeatStruc)_featStruc).hashCode(varMap);
            } else { // nb: would be nice to get rid of this case
                retval += _featStruc.hashCode(); 
            }
        }
        return retval;
    }

    /**
     * Returns whether this category equals the given object  
     * up to variable names, using the given maps from vars to ints, 
     * ignoring the LFs (if any).
     */
    public boolean equalsNoLF(Object obj, TObjectIntHashMap varMap, TObjectIntHashMap varMap2) {
        if (obj.getClass() != this.getClass()) { return false; }
        AtomCat ac = (AtomCat) obj;
        if (_featStruc != null && ac._featStruc == null) { return false; }
        if (_featStruc == null && ac._featStruc != null) { return false; }
        if (!type.equals(ac.type)) { return false; }
        if (_featStruc != null) { 
            if (_featStruc instanceof GFeatStruc) {
                if (!((GFeatStruc)_featStruc).equals(ac._featStruc, varMap, varMap2)) { return false; }
            } else { // nb: would be nice to get rid of this case
                if (!_featStruc.equals(ac._featStruc)) { return false; }
            }
        }
        return true;
    }

    /**
     * Returns whether this category is a fragment category;
     * returns true iff the type of this cat is "frag".
     */
    public boolean isFragment() { return type.equals("frag"); }
}


================================================
FILE: src/opennlp/ccg/synsem/BasicArg.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2002-5 Jason Baldridge and University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.synsem;

import java.io.Serializable;
import gnu.trove.*;

import opennlp.ccg.unify.*;

/**
 * A basic argument that contains a slash and a category.
 * 
 * @author Jason Baldridge
 * @author Michael White
 * @version $Revision: 1.9 $, $Date: 2009/11/28 03:39:27 $
 */
public final class BasicArg implements Arg, Serializable {

	private static final long serialVersionUID = -4244825501682166456L;

	private final Slash _slash;

	private final Category _cat;

	public BasicArg(Slash s, Category c) {
		_slash = s;
		_cat = c;
	}

	public Arg copy() {
		return new BasicArg(_slash.copy(), _cat.copy());
	}

	public Slash getSlash() {
		return _slash;
	}

	public void setSlashModifier(boolean modifier) { _slash.setModifier(modifier); }
	
    public void setSlashHarmonicCompositionResult(boolean harmonicResult) { _slash.setHarmonicCompositionResult(harmonicResult); }

    public Category getCat() {
		return _cat;
	}

	public boolean occurs(Variable v) {
		return _cat.occurs(v);
	}

	public Object fill(Substitution sub) throws UnifyFailure {
		return new BasicArg((Slash) _slash.fill(sub), (Category) _cat.fill(sub));
	}

	public void forall(CategoryFcn fcn) {
		_cat.forall(fcn);
	}

	public void unifySlash(Slash s) throws UnifyFailure {
		_slash.unifyCheck(s);
	}

	public void unifyCheck(Object u) throws UnifyFailure {
	}

	public Object unify(Object u, Substitution sub) throws UnifyFailure {
		if (u instanceof BasicArg) {
			return new BasicArg((Slash) _slash
					.unify(((BasicArg) u)._slash, sub), (Category) _cat.unify(
					((BasicArg) u)._cat, sub));
		} else {
			throw new UnifyFailure();
		}

	}

	public void deepMap(ModFcn mf) {
		_slash.deepMap(mf);
		_cat.deepMap(mf);
	}

	public String toString() {
		StringBuffer sb = new StringBuffer();
		sb.append(_slash.toString());
		if (_cat instanceof ComplexCat) {
			sb.append('(').append(_cat).append(')');
		} else {
			sb.append(_cat);
		}
		return sb.toString();
	}

	/**
	 * Returns the supertag for this arg.
	 */
	public String getSupertag() {
		StringBuffer sb = new StringBuffer();
		sb.append(_slash.getSupertag());
		if (_cat instanceof ComplexCat) {
			sb.append('(').append(_cat.getSupertag()).append(')');
		} else {
			sb.append(_cat.getSupertag());
		}
		return sb.toString();
	}

	/**
	 * Returns a TeX-formatted string representation for this arg.
	 */
	public String toTeX() {
		StringBuffer sb = new StringBuffer();
		sb.append(_slash.toTeX());
		if (_cat instanceof ComplexCat) {
			sb.append('(').append(_cat.toTeX()).append(')');
		} else {
			sb.append(_cat.toTeX());
		}
		return sb.toString();
	}

	/**
	 * Returns a hash code for this, using the given map from vars to ints.
	 */
	public int hashCode(TObjectIntHashMap varMap) {
		return _slash.hashCode(varMap) + _cat.hashCodeNoLF(varMap);
	}

	/**
	 * Returns whether this arg equals the given object up to variable names,
	 * using the given maps from vars to ints.
	 */
	public boolean equals(Object obj, TObjectIntHashMap varMap,
			TObjectIntHashMap varMap2) {
		if (obj.getClass() != this.getClass()) {
			return false;
		}
		BasicArg ba = (BasicArg) obj;
		return _slash.equals(ba._slash, varMap, varMap2)
				&& _cat.equalsNoLF(ba._cat, varMap, varMap2);
	}
}


================================================
FILE: src/opennlp/ccg/synsem/CatReader.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2002-4 Jason Baldridge, Gann Bierner and 
//                      University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.synsem;

import org.jdom.*;

/**
 * Utility class to build categories.
 *
 * @author      Jason Baldridge
 * @author      Gann Bierner
 * @author      Michael White
 * @version     $Revision: 1.4 $, $Date: 2005/10/18 22:20:15 $
 */
public class CatReader {
    
    public static Category getCat(Element catel) {
        Category cat = null;
        String catType = catel.getName();
        
        if (catType.equals("atomcat") || catType.equals("ac")) {    
            cat =  new AtomCat(catel);
        }
        
        else if (catType.equals("complexcat") || catType.equals("cc")) {    
            cat =  new ComplexCat(catel);
        }

        return cat;
    }
}


================================================
FILE: src/opennlp/ccg/synsem/Category.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2002-5 Jason Baldridge, Gann Bierner and 
//                      University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.synsem;

import opennlp.ccg.unify.*;
import opennlp.ccg.hylo.*;
import gnu.trove.*;
import org.jdom.Element;

/**
 * A CCG category.
 *
 * @author      Jason Baldridge
 * @author      Gann Bierner
 * @author      Michael White
 * @version     $Revision: 1.11 $, $Date: 2011/05/22 03:40:55 $
 */
public interface Category extends Unifiable, Mutable, java.io.Serializable {

    /**
     * Accessor function for the feature structure associated with this category.
     *
     * @return the feature structure for this cateogory
     */    
    public FeatureStructure getFeatureStructure();
    
    /**
     * Gives this category a new feature structure.
     *
     * @param fs the new feature structure
     */    
    public void setFeatureStructure(FeatureStructure fs);

    /** Gets the LF. */
    public LF getLF();
    
    /** Sets the LF. */
    public void setLF(LF lf);
    

    /**
     * Determines if this category is equal to another on the top level.
     * It does not check sub categories.
     *
     * @param o object to check for equality
     * @return whether or not this is shallowly equal to object
     */
    public boolean shallowEquals(Object o);

    /**
     * Deep copies this category.
     *
     * @return a deep copy of this category
     */
    public Category copy();

    /** Shallow copies this category. */
    public Category shallowCopy();
    

    /**
     * Iterates through this Category applying a function to this category
     * and every subcategory.
     *
     * @param f a function to be applied
     */    
    public void forall(CategoryFcn f); //to ls

    
    /** 
     * Returns a hash code for this category. 
     * The hash code handles equivalence up to variable names 
     * as long as features and predicates are in the same order.
     */
    public int hashCode();
    
    /** 
     * Returns a hash code for this category ignoring the LF.
     */
    public int hashCodeNoLF();
    
    /**
     * Returns a hash code for this category ignoring the LF, 
     * using the given map from vars to ints, 
     * to allow for equivalence up to variable names.
     */
    public int hashCodeNoLF(TObjectIntHashMap varMap);

    
    /** 
     * Returns whether this category equals the given object. 
     * Equivalence up to variable names is handled  
     * as long as features and predicates are in the same order.
     */
    public boolean equals(Object obj);
    
    /** 
     * Returns whether this category equals the given object, 
     * ignoring the LFs (if any).
     */
    public boolean equalsNoLF(Object obj);
    
    /**
     * Returns whether this category equals the given object  
     * up to variable names, using the given maps from vars to ints, 
     * ignoring the LFs (if any).
     */
    public boolean equalsNoLF(Object obj, TObjectIntHashMap varMap, TObjectIntHashMap varMap2);
    
    
    /**
     * Returns the target category of this category.
     */
    public TargetCat getTarget();
    
    /**
     * Returns the nominal which is the value of the index feature on the 
     * target cat, or null if none.
     */
    public Nominal getIndexNominal(); 
    
    /**
     * Returns the interned supertag for the category.
     */
    public String getSupertag();
    
    /**
     * Returns whether this category is a fragment category.
     */
    public boolean isFragment();
    
    /**
     * Returns a TeX-formatted string representation for the category.
     */
    public String toTeX();
    
    /**
     * Returns an XML element representing the category.
     */
    public Element toXml();
}


================================================
FILE: src/opennlp/ccg/synsem/CategoryFcn.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2002 Jason Baldridge and Gann Bierner
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.synsem;

/**
 * A set of functions that can be applied to Categories.  This is a way of
 * getting around the fact that Java doesn't have 1st class functions.
 * Thus, if a method is needed that takes a function that works on Categories,
 * pass one of these instead.
 *
 * @author      Gann Bierner
 * @version     $Revision: 1.1.1.1 $, $Date: 2003/02/28 18:02:12 $
 */
public interface CategoryFcn {
    /**
     * Converts a category to a different category
     *
     * @param c the category to change
     * @return the transformed category
     */
    public Category fcn(Category c);
    
    /**
     * Converts a category to a different category with some additional
     * information about its context.
     *
     * @param a The logical form in which the category appears
     * @param c The category to convert
     * @param i The position of the category in the logical form
     * @return the transformed category
     */
    public void fcn(Category a, Category c, int i);
    
    /**
     * Performs some destructive operation given a category
     *
     * @param c The category used for whatever purpose
     */
    public void forall(Category c);
}


================================================
FILE: src/opennlp/ccg/synsem/CategoryFcnAdapter.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2002 Jason Baldridge and Gann Bierner
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.synsem;

/**
 * An adapter for Category Functions so that you only have to implement the
 * methods you want.
 *
 * @author      Gann Bierner
 * @version     $Revision: 1.1.1.1 $, $Date: 2003/02/28 18:02:12 $
 */
public class CategoryFcnAdapter implements CategoryFcn{
    public Category fcn(Category c) {return c;}
    public void fcn(Category a, Category c, int i) {}
    public void forall(Category c) {};
}


================================================
FILE: src/opennlp/ccg/synsem/ComplexCat.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003-5 Jason Baldridge and University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.synsem;

import opennlp.ccg.unify.*;
import opennlp.ccg.util.DisplayPrefs;
import opennlp.ccg.grammar.Grammar;
import gnu.trove.*;
import org.jdom.*;

import java.util.*;

/**
 * A non-recursive representation of complex categories.
 * 
 * @author Jason Baldridge
 * @author Michael White
 * @version $Revision: 1.15 $, $Date: 2009/06/18 23:38:57 $
 */
public final class ComplexCat extends AbstractCat {

	private static final long serialVersionUID = 1L;

	private TargetCat _target;

	private ArgStack _args;

	/** Constructor with target and single arg. */
	public ComplexCat(TargetCat target, Arg arg) {
		this(target, new ArgStack(arg));
	}

	/** Constructor with target and arg stack. */
	public ComplexCat(TargetCat target, ArgStack args) {
		this(target, args, null);
	}

	/** Constructor with target, arg stack and LF. */
	public ComplexCat(TargetCat target, ArgStack args, LF lf) {
		super(lf);
		_target = target;
		if (args.size() < 1) {
			System.out.println("WARNING!!! Creating a ComplexCat with"
					+ " empty argument stack!");
		}
		_args = args;
	}

	/** Constructor which retrieves the complex category from the XML element. */
	// also determines modifier slashes
	@SuppressWarnings("unchecked")
	public ComplexCat(Element el) {
		// call super to get LF if present
		super(el);
		// get children minus LF elt
		List<Element> info = el.getChildren();
		Element lfElt = el.getChild("lf");
		if (lfElt != null) {
			info.remove(lfElt);
		}
		// get target and args from first and rest of remaining children
		_target = (TargetCat) CatReader.getCat(info.get(0));
		_args = new ArgStack(info.subList(1, info.size()));
		// set modifier slashes
		setModifierSlashes();
	}
	
    /**Returns an XML element representing the category. */
    public Element toXml() {
    	Element retval = new Element("complexcat");
    	retval.addContent(_target.toXml());
    	_args.toXml(retval);
    	// call super to add LF if present
    	super.toXml(retval);
    	return retval;
    }
	
	// sets modifier slashes based on feat struc ids
	private void setModifierSlashes() {
		FeatureStructure targetFS = _target.getFeatureStructure(); 
		int targetIndex = targetFS.getIndex();
		if (targetIndex == 0) targetIndex = targetFS.getInheritsFrom();
		if (targetIndex == 0) return;
		for (int i=0; i < _args.size(); i++) {
			Arg arg = _args.get(i);
			if (arg instanceof BasicArg) {
				setModifierSlash(targetIndex, (BasicArg)arg);
			}
			else if (arg instanceof SetArg) {
				SetArg sArg = (SetArg) arg;
				for (int j=0; j < sArg.size(); j++) {
					setModifierSlash(targetIndex, sArg.get(j));
				}
			}
		}
	}
	
	// sets modifier slash based on the target index
	private void setModifierSlash(int targetIndex, BasicArg arg) {
		FeatureStructure argFS = arg.getCat().getTarget().getFeatureStructure();
		// check for matching ids
		if (targetIndex == argFS.getIndex() || targetIndex == argFS.getInheritsFrom())
			arg.getSlash().setModifier(true);
	}

	
	/**
	 * Returns the target category of this category.
	 */
	public TargetCat getTarget() {
		return _target;
	}

	public Arg getArg(int pos) {
		return _args.get(pos);
	}

	public Arg getOuterArg() {
		return _args.getLast();
	}

	public Category getResult() {
		return getSubResult(arity() - 1);
	}

	public Category getSubResult(int upto) {
		if (upto == 0) {
			return _target;
		} else {
			return new ComplexCat(_target, _args.subList(0, upto));
		}
	}

	public ArgStack getArgStack() {
		return _args;
	}

	public ArgStack getArgStack(int from) {
		return _args.subList(from);
	}

	public boolean containsDollarArg() {
		return _args.containsDollarArg();
	}

	public boolean containsSetArg() {
		return _args.containsSetArg();
	}

	public void add(Arg a) {
		_args.add(a);
	}

	public void add(ArgStack as) {
		_args.add(as);
	}

	public void addBeforeEnd(ArgStack as) {
		int size = _args.size();
		if (size < 1) {
			add(as);
		} else {
			_args.addAt(as, size - 1);
		}
	}

	public void addFront(ArgStack as) {
		_args.addFront(as);
	}

	public void insertFront(ArgStack as) {
		_args.insertFront(as);
	}

	public void insertEnd(ArgStack as) {
		_args.insertEnd(as);
	}

	public void set(int index, Arg c) {
		_args.set(index, c);
	}

	public void setOuterArgument(Arg c) {
		_args.setLast(c);
	}

	public int arity() {
		return _args.size();
	}

	public Category copy() {
		return new ComplexCat((TargetCat) _target.copy(), _args.copy(),
				(_lf == null) ? null : (LF) _lf.copy());
	}

	public Category shallowCopy() {
		return new ComplexCat(_target, _args, _lf);
	}

	public void deepMap(ModFcn mf) {
		super.deepMap(mf);
		_target.deepMap(mf);
		_args.deepMap(mf);
	}

	public void forall(CategoryFcn f) {
		f.forall(this);
		_target.forall(f);
		_args.forall(f);
	}

	public void unifyCheck(Object u) throws UnifyFailure {
		if (u instanceof ComplexCat) {
			ComplexCat cc = (ComplexCat) u;
			_target.unifyCheck(cc._target);
		}
	}

	/** NB: The LF does not participate in unification. */
	public Object unify(Object u, Substitution sub) throws UnifyFailure {

		if (u instanceof AtomCat && arity() == 1 & containsDollarArg()) {
			sub.makeSubstitution((Dollar) _args.get(0), new ArgStack());
			return GUnifier.unify(_target, (AtomCat) u, sub);
		} else if (u instanceof ComplexCat) {
			ComplexCat cc = (ComplexCat) u;
			ArgStack $args = _args.unify(cc._args, sub);
			Category $target = GUnifier.unify(_target, cc._target, sub);
			if ($args.size() == 0) {
				return $target;
			} else {
				return new ComplexCat((TargetCat) $target, $args);
			}
		} else {
			throw new UnifyFailure();
		}
	}

	public boolean occurs(Variable v) {
		return super.occurs(v) || _target.occurs(v) || _args.occurs(v);
	}

	// nb: not yet sure about calling setLF methods
	public Object fill(Substitution s) throws UnifyFailure {
		Category $target = (Category) _target.fill(s);
		ArgStack $args = _args.fill(s);
		LF $lf = (_lf == null) ? null : (LF) _lf.fill(s);
		if ($args.size() == 0) {
			$target.setLF($lf);
			return $target;
		}
		if ($target instanceof TargetCat) {
			return new ComplexCat((TargetCat) $target, $args, $lf);
		} else if ($target instanceof ComplexCat) {
			((ComplexCat) $target).add($args);
			$target.setLF($lf);
			return $target;
		} else {
			throw new UnifyFailure();
		}
	}

	public String toString() {
	    DisplayPrefs prefs = Grammar.theGrammar.prefs;
	    StringBuffer sb = new StringBuffer();
	    sb.append(_target.toString()).append(_args.toString());
	    if (_lf != null && prefs.showSem) {
	    	sb.append(" : ").append(_lf.toString());
	    }
	    return sb.toString();
	}

	/**
	 * Returns the interned supertag for the category.
	 */
	public String getSupertag() {
		if (_supertag != null) return _supertag;
		StringBuffer sb = new StringBuffer();
		sb.append(_target.getSupertag()).append(_args.getSupertag());
		_supertag = sb.toString().intern();
		return _supertag;
	}

	public String toTeX() {
		// Preferences prefs = Preferences.userNodeForPackage(TextCCG.class);
		// boolean showSem = prefs.getBoolean(SHOW_SEMANTICS, false);
		StringBuffer sb = new StringBuffer();
		sb.append(_target.toTeX()).append(_args.toTeX());
		return sb.toString();
	}

	/**
	 * Returns a hash code for this category ignoring the LF, using the given
	 * map from vars to ints.
	 */
	public int hashCodeNoLF(TObjectIntHashMap varMap) {
		int retval = _target.hashCodeNoLF(varMap);
		retval += _args.hashCode(varMap);
		return retval;
	}

	/**
	 * Returns whether this category equals the given object up to variable
	 * names, using the given maps from vars to ints, ignoring the LFs (if any).
	 */
	public boolean equalsNoLF(Object obj, TObjectIntHashMap varMap,
			TObjectIntHashMap varMap2) {
		if (obj.getClass() != this.getClass()) {
			return false;
		}
		ComplexCat cc = (ComplexCat) obj;
		if (!_target.equalsNoLF(cc._target, varMap, varMap2)) {
			return false;
		}
		if (!_args.equals(cc._args, varMap, varMap2)) {
			return false;
		}
		return true;
	}
}


================================================
FILE: src/opennlp/ccg/synsem/DerivationHandler.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2010 Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.synsem;

import opennlp.ccg.parse.DerivationHistory;

/** 
 * A class to simplify implementing a recursive procedure on a derivation.
 * Recursion is handled within the implementation of the abstract methods 
 * by calls to <code>handleDerivation</code>, so that order of traversal 
 * can be flexibly specified.  Results may be optionally cached.
 * Note that the top step is only used with complete derivations.
 * 
 * @author 	Michael White
 * @version	$Revision: 1.1 $, $Date: 2010/02/21 16:44:59 $
 */ 
abstract public class DerivationHandler<T> {
	
	/** Top step. */
	abstract public T topStep(Sign sign);
	
	/** Lexical step. */
	abstract public T lexStep(Sign sign);

	/** Unary step. */
	abstract public T unaryStep(Sign sign, Sign headChild);
	
	/** Binary step. */
	abstract public T binaryStep(Sign sign, boolean left, Sign headChild, Sign siblingChild);
	
	/** Checks for cached value, returning null if none. Defaults to null. */
	public T checkCache(Sign sign) { return null; }

	/** Caches the result.  Default no-op. */
	public void cache(Sign sign, T result) {}
	
	/** Handles a complete derivation, invoking the top step. */
	public T handleCompleteDerivation(Sign sign) {
		return topStep(sign);
	}
	
	/** Handles a sub-derivation, checking and updating cache. */
	public T handleDerivation(Sign sign) {
		// check cache
		T retval = checkCache(sign); 
		if (retval != null) return retval;
		// lexical case
		if (sign.isLexical()) {
			retval = lexStep(sign);
			cache(sign, retval); 
			return retval; 
		}
		// recursive case
		DerivationHistory dh = sign.getDerivationHistory();
		Sign[] inputs = dh.getInputs();
		// unary case
		if (inputs.length == 1) {
			Sign headChild = inputs[0];
			retval = unaryStep(sign, headChild);
			cache(sign, retval); 
			return retval; 
		}
		// binary case
		else {
			boolean left;
			Sign headChild, siblingChild;
			if (sign.getLexHead() == inputs[0].getLexHead()) {
				left = true; headChild = inputs[0]; siblingChild = inputs[1];
			}
			else {
				left = false; headChild = inputs[1]; siblingChild = inputs[0];
			}
			retval = binaryStep(sign, left, headChild, siblingChild);
			cache(sign, retval); 
			return retval; 
		}
	}
}


================================================
FILE: src/opennlp/ccg/synsem/Dollar.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2002-7 Jason Baldridge and Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.synsem;

import java.io.Serializable;
import gnu.trove.*;

import opennlp.ccg.unify.*;

/**
 * A variable representing a stack of arguments
 * 
 * @author Jason Baldridge
 * @author Michael White
 * @version $Revision: 1.10 $, $Date: 2009/11/28 03:39:27 $
 */
public final class Dollar implements Arg, Variable, Mutable, Indexed, Serializable {

	private static final long serialVersionUID = -5936227018184772678L;

	private final Slash _slash;

	private final String _name;

	private int _index = 0;

	private boolean _hasMostGeneralSlash = false;

	public Dollar(String name) {
		this(new Slash(), name);
	}

	public Dollar(Slash s, String name) {
		this(s, name, 0);
	}

	public Dollar(Slash s, String name, int id) {
		_slash = s;
		_name = name;
		_index = id;
		if (s.toString().equals("|.")) {
			_hasMostGeneralSlash = true;
		}
	}

	public String name() {
		return _name;
	}

	public int getIndex() {
		return _index;
	}

	public void setIndex(int uniqueIndex) {
		_index = uniqueIndex;
	}

	public Arg copy() {
		return new Dollar(_slash.copy(), _name, _index);
	}

	public void forall(CategoryFcn fcn) {
	}

	public Slash getSlash() {
		return _slash;
	}

	public void setSlashModifier(boolean modifier) { _slash.setModifier(modifier); }
	
    public void setSlashHarmonicCompositionResult(boolean harmonicResult) { _slash.setHarmonicCompositionResult(harmonicResult); }

    public boolean equals(Object o) {
		return (o instanceof Dollar && _index == ((Dollar) o).getIndex() && _slash
				.equals(((Dollar) o).getSlash()));
	}

	public int hashCode() {
		return 31 * _index + _slash.hashCode() ;
	}

	public boolean occurs(Variable v) {
		return (v instanceof Dollar && equals(v));
	}

	public Object fill(Substitution sub) throws UnifyFailure {
		Object value = sub.getValue(this);
		if (value == null) {
			return this;
		}
		if (value instanceof Dollar) {
			return value;
		}
		// nb: must do occurs check here, at least in part b/c ArgStack doesn't
		// quite implement Unifiable
		if (value instanceof Arg && !((Arg) value).occurs(this)) {
			return ((Arg) value).fill(sub);
		} else if (value instanceof ArgStack
				&& !((ArgStack) value).occurs(this)) {
			return ((ArgStack) value).fill(sub);
		} else {
			// System.out.println("Error in value for dollar: " + this +" = " +
			// value);
			throw new UnifyFailure();
		}
	}

	public void unifySlash(Slash s) throws UnifyFailure {
		_slash.unifyCheck(s);
	}

	public void unifyCheck(Object u) throws UnifyFailure {
	}

	public Object unify(Object u, Substitution sub) throws UnifyFailure {
		if (u instanceof ArgStack && !((ArgStack) u).occurs(this)) {
			((ArgStack) u).slashesUnify(_slash);
		} else if (u instanceof Arg && !((Arg) u).occurs(this)) {
			((Arg) u).unifySlash(_slash);
		} else {
			throw new UnifyFailure();
		}
		sub.makeSubstitution(this, u);
		return u;
	}

	public void deepMap(ModFcn mf) {
		mf.modify(this);
	}

	public String toString() {
		StringBuffer sb = new StringBuffer();
		if (!_hasMostGeneralSlash)
			sb.append(_slash.toString());
		sb.append('$').append(_name);// .append(_index);
		return sb.toString();
	}

	/**
	 * Returns the supertag for this dollar arg.
	 */
	public String getSupertag() {
		StringBuffer sb = new StringBuffer();
		if (!_hasMostGeneralSlash)
			sb.append(_slash.getSupertag());
		sb.append('$');
		return sb.toString();
	}

	/**
	 * Returns a TeX-formatted string representation for this dollar arg.
	 */
	public String toTeX() {
		StringBuffer sb = new StringBuffer();
		if (!_hasMostGeneralSlash)
			sb.append(_slash.toTeX());
		sb.append("\\$ \\subs{").append(_name).append("}");// .append(_index);
		return sb.toString();
	}

	/**
	 * Returns a hash code using the given map from vars to ints.
	 */
	public int hashCode(TObjectIntHashMap varMap) {
		int retval = _slash.hashCode(varMap);
		// see if this already in map
		if (varMap.containsKey(this)) {
			retval += varMap.get(this);
		}
		// otherwise add it
		else {
			int next = varMap.size() + 1;
			varMap.put(this, next);
			retval += next;
		}
		return retval;
	}

	/**
	 * Returns whether this dollar equals the given object up to variable names,
	 * using the given maps from vars to ints.
	 */
	public boolean equals(Object obj, TObjectIntHashMap varMap, TObjectIntHashMap varMap2) {
		if (this == obj) return true;
		if (obj.getClass() != this.getClass()) return false;
		Dollar d = (Dollar) obj;
		if (varMap.get(this) != varMap2.get(d)) return false;
		if (!_slash.equals(d._slash, varMap, varMap2)) return false;
		return true;
	}
}


================================================
FILE: src/opennlp/ccg/synsem/GenerativeSyntacticModel.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2010 Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.synsem;

import java.io.*;
import java.net.URL;
import java.util.*;

import opennlp.ccg.grammar.Grammar;
import opennlp.ccg.lexicon.*;
import opennlp.ccg.ngrams.ConditionalProbabilityTable;
import opennlp.ccg.ngrams.NgramScorer;
import opennlp.ccg.perceptron.*;
import opennlp.ccg.test.Regression;
import opennlp.ccg.test.RegressionInfo;
import opennlp.ccg.test.RegressionInfo.TestItem;
import opennlp.ccg.util.Pair;

/** 
 * A class implementing a variant of Hockenmaier's HWDep generative syntactic model, 
 * with additional postag variables.
 * Note that the top step is only used with complete derivations.
 * Also note that for simplicity there is no special treatment of rare words, and thus 
 * a single unknown word is used in the model, rather than one for each POS tag.
 * 
 * @author 	Michael White
 * @version	$Revision: 1.12 $, $Date: 2010/03/07 03:23:01 $
 */ 
public class GenerativeSyntacticModel implements FeatureExtractor, SignScorer {

	/** Feature key. */
	public static String genlogprobkey = "genlogprob";
	
	/** Expansion string constant. */
	public static final String EXPANSION = "E";
	
	/** Left expansion string constant. */
	public static final String LEFT = "left";
	
	/** Right expansion string constant. */
	public static final String RIGHT = "right";
	
	/** Unary expansion string constant. */
	public static final String UNARY = "unary";
	
	/** Leaf expansion string constant. */
	public static final String LEAF = "leaf";

	/** Category of parent string constant. */
	public static final String PARENT = "P";

	/** Category of head string constant. */
	public static final String HEAD = "H";

	/** Category of sibling string constant. */
	public static final String SIBLING = "S";

	/** Lexical head category of parent string constant. */
	public static final String LEXCAT_PARENT = "CP";

	/** Head postag of parent string constant. */
	public static final String POS_PARENT = "T";

	/** Head word of parent string constant. */
	public static final String WORD_PARENT = "W";

	/** Lexical head category of sibling string constant. */
	public static final String LEXCAT_SIBLING = "CS";

	/** Head postag of sibling string constant. */
	public static final String POS_SIBLING = "TS";

	/** Head word of sibling string constant. */
	public static final String WORD_SIBLING = "WS";

	/** Lexical head category of top string constant. */
	public static final String LEXCAT_TOP = "CT";

	/** Head postag top string constant. */
	public static final String POS_TOP = "TT";

	/** Head word of top string constant. */
	public static final String WORD_TOP = "WT";

	/** Derivation top string constant. */
	public static final String TOP = "<top>";
	
	/**
	 * Class for caching the model's log prob in a sign.
	 */
	public static class GenLogProb {
		/** The log prob. */
		public final double logprob;
		/** Constructor. */
		public GenLogProb(double logprob) { this.logprob = logprob; }
	}
	
	/** The top step model. */
	protected ConditionalProbabilityTable topModel;
	/** The lexical step model. */
	protected ConditionalProbabilityTable leafModel;
	/** The unary step model. */
	protected ConditionalProbabilityTable unaryModel;
	/** The binary step model. */
	protected ConditionalProbabilityTable binaryModel;
	
	/** Constructor with file names. */
	public GenerativeSyntacticModel(String topModelFN, String leafModelFN, String unaryModelFN, String binaryModelFN) throws IOException {
		topModel = new ConditionalProbabilityTable(topModelFN);
		leafModel = new ConditionalProbabilityTable(leafModelFN);
		unaryModel = new ConditionalProbabilityTable(unaryModelFN);
		binaryModel = new ConditionalProbabilityTable(binaryModelFN);
	}

    /** Flag for whether to show scoring breakdown. */
    protected boolean debugScore = false;
    
    /** Sets the debug score flag, and propagates to component models. */
    public void setDebug(boolean debugScore) { 
    	this.debugScore = debugScore; 
    	topModel.setDebug(debugScore);
    	leafModel.setDebug(debugScore);
    	unaryModel.setDebug(debugScore);
    	binaryModel.setDebug(debugScore);
    } 
    
	/** The alphabet. */
	protected Alphabet alphabet = null;

	/** Generative logprob feature. */
	protected Alphabet.Feature genlogprobFeature = null;
	
	/** Sets the alphabet. */
	public void setAlphabet(Alphabet alphabet) {
		this.alphabet = alphabet;
		List<String> keys = new ArrayList<String>(1);
		keys.add(genlogprobkey);
		genlogprobFeature = alphabet.closed() ? alphabet.index(keys) : alphabet.add(keys);
	}
	
	/** Returns the features for the given sign and completeness flag. */
	public FeatureVector extractFeatures(Sign sign, boolean complete) {
		return genLogProbVector((float) logprob(sign, complete));
	}
	
	/** Returns a feature vector with the given gen log prob. */
	protected FeatureVector genLogProbVector(float logprob) {
		FeatureList retval = new FeatureList(1);
		if (genlogprobFeature != null) retval.add(genlogprobFeature, logprob);
		return retval;
	}
	
	/** Derivation handler for getting the log prob for each derivation step as a sum. */
	public class LogProbGetter extends DerivationHandler<Double> {
		// reusable list of pairs
		private List<Pair<String,String>> pairs = new ArrayList<Pair<String,String>>(); 
		private String listPairs() {
			StringBuffer sb = new StringBuffer();
			for (Pair<String,String> pair : pairs) sb.append(pair.a).append('-').append(pair.b).append(' ');
			return sb.toString();
		}
		/** Checks for cached value. */
		public Double checkCache(Sign sign) {
			GenLogProb glp = (GenLogProb) sign.getData(GenLogProb.class);
			return (glp == null) ? null : glp.logprob;
		}
		/** Caches the total. */
		public void cache(Sign sign, Double total) {
			sign.addData(new GenLogProb(total));
		}
		/** Top step. */
		public Double topStep(Sign sign) {
			pairs.clear(); addTopFactors(sign, pairs); 
			if (debugScore) System.out.println("[topStep] " + listPairs());
			return topModel.logprob(pairs) + handleDerivation(sign);
		}
		/** Lexical step. */
		public Double lexStep(Sign sign) {
			pairs.clear(); addLexFactors(sign, pairs); 
			if (debugScore) System.out.println("[lexStep] " + listPairs());
			return leafModel.logprob(pairs); 
		}
		/** Unary step. */
		public Double unaryStep(Sign sign, Sign headChild) {
			pairs.clear(); addUnaryFactors(sign, pairs, headChild);
			if (debugScore) System.out.println("[unaryStep] " + listPairs());
			return unaryModel.logprob(pairs) + handleDerivation(headChild);
		}
		/** Binary step. */
		public Double binaryStep(Sign sign, boolean left, Sign headChild, Sign siblingChild) {
			pairs.clear(); addBinaryFactors(sign, pairs, left, headChild, siblingChild); 
			if (debugScore) System.out.println("[binaryStep] " + listPairs());
			return binaryModel.logprob(pairs) + handleDerivation(headChild) + handleDerivation(siblingChild);
		}
	}
	
	/** Derivation handler for getting the factors for each derivation step as a list of words. */
	public static class FactorsGetter extends DerivationHandler<Void> {
		/** The factors. */
		public List<Word> factors = new ArrayList<Word>();
		// reusable list of pairs
		private List<Pair<String,String>> pairs = null;
		// new pairs
		private void newPairs() { pairs = new ArrayList<Pair<String,String>>(); }
		// adds new word for pairs to result
		private void addPairs() { factors.add(new ListPairWord(pairs)); }
		/** Top step. */
		public Void topStep(Sign sign) {
			newPairs(); addTopFactors(sign, pairs); addPairs(); 
			handleDerivation(sign); return null;
		}
		/** Lexical step. */
		public Void lexStep(Sign sign) {
			newPairs(); addLexFactors(sign, pairs); addPairs(); return null;
		}
		/** Unary step. */
		public Void unaryStep(Sign sign, Sign headChild) {
			newPairs(); addUnaryFactors(sign, pairs, headChild); addPairs(); 
			handleDerivation(headChild); return null;
		}
		/** Binary step. */
		public Void binaryStep(Sign sign, boolean left, Sign headChild, Sign siblingChild) {
			newPairs(); addBinaryFactors(sign, pairs, left, headChild, siblingChild); addPairs(); 
			handleDerivation(headChild); handleDerivation(siblingChild); return null;
		}
	}
	
	/** Returns the probability of the derivation according to the models. */
	public double score(Sign sign, boolean complete) {
		return NgramScorer.convertToProb(logprob(sign, complete));
	}
	
	/** Returns the log probability of the derivation according to the models. */
	public double logprob(Sign sign, boolean complete) {
		LogProbGetter lpgetter = new LogProbGetter();
		if (complete) return lpgetter.handleCompleteDerivation(sign);
		else return lpgetter.handleDerivation(sign);
	}
	
	/** Returns the factors from the derivation of the given sign (assumed to be complete). */
	public static List<Word> getFactors(Sign sign) {
		FactorsGetter fgetter = new FactorsGetter();
		fgetter.handleCompleteDerivation(sign);
		return fgetter.factors;
	}
	
	/** Adds the factors for the top step in the derivation of the given sign. */
	public static void addTopFactors(Sign sign, List<Pair<String,String>> pairs) {
		pairs.add(new Pair<String,String>(EXPANSION, TOP));
		pairs.add(new Pair<String,String>(PARENT, TOP));
		pairs.add(new Pair<String,String>(LEXCAT_PARENT, TOP));
		pairs.add(new Pair<String,String>(WORD_PARENT, TOP));
		pairs.add(new Pair<String,String>(HEAD, sign.getSupertag()));
		Sign lexHead = sign.getLexHead();
		pairs.add(new Pair<String,String>(LEXCAT_TOP, lexHead.getSupertag()));
		pairs.add(new Pair<String,String>(POS_TOP, lexHead.getPOS()));
		pairs.add(new Pair<String,String>(WORD_TOP, lexHead.getWordForm()));
	}
	
	/** Adds the factors for a lexical step in the derivation of the given sign. */
	public static void addLexFactors(Sign sign, List<Pair<String,String>> pairs) {
		pairs.add(new Pair<String,String>(EXPANSION, LEAF));
		addParentFactors(sign, pairs);
	}
	
	/** Adds the parent factors for a step in the derivation of the given sign. */
	public static void addParentFactors(Sign sign, List<Pair<String,String>> pairs) {
		pairs.add(new Pair<String,String>(PARENT, sign.getSupertag()));
		Sign lexHead = sign.getLexHead();
		pairs.add(new Pair<String,String>(LEXCAT_PARENT, lexHead.getSupertag()));
		pairs.add(new Pair<String,String>(POS_PARENT, lexHead.getPOS()));
		pairs.add(new Pair<String,String>(WORD_PARENT, lexHead.getWordForm()));
	}
	
	/** Returns the factors for a unary step in the derivation of the given sign. */
	public static void addUnaryFactors(Sign sign, List<Pair<String,String>> pairs, Sign headChild) {
		pairs.add(new Pair<String,String>(EXPANSION, UNARY));
		addParentFactors(sign, pairs);
		pairs.add(new Pair<String,String>(HEAD, headChild.getSupertag()));
	}
	
	/** Returns the factors for a binary step in the derivation of the given sign. */
	public static void addBinaryFactors(Sign sign, List<Pair<String,String>> pairs, boolean left, Sign headChild, Sign siblingChild) {
		pairs.add(new Pair<String,String>(EXPANSION, (left) ? LEFT : RIGHT));
		addParentFactors(sign, pairs);
		pairs.add(new Pair<String,String>(HEAD, headChild.getSupertag()));
		pairs.add(new Pair<String,String>(SIBLING, siblingChild.getSupertag()));
		Sign siblingLexHead = siblingChild.getLexHead();
		pairs.add(new Pair<String,String>(LEXCAT_SIBLING, siblingLexHead.getSupertag()));
		pairs.add(new Pair<String,String>(POS_SIBLING, siblingLexHead.getPOS()));
		pairs.add(new Pair<String,String>(WORD_SIBLING, siblingLexHead.getWordForm()));
	}
	
    /** Tests loading and scoring. */
    public static void main(String[] args) throws IOException {
        
    	String argstr = "(-dir <modeldir>) (-g <grammarfile>) (-t <testbedfile>) (-verbose)";
        String usage = "Usage: java opennlp.ccg.synsem.GenerativeSyntacticModel " + argstr;
        
        if (args.length > 0 && args[0].equals("-h")) {
            System.out.println(usage);
            System.exit(0);
        }
        
        String dir = ".", topfn = "top.flm", leaffn = "leaf.flm", unaryfn = "unary.flm", binaryfn = "binary.flm";
        String grammarfn = "grammar.xml", tbfn = "testbed.xml";
        boolean verbose = false;
        
        for (int i=0; i < args.length; i++) {
        	if (args[i].equals("-dir")) { dir = args[++i]; continue; }
        	if (args[i].equals("-g")) { grammarfn = args[++i]; continue; }
        	if (args[i].equals("-t")) { tbfn = args[++i]; continue; }
        	if (args[i].equals("-v") || args[i].equals("-verbose")) { verbose = true; continue; }
        	System.out.println("Unrecognized option: " + args[i]);
        }
        
        // load grammar
        URL grammarURL = new File(grammarfn).toURI().toURL();
        System.out.println("Loading grammar from URL: " + grammarURL);
        Grammar grammar = new Grammar(grammarURL);
        
        // load model
        System.out.println("Loading syntactic model from: " + dir);
        topfn = dir + "/" + topfn; leaffn = dir + "/" + leaffn; unaryfn = dir + "/" + unaryfn; binaryfn = dir + "/" + binaryfn;
        GenerativeSyntacticModel model = new GenerativeSyntacticModel(topfn, leaffn, unaryfn, binaryfn);
        if (verbose) model.setDebug(true);
        
    	// score saved signs
    	double logprobttotal = 0.0;
    	int numsents = 0;
    	for (File f : Regression.getXMLFiles(new File(tbfn))) {
            // load testfile
        	System.out.println("Loading: " + f.getName());
            RegressionInfo rinfo = new RegressionInfo(grammar, f);
            // do each item
	    	for (int i=0; i < rinfo.numberOfItems(); i++) {
	    		TestItem item = rinfo.getItem(i);
	    		if (item.numOfParses == 0) continue;
	    		numsents++;
	    		if (verbose) System.out.println("scoring: " + item.sentence);
	    		else System.out.print(".");
	    		Sign sign = item.sign;
	            double logprob = model.logprob(sign, true);
	            logprobttotal += logprob;
	            if (verbose) {
		    		System.out.println(sign.getDerivationHistory().toString());
		            System.out.println("logprob: " + logprob);
	            }
	    	}
	    	System.out.println();
    	}
    	
    	// totals
    	System.out.println("total logprob: " + logprobttotal);
    	System.out.println("logprob per sentence: " + (logprobttotal / numsents));
    }
}


================================================
FILE: src/opennlp/ccg/synsem/LF.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003-5 Jason Baldridge and University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.synsem;

import opennlp.ccg.unify.*;
import org.jdom.*;
import gnu.trove.*;

/**
 * An interface for objects which represent Logical Forms.
 *
 * @author      Jason Baldridge
 * @author      Michael White
 * @version     $Revision: 1.10 $, $Date: 2005/11/01 22:35:35 $
 */
public interface LF extends Unifiable, Mutable {

    /**
     * Sets the LF chunks to which this LF belongs.
     * LF chunks are used during realization to ensure 
     * that certain edges are semantically complete 
     * before combination is attempted with edges 
     * with semantics outside the chunk.
     * The chunks are numbered starting with 0, 
     * and null represents no chunks.
     */
    public void setChunks(TIntArrayList chunks);
    
    /**
     * Gets the LF chunks to which this LF belongs.
     */
    public TIntArrayList getChunks();
    

    /** Returns the simple type of this LF, or null if none. */
    public SimpleType getType();
    
    
    /**
     * Returns a copy of this LF.
     * (LF chunks are not copied.)
     */
    public LF copy();

    /**
     * Returns a hash code using the given map from vars to ints.
     */
    public int hashCode(TObjectIntHashMap varMap);

    /**
     * Returns whether this LF equals the given object  
     * up to variable names, using the given maps from vars to ints.
     */
    public boolean equals(Object obj, TObjectIntHashMap varMap, TObjectIntHashMap varMap2);
    
    /**
     * Returns an XML representation of this LF.
     */
    public Element toXml();
    
    /**
     * Returns a pretty-printed string of this LF, with the given indent.
     */
    public String prettyPrint(String indent);
}


================================================
FILE: src/opennlp/ccg/synsem/LexLogProbFeatureExtractor.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2009 Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.synsem;

import java.util.*;

import opennlp.ccg.perceptron.*;
import opennlp.ccg.lexicon.SupertaggerAdapter;

/** 
 * A class for extracting total lexical log probabilities from a supertagger 
 * as a feature.  The class may also be used as a sign scorer.
 * 
 * @author 	Michael White
 * @version $Revision: 1.3 $, $Date: 2009/11/01 22:26:29 $
 */ 
public class LexLogProbFeatureExtractor implements FeatureExtractor, SignScorer {

	/** Feature key. */
	public static String lexlogprobkey = "lexlogprob";
	
	/** The alphabet. */
	protected Alphabet alphabet = null;

	/** Lexical logprob feature. */
	protected Alphabet.Feature lexlogprobFeature = null;
	
	/** Sets the alphabet. */
	public void setAlphabet(Alphabet alphabet) {
		this.alphabet = alphabet;
		List<String> keys = new ArrayList<String>(1);
		keys.add(lexlogprobkey);
		lexlogprobFeature = alphabet.closed() ? alphabet.index(keys) : alphabet.add(keys);
	}
	
	/** Returns the features for the given sign and completeness flag. */
	public FeatureVector extractFeatures(Sign sign, boolean complete) {
		return lexLogProbVector(getLexLogProb(sign, complete));
	}
	
	/** Recursively gets lex log prob total for the given sign, if not already present. */
	protected float getLexLogProb(Sign sign, boolean complete) {
		// check for stored log prob 
		SupertaggerAdapter.LexLogProb lexlogprob = 
			(SupertaggerAdapter.LexLogProb) sign.getData(SupertaggerAdapter.LexLogProb.class);
		if (lexlogprob != null) return lexlogprob.logprob;
		// otherwise calculate and store one
		float logprob = 0;
		// lex case
		if (sign.isLexical()) {
			// just use zero if not already there
		}
		// non-terminal
		else {
			// use input totals to calculate current one
			Sign[] inputs = sign.getDerivationHistory().getInputs();
			if (inputs.length == 1) 
				logprob = getLexLogProb(inputs[0], false);
			else if (inputs.length == 2) 
				logprob = getLexLogProb(inputs[0], false) + getLexLogProb(inputs[1], false);
		}
		// store it and return
		sign.addData(new SupertaggerAdapter.LexLogProb(logprob));
		return logprob;
	}
	
	/** Returns a feature vector with the given lex log prob total. */
	protected FeatureVector lexLogProbVector(float logprob) {
		FeatureList retval = new FeatureList(1);
		if (lexlogprobFeature != null) retval.add(lexlogprobFeature, logprob);
		return retval;
	}
	
    /** 
     * Returns a score for the given sign and completeness flag; 
     * specifically, returns the lex log prob total for the sign.
     */
    public double score(Sign sign, boolean complete) {
    	return getLexLogProb(sign, complete);
    }
}


================================================
FILE: src/opennlp/ccg/synsem/LexSemOrigin.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2007 Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.synsem;

/**
 * An interface for items which introduce lexical semantics, covering 
 * (lexical) signs and unary type changing rules.
 *
 * @author      Michael White
 * @version     $Revision: 1.2 $, $Date: 2008/01/03 21:30:12 $
 */
public interface LexSemOrigin {
	
    /**
     * Returns the supertag.
     */
    public String getSupertag();
    
    /**
     * Returns the POS tag. 
     * For unary type changing rules, the constant TypeChangingRule.POS_STRING is 
     * always returned.
     */
    public String getPOS();
    
    /**
     * Sets the origin of the elementary predications.
     */
    public void setOrigin();
}


================================================
FILE: src/opennlp/ccg/synsem/Modality.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2002 Jason Baldridge
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.synsem;

import opennlp.ccg.unify.*;

/**
 * A modality that can decorate a categorial slash.
 *
 * @author      Jason Baldridge
 * @version     $Revision: 1.2 $, $Date: 2004/05/01 10:40:04 $
 */
public interface Modality extends Unifiable {
    public Object copy();
    public byte getDirection();
    public String toString(byte dir);
    public String toTeX(byte dir);
    public String toTeX();
}


================================================
FILE: src/opennlp/ccg/synsem/ReRankingScorer.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2011 Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.synsem;

/**
 * Interface for signs scorers with both a base model and a full (reranking) model.
 * The implementation of the score(Sign, boolean) method should vary according to the 
 * full model flag. The base model should be the default. 
 */
public interface ReRankingScorer extends SignScorer {
	/** Sets flag for using full (vs. base) model. The base model should be the default. */
	public void setFullModel(boolean on);
}


================================================
FILE: src/opennlp/ccg/synsem/SetArg.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2002-5 Jason Baldridge and University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.synsem;

import opennlp.ccg.unify.*;
import org.jdom.*;
import java.io.Serializable;
import java.util.*;
import gnu.trove.*;

/**
 * A category which contains an unordered set of categories.
 * 
 * @author Jason Baldridge
 * @author Michael White
 * @version $Revision: 1.11 $, $Date: 2009/12/21 02:15:44 $
 */
public final class SetArg implements Arg, Serializable {

	private static final long serialVersionUID = -7067480310511294657L;
	
	private ArgStack _args;

	@SuppressWarnings("unchecked")
	public SetArg(Element el) {
		List<Element> info = el.getChildren();
		List<Arg> args = new ArrayList<Arg>();
		for (Iterator<Element> infoIt = info.iterator(); infoIt.hasNext();) {
			Slash s = new Slash(infoIt.next());
			Category c = CatReader.getCat(infoIt.next());
			args.add(new BasicArg(s, c));
		}
		Arg[] list = new Arg[args.size()];
		args.toArray(list);
		_args = new ArgStack(list);
	}

	public SetArg(Arg[] args) {
		_args = new ArgStack(args);
	}

	public SetArg(ArgStack args) {
		_args = args;
	}

	public Element toXml() {
		Element retval = new Element("setarg");
		for (Arg arg : _args._list) {
			if (arg instanceof BasicArg) { // only supporting basic args per xml construction
				BasicArg barg = (BasicArg) arg;
				retval.addContent(barg.getSlash().toXml());
				retval.addContent(barg.getCat().toXml());
			}
		}
		return retval;
	}
	
	public Arg copy() {
		return new SetArg(_args.copy());
	}

	public void add(ArgStack as) {
		_args.add(as);
	}

	public void forall(CategoryFcn fcn) {
		_args.forall(fcn);
	}

	public Arg copyWithout(int pos) {
		if (_args.size() == 2) {
			if (pos == 0) {
				return _args.get(1);
			} else {
				return _args.get(0);
			}
		} else {
			return new SetArg(_args.copyWithout(pos));
		}
	}

	public int size() {
		return _args.size();
	}

	public BasicArg get(int pos) {
		return (BasicArg) _args.get(pos);
	}

	public Category getCat(int pos) {
		return ((BasicArg) _args.get(pos)).getCat();
	}

	public int indexOf(BasicArg a) {
		int index = -1;
		for (int i = 0; i < _args.size() && index < 0; i++) {
			try {
				a.unifySlash(((BasicArg) _args.get(i)).getSlash());
				GUnifier.unify(getCat(i), a.getCat());
				index = i;
			} catch (UnifyFailure uf) {
			}
		}
		// if (index<0) {
		// throw new UnifyFailure();
		// } else {
		// return index;
		// }
		return index;
	}

	public int indexOf(Category cat) {
		int index = -1;
		for (int i = 0; i < _args.size() && index < 0; i++) {
			try {
				GUnifier.unify(getCat(i), cat);
				index = i;
			} catch (UnifyFailure uf) {
			}
		}
		return index;
		// if (index<0) {
		// throw new UnifyFailure();
		// } else {
		// return index;
		// }
	}

	public void setSlashModifier(boolean modifier) { 
		for (int i = 0; i < _args.size(); i++) {
			BasicArg arg = get(i);
			arg.setSlashModifier(modifier);
		}
	}
	
    public void setSlashHarmonicCompositionResult(boolean harmonicResult) { 
		for (int i = 0; i < _args.size(); i++) {
			BasicArg arg = get(i);
			arg.setSlashHarmonicCompositionResult(harmonicResult);
		}
	}
    
	public boolean containsContrarySlash() {
		for (int i = 0; i < _args.size(); i++) {
			if (!((BasicArg) _args.get(i)).getSlash().sameDirAsModality()) {
				return true;
			}
		}
		return false;
	}

	public void unifySlash(Slash s) throws UnifyFailure {
		for (int i = 0; i < _args.size(); i++) {
			_args.get(i).unifySlash(s);
		}
	}

	public void unifyCheck(Object u) throws UnifyFailure {
	}

	// nb: direct unification not implemented ...
	public Object unify(Object u, Substitution sub) throws UnifyFailure {
		throw new UnifyFailure();
	}

	public Object fill(Substitution s) throws UnifyFailure {
		return new SetArg(_args.fill(s));
	}

	public void deepMap(ModFcn mf) {
		_args.deepMap(mf);
	}

	public boolean occurs(Variable v) {
		return _args.occurs(v);
	}

	public boolean equals(Object c) {
		return false;
	}

	public String toString() {
		StringBuffer sb = new StringBuffer(10);
		sb.append('{').append(_args.toString()).append('}');
		return sb.toString();
	}

	/**
	 * Returns the supertag for this arg.
	 */
	public String getSupertag() {
		StringBuffer sb = new StringBuffer();
		sb.append("{").append(_args.getSupertag()).append("}");
		return sb.toString();
	}

	/**
	 * Returns a TeX-formatted string representation for this arg.
	 */
	public String toTeX() {
		StringBuffer sb = new StringBuffer(10);
		sb.append("\\{").append(_args.toTeX()).append("\\}");
		return sb.toString();
	}

	/**
	 * Returns a hash code for this arg, using the given map from vars to ints.
	 */
	public int hashCode(TObjectIntHashMap varMap) {
		return _args.hashCode(varMap);
	}

	/**
	 * Returns whether this arg equals the given object up to variable names,
	 * using the given maps from vars to ints.
	 */
	public boolean equals(Object obj, TObjectIntHashMap varMap,
			TObjectIntHashMap varMap2) {
		if (obj.getClass() != this.getClass()) {
			return false;
		}
		SetArg sa = (SetArg) obj;
		return _args.equals(sa._args, varMap, varMap2);
	}
}


================================================
FILE: src/opennlp/ccg/synsem/Sign.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003-9 Jason Baldridge, University of Edinburgh and Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.synsem;

import opennlp.ccg.parse.*;
import opennlp.ccg.util.*;
import opennlp.ccg.lexicon.*;
import opennlp.ccg.grammar.*;
import opennlp.ccg.hylo.*;

import org.jdom.*;

import gnu.trove.*;

import java.io.*;
import java.util.*;

/**
 * A CCG sign, consisting of a list of words paired with a category.
 * Signs may contain arbitrary data objects which are ignored in equality checking.
 * Non-serializable data objects are filtered during serialization.
 *
 * @author      Jason Baldridge
 * @author      Michael White
 * @version     $Revision: 1.44 $, $Date: 2011/08/27 19:27:01 $
 */
public class Sign implements LexSemOrigin, Serializable {
    
	private static final long serialVersionUID = 1072712272514007274L;

	/** The words. */
    protected List<Word> _words;
    
    /** The category. */
    protected Category _cat;
    
    /** The derivation history. */
    protected DerivationHistory _history;
    
    /** The lexical head. */
    protected Sign _lexHead;
    
    
    /** List of transient data objects, for retrieval by class. */
    protected LinkedList<Object> data = null; 
    

    /** Constructor for subclasses. */
    protected Sign() {}
    
    /** Constructor with derivation history. */
    @SuppressWarnings("unchecked")
	protected Sign(List<Word> words, Category cat, DerivationHistory dh, Sign lexHead) {
        _words = (List<Word>) Interner.globalIntern(words); 
        _cat = cat;
        _history = dh;
        _lexHead = lexHead;
    }

    /** Constructor with no additional derivation history. */
    public Sign(List<Word> words, Category cat) {
        this(words, cat, null, null);
        _history = new DerivationHistory(this);
        _lexHead = this;
    }

    /** Constructor with no additional derivation history. */
    public Sign(Word word, Category cat) {
        this(new SingletonList<Word>(word), cat);
    }
    
    
    // during deserialization, interns words
    @SuppressWarnings("unchecked")
	private void readObject(java.io.ObjectInputStream in) throws IOException, ClassNotFoundException {
    	in.defaultReadObject();
        _words = (List<Word>) Interner.globalIntern(_words); 
    }
    
    // during serialization, skips non-serializable data objects
    private void writeObject(java.io.ObjectOutputStream stream) throws IOException {
    	// save old data objects
    	LinkedList<Object> tmp = data;
    	// filter non-serializable ones
    	if (tmp != null) {
    		data = new LinkedList<Object>();
    		for (Object obj : tmp) {
    			if (obj instanceof Serializable) data.add(obj);
    		}
    		if (data.isEmpty()) data = null;
    	}
    	// serialize
    	stream.defaultWriteObject();
    	// restore old data objects
    	data = tmp;
    }

    
    /** Factory method for creating a sign from a lexical sign plus a coarticulation one. */
    public static Sign createCoartSign(Category cat, Sign lexSign, Sign coartSign) {
        List<Word> words = lexSign.getWords();
        if (words.size() > 1) 
            throw new RuntimeException("Can't create coarticulation sign from multiple words.");
        Word word = words.get(0);
        Word coartWord = coartSign.getWords().get(0);
        Word wordPlus = Word.createWordWithAttrs(word, coartWord);
        Sign retval = new Sign(new SingletonList<Word>(wordPlus), cat, null, null);
        retval._lexHead = retval;
        Rule coartRule = new Rule() {
            public String name() { return "coart"; }
            public int arity() { return 1; }
            public List<Category> applyRule(Category[] inputs) { throw new RuntimeException("Not supported."); }
            public RuleGroup getRuleGroup() { throw new RuntimeException("Not supported."); }
            public void setRuleGroup(RuleGroup ruleGroup) { throw new RuntimeException("Not supported."); }
            public Element toXml() { throw new RuntimeException("Not supported."); }
        };
        retval._history = new DerivationHistory(new Sign[]{lexSign,coartSign}, retval, coartRule);
        return retval;
    }
    
    /** Factory method for creating derived signs with the given cat from the given inputs, rule and lex head. */
    public static Sign createDerivedSign(Category cat, Sign[] inputs, Rule rule, Sign lexHead) {
        return new Sign(cat, inputs, rule, lexHead);
    }

    /** Factory method for creating derived signs from the given result cat, inputs, rule and lex head, 
        with a new LF constructed from the inputs.
        Note that unlike with rule applications, the result LF is constructed with 
        no var substitutions, so it is useful only for creating alternative signs during realization. */
    public static Sign createDerivedSignWithNewLF(Category cat, Sign[] inputs, Rule rule, Sign lexHead) {
        Category copyCat = cat.shallowCopy();
        LF lf = null;
        for (int i = 0; i < inputs.length; i++) {
            lf = HyloHelper.append(lf, inputs[i].getCategory().getLF());
        }
        if (rule instanceof TypeChangingRule) {
            TypeChangingRule tcr = (TypeChangingRule) rule;
            lf = HyloHelper.append(lf, tcr.getResult().getLF());
        }
        if (lf != null) { HyloHelper.sort(lf); }
        copyCat.setLF(lf);
        return new Sign(copyCat, inputs, rule, lexHead);
    }
        
    /** Constructor with words and derivation history formed from the given inputs, rule and lex head. */
    protected Sign(Category cat, Sign[] inputs, Rule rule, Sign lexHead) {
        this(getRemainingWords(inputs, 0), cat, null, lexHead);
        _history = new DerivationHistory(inputs, this, rule);
    }
    
    // returns the remaining words in a structure sharing way
    private static List<Word> getRemainingWords(Sign[] inputs, int index) {
        // if (inputs.length == 0) throw new RuntimeException("Error: can't make sign from zero inputs");
        if (index == (inputs.length - 1)) return inputs[index]._words;
        return new StructureSharingList<Word>(
            inputs[index]._words,
            getRemainingWords(inputs, index+1)
        );
    }

    
    /** Returns the words of the sign. */
    public List<Word> getWords() {
        return _words;
    }

    /** Returns the words as a string.  Delegates to the current tokenizer's getOrthography method. */
    public String getOrthography() {
        return Grammar.theGrammar.lexicon.tokenizer.getOrthography(_words);
    }

    /** Returns the sign's category. */
    public Category getCategory() {
        return _cat;
    }

    /** Returns whether the sign is lexical. */
    public boolean isLexical() { return _history.isEmpty(); }
    
    /** Sets the derivation history. */
    public void setDerivationHistory(DerivationHistory dh) {
        _history = dh;
    }
    
    /** Returns the derivation history. */
    public DerivationHistory getDerivationHistory() {
        return _history;
    }

    /** Returns the lexical head. */
    public Sign getLexHead() { return _lexHead; }
    
    
    /** Returns a hash code for this sign. */ 
    public int hashCode() {
        return System.identityHashCode(_words) + _cat.hashCode();
    }
    
    /** Returns whether this sign equals the given object. */
    public boolean equals(Object obj) {
        if (obj == this) return true;
        if (!(obj instanceof Sign)) return false;
        Sign sign = (Sign) obj;
        return _words == sign._words && _cat.equals(sign._cat);
    }

    
    /** 
     * Returns a hash code for this sign with the words restricted to surface words; 
     * with lexical signs, however, the original hash code is returned, so that 
     * words with signs that differ just in their pos tags can be distinguished 
     * (for robustness).
     */ 
    public int surfaceWordHashCode() {
    	return surfaceWordHashCode(false);
    }
    
    /** 
     * Returns a hash code for this sign with the words restricted to surface words, 
     * and with the LF ignored according to the given flag; 
     * with lexical signs, however, the original hash code is returned, so that 
     * words with signs that differ just in their pos tags can be distinguished 
     * (for robustness).
     */ 
    public int surfaceWordHashCode(boolean ignoreLF) {
        // original hash code for lex signs
        if (_history.getInputs() == null) return hashCode();
        // otherwise use surface words
        int hc = 1;
        for (int i = 0; i < _words.size(); i++) {
            Word word = _words.get(i);
            hc = 31*hc + word.surfaceWordHashCode();
        }
        hc += (ignoreLF) ? _cat.hashCodeNoLF() : _cat.hashCode();
        return hc;
    }
    
    /** 
     * Returns whether this sign and the given object have equal categories and
     * restrictions to surface words; 
     * with lexical signs, however, the original equals result is returned, so that 
     * words with signs that differ just in their pos tags can be distinguished 
     * (for robustness).
     */
    public boolean surfaceWordEquals(Object obj) {
    	return surfaceWordEquals(obj, false);
    }

    /** 
     * Returns whether this sign and the given object have equal categories and
     * restrictions to surface words,  
     * with the LF ignored according to the given flag; 
     * with lexical signs, however, the original equals result is returned, so that 
     * words with signs that differ just in their pos tags can be distinguished 
     * (for robustness).
     */
    public boolean surfaceWordEquals(Object obj, boolean ignoreLF) {
        if (obj == this) return true;
        if (!(obj instanceof Sign)) return false;
        Sign sign = (Sign) obj;
        // original equals for lex signs
        if (_history.getInputs() == null || sign._history.getInputs() == null) 
            return equals(sign);
        // otherwise use surface words
        if (_words.size() != sign._words.size()) return false;
        for (int i = 0; i < _words.size(); i++) {
            Word word = _words.get(i); 
            Word signWord = (Word) sign._words.get(i);
            if (!word.surfaceWordEquals(signWord)) return false;
        }
        return (ignoreLF) ? _cat.equalsNoLF(sign._cat) : _cat.equals(sign._cat);
    }

    
    /** Returns 'orthography :- category'. */
    public String toString() {
        return getOrthography() + " :- " + _cat.toString(); // for lex head: + " --> " + _lexHead.getWordForm();
    }
 
    
    /** 
     * Returns the words in an XML doc, with no labeled spans for nominals. 
     */
    public Document getWordsInXml() {
    	Set<Nominal> emptySet = Collections.emptySet();
    	return getWordsInXml(emptySet); 
    }
    
    /** 
     * Returns the words in an XML doc, with labeled spans for the given nominals, 
     * and with pitch accents and boundary tones converted to elements. 
     * Each orthographic word appears in a separate element, 
     * with multiwords grouped under a multiword element.
     * Attribute-value pairs for the word (if any) appear on the word 
     * or multiword element.
     * Words are also expanded using the grammar's tokenizer.
     */
    public Document getWordsInXml(Set<Nominal> nominals) {
        TObjectIntHashMap nominalsMap = new TObjectIntHashMap(); 
        setMaxOrthLengths(nominals, nominalsMap);
        Document doc = new Document();
        Element root = new Element("seg");
        doc.setRootElement(root);
        addWordsToXml(root, nominalsMap);
        return doc;
    }
    
    // finds the maximum orthography lengths for signs headed by the given nominals
    private void setMaxOrthLengths(Set<Nominal> nominals, TObjectIntHashMap nominalsMap) {
        // update map
        Nominal index = _cat.getIndexNominal();
        if (index != null && nominals.contains(index)) {
            int orthLen = getOrthography().length();
            if (!nominalsMap.containsKey(index) || orthLen > nominalsMap.get(index)) {
                nominalsMap.put(index, orthLen);
            }
        }
        // recurse
        Sign[] inputs = _history.getInputs();
        if (inputs == null) return;
        for (int i = 0; i < inputs.length; i++) {
            inputs[i].setMaxOrthLengths(nominals, nominalsMap); 
        }
    }
    
    // recursively adds orthographic words as XML to the given parent, 
    // using the nominals map to determine labeled spans
    private void addWordsToXml(Element parent, TObjectIntHashMap nominalsMap) {
        // check for matching nominal as index of target cat; 
        // if found, update parent to labeled span element
        Nominal index = _cat.getIndexNominal();
        if (index != null && nominalsMap.containsKey(index) && 
            nominalsMap.get(index) == getOrthography().length()) 
        {
            // remove index key from map, to avoid duplicate spans with the same length
            nominalsMap.remove(index);
            // make span element, update parent
            Element span = new Element("span");
            span.setAttribute("label", index.toString());
            parent.addContent(span);
            parent = span;
        }
        // process inputs from derivation history
        Sign[] inputs = _history.getInputs();
        if (inputs == null) {
            // in leaf case, word list must be a singleton
            Word word = _words.get(0); 
            // check for boundary tone
            if (Grammar.isBoundaryTone(word.getForm())) {
                // add element for boundary tone
                Element boundary = new Element("boundary");
                boundary.setAttribute("type", word.getForm());
                parent.addContent(boundary);
                return;
            }
            // check for pitch accent
            if (word.getPitchAccent() != null) {
                // add pitchaccent element containing word(s) with corresponding accent
                Element pitchaccent = new Element("pitchaccent");
                pitchaccent.setAttribute("type", word.getPitchAccent());
                addWords(pitchaccent, word);
                parent.addContent(pitchaccent);
                return;
            }
            // otherwise add word(s)
            addWords(parent, word);
            return;
        }
        if (inputs.length == 1) {
            inputs[0].addWordsToXml(parent, nominalsMap);
            return;
        }
        for (int i = 0; i < inputs.length; i++) {
            inputs[i].addWordsToXml(parent, nominalsMap);
        }
    }
    
    // adds one or more word elements after expanding surface form; 
    // multiwords are enclosed within a multiword element; 
    // any attribute-value pairs are added to the word or multiword element
    private void addWords(Element parent, Word word) {
        List<String> orthWords = Grammar.theGrammar.lexicon.tokenizer.expandWord(word);
        Element child;
        if (orthWords.size() == 1) {
            Element wordElt = new Element("word");
            wordElt.addContent(orthWords.get(0));
            child = wordElt;
        }
        else {
            Element multiwordElt = new Element("multiword");
            for (int i = 0; i < orthWords.size(); i++) {
                Element wordElt = new Element("word");
                wordElt.addContent(orthWords.get(i));
                multiwordElt.addContent(wordElt);
            }
            child = multiwordElt;
        }
        for (Iterator<Pair<String,String>> it = word.getAttrValPairs(); it.hasNext(); ) {
            Pair<String,String> p = it.next();
            String attr = p.a; String val = p.b;
            child.setAttribute(attr, val);
        }
        parent.addContent(child);
    }
    

    /**
     * Returns a string showing the bracketings implied by the derivation.
     * See DerivationHistory.toString to see the complete derivation in 
     * vertical list form.
     */
    public String getBracketedString() {
        Sign[] inputs = _history.getInputs();
        if (inputs == null) return getOrthography();
        if (inputs.length == 1) return inputs[0].getBracketedString();
        StringBuffer sb = new StringBuffer();
        sb.append("(");
        for (int i = 0; i < inputs.length; i++) {
            sb.append(inputs[i].getBracketedString());
            if (i < (inputs.length - 1)) sb.append(" ");
        }
        sb.append(")");
        return sb.toString();
    }
    
    /**
     * Returns the category's supertag.
     */
    public String getSupertag() { return _cat.getSupertag(); }
    
    /**
     * Returns the word form of the first word. 
     */
    public String getWordForm() { return _words.get(0).getForm(); }
    
    /**
     * Returns the POS tag of the first word.
     */
    public String getPOS() { return _words.get(0).getPOS(); }
    
    /**
     * Sets the origin of the elementary predications.
     */
    public void setOrigin() { HyloHelper.setOrigin(_cat.getLF(), this); }
    
    /**
     * Returns the index of the first word of the given lex sign in this sign's 
     * list of words, or -1 if the given lex sign is not in this sign's derivation 
     * history.
     */
    public int wordIndex(Sign lexSign) {
    	return wordIndex(lexSign, new int[]{0});
    }
    
    // returns word index relative to input offset
    private int wordIndex(Sign lexSign, int[] offset) {
    	if (this == lexSign) return offset[0];
    	if (isLexical()) {
    		offset[0] += _words.size();
    		return -1;
    	}
        Sign[] inputs = _history.getInputs();
        for (int i = 0; i < inputs.length; i++) {
        	int retval = inputs[i].wordIndex(lexSign, offset);
        	if (retval >= 0) return retval;
        }
        return -1;
    }
    
    
    /** Adds a data object to the front of the list of data objects. */
    public void addData(Object obj) {
    	if (data == null) data = new LinkedList<Object>();
    	data.addFirst(obj);
    }
    
    /** Returns the first data object with the given class, or null if none. */
    public Object getData(Class<?> objClass) {
    	if (data == null) return null;
    	for (Object obj : data) {
    		if (obj.getClass() == objClass) return obj;
    	}
    	return null;
    }

    
	/** Unfilled dependencies wrapper, for unique retrieval from data objects. */
	public static class UnfilledDeps {
		public List<LexDependency> unfilledDeps; 
		public UnfilledDeps(List<LexDependency> unfilledDeps) { this.unfilledDeps = unfilledDeps; }
	}
	
	/** Filled dependencies wrapper, for unique retrieval from data objects. */
	public static class FilledDeps {
		public List<LexDependency> filledDeps; 
		public FilledDeps(List<LexDependency> filledDeps) { this.filledDeps = filledDeps; }
	}
	
	/** Returns the unfilled dependencies for this sign, with caching. */
	public List<LexDependency> getUnfilledDeps() {
		// check cache
		UnfilledDeps udeps = (UnfilledDeps) getData(UnfilledDeps.class);
		if (udeps != null) return udeps.unfilledDeps;
		// lex case: calculate, store and return
		if (isLexical()) {
			List<LexDependency> unfilledDeps = HyloHelper.getUnfilledLexDeps(_cat.getLF());
			addData(new UnfilledDeps(unfilledDeps));
			return unfilledDeps;
		}
		// otherwise compute filled deps, with unfilled determined as a side effect, and return cached result
		getFilledDeps();
		udeps = (UnfilledDeps) getData(UnfilledDeps.class);
		return udeps.unfilledDeps;
	}
    
	/** Returns the filled dependencies for this sign, with caching. */
	public List<LexDependency> getFilledDeps() {
		// skip lex case
		if (isLexical()) return Collections.emptyList();
		// check cache
		FilledDeps fdeps = (FilledDeps) getData(FilledDeps.class);
		if (fdeps != null) return fdeps.filledDeps;
		// otherwise get unfilled deps from children recursively
		List<LexDependency> unfilledDeps = new ArrayList<LexDependency>(5);
		Sign[] inputs = _history.getInputs();
        for (int i = 0; i < inputs.length; i++) {
        	unfilledDeps.addAll(inputs[i].getUnfilledDeps());
        }
        // calculate filled deps
        List<LexDependency> filledDeps = HyloHelper.getFilledLexDeps(unfilledDeps, _cat.getLF());
        // store filled and unfilled, returning filled
        addData(new UnfilledDeps(unfilledDeps));
        addData(new FilledDeps(filledDeps));
    	return filledDeps;
	}

	/** 
	 * Returns the sibling filled dependencies for this sign by recursively 
	 * filtering the filled dependencies from the input signs for those with 
	 * the same head.
	 */
	public List<LexDependency> getSiblingFilledDeps() {
		List<LexDependency> filledDeps = getFilledDeps();
		if (filledDeps.isEmpty()) return Collections.emptyList();
		List<LexDependency> retval = new ArrayList<LexDependency>(5);
		Sign[] inputs = _history.getInputs();
        for (int i = 0; i < inputs.length; i++) {
        	inputs[i].addSiblingFilledDeps(retval, filledDeps);
        }
		return retval;
	}
	
	// recursively adds sibling filled deps until lex items reached or 
	// sibs with different heads found
	private void addSiblingFilledDeps(List<LexDependency> retval, List<LexDependency> filledDeps) {
		if (isLexical()) return;
		List<LexDependency> candDeps = getFilledDeps();
		if (!candDeps.isEmpty()) {
			List<LexDependency> sibs = LexDependency.filterSameHead(candDeps, filledDeps);
			if (sibs.isEmpty()) return;
			retval.addAll(sibs);
			
		}
		Sign[] inputs = _history.getInputs();
        for (int i = 0; i < inputs.length; i++) {
        	inputs[i].addSiblingFilledDeps(retval, filledDeps);
        }
	}

	/**
	 * Returns the descendant sign headed by the given dependent 
	 * by recursing through the input signs as long as the head remains 
	 * the same as the given head; otherwise returns null.
	 */
	public Sign getSignHeadedByDep(LexDependency lexdep) {
		// check same head
		if (!isLexical() && _lexHead == lexdep.lexHead) {
			Sign[] inputs = _history.getInputs();
	        for (int i = 0; i < inputs.length; i++) {
	    		// check for match
	        	if (inputs[i]._lexHead == lexdep.lexDep) return inputs[i]; // found it
	        	// otherwise recurse
	        	Sign retval = inputs[i].getSignHeadedByDep(lexdep);
	        	if (retval != null) return retval;
	        }
		}
		// otherwise not found
		return null;
	}
	
	
    /** Tests serialization of simple types, including resolution. */
    public void debugSerialization() throws IOException, ClassNotFoundException {
        // test serialization
    	String filename = "tmp.ser";
    	ObjectOutputStream out = new ObjectOutputStream(new FileOutputStream(filename));
    	System.out.println("Writing this: " + this);
    	System.out.println(this.getDerivationHistory());
    	out.writeObject(this);
    	out.close();
    	ObjectInputStream in = new ObjectInputStream(new FileInputStream(filename));
    	System.out.print("Reading sign: ");
    	Sign sign = (Sign) in.readObject();
    	System.out.println(sign);
    	System.out.println(sign.getDerivationHistory());
    	in.close();
    	// test identity and equality
    	System.out.println("this == sign?: " + (this == sign));
    	System.out.println("this.equals(sign)?: " + (this.equals(sign)));
    }
}


================================================
FILE: src/opennlp/ccg/synsem/SignHash.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003-5 Jason Baldridge, Gann Bierner and 
//                      University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.synsem;

import gnu.trove.*;
import java.util.*;

import opennlp.ccg.lexicon.Word;

/**
 * A set of signs, unique up to surface words.
 * Signs with lower derivational complexity are kept during insertion.
 *
 * @author      Jason Baldridge
 * @author      Gann Bierner
 * @author      Michael White
 * @version     $Revision: 1.13 $, $Date: 2009/12/21 02:15:44 $
 */
public class SignHash extends THashSet {

	private static final long serialVersionUID = 1L;
	
	/** Hashing strategy that uses Sign's surfaceWordHashCode and surfaceWordEquals methods. */
    protected static TObjectHashingStrategy surfaceWordHashingStrategy = new TObjectHashingStrategy() {
		private static final long serialVersionUID = 1L;
		public int computeHashCode(java.lang.Object o) {
            return ((Sign)o).surfaceWordHashCode();
        }
        public boolean equals(java.lang.Object o1, java.lang.Object o2) {
            return ((Sign)o1).surfaceWordEquals((Sign)o2);
        }
    };

    /** Default constructor. */
    public SignHash() { super(surfaceWordHashingStrategy); }

    /**
     * Constructor which adds one sign.
     */
    public SignHash(Sign sign) {
        this(); insert(sign);
    }

    /**
     * Constructor which adds a collection of signs.
     */
    public SignHash(Collection<Sign> c) {
        this();
        for (Sign s : c) insert(s);
    }
    
    /**
     * Returns this as a set of signs.
     */
    @SuppressWarnings("unchecked")
	public Set<Sign> asSignSet() { return (Set<Sign>) this; }

    /**
     * Adds a sign, keeping the one with lower derivational complexity 
     * if there is an equivalent one there already; returns the old 
     * sign if it was displaced, the new sign if there was no equivalent 
     * old sign, or null if the sign was not actually added.
     */
    public Sign insert(Sign sign) {
        int pos = index(sign);
        if (pos >= 0) {
            Sign oldSign = (Sign) _set[pos];
            if (oldSign == sign) return null;
            if (sign.getDerivationHistory().compareTo(oldSign.getDerivationHistory()) < 0) {
            	_set[pos] = sign; return oldSign;
            }
            else return null;
        }
        else {
        	add(sign); return sign;
        }
    }
    
    /** Returns the signs sorted by their words lexicographically. */
    public List<Sign> getSignsSorted() {
    	ArrayList<Sign> retval = new ArrayList<Sign>(asSignSet());
    	Collections.sort(retval, signComparator); 
    	return retval;
    }
    
    /** Comparator for signs to provide a persistent ordering. */
    public static final Comparator<Sign> signComparator = new Comparator<Sign>() {
		public int compare(Sign sign1, Sign sign2) {
			return compareTo(sign1, sign2);
		}
    };

    /** Compares signs by their derivation complexity, lists of words, then (somewhat desperately) cat hash codes. */
    public static int compareTo(Sign sign1, Sign sign2) {
    	int cmp = 0;
    	cmp = sign1.getDerivationHistory().compareTo(sign2.getDerivationHistory());
    	if (cmp != 0) return cmp;
    	List<Word> words1 = sign1.getWords(); 
    	List<Word> words2 = sign2.getWords();
    	cmp = compareTo(words1, words2);
    	if (cmp != 0) return cmp;
    	// TODO: implement compareTo method on categories
    	int h1 = sign1.getCategory().hashCode();
    	int h2 = sign2.getCategory().hashCode();
    	if (h1 < h2) return -1;
    	if (h1 > h2) return 1;
    	return 0;
    }
    
    /** Compares lists of words lexicographically. */
    public static int compareTo(List<Word> words1, List<Word> words2) {
    	int i=0;
    	while (i < words1.size() || i < words2.size()) {
    		if (i == words1.size()) return -1;
    		if (i == words2.size()) return 1;
    		Word w1 = words1.get(i); Word w2 = words2.get(i);
    		int cmp = w1.compareTo(w2);
    		if (cmp != 0) return cmp;
    		i++;
    	}
    	return 0;
    }
}


================================================
FILE: src/opennlp/ccg/synsem/SignScorer.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003-4 University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.synsem;

import java.util.Random;

/**
 * Interface for sign scoring models.
 *
 * @author      Michael White
 * @version     $Revision: 1.2 $, $Date: 2008/11/09 02:59:49 $
 */
public interface SignScorer
{
    /** 
     * Returns a score for the given sign and completeness flag, where higher 
     * numbers are better than lower numbers.
     * When normalized, returns a score between 0 (worst) and 1 (best).
     */
    public double score(Sign sign, boolean complete);

    /** A scorer that returns 0 for all signs. */
    public static SignScorer nullScorer = new SignScorer() { 
        public double score(Sign sign, boolean complete) { return 0; }
    };

    /** A scorer that returns a random number in [0,1] for all signs. */
    public static SignScorer randomScorer = new SignScorer() { 
    	Random random = new Random();
        public double score(Sign sign, boolean complete) { return random.nextDouble(); }
    };
}


================================================
FILE: src/opennlp/ccg/synsem/Slash.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2002-7 Jason Baldridge, Gann Bierner and Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.synsem;

import java.io.Serializable;
import gnu.trove.*;
import org.jdom.Element;

import opennlp.ccg.unify.*;

/**
 * A categorial slash which has an optional mode associated with it.
 * 
 * @author Jason Baldridge
 * @author Gann Bierner
 * @author Michael White
 * @version $Revision: 1.10 $, $Date: 2009/11/28 03:39:27 $
 */
public final class Slash implements Unifiable, Mutable, Serializable {

	private static final long serialVersionUID = -1935688863458012637L;

	public static final byte L = 0;

	public static final byte B = 1;

	public static final byte R = 2;

	public static final byte INERT_OR_ACTIVE = 0;

	public static final byte ACTIVE = 1;

	public static final byte INERT = 2;

	private final byte _dir;

	private final Modality _modality;

	private byte _ability = INERT_OR_ACTIVE;
	
	private boolean _modifier = false;

	private boolean _harmonicCompositionResult = false;
	
	public Slash(Element el) {
		String d = el.getAttributeValue("dir");
		if (d == null)
			d = el.getAttributeValue("d");
		if (d == null) {
			d = "|";
		}
		_dir = encode(d.charAt(0));

		String m = el.getAttributeValue("mode");
		if (m == null)
			m = el.getAttributeValue("m");
		if (m != null) {
			_modality = new SlashMode(m);
		} else {
			String vm = el.getAttributeValue("varmodality");
			if (vm == null)
				vm = el.getAttributeValue("varModality");
			if (vm != null) {
				_modality = new VarModality(vm);
			} else {
				_modality = new SlashMode();
			}
		}

		String ability = el.getAttributeValue("ability");
		if (null != ability) {
			setAbility(ability);
		}
	}

	public Slash() {
		this('|');
	}

	public Slash(char sd) {
		_dir = encode(sd);
		_modality = new SlashMode();
	}

	public Slash(char sd, String md) {
		_dir = encode(sd);
		_modality = new SlashMode(md);
	}

	public Slash(char sd, Modality md) {
		_dir = encode(sd);
		_modality = md;
	}

	private Slash(byte d, Modality m, byte a) {
		_dir = d;
		_modality = m;
		_ability = a;
	}
	
	public Element toXml() {
    	Element retval = new Element("slash");
    	retval.setAttribute("dir", encode());
    	String ability = decodeAbility();
    	if (_modality instanceof SlashMode) {
    		String mode = _modality.toString();
    		if (!mode.equals(".")) retval.setAttribute("mode", mode);
    	}
    	else if (_modality instanceof VarModality)
    		retval.setAttribute("varmodality", ((VarModality) _modality).name());
    	if (ability != null) retval.setAttribute("ability", ability);
    	return retval;
	}

	public Slash copy() {
		Slash retval = new Slash(_dir, (Modality) _modality.copy(), _ability);
		retval._modifier = _modifier;
		retval._harmonicCompositionResult = _harmonicCompositionResult;
		return retval;
	}

	public boolean occurs(Variable v) {
		return _modality.occurs(v);
	}

	public void deepMap(ModFcn mf) {
		mf.modify(this);
	}

	public boolean isActive() {
		return _ability == ACTIVE || _ability == INERT_OR_ACTIVE;
	}

	public boolean setAbility(String ability) {
		byte newAbility;
		if (ability.equals("inert")) {
			newAbility = INERT;
		} else if (ability.equals("active")) {
			newAbility = ACTIVE;
		} else {
			newAbility = INERT_OR_ACTIVE;
		}
		if (abilitiesMatch(_ability, newAbility)) {
			_ability = newAbility;
			return true;
		} else {
			return false;
		}
	}
	
	/** Returns a string for the ability or null if not set. */
	public String decodeAbility() {
		if (_ability == INERT) return "inert";
		else if (_ability == ACTIVE) return "active";
		else return null;
	}
	
	/** Returns whether this cat is a modifier cat (defaults to false). */
	public boolean isModifier() { return _modifier; }
	
	/** Sets whether this cat is a modifier cat. */
	// NB: Might want to change this allow lex overrides of defaults
	public void setModifier(boolean modifier) { _modifier = modifier; }
	
	/** Returns whether this arg has resulted from harmonic composition. */
	public boolean isHarmonicCompositionResult() { return _harmonicCompositionResult; }
	
	/** Sets whether this arg has resulted from harmonic composition. */
	public void setHarmonicCompositionResult(boolean harmonicResult) { _harmonicCompositionResult = harmonicResult; }
	

	public void unifyCheck(Object u) throws UnifyFailure {
		if (u instanceof Slash) {
			if (!abilitiesMatch(_ability, ((Slash) u)._ability)) {
				throw new UnifyFailure();
			}
			if (!directionsMatch(_dir, ((Slash) u)._dir)) {
				throw new UnifyFailure();
			}
			_modality.unifyCheck(((Slash) u)._modality);
		} else {
			throw new UnifyFailure();
		}
	}

	public Object unify(Object u, Substitution sub) throws UnifyFailure {

		if (u instanceof Slash) {
			Slash s2 = (Slash) u;
			byte newAbility = _ability;
			if (_ability == INERT_OR_ACTIVE) {
				newAbility = s2._ability;
			} else if (s2._ability == INERT_OR_ACTIVE) {
				newAbility = _ability;
			} else if (_ability != s2._ability) {
				throw new UnifyFailure();
			}

			byte newDir = _dir;
			if (_dir == B) {
				newDir = s2._dir;
			} else if (s2._dir == B) {
				newDir = _dir;
			} else if (_dir != s2._dir) {
				throw new UnifyFailure();
			}

			Modality newModality = (Modality) _modality.unify(((Slash) u)._modality, sub);
			Slash retval = new Slash(newDir, newModality, newAbility);
			retval._modifier = _modifier;
			return retval;
		} else {
			throw new UnifyFailure();
		}

	}

	public Object fill(Substitution sub) throws UnifyFailure {
		Slash retval = new Slash(_dir, (Modality) _modality.fill(sub), _ability);
		retval._modifier = _modifier;
		return retval;
	}

//	public boolean equals(Slash s) {
//		return directionsMatch(_dir, s._dir);
//	}

	public boolean sameDirAsModality() {
		return directionsMatch(_dir, _modality.getDirection());
	}

	private static byte encode(char sd) {
		switch (sd) {
		case '/':
			return R;
		case '\\':
			return L;
		default:
			return B;
		}
	}

	public static boolean directionsMatch(byte s1, byte s2) {
		if (s1 == B || s2 == B) {
			return true;
		} else {
			return s1 == s2;
		}
	}

	private static boolean abilitiesMatch(byte ab1, byte ab2) {
		if (ab1 == INERT_OR_ACTIVE || ab2 == INERT_OR_ACTIVE) {
			return true;
		} else {
			return ab1 == ab2;
		}
	}

	/**
	 * Returns a hash code based on the direction, ability and modality.
	 */
	public int hashCode() {
		return 31 * _dir + 7 * _ability + _modality.hashCode();
	}

	/**
	 * Returns whether this slash equals the given object 
	 * based on the direction, ability and modality.
	 */
	public boolean equals(Object obj) {
		if (this == obj) return true;
		if (obj.getClass() != this.getClass()) return false;
		Slash s = (Slash) obj;
		if (_dir != s._dir ||_ability != s._ability) return false;
		return _modality.equals(s._modality);
	}

	/**
	 * Returns a hash code using the given map from vars to ints.
	 */
	public int hashCode(TObjectIntHashMap varMap) {
		int retval = 31 * _dir + 7 * _ability;
		if (_modality instanceof Variable) retval += ((Variable)_modality).hashCode(varMap);
		else retval += _modality.hashCode();
		return retval;
	}

	/**
	 * Returns whether this slash equals the given object up to variable names,
	 * using the given maps from vars to ints.
	 */
	public boolean equals(Object obj, TObjectIntHashMap varMap, TObjectIntHashMap varMap2) {
		if (this == obj) return true;
		if (obj.getClass() != this.getClass()) return false;
		Slash s = (Slash) obj;
		if (_dir != s._dir || _ability != s._ability) return false;
		if (_modality instanceof Variable) 
			return ((Variable)_modality).equals(s._modality, varMap, varMap2);
		else 
			return _modality.equals(s._modality);
	}

	// string for showing ability
	private String abilityStr() {
		if (_ability == ACTIVE)
			return "@";
		else if (_ability == INERT)
			return "!";
		else
			return "";
	}

	public String toString() {
		switch (_dir) {
		case R:
			return "/" + abilityStr() + _modality.toString(R);
		case L:
			return "\\" + abilityStr() + _modality.toString(L);
		default:
			return "|" + abilityStr() + _modality;
		}
	}

	/**
	 * Returns the direction for this slash as a string.
	 */
	public String encode() {
		switch (_dir) {
		case R:
			return "/";
		case L:
			return "\\";
		default:
			return "|";
		}
	}

	/**
	 * Returns the supertag for this slash.
	 */
	public String getSupertag() {
		return encode();
	}

	/**
	 * Returns a TeX-formatted string representation for this slash.
	 */
	public String toTeX() {
		StringBuffer sb = new StringBuffer();
		String sup = "\\sups";
		String sub = "\\subs";
		String modTeX = null;
		switch (_dir) {
		case R:
			sb.append("/ ");
			sup = "\\supsb";
			sub = "\\subsa";
			modTeX = _modality.toTeX(R);
			break;
		case L:
			sb.append("\\bs ");
			sub = "\\subsb";
			sup = "\\supsa";
			modTeX = _modality.toTeX(L);
			break;
		default:
			sb.append("| ");
			sub = "\\subs";
			sup = "\\sups";
			modTeX = _modality.toTeX();
			break;
		}

		if (_ability == ACTIVE)
			sb.append(sup).append("{").append("+").append("} ");
		if (_ability == INERT)
			sb.append(sup).append("{").append("-").append("} ");
		if ((modTeX != "") && (_ability == ACTIVE)) {
			if ((_dir == R))
				sb.append("\\hspace{-1.45mm} ");
			else if (_dir == L)
				sb.append("\\hspace{-0.50mm} ");
		}
		if (modTeX != "")
			sb.append(sub).append("{").append(modTeX).append("} ");
		return sb.toString();
	}
}


================================================
FILE: src/opennlp/ccg/synsem/SlashMode.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2002 Jason Baldridge
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.synsem;

import java.io.Serializable;
import org.jdom.Element;

import opennlp.ccg.unify.*;

/**
 * A mode that can decorate a categorial slash.
 * 
 * @author Jason Baldridge
 * @version $Revision: 1.5 $, $Date: 2009/07/17 04:23:30 $
 */
public final class SlashMode implements Modality, Serializable {

	private static final long serialVersionUID = -2387797559890373347L;

	public static final byte All = 0;

	public static final byte ApplicationOnly = 1;

	public static final byte Associative = 2;

	public static final byte Permutative = 3;

	public static final byte PermutativeRight = 4;

	public static final byte PermutativeLeft = 5;

	public static final byte APRight = 6;

	public static final byte APLeft = 7;

	private byte _mode;

	public SlashMode(Element el) {
		String m = el.getAttributeValue("mode");
		if (m == null)
			m = el.getAttributeValue("m");
		if (m == null) {
			m = ".";
		}

		_mode = byteVal(m);
	}

	public SlashMode() {
		this(".");
	}

	public SlashMode(String m) {
		_mode = byteVal(m);
	}

	private SlashMode(byte m) {
		_mode = m;
	}

	public Object copy() {
		return new SlashMode(_mode);
	}

	/** Returns a hash code based on the mode. */
	public int hashCode() { return 31 * _mode; }
	
	/** Returns whether this slash mode equals the given object based on the mode. */
	public boolean equals(Object obj) {
		if (this == obj) return true;
		if (obj.getClass() != this.getClass()) return false;
		SlashMode m = (SlashMode) obj;
		return _mode == m._mode;
	}
	
//	public boolean equals(SlashMode m) {
//		return _mode == m._mode;
//	}

	public boolean occurs(Variable var) {
		return false;
	}

	public void unifyCheck(Object o) throws UnifyFailure {
		if (!(o instanceof VarModality || (o instanceof SlashMode && modesMatch(
				_mode, ((SlashMode) o)._mode)))) {
			throw new UnifyFailure();
		}
	}

	public Object unify(Object o, Substitution sub) throws UnifyFailure {
		if (o instanceof VarModality) {
			return ((VarModality) o).unify(this, sub);
		} else if (o instanceof SlashMode) {
			if (modesMatch(_mode, ((SlashMode) o)._mode)) {
				return copy();
			} else {
				throw new UnifyFailure();
			}
		} else {
			throw new UnifyFailure();
		}
	}

	public Object fill(Substitution sub) throws UnifyFailure {
		return copy();
	}

	public String toString(byte slashDir) {
		if (slashDir == getDirection()) {
			switch (_mode) {
			case PermutativeRight:
				return "x";
			case PermutativeLeft:
				return "x";
			case APRight:
				return "";
			case APLeft:
				return "";
			default:
				return toString();
			}
		} else {
			return toString();
		}
	}

	public String toString() {
		switch (_mode) {
		case All:
			return ".";
		case ApplicationOnly:
			return "*";
		case Associative:
			return "^";
		case Permutative:
			return "x";
		case PermutativeRight:
			return "x>";
		case PermutativeLeft:
			return "<x";
		case APRight:
			return ">";
		case APLeft:
			return "<";
		default:
			return ".";
		}
	}

	public String toTeX(byte slashDir) {
		if (slashDir == getDirection()) {
			switch (_mode) {
			case PermutativeRight:
				return "x";
			case PermutativeLeft:
				return "x";
			case APRight:
				return "";
			case APLeft:
				return "";
			default:
				return toTeX();
			}
		} else {
			return toTeX();
		}
	}

	public String toTeX() {
		switch (_mode) {
		case All:
			return ".";
		case ApplicationOnly:
			return "*";
		case Associative:
			return "\\diamond";
		case Permutative:
			return "x";
		case PermutativeRight:
			return "x>";
		case PermutativeLeft:
			return "<x";
		case APRight:
			return ">";
		case APLeft:
			return "<";
		default:
			return ".";
		}
	}

	private static byte byteVal(String m) {
		if (m.equals(".")) {
			return All;
		} else if (m.equals(">")) {
			return APRight;
		} else if (m.equals("<")) {
			return APLeft;
		} else if (m.equals("*")) {
			return ApplicationOnly;
		} else if (m.equals("^")) {
			return Associative;
		} else if (m.equals("x")) {
			return Permutative;
		} else if (m.equals("x>")) {
			return PermutativeRight;
		} else if (m.equals("<x")) {
			return PermutativeLeft;
		} else {
			return All;
		}
	}

	public byte getDirection() {
		switch (_mode) {
		case PermutativeRight:
			return Slash.R;
		case PermutativeLeft:
			return Slash.L;
		case APRight:
			return Slash.R;
		case APLeft:
			return Slash.L;
		default:
			return Slash.B;
		}
	}

	private static boolean modesMatch(byte m1, byte m2) {
		boolean doMatch;
		if (m1 == m2) {
			doMatch = true;
		} else if (m1 == All || m2 == All) {
			doMatch = true;
		} else if (m1 == ApplicationOnly && m2 == ApplicationOnly) {
			doMatch = true;
		} else if (m1 == ApplicationOnly || m2 == ApplicationOnly) {
			doMatch = false;
		} else if (m1 == Associative) {
			if (m2 == APRight || m2 == APLeft) {
				doMatch = true;
			} else {
				doMatch = false;
			}
		} else if (m1 == APRight) {
			if (m2 == PermutativeRight || m2 == Permutative
					|| m2 == Associative) {
				doMatch = true;
			} else {
				doMatch = false;
			}
		} else if (m1 == APLeft) {
			if (m2 == PermutativeLeft || m2 == Permutative || m2 == Associative) {
				doMatch = true;
			} else {
				doMatch = false;
			}
		} else if (m1 == PermutativeRight) {
			if (m2 == APRight || m2 == Permutative) {
				doMatch = true;
			} else {
				doMatch = false;
			}
		} else if (m1 == PermutativeLeft || m2 == Permutative) {
			if (m2 == APLeft) {
				doMatch = true;
			} else {
				doMatch = false;
			}
		} else if (m1 == Permutative) {
			if (m2 == APLeft || m2 == APRight || m2 == PermutativeRight
					|| m2 == PermutativeLeft) {
				doMatch = true;
			} else {
				doMatch = false;
			}
		} else {
			doMatch = false;
		}
		// System.out.println(m1 +" :: "+m2 + " => " + doMatch);
		return doMatch;
	}
}


================================================
FILE: src/opennlp/ccg/synsem/SyntacticFeatureExtractor.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2009 Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.synsem;

import java.util.*;

import opennlp.ccg.perceptron.*;
import opennlp.ccg.util.TrieMap;
import opennlp.ccg.lexicon.Word;

/** 
 * A class for extracting generic features from derivations,
 * inspired by those in the C&C-07 normal form model.
 * 
 * Features are extracted lazily for efficiency.
 * 
 * @author Michael White
 * @version     $Revision: 1.10 $, $Date: 2011/11/08 14:58:15 $
 */ 
public class SyntacticFeatureExtractor implements FeatureExtractor {
	
	/** Feature prefix constant: "syn". */
	public static final String PREFIX = "syn";
	
	/** Feature map wrapper, for unique retrieval from a sign's data objects. */
	public static class FeatureMapWrapper {
		public FeatureMap featureMap;
		public FeatureMapWrapper(FeatureMap featureMap) { this.featureMap = featureMap; }
	}
	
	/** Flag for whether to include distance features (defaults to true). */
	public boolean includeDistFeats = true;

	/** The alphabet. */
	protected Alphabet alphabet = null;

	/** Current feature map. */
	protected FeatureMap currentMap = null;
	
	/** Current sign (for extracting features). */
	protected Sign currentSign = null;
	
	/** Current input signs (for extracting features). */
	protected Sign[] currentInputs = null;
	
	/** Current sibling (for extracting features). */
	protected Sign currentSibling = null;
	
	/** Current words (for extracting features). */
	protected List<Word> currentWords = null;
	
	/** Current head index (for extracting features). */
	protected int currentHeadIndex = -1;

	/** Current sibling head index (for extracting features). */
	protected int currentSibHeadIndex = -1;
	
	/** Current distance in words (for extracting features). */
	protected String currentDistW = null;

	/** Current distance in puncts (for extracting features). */
	protected String currentDistP = null;

	/** Current distance in verbs (for extracting features). */
	protected String currentDistV = null;

	/** Lexical feature extractors. */
	protected List<List<TrieMap.KeyExtractor<String>>> lexExtractors = new ArrayList<List<TrieMap.KeyExtractor<String>>>();
	
	/** Rule feature extractors. */
	protected List<List<TrieMap.KeyExtractor<String>>> unaryRuleExtractors = new ArrayList<List<TrieMap.KeyExtractor<String>>>();
	
	/** Binary rule feature extractors. */
	protected List<List<TrieMap.KeyExtractor<String>>> binaryRuleExtractors = new ArrayList<List<TrieMap.KeyExtractor<String>>>();
	
	/** Distance feature extractors. */
	protected List<List<TrieMap.KeyExtractor<String>>> distExtractors = new ArrayList<List<TrieMap.KeyExtractor<String>>>();
	
	
	/** Constructor. */
	public SyntacticFeatureExtractor() {
		// init lazy feature extractors
		lexExtractors.add(lexcat_word());
		lexExtractors.add(lexcat_pos());
		unaryRuleExtractors.add(unary_rule());
		unaryRuleExtractors.add(unary_rule_word());
		unaryRuleExtractors.add(unary_rule_pos());
		binaryRuleExtractors.add(binary_rule());
		binaryRuleExtractors.add(binary_rule_word());
		binaryRuleExtractors.add(binary_rule_pos());
		binaryRuleExtractors.add(rule_word_word());
		binaryRuleExtractors.add(rule_word_pos());
		binaryRuleExtractors.add(rule_pos_word());
		binaryRuleExtractors.add(rule_pos_pos());
		distExtractors.add(rule_word_dist());
		distExtractors.add(rule_pos_dist());
		distExtractors.add(rule_word_dist_puncts());
		distExtractors.add(rule_pos_dist_puncts());
		distExtractors.add(rule_word_dist_verbs());
		distExtractors.add(rule_pos_dist_verbs());
	}
	
	/** Sets the alphabet. */
	public void setAlphabet(Alphabet alphabet) {
		this.alphabet = alphabet;
	}
	
	
	/** Returns the features for the given sign and completeness flag. */
	public FeatureVector extractFeatures(Sign sign, boolean complete) {
		addFeatures(sign, complete);
		return getFeatureMap(sign);
	}
	
	/** Recursively adds features to the feature map for the given sign, if not already present. */
	protected void addFeatures(Sign sign, boolean complete) {
		// check for existing map, otherwise make one
		if (getFeatureMap(sign) != null) return;
		// lex case
		if (sign.isLexical()) {
			currentSign = sign;
			currentMap = new FeatureMap();
			inc(lexExtractors);
		}
		// non-terminal
		else {
			Sign[] inputs = sign.getDerivationHistory().getInputs();
			// first recurse
			for (Sign child : inputs) addFeatures(child, false);
			// use input maps in making current map
			currentSign = sign;
			currentInputs = inputs;
			if (inputs.length == 1) {
				currentMap = new FeatureMap(getFeatureMap(inputs[0]));
				inc(unaryRuleExtractors);
			}
			else if (inputs.length == 2) {
				currentMap = new FeatureMap(getFeatureMap(inputs[0]), getFeatureMap(inputs[1]));
				currentSibling = sibling(sign, inputs);
				inc(binaryRuleExtractors);
				// dist feats
				if (includeDistFeats) {
					currentWords = null; // get words and head indices lazily
					currentDistW = null; currentDistP = null; currentDistV = null; // also reset current distances
					inc(distExtractors);
				}
			}
		}
		// store it
		storeFeatureMap(sign);
	}
	
	/** Stores the current feature map as a data object in the given sign. */
	protected void storeFeatureMap(Sign sign) {
		sign.addData(new FeatureMapWrapper(currentMap));
	}
	
	/** Returns the feature map for this extractor from the given sign (null if none). */
	protected FeatureMap getFeatureMap(Sign sign) {
		FeatureMapWrapper fmw = (FeatureMapWrapper)sign.getData(FeatureMapWrapper.class);
		return (fmw != null) ? fmw.featureMap : null;
	}
	
	/**
	 * Increments the count of the given features, if relevant.
	 */
	protected void inc(List<List<TrieMap.KeyExtractor<String>>> extractors) {
		for (List<TrieMap.KeyExtractor<String>> lazyExtractor : extractors) {
			Alphabet.Feature f = alphabet.indexLazy(lazyExtractor);
			if (f != null) currentMap.inc(f);
		}
	}

	/** Returns the sibling sign from among the two inputs. */
	protected Sign sibling(Sign sign, Sign[] inputs) {
		if (sign.getLexHead() == inputs[0].getLexHead()) return inputs[1];
		else return inputs[0];
	}
	
	/** Sets the current words, if null, along with head indices. */
	protected void setCurrentWords() {
		if (currentWords != null) return;
		currentWords = currentSign.getWords();
		Word head = currentSign.getLexHead().getWords().get(0);
		Word sibHead = currentSibling.getLexHead().getWords().get(0);
		currentHeadIndex = find(currentWords, head);
		currentSibHeadIndex = find(currentWords, sibHead);
	}
	
	/** Returns the index of the given word in the list, or -1 if not found. */
	protected int find(List<Word> words, Word word) {
		int len = words.size();
		for (int i=0; i < len; i++) {
			if (words.get(i) == word) return i;
		}
		return -1;
	}
	
	/** Returns the distance in intervening words as 0w, 1w, 2w or 3w (for 3 or more). */
	protected String distWords() {
		if (currentDistW != null) return currentDistW;
		setCurrentWords();
		int dist = Math.abs(currentHeadIndex - currentSibHeadIndex) - 1;
		switch (dist) {
			case 0: return currentDistW = "0w";
			case 1: return currentDistW = "1w";
			case 2: return currentDistW = "2w";
			default: return currentDistW = "3w";
		}
	}
	
	/** Returns the distance in intervening punctuation marks as 0p, 1p, 2p or 3p (for 3 or more). */
	protected String distPuncts() {
		if (currentDistP != null) return currentDistP;
		setCurrentWords();
		int min = Math.min(currentHeadIndex, currentSibHeadIndex);
		int max = Math.max(currentHeadIndex, currentSibHeadIndex);
		int count = 0;
		for (int i=min+1; i < max; i++) {
			Word w = currentWords.get(i); 
			if (isPunct(w)) count++;
		}
		switch (count) {
			case 0: return currentDistP = "0p";
			case 1: return currentDistP = "1p";
			case 2: return currentDistP = "2p";
			default: return currentDistP = "3p";
		}
	}
	
	/**
	 * Returns whether a word is a punctuation mark that typically signals sentence-internal complexity.
	 * The default implementation tests for commas, dashes (--), semi-colons and colons.
	 */
	protected boolean isPunct(Word word) {
		// NB: in principle could use POS, but sometimes punctuation marks seem to end up with IN as the POS tag
		String form = word.getForm();
		return (form == "," || form == "--" || form == ";" || form == ":");
	}
	
	/** Returns the distance in intervening verbs as 0v, 1v, or 2v (for 2 or more). */
	protected String distVerbs() {
		if (currentDistV != null) return currentDistV;
		setCurrentWords();
		int min = Math.min(currentHeadIndex, currentSibHeadIndex);
		int max = Math.max(currentHeadIndex, currentSibHeadIndex);
		int count = 0;
		for (int i=min+1; i < max; i++) {
			Word w = currentWords.get(i); 
			if (isVerb(w)) count++;
		}
		switch (count) {
			case 0: return currentDistV = "0v";
			case 1: return currentDistV = "1v";
			default: return currentDistV = "2v";
		}
	}
	
	/**
	 * Returns whether a word is a verb.
	 * The default implementation tests for a POS tag beginning with V.
	 */
	protected boolean isVerb(Word word) {
		String pos = word.getPOS();
		return (pos.startsWith("V"));
	}
	
	
	// lex cat + word
	private List<TrieMap.KeyExtractor<String>> lexcat_word() {
		List<TrieMap.KeyExtractor<String>> retval = new ArrayList<TrieMap.KeyExtractor<String>>(2);
		add_supertag(retval);
		retval.add(new TrieMap.KeyExtractor<String>(){public String getKey(){ return currentSign.getWordForm(); }});
		return retval;
	}
	
	// add prefix + supertag
	private void add_supertag(List<TrieMap.KeyExtractor<String>> retval) {
		retval.add(new TrieMap.KeyExtractor<String>(){public String getKey(){ return PREFIX; }});
		retval.add(new TrieMap.KeyExtractor<String>(){public String getKey(){ return currentSign.getSupertag(); }});
	}
	
	// lex cat + pos
	private List<TrieMap.KeyExtractor<String>> lexcat_pos() {
		List<TrieMap.KeyExtractor<String>> retval = new ArrayList<TrieMap.KeyExtractor<String>>(2);
		add_supertag(retval);
		retval.add(new TrieMap.KeyExtractor<String>(){public String getKey(){ return currentSign.getPOS(); }});
		return retval;
	}
	
	// rule
	private List<TrieMap.KeyExtractor<String>> unary_rule() {
		List<TrieMap.KeyExtractor<String>> retval = new ArrayList<TrieMap.KeyExtractor<String>>(2);
		add_unary_rule(retval);
		return retval;
	}
	
	private void add_unary_rule(List<TrieMap.KeyExtractor<String>> retval) {
		add_supertag(retval);
		retval.add(new TrieMap.KeyExtractor<String>(){public String getKey(){ return currentInputs[0].getSupertag(); }});
	}
	
	private List<TrieMap.KeyExtractor<String>> binary_rule() {
		List<TrieMap.KeyExtractor<String>> retval = new ArrayList<TrieMap.KeyExtractor<String>>(3);
		add_binary_rule(retval);
		return retval;
	}
	
	private void add_binary_rule(List<TrieMap.KeyExtractor<String>> retval) {
		add_unary_rule(retval);
		retval.add(new TrieMap.KeyExtractor<String>(){public String getKey(){ return currentInputs[1].getSupertag(); }});
	}
	
	// rule + head word
	private List<TrieMap.KeyExtractor<String>> unary_rule_word() {
		List<TrieMap.KeyExtractor<String>> retval = new ArrayList<TrieMap.KeyExtractor<String>>(3);
		add_unary_rule_word(retval);
		return retval;
	}
	
	private void add_unary_rule_word(List<TrieMap.KeyExtractor<String>> retval) {
		add_unary_rule(retval);
		add_lex_word(retval);
	}
	
	private void add_lex_word(List<TrieMap.KeyExtractor<String>> retval) {
		retval.add(new TrieMap.KeyExtractor<String>(){public String getKey(){ return currentSign.getLexHead().getWordForm(); }});
	}
	
	private List<TrieMap.KeyExtractor<String>> binary_rule_word() {
		List<TrieMap.KeyExtractor<String>> retval = new ArrayList<TrieMap.KeyExtractor<String>>(4);
		add_binary_rule_word(retval);
		return retval;
	}
	
	private void add_binary_rule_word(List<TrieMap.KeyExtractor<String>> retval) {
		add_binary_rule(retval);
		add_lex_word(retval);
	}
	
	// rule + head pos
	private List<TrieMap.KeyExtractor<String>> unary_rule_pos() {
		List<TrieMap.KeyExtractor<String>> retval = new ArrayList<TrieMap.KeyExtractor<String>>(3);
		add_unary_rule_pos(retval);
		return retval;
	}
	
	private void add_unary_rule_pos(List<TrieMap.KeyExtractor<String>> retval) {
		add_unary_rule(retval);
		add_lex_pos(retval);
	}
	
	private void add_lex_pos(List<TrieMap.KeyExtractor<String>> retval) {
		retval.add(new TrieMap.KeyExtractor<String>(){public String getKey(){ return currentSign.getLexHead().getPOS(); }});
	}
	
	private List<TrieMap.KeyExtractor<String>> binary_rule_pos() {
		List<TrieMap.KeyExtractor<String>> retval = new ArrayList<TrieMap.KeyExtractor<String>>(4);
		add_binary_rule_pos(retval);
		return retval;
	}
	
	private void add_binary_rule_pos(List<TrieMap.KeyExtractor<String>> retval) {
		add_binary_rule(retval);
		add_lex_pos(retval);
	}
	
	// rule + head word + sibling word
	private List<TrieMap.KeyExtractor<String>> rule_word_word() {
		List<TrieMap.KeyExtractor<String>> retval = new ArrayList<TrieMap.KeyExtractor<String>>(5);
		add_binary_rule_word(retval);
		add_sibling_word(retval);
		return retval;
	}
	
	private void add_sibling_word(List<TrieMap.KeyExtractor<String>> retval) {
		retval.add(new TrieMap.KeyExtractor<String>(){public String getKey(){ return currentSibling.getLexHead().getWordForm(); }});
	}
	
	// rule + head word + sibling pos
	private List<TrieMap.KeyExtractor<String>> rule_word_pos() {
		List<TrieMap.KeyExtractor<String>> retval = new ArrayList<TrieMap.KeyExtractor<String>>(5);
		add_binary_rule_word(retval);
		add_sibling_pos(retval);
		return retval;
	}
	
	private void add_sibling_pos(List<TrieMap.KeyExtractor<String>> retval) {
		retval.add(new TrieMap.KeyExtractor<String>(){public String getKey(){ return currentSibling.getLexHead().getPOS(); }});
	}
	
	// rule + head pos + sibling word
	private List<TrieMap.KeyExtractor<String>> rule_pos_word() {
		List<TrieMap.KeyExtractor<String>> retval = new ArrayList<TrieMap.KeyExtractor<String>>(5);
		add_binary_rule_pos(retval);
		add_sibling_word(retval);
		return retval;
	}
	
	// rule + head pos + sibling pos
	private List<TrieMap.KeyExtractor<String>> rule_pos_pos() {
		List<TrieMap.KeyExtractor<String>> retval = new ArrayList<TrieMap.KeyExtractor<String>>(5);
		add_binary_rule_pos(retval);
		add_sibling_pos(retval);
		return retval;
	}
	
	// rule + head word + dist
	private List<TrieMap.KeyExtractor<String>> rule_word_dist() {
		List<TrieMap.KeyExtractor<String>> retval = new ArrayList<TrieMap.KeyExtractor<String>>(5);
		add_binary_rule_word(retval);
		add_dist_words(retval);
		return retval;
	}
	
	private void add_dist_words(List<TrieMap.KeyExtractor<String>> retval) {
		retval.add(new TrieMap.KeyExtractor<String>(){public String getKey(){ return distWords(); }});
	}
	
	// rule + head pos + dist
	private List<TrieMap.KeyExtractor<String>> rule_pos_dist() {
		List<TrieMap.KeyExtractor<String>> retval = new ArrayList<TrieMap.KeyExtractor<String>>(5);
		add_binary_rule_pos(retval);
		add_dist_words(retval);
		return retval;
	}
	
	// rule + head word + dist in puncts
	private List<TrieMap.KeyExtractor<String>> rule_word_dist_puncts() {
		List<TrieMap.KeyExtractor<String>> retval = new ArrayList<TrieMap.KeyExtractor<String>>(5);
		add_binary_rule_word(retval);
		add_dist_puncts(retval);
		return retval;
	}
	
	private void add_dist_puncts(List<TrieMap.KeyExtractor<String>> retval) {
		retval.add(new TrieMap.KeyExtractor<String>(){public String getKey(){ return distPuncts(); }});
	}
	
	// rule + head pos + dist in puncts
	private List<TrieMap.KeyExtractor<String>> rule_pos_dist_puncts() {
		List<TrieMap.KeyExtractor<String>> retval = new ArrayList<TrieMap.KeyExtractor<String>>(5);
		add_binary_rule_pos(retval);
		add_dist_puncts(retval);
		return retval;
	}
	
	// rule + head word + dist in verbs
	private List<TrieMap.KeyExtractor<String>> rule_word_dist_verbs() {
		List<TrieMap.KeyExtractor<String>> retval = new ArrayList<TrieMap.KeyExtractor<String>>(5);
		add_binary_rule_word(retval);
		add_dist_verbs(retval);
		return retval;
	}
	
	private void add_dist_verbs(List<TrieMap.KeyExtractor<String>> retval) {
		retval.add(new TrieMap.KeyExtractor<String>(){public String getKey(){ return distVerbs(); }});
	}
	
	// rule + head pos + dist in verbs
	private List<TrieMap.KeyExtractor<String>> rule_pos_dist_verbs() {
		List<TrieMap.KeyExtractor<String>> retval = new ArrayList<TrieMap.KeyExtractor<String>>(5);
		add_binary_rule_pos(retval);
		add_dist_verbs(retval);
		return retval;
	}
}


================================================
FILE: src/opennlp/ccg/synsem/TargetCat.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2002 Jason Baldridge
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.synsem;

/**
 * A category that can be a target of a curried cat.  Basically, atomcats or
 * variable cats.
 *
 * @author      Jason Baldridge
 * @version     $Revision: 1.1.1.1 $, $Date: 2003/02/28 18:02:13 $
 */
public interface TargetCat extends Category {

}


================================================
FILE: src/opennlp/ccg/synsem/VarModality.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2002-7 Jason Baldridge and Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.synsem;

import java.io.Serializable;
import gnu.trove.TObjectIntHashMap;

import opennlp.ccg.unify.*;

/**
 * A class for variables which can stand for slash modalities.
 *
 * @author      Jason Baldridge
 * @author		Michael White
 * @version     $Revision: 1.4 $, $Date: 2009/07/17 04:23:30 $
 **/
public class VarModality implements Variable, Indexed, Mutable, Modality, Serializable {
    
	private static final long serialVersionUID = 7465785777802095802L;
	
	protected final String _name;
    protected int _index;
    protected int _hashCode;
    
    private static int UNIQUE_STAMP = 0;
    
    public VarModality() {
        this("VM"+UNIQUE_STAMP++);
    }
    
    public VarModality(String name) {
        this(name, 0);
    }

    protected VarModality(String name, int index) {
        _name = name;
        _index = index;
        _hashCode = _name.hashCode() + _index;
    }
    
    public String name() {
        return _name;
    }

    public Object copy() {
        return new VarModality(_name, _index);
    }
    
    public void deepMap(ModFcn mf) {
        mf.modify(this);
    }
    
    public int getIndex() {
        return _index;
    }

    public void setIndex(int index) {
        _hashCode += index - _index;
        _index = index;
    }

    public boolean occurs(Variable var) {
        return equals(var);
    }

    public int hashCode() {
        return _hashCode;
    }
    
    public boolean equals(Object o) {
    	if (this == o) return true;
        if (!(o instanceof VarModality)) return false;
        VarModality vm = (VarModality) o;
        return _index == vm._index && _name.equals(vm._name);
    }

    /**
	 * Returns a hash code using the given map from vars to ints.
	 */
	public int hashCode(TObjectIntHashMap varMap) {
		// see if this already in map
		if (varMap.containsKey(this))
			return varMap.get(this);
		// otherwise add it
		int next = varMap.size() + 1;
		varMap.put(this, next);
		return next;
	}
        
    /**
	 * Returns whether this var equals the given object up to variable names,
	 * using the given maps from vars to ints.
	 */
    public boolean equals(Object obj, TObjectIntHashMap varMap, TObjectIntHashMap varMap2) {
        if (this == obj) return true;
        if (obj.getClass() != this.getClass()) { return false; }
        VarModality vm = (VarModality) obj;
        if (varMap.get(this) != varMap2.get(vm)) return false;
        return true;
    }
    
    public void unifyCheck(Object o) throws UnifyFailure {
        if (!(o instanceof SlashMode || o instanceof VarModality)) {
            throw new UnifyFailure();
        }
    }
    
    public Object unify(Object u, Substitution sub) throws UnifyFailure {
        if (u instanceof SlashMode) {
            return sub.makeSubstitution(this, u);    
        } else if (u instanceof VarModality) {
            VarModality var2 = (VarModality)u;
            Variable $var = new VarModality(_name+var2._name,
                            UnifyControl.getUniqueVarIndex());
            
            sub.makeSubstitution(this, $var);
            sub.makeSubstitution(var2, $var);
            return $var;
        } else {
            throw new UnifyFailure();
        }
    }

    public Object fill(Substitution sub) throws UnifyFailure {
        Object val = sub.getValue(this);
        if (val != null) {
            return val;
        } else {
            return this;
        }
    }

    public byte getDirection() {
        return Slash.B;
    }
    
    public String toString(byte dir) { 
        return toString();
    }

    public String toString() { 
        return _name;
    }
    
    public String toTeX(byte dir) {    
        return toTeX();
    }

    public String toTeX() {    
        return  _name;
    }
}


================================================
FILE: src/opennlp/ccg/test/CrossValidateRealizer.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2004 University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.test;

import opennlp.ccg.grammar.*;
import opennlp.ccg.realize.*;
import opennlp.ccg.synsem.SignScorer;
import opennlp.ccg.ngrams.*;

import java.io.*;
import java.net.*;
import java.util.*;
//import java.util.prefs.*;
//import java.text.NumberFormat;

import org.jdom.*;
import org.jdom.input.*;

/**
 * Runs cross-validation tests with the realizer.
 *
 * @author  Michael White
 * @version $Revision: 1.30 $, $Date: 2011/03/20 20:11:58 $
 */
public class CrossValidateRealizer implements ScorerMaker {

    /** The tester to use. */
    public Regression tester = null;

    /** The path to the tmp dir. */
    public String tmpdir = "tmp";
    
    // the actual tmp dir
    private File tmpDir = null;
    
    /** The number of cross-validation folds, either 1.x or an int of at least 2. */
    public double numFolds = 10;

    /** The scorer maker, for preparing and loading scoring models. */
    public ScorerMaker scorerMaker = this;
    
    /** The pruning strategy, if any. */
    public PruningStrategy pruningStrategy = null;
    
    
    /** Sets up the tester with the given grammar. */
    public CrossValidateRealizer(URL grammarURL) throws IOException {

        // init tester
        tester = new Regression();
        
        // load grammar
        System.out.println("Loading grammar from URL: " + grammarURL);
        tester.grammar = new Grammar(grammarURL);
        System.out.println();
    }

        
    /** Sets up the folds in tmpdir. */
	@SuppressWarnings({ "unchecked", "rawtypes" })
	public void setupInputs(URL testbedURL) throws IOException {
        
        // ensure tmpdir exists
        tmpDir = new File(tmpdir);
        if (!tmpDir.exists()) { tmpDir.mkdirs(); }
        
        try {
            // load items
            System.out.println("Loading testbed from URL: " + testbedURL);
            SAXBuilder builder = new SAXBuilder();
            Document inputDoc = builder.build(testbedURL.openStream());
            System.out.println();
            Element inputRoot = inputDoc.getRootElement();
            List inputItems = inputRoot.getChildren("item");
            
            System.out.println("Setting up inputs in tmpdir: " + tmpdir);
            
            // make, save shuffled doc
            Document shuffledDoc = new Document();
            Element shuffledRoot = new Element("regression");
            shuffledDoc.setRootElement(shuffledRoot);
            Random rand = new Random();
            while (inputItems.size() > 0) {
                Element rItem = (Element) inputItems.remove(rand.nextInt(inputItems.size()));
                shuffledRoot.addContent(rItem);
            }
            FileOutputStream shuffledOut = new FileOutputStream(new File(tmpDir, "shuffled.xml")); 
            tester.grammar.serializeXml(shuffledDoc, shuffledOut);
            shuffledOut.close();
            List shuffledItems = shuffledRoot.getChildren("item");
            int numItems = shuffledItems.size();
            Element[] shuffledItemsArray = new Element[numItems];
            shuffledItems.toArray(shuffledItemsArray); // need a non-live listing
            
            // get LF listing
            Element[] shuffledLFsArray = new Element[numItems];
            for (int i = 0; i < numItems; i++) {
                Element item = shuffledItemsArray[i];
                shuffledLFsArray[i] = item.getChild("lf");
                // reduce content to just full-words (if present)
                Element fullWords = item.getChild("full-words");
                item.setContent((List)null);
                if (fullWords != null) item.addContent(fullWords);
            }
            
            // make folds docs, leaving LFs out of training, and 
            // removing any exact duplicates with test items 
            int itemsPerFold = (int) Math.floor(numItems / (numFolds * 1.0));
            Set<String> testStrings = new HashSet<String>();
            int dups = 0;
            for (int i = 0; i < numFolds; i++) {
                testStrings.clear(); dups = 0;
                int foldStart = i * itemsPerFold;
                int foldLimit = (i < numFolds - 1) ? foldStart + itemsPerFold : numItems;
                Document testDoc = new Document();
                Element testRoot = new Element("regression");
                testDoc.setRootElement(testRoot);
                Document trainDoc = new Document();
                Element trainRoot = new Element("regression");
                trainDoc.setRootElement(trainRoot);
                // split items into train/test
                for (int j = 0; j < numItems; j++) {
                    Element item = shuffledItemsArray[j]; 
                    item.detach();
                    Element lf = shuffledLFsArray[j];
                    if (foldStart <= j && j < foldLimit) {
                        testRoot.addContent(item);
                        item.addContent(lf);
                        testStrings.add(item.getAttributeValue("string"));
                    }
                    else { 
                        // special case for 1.x folds: limit training data 
                        // to first numItems - itemsPerFold items
                        if (numFolds < 2 && i == 1 && j >= (numItems - itemsPerFold))
                            continue;
                        trainRoot.addContent(item);
                    }
                }
                // check for dups in training items
                List trainingItems = trainRoot.getChildren("item");
                for (Iterator it = trainingItems.iterator(); it.hasNext(); ) {
                    Element item = (Element) it.next();
                    if (testStrings.contains(item.getAttributeValue("string"))) {
                        it.remove(); dups++;
                    }
                }
                if (dups > 0) { 
                    System.out.println("Removing " + dups + " test item duplicate(s) from training, fold " + i);
                }
                FileOutputStream testOut = new FileOutputStream(new File(tmpDir, testFileName(i))); 
                tester.grammar.serializeXml(testDoc, testOut);
                testOut.close();
                FileOutputStream trainOut = new FileOutputStream(new File(tmpDir, trainingFileName(i))); 
                tester.grammar.serializeXml(trainDoc, trainOut);
                trainOut.close();
            }
            
            System.out.println();
        }
        catch (JDOMException exc) {
            throw (IOException) new IOException().initCause(exc);
        }
    }

    // training/test file names
    private String trainingFileName(int foldNum) { return "fold" + foldNum + "-train.xml"; }
    private String testFileName(int foldNum) { return "fold" + foldNum + "-test.xml"; }
    
    /** Does scorer prep (if any) on the folds already set-up in tmpdir. */
    public void prepScorers() throws IOException {
        // ensure tmpDir set
        if (tmpDir == null) tmpDir = new File(tmpdir);
        System.out.println("Preparing scorers in tmpdir: " + tmpdir);
        System.out.println();
        // do each fold
        for (int i = 0; i < numFolds; i++) {
            // make training/test files for fold
            File trainFile = new File(tmpDir, trainingFileName(i));
            File testFile = new File(tmpDir, testFileName(i));
            // prep scorer
            scorerMaker.prepScorer(tmpDir, i, trainFile, testFile);
        }
        // summary
        scorerMaker.prepScorersSummary(tmpDir);
    }

    
    /** Default, do-nothing implementation of ScorerMaker.setCVR. */
    public void setCVR(CrossValidateRealizer cvr) {}
    
    /** Default, do-nothing implementation of ScorerMaker.prepScorer. */
    public void prepScorer(File tmpDir, int foldNum, File trainFile, File testFile) throws IOException {}
    
    /** Default, do-nothing implementation of ScorerMaker.prepScorersSummary. */
    public void prepScorersSummary(File tmpDir) throws IOException {}
    
    /**
     * Default implementation of ScorerMaker.loadScorer.
     * Loads an n-gram precision model with semantic class replacement, 
     * using targets from the training data. 
     */
    public SignScorer loadScorer(File tmpDir, int foldNum, File trainFile) throws IOException {
        RegressionInfo trainingItems = new RegressionInfo(tester.grammar, trainFile);
        String[] targets = new String[trainingItems.numberOfItems()];
        for (int i=0; i < trainingItems.numberOfItems(); i++) {
            targets[i] = trainingItems.getItem(i).sentence;
        }
        NgramPrecisionModel retval = (tester.ngramOrder > 0) 
            ? new NgramPrecisionModel(targets, tester.ngramOrder, true) 
            : new NgramPrecisionModel(targets, true);
        return retval;
    }
    

    /** Run the cross-validation test on the folds already set-up in tmpdir. */
    public void runTest() throws IOException {

        // ensure tmpDir set
        if (tmpDir == null) tmpDir = new File(tmpdir);
        
        // turn-off parsing, stats
        tester.doParsing = false;
        tester.showStats = false;
        
        // setup realizer
        tester.realizer = new Realizer(tester.grammar);
        if (pruningStrategy != null) {
            tester.realizer.pruningStrategy = pruningStrategy;
        }

        // show realizer settings
        Regression.showRealizerSettings();
        
        // do each fold
        for (int i = 0; i < numFolds; i++) {
            // make files for fold
            File trainFile = new File(tmpDir, trainingFileName(i));
            File testFile = new File(tmpDir, testFileName(i));
            // load scorer
            tester.scorer = scorerMaker.loadScorer(tmpDir, i, trainFile);
            // run test
            tester.runTest(testFile);
        }
        
        // show stats
        tester.showStats();
    }
    
    
    /** Command-line routine for cross-validating realizer. */
    public static void main(String[] args) throws IOException { 
        
        String usage = "java opennlp.ccg.test.CrossValidateRealizer " + 
                       "(-folds N) (-tmp <tmpdir>) " +
                       "(-setuponly) (-skipsetup) " + 
                       "(-preponly) (-skipprep) " + 
                       "(-ngramorder N) " + 
                       "(-scorermaker <scorermakerclass>) " + 
                       "(-pruningstrategy <pruningstrategyclass>) " +
                       "(-g <grammarfile>) (-s <statsfile>) (<testbedfile>)";
                       
        if (args.length > 0 && args[0].equals("-h")) {
            System.out.println("Usage: " + usage);
            System.exit(0);
        }
        
        // args
        double numFolds = 0;
        String tmpdir = null;
        boolean setupOnly = false;
        boolean skipSetup = false;
        boolean prepOnly = false;
        boolean skipPrep = false;
        int ngramOrder = 0;
        String scorerMakerClass = null;
        String pruningStrategyClass = null; 
        String grammarfile = "grammar.xml";
        String testbedfile = "testbed.xml";
        String statsfile = null;
        for (int i = 0; i < args.length; i++) {
            if (args[i].equals("-folds")) { 
                numFolds = Double.parseDouble(args[++i]); 
                if (numFolds < 1 || (numFolds >= 2 && numFolds != Math.round(numFolds))) {
                    System.out.println("Error, folds must be 1.x or an int of at least 2");
                    System.exit(-1);
                }
                continue; 
            }
            if (args[i].equals("-tmp")) { tmpdir = args[++i]; continue; }
            if (args[i].equals("-setuponly")) { setupOnly = true; continue; }
            if (args[i].equals("-skipsetup")) { skipSetup = true; continue; }
            if (args[i].equals("-preponly")) { prepOnly = true; continue; }
            if (args[i].equals("-skipprep")) { skipPrep = true; continue; }
            if (args[i].equals("-ngramorder")) { ngramOrder = Integer.parseInt(args[++i]); continue; }
            if (args[i].equals("-scorermaker")) { scorerMakerClass = args[++i]; continue; }
            if (args[i].equals("-pruningstrategy")) { pruningStrategyClass = args[++i]; continue; }
            if (args[i].equals("-g")) { grammarfile = args[++i]; continue; }
            if (args[i].equals("-s")) { statsfile = args[++i]; continue; }
            testbedfile = args[i];
        }
        
        // make cross-validator
        URL grammarURL = new File(grammarfile).toURI().toURL();
        CrossValidateRealizer cvr = new CrossValidateRealizer(grammarURL);
        if (numFolds > 0) cvr.numFolds = numFolds;
        if (tmpdir != null) cvr.tmpdir = tmpdir;
        if (ngramOrder > 0) cvr.tester.ngramOrder = ngramOrder;
        if (scorerMakerClass != null) {
            try {
                cvr.scorerMaker = (ScorerMaker) Class.forName(scorerMakerClass).newInstance();
                cvr.scorerMaker.setCVR(cvr);
            } catch (Exception exc) {
                throw (RuntimeException) new RuntimeException().initCause(exc);
            }
        }
        if (pruningStrategyClass != null) {
            try {
                cvr.pruningStrategy = (PruningStrategy) Class.forName(pruningStrategyClass).newInstance();
            } catch (Exception exc) {
                throw (RuntimeException) new RuntimeException().initCause(exc);
            }
        }
        if (statsfile != null) cvr.tester.statsfile = statsfile;

        // set-up inputs
        URL testbedURL = new File(testbedfile).toURI().toURL();
        if (!skipSetup) { cvr.setupInputs(testbedURL); }
        if (setupOnly) { System.exit(0); }

        // prep scorers
        if (!skipPrep) { cvr.prepScorers(); }
        if (prepOnly) { System.exit(0); }
        
        // run test
        System.gc();
        cvr.runTest();
    }
}


================================================
FILE: src/opennlp/ccg/test/DerivMaker.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2016 Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.test;

//import java.util.*;
import org.jdom.*;
import opennlp.ccg.synsem.*;

/**
 * Utility class for exporting derivations in xml.
 *
 * @author  Michael White
 * @version $Revision: 1.5 $, $Date: 2009/12/21 04:18:31 $
 */
public class DerivMaker {

	/** 
	 * Returns a derivation in the same format as the converted CCGbank, 
	 * but just with the lexemes, POS tags and supertags.
	 */
	public static Element makeDeriv(Sign sign) {
		Element retval;
		if (sign.isLexical()) {
			retval = new Element("Leafnode");
			retval.setAttribute("lexeme",sign.getOrthography());
			retval.setAttribute("pos",sign.getPOS());
		}
		else {
			retval = new Element("Treenode");
			for (Sign child: sign.getDerivationHistory().getInputs())
				retval.addContent(makeDeriv(child));
		}
		retval.setAttribute("stag",sign.getSupertag());
		return retval;
	}
}


================================================
FILE: src/opennlp/ccg/test/GenTargets.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2004 University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.test;

import opennlp.ccg.realize.*;
import opennlp.ccg.grammar.*;
import opennlp.ccg.synsem.*;
import opennlp.ccg.ngrams.*;

import org.jdom.*;

import java.io.*;
import java.net.*;
import java.util.*;

/**
 * Generates initial target sentences from a list of logical forms. 
 * The input is an XML file with a list of top-level LF elements.
 * The output is a testbed file, with the number of parses just 
 * set to 1 (rather than actually being computed).
 * The best realization is determined using n-grams from an 
 * existing testbed file.
 *
 * @author      Michael White
 * @version     $Revision: 1.9 $, $Date: 2009/12/21 04:18:31 $
 */
public class GenTargets
{
    /** The grammar. */
    private Grammar grammar; 

    /** The realizer instance. */
    private Realizer realizer;
    
    /** The n-gram scorer. */
    private NgramScorer ngramScorer;
    
    /** The unique target strings. */
    private Set<String> uniqueTargets = new HashSet<String>();
    
    /** 
     * Constructor: loads grammar, instantiates realizer, and sets up n-gram scorer 
     * using targets with sem class replacement from the testbed.
     */
    private GenTargets(URL grammarURL, File regressionFile) throws IOException {

        // load grammar
        System.out.println("Loading grammar from: " + grammarURL);
        grammar = new Grammar(grammarURL);

        // set up n-gram scorer
        System.out.println("Loading target phrases from: " + regressionFile);
        RegressionInfo rinfo = new RegressionInfo(grammar, regressionFile);
        String[] targets = new String[rinfo.numberOfItems()];
        for (int i=0; i < targets.length; i++) {
            String target = rinfo.getItem(i).sentence;
            targets[i] = target;
        }
        // use targets with sem class replacement
        ngramScorer = new NgramPrecisionModel(targets, true);
        
        // instantiate realizer        
        realizer = new Realizer(grammar);
    }
    
    // does realization, adds test case
    private void realize(Element lfElt, Element outRoot) throws IOException {
        // get LF
        LF lf = Realizer.getLfFromElt(lfElt);
        
        // run request
        realizer.realize(lf, ngramScorer); 
        Chart chart = realizer.getChart();
        
        // make test item (w/o trying to figure out the correct number of parses)
        String target = chart.bestEdge.getSign().getOrthography();
        if (uniqueTargets.contains(target)) {
            System.out.println("Duplicate realization: " + target);
            return;
        }
        uniqueTargets.add(target);
        System.out.println("Best realization: " + target);
        Element testElt = RegressionInfo.makeTestItem(grammar, target, 1, lf); 
        
        // add to output
        outRoot.addContent(testElt);
        if (!chart.bestEdge.complete()) {
            System.out.println("NB: realization incomplete!");
            testElt.setAttribute("complete", "false");
        }
    }
    
    
    /** Creates generator and runs it on the given input file. */    
    @SuppressWarnings("unchecked")
	public static void main(String[] args) throws IOException {
        
        String usage = "Usage: java opennlp.ccg.test.GenTargets (-g <grammarfile>) (-tb <testbedfile>) <inputfile> <outputfile>";
        
        if (args.length > 0 && args[0].equals("-h")) {
            System.out.println(usage);
            System.exit(0);
        }

        // args
        String grammarfile = "grammar.xml";
        String testbedfile = "testbed.xml";
        String inputfile = null;
        String outputfile = null;
        for (int i = 0; i < args.length; i++) {
            if (args[i].equals("-g")) {
                grammarfile = args[++i]; continue; 
            }
            if (args[i].equals("-tb")) {
                testbedfile = args[++i]; continue; 
            }
            if (inputfile == null) {
                inputfile = args[i]; continue;
            }
            if (outputfile == null) {
                outputfile = args[i]; continue;
            }
        }
        if (inputfile == null || outputfile == null) {
            System.out.println(usage);
            System.exit(0);
        }

        // create Generator
        File gFile = new File(grammarfile);
        URL grammarURL = gFile.toURI().toURL();
        File tbFile = new File(testbedfile);
        if (!tbFile.exists()) {
            tbFile = new File(gFile.getParentFile(), testbedfile);
        }
        GenTargets gen = new GenTargets(grammarURL, tbFile);
        
        // load input LFs
        System.out.println("Loading LFs from: " + inputfile);
        Document doc = gen.grammar.loadFromXml(inputfile);
        
        // create output doc
        Document outDoc = new Document();
        Element outRoot = new Element("regression");
        outDoc.setRootElement(outRoot);

        // realize each one
        System.out.println("Realizing LFs ...");
        Element root = doc.getRootElement();
        List<Element> lfElts = root.getChildren("lf");
        for (int i = 0; i < lfElts.size(); i++) {
            Element lfElt = (Element) lfElts.get(i); 
            try {
                gen.realize(lfElt, outRoot);
            }
            catch (Exception exc) {
                System.out.println("Warning: unable to realize LF " + i + ": " + exc);
            }
        }
        
        // save file
        System.out.println("Saving results to: " + outputfile);
        FileOutputStream out = new FileOutputStream(outputfile); 
        gen.grammar.serializeXml(outDoc, out);
        out.close();
        
        System.out.println("Done.");
    }
}


================================================
FILE: src/opennlp/ccg/test/Regression.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003-9 Jason Baldridge and Michael White (University of Edinburgh / The Ohio State University)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.test;

import java.io.*;
import java.net.URL;
import java.text.*;
import java.util.*;
import java.util.prefs.Preferences;

import opennlp.ccg.TextCCG;
import opennlp.ccg.grammar.Grammar;
import opennlp.ccg.hylo.*;
import opennlp.ccg.lexicon.Tokenizer;
import opennlp.ccg.lexicon.Word;
import opennlp.ccg.ngrams.*;
import opennlp.ccg.parse.ParseException;
import opennlp.ccg.parse.Parser;
import opennlp.ccg.parse.Supertagger;
import opennlp.ccg.parse.supertagger.WordAndPOSDictionaryLabellingStrategy;
import opennlp.ccg.realize.*;
import opennlp.ccg.realize.hypertagger.ZLMaxentHypertagger;
import opennlp.ccg.synsem.*;
import opennlp.ccg.util.Pair;
import opennlp.ccg.util.SingletonList;
import opennlp.ccg.perceptron.*;

import org.jdom.*;
import org.jdom.output.Format;
import org.jdom.output.XMLOutputter;

/**
 * Automates the testing of CCG grammars.
 *
 * @author  Jason Baldridge
 * @author  Michael White
 * @version $Revision: 1.151 $, $Date: 2011/12/11 16:51:58 $
 */
public class Regression {

    /** Flag for whether to do parsing. */
    public boolean doParsing = true;
    
    /** Flag for whether to do realization. */
    public boolean doRealization = true;

    /** Flag for whether to just do even items. */
    public boolean evenOnly = false;

    /** Flag for whether to just do odd items. */
    public boolean oddOnly = false;
    
    /** Flag for whether to do garbage collection before each iteration. */
    public boolean doGC = false;
    
    /** File to write events to (if any). */
    public String eventfile = null;
    
    /** Flag for whether to include the gold sign when generating events. */
    public boolean includeGoldInEvents = false;
    
    /** Directory for writing APML files (if any). */
    public String apmldir = null;
    
    /** Flag for whether to show realization stats. */
    public boolean showStats = true;
    
    /** Flag for whether to show parsing stats. */
    public boolean showParseStats = false;
    
    /** File to dump realizer stats to (if any). */
    public String statsfile = null;
    
    /** File prefix to write bleu test files to (if any). */
    public String bleufileprefix = null;

    /** File to write n-best realizations to (if any). */
    public String nbestrealfile = null;
    
    /** Flag for whether to normalize strings as for BLEU scoring in n-best output. */
    public boolean nbestnormbleu = false;
    
    /** Directory to save best realization serializations to (if any). */
    public String realserdir = null;
    
    /** File to write rescored sign scores to (if any). */
    public String rescorefile = null;
    
    /** Map from info keys to best realization signs for serialization (if any). */
    public Map<String,Sign> bestRealMap = null;
    
    /** Flag for whether to include LFs in n-best output. */
    public boolean nbestincludelfs = false;
    
    /** File to write n-best parses to (if any). */
    public String nbestparsefile = null;
    
    /** The grammar to use for testing. */
    public Grammar grammar = null;
    
    /** The parser to use for testing. */
    public Parser parser = null;
    
    /** The realizer to use for testing. */
    public Realizer realizer = null;
    
    /** The scorer to use for realizer testing (or null, for default). */
    public SignScorer scorer = null;
    
    /** The scorer to use for parser testing. */
    public SignScorer parseScorer = null;
    
    /** Flag for whether to only allow exact matches with the default scorer. */
    public boolean exactMatches = false;
    
    /** The n-gram order to use with the default scorer (or 0, for default). */
    public int ngramOrder = 0; 

    /** The feature extractor to use in extracting events. */
    public FeatureExtractor featureExtractor = null;
    
    //
    // the various totals
    //

    public int pCount = 0;
    public int pBadCount = 0;
    public int pFailedCount = 0;
    public int pExactCount = 0;
    public double totalF = 0.0;
    public double totalRecall = 0.0;
    public double totalPrecision = 0.0;
    public double totalDepsF = 0.0;
    public double totalDepsRecall = 0.0;
    public double totalDepsPrecision = 0.0;
    public double totalUnlabeledDepsF = 0.0;
    public double totalUnlabeledDepsRecall = 0.0;
    public double totalUnlabeledDepsPrecision = 0.0;
    public double totalFComplete = 0.0;
    public double totalRecallComplete = 0.0;
    public double totalPrecisionComplete = 0.0;
    public double totalDepsFComplete = 0.0;
    public double totalDepsRecallComplete = 0.0;
    public double totalDepsPrecisionComplete = 0.0;
    public double totalUnlabeledDepsFComplete = 0.0;
    public double totalUnlabeledDepsRecallComplete = 0.0;
    public double totalUnlabeledDepsPrecisionComplete = 0.0;
    public int pTotalEdges = 0;
    public int pTotalEdgesGood = 0;
    public int pMaxEdges = 0;
    public int pMaxEdgesGood = 0;
    public int pTotalUnpackingEdges = 0;
    public int pMaxUnpackingEdges = 0;
    public int pTotalCellMax = 0;
    public int pTotalCellMaxGood = 0;
    public int pMaxCellMax = 0;
    public int pMaxCellMaxGood = 0;
    public int pTotalLexTime = 0;
    public int pTotalParseTime = 0;
    public int pTotalChartTime = 0;
    public int pTotalUnpackingTime = 0;
    public int pMaxLexTime = 0;
    public int pMaxParseTime = 0;
    public int pMaxChartTime = 0;
    public int pMaxUnpackingTime = 0;
    public Map<Double,Integer> pBetaTallies = null;
    
    public int rCount = 0;
    public int rDoneCount = 0;
    public int rBadCount = 0;
    public int rExactCount = 0;
    public double totalScore = 0.0;
    public double totalScoreComplete = 0.0;
    public double totalReciprocalRank = 0.0;
    public int totalNominals = 0; 
    public int totalTokens = 0;
    public int minTokens = 0;
    public int maxTokens = 0;
    public int totalRuleApps = 0;
    public int totalEdges = 0;
    public int totalEdgesCreated = 0;
    public int totalUnprunedEdges = 0;
    public int totalPrunedRemoved = 0;
    public int totalPrunedNeverAdded = 0;
    public int totalCellMax = 0;
    public int totalNewBest = 0;
    public int totalLex = 0;
    public int totalFirst = 0;
    public int totalBest = 0;
    public int totalPacked = 0;
    public int totalStoppedOrDone = 0;
    public int maxLex = 0;
    public int maxFirst = 0;
    public int maxBest = 0;
    public int maxNewBest = 0;
    public int maxPacked = 0;
    public int maxStoppedOrDone = 0;
    public int oracleBetter = 0;
    public int goldMissing = 0;
    public String maxLexStr = null;
    public String maxFirstStr = null;
    public String maxBestStr = null;
    public String maxNewBestStr = null;
    public String maxPackedStr = null;
    public String maxStoppedOrDoneStr = null;
    public List<Double> bestEstimatedScores = null;
    public List<Double> bestActualScores = null;
    public List<Integer> itemRanks = null;
    public TimingMap lexMap = null;
    public TimingMap firstMap = null;
    public TimingMap bestMap = null; 
    public TimingMap allMap = null; 
    
    private PrintWriter events = null;
    private PrintWriter bleuGen = null;
    private PrintWriter bleuRef = null;
    private PrintWriter bleuSrc = null;
    private PrintWriter nbestrealPW = null;
    private PrintWriter rescorePW = null;
    private PrintWriter nbestparsePW = null;
    
    private XMLOutputter xmlOutputter = new XMLOutputter(); // for xml-escaping strings
    
    /** Constructor. */
    public Regression() {
        // init
        resetTotals();
    }
    
    /** Resets the various totals. */
    public void resetTotals() {
    	// parser
        pCount = 0; pBadCount = 0; pFailedCount = 0; pExactCount = 0;
        totalF = 0.0; totalRecall = 0.0; totalPrecision = 0.0;
        totalDepsF = 0.0; totalDepsRecall = 0.0; totalDepsPrecision = 0.0;
        totalUnlabeledDepsF = 0.0; totalUnlabeledDepsRecall = 0.0; totalUnlabeledDepsPrecision = 0.0;
        totalFComplete = 0.0; totalRecallComplete = 0.0; totalPrecisionComplete = 0.0;
        totalDepsFComplete = 0.0; totalDepsRecallComplete = 0.0; totalDepsPrecisionComplete = 0.0;
        totalUnlabeledDepsFComplete = 0.0; totalUnlabeledDepsRecallComplete = 0.0; totalUnlabeledDepsPrecisionComplete = 0.0;
        pTotalEdges = 0; pTotalEdgesGood = 0; pMaxEdges = 0; pMaxEdgesGood = 0;
        pTotalUnpackingEdges = 0; pMaxUnpackingEdges = 0;
        pTotalCellMax = 0; pTotalCellMaxGood = 0; pMaxCellMax = 0; pMaxCellMaxGood = 0;
        pTotalLexTime = 0; pTotalParseTime = 0; pTotalChartTime = 0; pTotalUnpackingTime = 0;
        pMaxLexTime = 0; pMaxParseTime = 0; pMaxChartTime = 0; pMaxUnpackingTime = 0;
        if (doParsing) {
        	pBetaTallies = new TreeMap<Double,Integer>();
        }
        // realizer
        rCount = 0; rDoneCount = 0; rBadCount = 0; rExactCount = 0;
        totalScore = 0.0; totalScoreComplete = 0.0;
        totalReciprocalRank = 0.0;
        totalNominals = 0; 
        totalTokens = 0; minTokens = 0; maxTokens = 0;
        totalRuleApps = 0;
        totalEdges = 0; totalEdgesCreated = 0; totalUnprunedEdges = 0; totalPrunedRemoved = 0; totalPrunedNeverAdded = 0; totalCellMax = 0;
        totalNewBest = 0; totalLex = 0; totalFirst = 0; totalBest = 0; totalPacked = 0; totalStoppedOrDone = 0;
        maxLex = 0; maxFirst = 0; maxBest = 0; maxNewBest = 0; maxPacked = 0; maxStoppedOrDone = 0;
        oracleBetter = 0; goldMissing = 0;
        maxLexStr = null; maxFirstStr = null; maxBestStr = null; maxNewBestStr = null; maxPackedStr = null; maxStoppedOrDoneStr = null;
        if (doRealization) {
            bestActualScores = new ArrayList<Double>(); bestEstimatedScores = new ArrayList<Double>(); itemRanks = new ArrayList<Integer>();
            lexMap = new TimingMap("lex"); firstMap = new TimingMap("first"); bestMap = new TimingMap("best"); allMap = new TimingMap("all");
        }
    }

    
    // sets up bleu output
    private void bleuSetup() throws IOException {
    	// setup bleu files, if apropos
    	if (bleufileprefix != null && doRealization) {
    		bleuGen = new PrintWriter(new BufferedWriter(new FileWriter(bleufileprefix + "-gen.sgm")));
    		bleuRef = new PrintWriter(new BufferedWriter(new FileWriter(bleufileprefix + "-ref.sgm")));
    		bleuSrc = new PrintWriter(new BufferedWriter(new FileWriter(bleufileprefix + "-src.sgm")));
    		bleuGen.println("<tstset setid=\"ccg-test\" srclang=\"en\" trglang=\"en\">");
    		bleuRef.println("<refset setid=\"ccg-test\" srclang=\"en\" trglang=\"en\">");
    		bleuSrc.println("<srcset setid=\"ccg-test\" srclang=\"en\">");
    	}
    }
    
    // sets up n-best realization output
    private void nbestrealSetup() throws IOException {
        // set up file to write ref & n-best realizations (if any)
        if (nbestrealfile != null && doRealization) {
            nbestrealPW = new PrintWriter(new BufferedWriter(new FileWriter(nbestrealfile)));
            nbestrealPW.println("<nbest>");
        }
    }
    
    // sets up rescored sign score output
    private void rescoreSetup() throws IOException {
        // set up rescoring file
        if (rescorefile != null) {
            rescorePW = new PrintWriter(new BufferedWriter(new FileWriter(rescorefile)));
            rescorePW.println("<rescored>");
        }
    }
    
    // sets up n-best parsing output
    private void nbestparseSetup() throws IOException {
        // set up file to write sentence & n-best parses (if any)
        if (nbestparsefile != null && doParsing) {
            nbestparsePW = new PrintWriter(new BufferedWriter(new FileWriter(nbestparsefile)));
            nbestparsePW.println("<nbest>");
        }
    }
    
    // starts a doc
    private void bleuStartDoc(String id) {
    	if (bleufileprefix != null && doRealization) {
			bleuGen.println("<doc docid=\"" + id + "\" sysid=\"openccg\">");
			bleuRef.println("<doc docid=\"" + id + "\" sysid=\"ref\">");
			bleuSrc.println("<doc docid=\"" + id + "\">");
    	}
    }

    // ends a doc
    private void bleuEndDoc() {
    	if (bleufileprefix != null && doRealization) {
    		bleuGen.println("</doc>"); 
    		bleuRef.println("</doc>"); 
    		bleuSrc.println("</doc>"); 
    	}
    }

    // finishes bleu output
    private void bleuFinish() throws IOException {
    	// finish bleu files, if apropos
    	if (bleufileprefix != null && doRealization) {
    		bleuGen.println("</tstset>");
    		bleuRef.println("</refset>");
    		bleuSrc.println("</srcset>");
    		bleuGen.flush(); bleuGen.close();
    		bleuRef.flush(); bleuRef.close();
    		bleuSrc.flush(); bleuSrc.close();
    	}
    }

    // finishes n-best realization output
    private void nbestrealFinish() throws IOException {
    	// finish n-best real file, if apropos
    	if (nbestrealfile != null && doRealization) {
    		nbestrealPW.println("</nbest>");
    		nbestrealPW.flush(); nbestrealPW.close();
    	}
    }

    // finishes rescored sign output
    private void rescoreFinish() throws IOException {
    	// finish rescoring file
    	if (rescorefile != null) {
    		rescorePW.println("</rescored>");
    		rescorePW.flush(); rescorePW.close();
    	}
    }

    // finishes n-best parsing output
    private void nbestparseFinish() throws IOException {
    	// finish n-best real file, if apropos
    	if (nbestparsefile != null && doParsing) {
    		nbestparsePW.println("</nbest>");
    		nbestparsePW.flush(); nbestparsePW.close();
    	}
    }

    // resets bestRealMap
    private void realserStartDoc() {
    	if (realserdir != null && doRealization) {
    		bestRealMap = new HashMap<String,Sign>();
    	}
    }
    
    // serializes bestRealMap
    private void realserEndDoc(String testName) throws IOException {
    	if (realserdir != null && doRealization) {
	    	File serFile = new File(new File(realserdir), testName + ".ser");
	    	ObjectOutputStream oos = new ObjectOutputStream(new FileOutputStream(serFile));
	    	oos.writeObject(bestRealMap);
	    	oos.close();
    	}
    }
    
    // escapes string for xml output
    private String xmlEscape(String s) { return xmlOutputter.outputString(new Text(s)); }
    
    // normalizes realizations for BLEU scoring
    // at present, this means replacing underscores with spaces and escaping for xml output
    private String norm_bleu(String s) { return xmlEscape(s.replace('_', ' ')); }
    
    
    /** Runs the test on the items in the given file or directory of files. */
    public void runTest(File regressionFile) throws IOException {
    	// set up event file (if any)
    	if (eventfile != null) events = EventFile.openWriter(new File(eventfile));
        // set up bleu output, n-best realizations, rescoring, n-best parses (if apropos)
    	bleuSetup(); nbestrealSetup(); rescoreSetup(); nbestparseSetup();
    	// do each file or files
    	for (File f : getXMLFiles(regressionFile))
    		runSingleTest(f);
    	// finish bleu, n-best realization output, rescoring, n-best parses (if apropos)
    	bleuFinish(); nbestrealFinish(); rescoreFinish(); nbestparseFinish();
    	// close event file (if any)
    	if (events != null) { events.flush(); events.close(); }
    	// show stats (if apropos)
    	if (rescorefile != null) return;
    	if (doParsing && showParseStats) showParseStats();
        if (doRealization && showStats) showStats();
    }
    	 
    /** Returns a list of xml files from the given file or directory. */
    public static List<File> getXMLFiles(File file) {
    	if (!file.isDirectory()) return new SingletonList<File>(file);
    	List<File> retval = new ArrayList<File>();
		File[] files = file.listFiles();
		Arrays.sort(files);
		for (int i = 0; i < files.length; i++) {
			if (!files[i].isDirectory() && files[i].getName().endsWith(".xml"))
				retval.add(files[i]);
		}
    	return retval;
    }
    	
    /** Runs the test on the items in the given file. */
    private void runSingleTest(File regressionFile) throws IOException {
    	
    	String testName = regressionFile.getName();
    	int lastDot = testName.lastIndexOf('.');
    	if (lastDot > 0) testName = testName.substring(0, lastDot);
    	
        // load testfile
    	System.out.println("Loading: " + testName);
    	System.out.println();
        RegressionInfo rinfo = new RegressionInfo(grammar, regressionFile);

        // start bleu doc (if apropos)
        bleuStartDoc(testName);
        // start storing best realizations for serialization (if apropos) 
        realserStartDoc();
        
        // do each test
        int numItems = rinfo.numberOfItems();
        System.out.println("Parse\tRealize\tString");
        System.out.println("-----\t-------\t------");
        
        for (int i=0; i < numItems; i++) {

            // check even/odd only
            if (i % 2 == 1 && evenOnly) continue;
            if (i % 2 == 0 && oddOnly) continue;
            
            RegressionInfo.TestItem testItem = rinfo.getItem(i);
            if (doGC) System.gc();
            
            // short circuit for sign rescoring; realization only at the moment
            if (rescorefile != null) {
                String id = testItem.info;
                double score = scorer.score(testItem.sign, true);
            	rescorePW.println("<seg id=\"" + id + "\" score=\"" + score + "\"/>");
                showOutcome("-", nfE.format(score), "", testItem.sign.getOrthography());
            	continue;
            }
            
            List<Sign> parses = null;
            List<Double> parseScores = null;
            LF parsedLF = null;
            LF compactedLF = null;
            LF transformedParsedLF = null;
            boolean parsed = false;
            boolean parsedComplete = false;
            if (doParsing) {
                try {
            		// use full-words or words from stored sign if possible
            		List<Word> words = null;
            		if (testItem.fullWords != null) {
                		words = grammar.lexicon.tokenizer.tokenize(testItem.fullWords, true);
                		// strip <s> and </s>
                		if (words.get(0).getForm() == "<s>") words.remove(0);
                		if (words.get(words.size()-1).getForm() == "</s>") words.remove(words.size()-1);
            		}
            		else if (testItem.sign != null) {
            			words = testItem.sign.getWords();
            		}
            		if (words != null) {
	            		// parse 'em
	            		parser.parse(words);
            		}
                	else { 
                		parser.parse(testItem.sentence);
                	}
                	// retrieve results
                    parses = parser.getResult();
                    parseScores = parser.getScores();
                    parsed = true;
                    parsedComplete = !parses.get(0).getCategory().isFragment();
                    // get LF of best parse, if needed
                    if (showParseStats || (doRealization && testItem.lfElt == null && testItem.sign == null)) {
	                    Sign sign = parses.get(0);
	                    Category cat = sign.getCategory().copy();
	                    Nominal index = cat.getIndexNominal();
	                    parsedLF = cat.getLF();
	                    index = HyloHelper.convertNominals(parsedLF, sign, index);
	                    compactedLF = HyloHelper.compact(parsedLF, index);
	                    // get transformed version if needed
	                    if (testItem.sign == null) {
		                    transformedParsedLF = grammar.transformLF(compactedLF); 
	                    }
                    }
                } catch (ParseException e) {
                	parses = Collections.emptyList();
                    parsed = false;
                } catch (Exception e) {
                	parses = Collections.emptyList();
                    parsed = false;
                    System.err.println("Uncaught exception in parsing: " + testItem.sentence);
                    e.printStackTrace(System.err);
                }
                  
                // update parse stats
                int count = parser.edgeCount();
                pTotalEdges += count;
                if (count > pMaxEdges) pMaxEdges = count;
                if (parsedComplete) {
                	pTotalEdgesGood += count;
                	if (count > pMaxEdgesGood) pMaxEdgesGood = count;
                }
                count = parser.unpackingEdgeCount();
                pTotalUnpackingEdges += count;
                if (count > pMaxUnpackingEdges) pMaxUnpackingEdges = count;
                int cellMax = parser.maxCellSize();
                pTotalCellMax += cellMax;
                if (cellMax > pMaxCellMax) pMaxCellMax = cellMax;
                if (parsedComplete) {
                	pTotalCellMaxGood += cellMax;
                    if (cellMax > pMaxCellMaxGood) pMaxCellMaxGood = cellMax;
                }
                int time = parser.getLexTime();
                pTotalLexTime += time;
                if (time > pMaxLexTime) pMaxLexTime = time;
                time = parser.getParseTime();
                pTotalParseTime += time;
                if (time > pMaxParseTime) pMaxParseTime = time;
                time = parser.getChartTime();
                pTotalChartTime += time;
                if (time > pMaxChartTime) pMaxChartTime = time;
                time = parser.getUnpackingTime();
                pTotalUnpackingTime += time;
                if (time > pMaxUnpackingTime) pMaxUnpackingTime = time;
                double beta = parser.getSupertaggerBeta();
                Integer betaTally = pBetaTallies.get(beta);
                pBetaTallies.put(beta, (betaTally != null) ? ++betaTally : 1);
            }
            
            // get test item LF, if needed
            LF testItemLF = null;
            if (testItem.lfElt != null && (doRealization || (showParseStats && parsed && testItem.sign == null))) {
                Element lfElt = testItem.lfElt;
                Document doc = new Document();
                lfElt.detach();
                doc.setRootElement(lfElt);
                testItemLF = grammar.loadLF(doc);
            }
            
            // compare EPs
            EPsScorer.Results parseScore = null;
            LF goldLF = null;
            if (showParseStats && parsedLF != null) {
                // get LF to score, gold LF
            	LF lfToScore = null;
                if (testItem.sign != null) {
                	// use LF from stored sign if available
                	lfToScore = parsedLF;
                    Category cat = testItem.sign.getCategory().copy();
                    Nominal index = cat.getIndexNominal();
                    goldLF = cat.getLF();
                    index = HyloHelper.convertNominals(goldLF, testItem.sign, index);
                }
                else {
                	// otherwise use test item LF
                	lfToScore = transformedParsedLF;
                	goldLF = testItemLF;
                }
        		if (goldLF == null) {
        			throw new RuntimeException(
        				"Can't score parse: " + testItem.sentence + "!\n" +
        				"No gold LF."
    				);
        		}
                // score parse
            	parseScore = EPsScorer.score(lfToScore, goldLF);
            }
            
            // update parsing results
            if (showParseStats && testItem.numOfParses > 0) {
            	pCount++;
            	if (parses.size() == 0 || !parsedComplete) pBadCount++;
            	if (parses.size() == 0) pFailedCount++;
            	if (parseScore != null) {
            		if (parseScore.fscore == 1.0) pExactCount++;
            		totalF += parseScore.fscore;
            		totalRecall += parseScore.recall;
            		totalPrecision += parseScore.precision;
            		totalDepsF += parseScore.depsFscore;
            		totalDepsRecall += parseScore.depsRecall;
            		totalDepsPrecision += parseScore.depsPrecision;
            		totalUnlabeledDepsF += parseScore.unlabeledDepsFscore;
            		totalUnlabeledDepsRecall += parseScore.unlabeledDepsRecall;
            		totalUnlabeledDepsPrecision += parseScore.unlabeledDepsPrecision;
            		if (parsedComplete) {
                		totalFComplete += parseScore.fscore;
                		totalRecallComplete += parseScore.recall;
                		totalPrecisionComplete += parseScore.precision;
                		totalDepsFComplete += parseScore.depsFscore;
                		totalDepsRecallComplete += parseScore.depsRecall;
                		totalDepsPrecisionComplete += parseScore.depsPrecision;
                		totalUnlabeledDepsFComplete += parseScore.unlabeledDepsFscore;
                		totalUnlabeledDepsRecallComplete += parseScore.unlabeledDepsRecall;
                		totalUnlabeledDepsPrecisionComplete += parseScore.unlabeledDepsPrecision;
            		}
            	}
            }
            
            // events output
            if (events != null && doParsing) {
            	// nb: only dealing with complete parses at the moment
            	// nb: gold LF must come from saved sign
            	if (parses.size() > 0 && testItem.sign != null) {
            		List<Sign> bestSigns = new ArrayList<Sign>(parses);
            		Sign best = parses.get(0);
            		// update best if not exact match
            		if (parseScore.fscore != 1.0) {
            			// check oracle best
            			Pair<Sign,Boolean> bestPair = parser.oracleBest(goldLF); 
            			if (bestPair.a != null) oracleBetter++;
            			if (bestPair.b) {
            				best = bestPair.a;
            				if (!bestSigns.contains(best)) bestSigns.add(best);
            			}
            			// add gold if missing, if apropos
            			else {
            				goldMissing++;
            				if (includeGoldInEvents) {
	                			best = testItem.sign;
	                    		//parser.addSupertaggerLogProbs(best); 
	                    		bestSigns.add(best);
            				}
            			}
            		}
        			EventFile.writeEvents(events, bestSigns, best, featureExtractor);
            	}
            }
            
            // n-best parses output
            if (nbestparsePW != null) {
                XMLOutputter outputter = new XMLOutputter();
                outputter.setFormat(Format.getPrettyFormat());
            	// header for item
                String extras = "";
                if (parsedComplete) extras += " complete=\"true\"";
                String id = testItem.info;
                if (id == null) id = "" + i;
                nbestparsePW.println("<seg id=\"" + id + "\" str=\"" + xmlEscape(testItem.sentence) + "\"" + extras + ">");
            	String tagend = (nbestincludelfs) ? ">" : "/>";
            	// add best parse
            	if (parseScore != null) { 
            		double edgeScore = parseScores.get(0);
                	String scores = "score=\"" + nf.format(parseScore.fscore) + "\" edge-score=\"" + nfE.format(edgeScore) + "\"";
                	nbestparsePW.println("<best " + scores + tagend);
                	if (nbestincludelfs) {
                    	Element lfElt = grammar.makeLfElt(compactedLF);
                    	nbestparsePW.println(outputter.outputString(lfElt));
                    	nbestparsePW.println("</best>");                		
                	}
            	}
            	// add remaining n-best 
            	for (int k=1; k < parses.size(); k++) {
                    Sign sign = parses.get(k);
            		double edgeScore = parseScores.get(k);
                    Category cat = sign.getCategory().copy();
                    Nominal index = cat.getIndexNominal();
                    LF parsedLFk = cat.getLF();
                    index = HyloHelper.convertNominals(parsedLFk, sign, index);
                    LF compactedLFk = HyloHelper.compact(parsedLFk, index);
                    LF lfToScore = parsedLFk;
                    if (testItem.sign != null) {
                        lfToScore = grammar.transformLF(compactedLFk); 
                    }
                    EPsScorer.Results parseScoreK = EPsScorer.score(lfToScore, goldLF);
                	String scores = "score=\"" + nf.format(parseScoreK.fscore) + "\" edge-score=\"" + nfE.format(edgeScore) + "\"";
                	nbestparsePW.println("<next " + scores + tagend);
                	if (nbestincludelfs) {
                    	Element lfElt = grammar.makeLfElt(compactedLFk);
                    	nbestparsePW.println(outputter.outputString(lfElt));
                    	nbestparsePW.println("</next>");
                	}
            	}
                // close item
                nbestparsePW.println("</seg>");
            }
        
            // determine string to show for parse result
            String starForBadSentence = "";
            if (testItem.numOfParses == 0) starForBadSentence = "*";
            
            String parseResult;
            if (!doParsing) {
                parseResult = "-";
            } else if (parseScore != null) {
                parseResult = nf.format(parseScore.fscore);
                if (!parsedComplete) parseResult = "[" + parseResult + "]";
            } else if (testItem.numOfParses == parses.size()) {
                parseResult = "ok";
            } else if (testItem.numOfParses > 0 && parses.size() > 0) {
                // show num parses, if not the number expected
                parseResult = "(" + parses.size() + ")";
            } else if (testItem.knownFailure) {
                parseResult = "(known)";
            } else {
                parseResult = "FAILED";
            }
                
            if (!doRealization || (doParsing && !parsed) || testItem.numOfParses == 0) {
                showOutcome(parseResult, "-", starForBadSentence, testItem.sentence);
                continue;
            }
            
            LF inputLF = null;
            // use given LF
            if (testItemLF != null) inputLF = testItemLF;
            // or LF from stored sign
            else if (testItem.sign != null) {
                Sign sign = testItem.sign;
                Category cat = sign.getCategory().copy();
                Nominal index = cat.getIndexNominal();
                LF convertedLF = HyloHelper.compactAndConvertNominals(cat.getLF(), index, sign);
                inputLF = grammar.transformLF(convertedLF);
            }
            // otherwise use first parse
            else if (transformedParsedLF != null) inputLF = transformedParsedLF;
            // otherwise give up
            else {
                String suggestion = (!doParsing) ? "Try leaving off -noparsing option." : "";
                throw new RuntimeException("No LF to realize! " + suggestion);
            }
            
            // set up n-gram precision scorer for default scoring and/or scoring results
            String[] targets = (testItem.alt == null) 
            	? new String[] { testItem.sentence }
            	: new String[] { testItem.sentence, testItem.alt };
            NgramPrecisionModel defaultNgramScorer = new NgramPrecisionModel(targets);
            SignScorer scorerToUse = scorer;
            if (scorerToUse == null) {
                if (ngramOrder > 0 || exactMatches) {
                	if (ngramOrder > 0) scorerToUse = new NgramPrecisionModel(targets, ngramOrder);
                	else scorerToUse = new NgramPrecisionModel(targets);
                	((NgramPrecisionModel)scorerToUse).setExactMatches(exactMatches);
                }
                else scorerToUse = defaultNgramScorer;
            }
            // set targets for self-paraphrase biasing
            else if (scorerToUse instanceof SelfParaphraseBiaser) {
            	((SelfParaphraseBiaser)scorerToUse).setTargets(targets);
            }
            
            if (doGC) System.gc(); 
            try {
            	//Add gold std pred supertag mapping to the hypertagger class
            	if (events != null && realizer.hypertagger != null && testItem.predInfo != null) {
                	realizer.hypertagger.storeGoldStdPredInfo(testItem.predInfo);
                }
            	realizer.realize(inputLF, scorerToUse);
            }
            catch (Throwable thrwbl) {
                System.out.println("Unable to process: " + testItem.sentence);
                thrwbl.printStackTrace(System.out);
                continue;
            }
            opennlp.ccg.realize.Chart chart = realizer.getChart();
            String realizeResult = "ok"; boolean gramcomplete = true; boolean joined = false;
            Edge bestEdge = chart.bestEdge;
            if (!bestEdge.complete() || bestEdge.getSign().getCategory().isFragment()) {
                realizeResult = "[ok]"; gramcomplete = false;
                rBadCount++;
                if (chart.joinFragments) { 
                	bestEdge = chart.bestJoinedEdge;
                	joined = true;
                }
            }
            String bestRealization = bestEdge.getSign().getOrthography();
            double score = defaultNgramScorer.score(bestEdge.getSign(), false); // nb: use default n-gram precision score for reporting 
            
            // events output
            if (events != null) {
            	List<Edge> bestEdges = chart.bestEdges();
            	// nb: only dealing with complete realizations at the moment
            	if (bestEdges.size() > 0) {
            		Pair<Edge,Boolean> bestPair = chart.oracleBest(testItem.sentence); 
            		Edge oracleBest = bestPair.a;
            		if (oracleBest != null) {
                    	Sign best = oracleBest.getSign();
                    	List<Sign> bestSigns = new ArrayList<Sign>(bestEdges.size()+1);
                    	for (Edge e : bestEdges) bestSigns.add(e.getSign());
            			if (bestEdge != oracleBest) oracleBetter++;
            			if (!bestPair.b) {
            				goldMissing++;
            				if (includeGoldInEvents) {
            					best = testItem.sign;
            				}
            			}
            			if (!bestSigns.contains(best)) bestSigns.add(best);
            			EventFile.writeEvents(events, bestSigns, best, featureExtractor);
            		}
            	}
            }
            
            // bleu output
            if (bleufileprefix != null) {
                String extras = " time=\"";
                if (chart.done) extras += chart.timeTilDone;
                else extras += chart.timeTilStopped;
                extras += "\"";
                extras += " score=\"" + nf.format(score) + "\"";
                if (gramcomplete) extras += " complete=\"true\"";
                if (joined) extras += " joined=\"true\"";
                String id = testItem.info;
                if (id == null) id = "" + i;
            	bleuGen.println("<seg id=\"" + id + "\"" + extras + ">" + norm_bleu(bestRealization) + "</seg>");
            	String sent = norm_bleu(testItem.sentence);
            	bleuRef.println("<seg id=\"" + id + "\">" + sent + "</seg>");
            	bleuSrc.println("<seg id=\"" + id + "\">" + sent + "</seg>");
            }
            
            // n-best realization output
            if (nbestrealPW != null) {
                XMLOutputter outputter = new XMLOutputter();
                outputter.setFormat(Format.getPrettyFormat());
            	// header for item
                String extras = "";
                if (gramcomplete) extras += " complete=\"true\"";
                if (joined) extras += " joined=\"true\"";
                String id = testItem.info;
                if (id == null) id = "" + i;
            	nbestrealPW.println("<seg id=\"" + id + "\"" + extras + ">");
            	// add ref sentence
            	String ref = (nbestnormbleu) ? norm_bleu(testItem.sentence) : xmlEscape(testItem.sentence); 
            	nbestrealPW.println("<ref>" + ref + "</ref>");
            	// add best realization
            	String scores = "score=\"" + nf.format(score) + "\" edge-score=\"" + nfE.format(bestEdge.score) + "\"";
            	String best = (nbestnormbleu) ? norm_bleu(bestRealization) : xmlEscape(bestRealization);
            	if (!nbestincludelfs)
            		nbestrealPW.println("<best " + scores + ">" + best + "</best>");
            	else {
            		nbestrealPW.println("<best " + scores + ">");
            		nbestrealPW.println("<str>" + best + "</str>");
                	Sign sign = bestEdge.getSign();
                    Category cat = sign.getCategory().copy();
                    Nominal index = cat.getIndexNominal();
                    LF lf = cat.getLF();
                	index = HyloHelper.convertNominalsToVars(lf, index);
                    index = HyloHelper.convertNominals(lf, sign, index);
                    LF lfc = HyloHelper.compact(lf, index);
                	Element lfElt = grammar.makeLfElt(lfc);
                	nbestrealPW.println(outputter.outputString(lfElt));
            		nbestrealPW.println("</best>");
            		
            	}
                // if complete, add remaining n-best
                if (bestEdge.complete()) {
                    List<Edge> bestEdges = chart.bestEdges();
                    for (int j=1; j < bestEdges.size(); j++) {
                    	Edge e = bestEdges.get(j);
                        String eSent = e.getSign().getOrthography();
                        double eScore = defaultNgramScorer.score(e.getSign(), false); // nb: use default n-gram precision score for reporting
                    	String eScores = " score=\"" + nf.format(eScore) + "\" edge-score=\"" + nfE.format(e.score) + "\"";
                    	// add next realization
                    	String next = (nbestnormbleu) ? norm_bleu(eSent) : xmlEscape(eSent);
                    	if (!nbestincludelfs)
                    		nbestrealPW.println("<next" + eScores + ">" + next + "</next>");
                    	else {
                    		nbestrealPW.println("<next" + eScores + ">");
                    		nbestrealPW.println("<str>" + next + "</str>");
                        	Sign sign = e.getSign();
                            Category cat = sign.getCategory().copy();
                            Nominal index = cat.getIndexNominal();
                            LF lf = cat.getLF();
                        	index = HyloHelper.convertNominalsToVars(lf, index);
                            index = HyloHelper.convertNominals(lf, sign, index);
                            LF lfc = HyloHelper.compact(lf, index);
                        	Element lfElt = grammar.makeLfElt(lfc);
                        	nbestrealPW.println(outputter.outputString(lfElt));
                    		nbestrealPW.println("</next>");
                    	}
                    }
                }
                // close item
            	nbestrealPW.println("</seg>");
            }
        
        	// if apmldir non-null, output APML as apmldir/ex(i+1).apml
            if (apmldir != null) {
                String apmlfn = apmldir + "/ex" + (i+1) + ".apml";
                grammar.saveToApml(bestEdge.getSign(), apmlfn);
            }
            
            // store best realization, if apropos and grammatically complete, keyed by info string or item position
            if (realserdir != null && gramcomplete) {
            	String id = testItem.info;
            	if (id == null) id = "i" + i;
            	bestRealMap.put(testItem.info, bestEdge.getSign());
            }
            
            // compute stats, show outcome
            rCount++;
            totalScore += score; 
            if (gramcomplete) totalScoreComplete += score;
            int itemRank = 1;
            Tokenizer tokenizer = grammar.lexicon.tokenizer;
            String itemOrth = tokenizer.getOrthography(tokenizer.tokenize(testItem.sentence));
            if (!bestRealization.equals(itemOrth)) {
                itemRank = 0;
                List<Edge> bestEdges = chart.bestEdges();
                for (int j = 0; j < bestEdges.size(); j++) {
                    Edge edge = bestEdges.get(j);
                    String str = edge.getSign().getOrthography();
                    if (str.equals(itemOrth)) {
                        itemRank = j+1; break;
                    }
                }
                if (itemRank > 0) totalReciprocalRank += (1.0 / itemRank);
            	if (gramcomplete) {
	                realizeResult = nf.format(score);
	                if (itemRank > 0 && itemRank < 10) realizeResult += " ";
	                if (itemRank > 0 && itemRank < 100) realizeResult += "#" + itemRank;
            	}
            	else {
            		realizeResult = "[" + nf.format(score) + "]";
            		if (joined) realizeResult += "j";
            	}
                showOutcome(parseResult, realizeResult, starForBadSentence, testItem.sentence, bestRealization);
            }
            else {
                rExactCount++;
                totalReciprocalRank += 1.0;
                showOutcome(parseResult, realizeResult, starForBadSentence, testItem.sentence);
            }
            
            totalNominals += chart.numNominals;
            int tokens = testItem.sentence.split("\\s+").length;
            totalTokens += tokens;
            if (tokens < minTokens || minTokens == 0) minTokens = tokens;
            if (tokens > maxTokens) maxTokens = tokens;
            totalRuleApps += chart.edgeFactory.ruleApps();
            totalEdges += chart.numEdgesInChart();
            totalEdgesCreated += chart.numEdges;
            totalUnprunedEdges += chart.numUnprunedEdges();
            totalPrunedRemoved += chart.numPrunedRemoved;
            totalPrunedNeverAdded += chart.numPrunedNeverAdded;
            totalCellMax += chart.cellMax;
            totalNewBest += chart.newBest;
            
            bestActualScores.add(new Double(score));
            bestEstimatedScores.add(new Double(bestEdge.score));
            itemRanks.add(new Integer(itemRank));
            
            totalLex += chart.timeTilLex;
            if (chart.timeTilLex > maxLex) {
                maxLex = chart.timeTilLex;
                maxLexStr = testItem.sentence;
            }
            lexMap.add(chart.numNominals, chart.timeTilLex);
            
            totalFirst += chart.timeTilFirst;
            if (chart.timeTilFirst > maxFirst) {
                maxFirst = chart.timeTilFirst;
                maxFirstStr = testItem.sentence;
            }
            firstMap.add(chart.numNominals, chart.timeTilFirst);
            
            totalBest += chart.timeTilBest;
            if (chart.timeTilBest > maxBest) {
                maxBest = chart.timeTilBest;
                maxBestStr = testItem.sentence;
            }
            bestMap.add(chart.numNominals, chart.timeTilBest);
            
            if (chart.newBest > 0 && (chart.timeTilBest - chart.timeTilFirst) >= maxNewBest) {
                maxNewBest = chart.timeTilBest - chart.timeTilFirst;
                maxNewBestStr = testItem.sentence;
            }
            
            totalPacked += chart.timeTilPacked;
            if (chart.timeTilPacked > maxPacked) {
                maxPacked = chart.timeTilPacked;
                maxPackedStr = testItem.sentence;
            }
            
            if (chart.done) {
                rDoneCount++;
                totalStoppedOrDone += chart.timeTilDone;
                if (chart.timeTilDone > maxStoppedOrDone) {
                    maxStoppedOrDone = chart.timeTilDone;
                    maxStoppedOrDoneStr = testItem.sentence;
                }
                allMap.add(chart.numNominals, chart.timeTilDone);
            }
            else {
                totalStoppedOrDone += chart.timeTilStopped;
                if (chart.timeTilStopped > maxStoppedOrDone) {
                    maxStoppedOrDone = chart.timeTilStopped;
                    maxStoppedOrDoneStr = testItem.sentence;
                }
                allMap.add(chart.numNominals, chart.timeTilStopped);
            }
        }
        
        // end bleu doc (if apropos)
        bleuEndDoc();
        System.out.println();
        
        // serialize best realizations (if apropos)
        realserEndDoc(testName);
    }

    /** Shows the various parsing totals. */
    public void showParseStats() {
    	int pCompleteCount = pCount - pBadCount;
    	int pFragCount = pBadCount - pFailedCount;
        String pComplete = "" + pCompleteCount;
        String pCompletePct = "" + nf.format(100.0 * pCompleteCount / pCount) + "%";
        System.out.println("Strings parsed completely (in fragments, failed): " + pComplete + " (" + pFragCount + ", " + pFailedCount + ") " + pCompletePct);
        String pInexact = "" + (pCount - pExactCount);
        String pExactPct = "" + nf.format(100.0 * pExactCount / pCount) + "%";
        System.out.println("Strings parsed exactly (inexactly): " + pExactCount + " (" + pInexact + ") " + pExactPct);
        String avgEdges = nf.format(1.0 * pTotalEdges / pCount);
        System.out.println("Average edge count (before unpacking): " + avgEdges);
        String avgEdgesGood = nf.format(1.0 * pTotalEdgesGood / pCompleteCount);
        System.out.println("Average edge count (before unpacking) for complete parses: " + avgEdgesGood);
        System.out.println("Max edge count: " + pMaxEdges);
        System.out.println("Max edge count for complete parses: " + pMaxEdgesGood);
        String avgUnpacked = nf.format(1.0 * pTotalUnpackingEdges / pCount);
        System.out.println("Average edges unpacked (created while unpacking): " + avgUnpacked);
        System.out.println("Max unpacked edges: " + pMaxUnpackingEdges);
        String avgLexTime = nf.format(1.0 * pTotalLexTime / pCount);
        String avgCellMax = nf.format(1.0 * pTotalCellMax / pCount);
        System.out.println("Average max cell size (before unpacking): " + avgCellMax);
        String avgCellMaxGood = nf.format(1.0 * pTotalCellMaxGood / pCompleteCount);
        System.out.println("Average max cell size (before unpacking) for complete parses: " + avgCellMaxGood);
        System.out.println("Max max cell size: " + pMaxCellMax);
        System.out.println("Max max cell size for complete parses: " + pMaxCellMaxGood);
        System.out.println("Average lex lookup time: " + avgLexTime);
        String avgParseTime = nf.format(1.0 * pTotalParseTime / pCount);
        System.out.println("Max lex lookup time: " + pMaxLexTime);
        System.out.println("Average parse time: " + avgParseTime);
        System.out.println("Max parse time: " + pMaxParseTime);
        String avgChartTime = nf.format(1.0 * pTotalChartTime / pCount);
        System.out.println("Average chart construction time: " + avgChartTime);
        System.out.println("Max chart construction time: " + pMaxChartTime);
        String avgUnpackingTime = nf.format(1.0 * pTotalUnpackingTime / pCount);
        System.out.println("Average unpacking time: " + avgUnpackingTime);
        System.out.println("Max unpacking time: " + pMaxUnpackingTime);
        System.out.println("Supertagger beta tallies:");
        Set<Double> betas = pBetaTallies.keySet();
        for (double beta : betas) {
        	int tally = pBetaTallies.get(beta);
            System.out.println(beta + "\t" + tally);
        }
        String avgF = nf.format(100.0 * totalF / pCount);
        System.out.println("Labeled f-score: " + avgF);
        String avgRecall = nf.format(100.0 * totalRecall / pCount);
        System.out.println("Labeled recall: " + avgRecall);
        String avgPrecision = nf.format(100.0 * totalPrecision / pCount);
        System.out.println("Labeled precision: " + avgPrecision);
        String avgDepsF = nf.format(100.0 * totalDepsF / pCount);
        System.out.println("Labeled f-score deps only: " + avgDepsF);
        String avgDepsRecall = nf.format(100.0 * totalDepsRecall / pCount);
        System.out.println("Labeled recall deps only: " + avgDepsRecall);
        String avgDepsPrecision = nf.format(100.0 * totalDepsPrecision / pCount);
        System.out.println("Labeled precision deps only: " + avgDepsPrecision);
        String avgUnlabeledDepsF = nf.format(100.0 * totalUnlabeledDepsF / pCount);
        System.out.println("Unlabeled deps f-score: " + avgUnlabeledDepsF);
        String avgUnlabeledDepsRecall = nf.format(100.0 * totalUnlabeledDepsRecall / pCount);
        System.out.println("Unlabeled deps recall: " + avgUnlabeledDepsRecall);
        String avgUnlabeledDepsPrecision = nf.format(100.0 * totalUnlabeledDepsPrecision / pCount);
        System.out.println("Unlabeled deps precision: " + avgUnlabeledDepsPrecision);
        String avgFComplete = nf.format(100.0 * totalFComplete / pCompleteCount);
        System.out.println("Labeled f-score for complete parses: " + avgFComplete);
        String avgRecallComplete = nf.format(100.0 * totalRecallComplete / pCompleteCount);
        System.out.println("Labeled recall for complete parses: " + avgRecallComplete);
        String avgPrecisionComplete = nf.format(100.0 * totalPrecisionComplete / pCompleteCount);
        System.out.println("Labeled precision for complete parses: " + avgPrecisionComplete);
        String avgDepsFComplete = nf.format(100.0 * totalDepsFComplete / pCompleteCount);
        System.out.println("Labeled f-score deps only for complete parses: " + avgDepsFComplete);
        String avgDepsRecallComplete = nf.format(100.0 * totalDepsRecallComplete / pCompleteCount);
        System.out.println("Labeled recall deps only for complete parses: " + avgDepsRecallComplete);
        String avgDepsPrecisionComplete = nf.format(100.0 * totalDepsPrecisionComplete / pCompleteCount);
        System.out.println("Labeled precision deps only for complete parses: " + avgDepsPrecisionComplete);
        String avgUnlabeledDepsFComplete = nf.format(100.0 * totalUnlabeledDepsFComplete / pCompleteCount);
        System.out.println("Unlabeled deps f-score for complete parses: " + avgUnlabeledDepsFComplete);
        String avgUnlabeledDepsRecallComplete = nf.format(100.0 * totalUnlabeledDepsRecallComplete / pCompleteCount);
        System.out.println("Unlabeled deps recall for complete parses: " + avgUnlabeledDepsRecallComplete);
        String avgUnlabeledDepsPrecisionComplete = nf.format(100.0 * totalUnlabeledDepsPrecisionComplete / pCompleteCount);
        System.out.println("Unlabeled deps precision for complete parses: " + avgUnlabeledDepsPrecisionComplete);
        if (oracleBetter > 0) System.out.println("Oracle better: " + oracleBetter);
        if (goldMissing > 0) System.out.println("Gold missing: " + goldMissing);
        System.out.println();
    }
    
    /** Shows the various realization totals. */
    public void showStats() {
    	int rCompleteCount = rCount - rBadCount;
        String rComplete = "" + rCompleteCount;
        String rCompletePct = "" + nf.format(100.0 * rCompleteCount / rCount) + "%";
        System.out.println("Strings realized completely (in fragments): " + rComplete + " (" + rBadCount + ") " + rCompletePct);
        String rInexact = "" + (rCount - rExactCount);
        String rExactPct = "" + nf.format(100.0 * rExactCount / rCount) + "%";
        System.out.println("Strings realized exactly (inexactly): " + rExactCount + " (" + rInexact + ") " + rExactPct);
        System.out.println("Strings where realization finished: " + rDoneCount);
        String avgScore = nf.format(totalScore / rCount);
        System.out.println("Avg score: " + avgScore);
        String avgScoreComplete = nf.format(totalScoreComplete / rCompleteCount);
        System.out.println("Avg score for complete realizations: " + avgScoreComplete);
        String meanReciprocalRank = nf.format(totalReciprocalRank / rCount);
        System.out.println("Mean reciprocal rank: " + meanReciprocalRank);
        String residualMRR = (rCount == rExactCount) 
            ? "n/a" 
            : nf.format((totalReciprocalRank - rExactCount) / (rCount - rExactCount));
        System.out.println("Residual mean reciprocal rank: " + residualMRR);
        String avgNodes = nf.format(totalNominals * 1.0 / rCount); 
        String avgTokens = nf.format(totalTokens * 1.0 / rCount); 
        System.out.println("Avg num nodes, words: " + avgNodes + ", " + avgTokens);
        System.out.println("Num words (min-max): " + minTokens + "-" + maxTokens);
        String avgRuleApps = nf.format(totalRuleApps * 1.0 / rCount);
        System.out.println("Avg num rule apps: " + avgRuleApps);
        String avgEdges = nf.format(totalEdges * 1.0 / rCount);
        String avgEdgesCreated = nf.format(totalEdgesCreated * 1.0 / rCount);
        String avgUnprunedEdges = nf.format(totalUnprunedEdges * 1.0 / rCount);
        System.out.println("Avg num edges in chart: " + avgEdges);
        System.out.println("Avg num edges created: " + avgEdgesCreated);
        System.out.println("Avg num unpruned edges: " + avgUnprunedEdges);
        String avgRemoved = nf.format(totalPrunedRemoved * 1.0 / rCount);
        String avgNeverAdded = nf.format(totalPrunedNeverAdded * 1.0 / rCount);
        System.out.println("Avg num pruned edges removed, never added: "  + avgRemoved + ", " + avgNeverAdded);
        String avgCellMax = nf.format(totalCellMax * 1.0 / rCount);
        System.out.println("Avg cell max: " + avgCellMax);
        String avgNewBest = nf.format(totalNewBest * 1.0 / rCount);
        System.out.println("Total, avg num new best realizations: " + totalNewBest + ", " + avgNewBest);
        String avgLex = nf.format(lexMap.mean());
        String stdLex = nf.format(lexMap.sigma());
        System.out.println("Avg (std) time 'til lex lookup finished: " + avgLex + " (" + stdLex + ")");
        System.out.println("Max time 'til lex lookup finished: " + maxLex + " (" + maxLexStr + ")");
        String avgFirst = nf.format(firstMap.mean());
        String stdFirst = nf.format(firstMap.sigma());
        System.out.println("Avg (std) time 'til first realization: " + avgFirst + " (" + stdFirst + ")");
        System.out.println("Max time 'til first realization: " + maxFirst + " (" + maxFirstStr + ")");
        String avgBest = nf.format(bestMap.mean());
        String stdBest = nf.format(bestMap.sigma());
        System.out.println("Avg (std) time 'til best realization: " + avgBest + " (" + stdBest + ")");
        System.out.println("Max time 'til best realization: " + maxBest + " (" + maxBestStr +")");
        System.out.println("Max time 'til new best realization: " + maxNewBest + " (" + maxNewBestStr +")");
        String avgPacked = nf.format(totalPacked / rCount);
        System.out.println("Avg time 'til done packing: " + avgPacked);
        System.out.println("Max time 'til done packing: " + maxPacked + " (" + maxPackedStr +")");
        String avgStoppedOrDone = nf.format(allMap.mean());
        String stdStoppedOrDone = nf.format(allMap.sigma());
        System.out.println("Avg (std) time 'til stopped/done with realizations: " + avgStoppedOrDone + " (" + stdStoppedOrDone + ")");
        System.out.println("Max time 'til stopped/done with realizations: " + maxStoppedOrDone + " (" + maxStoppedOrDoneStr +")");
        if (oracleBetter > 0) System.out.println("Oracle better: " + oracleBetter);
        if (goldMissing > 0) System.out.println("Gold missing: " + goldMissing);
        if (statsfile != null) {
            Document doc = new Document();
            Element root = new Element("rstats");
            doc.setRootElement(root);
            Element counts = new Element("counts");
            root.addContent(counts);
            counts.setAttribute("realized", "" + rCount);
            counts.setAttribute("complete", "" + rComplete);
            counts.setAttribute("fragments", "" + rBadCount);
            counts.setAttribute("exact", "" + rExactCount);
            counts.setAttribute("inexact", rInexact);
            counts.setAttribute("finished", "" + rDoneCount);
            Element overall = new Element("overall");
            root.addContent(overall);
            overall.setAttribute("avg-score", avgScore);
            overall.setAttribute("mean-reciprocal-rank", meanReciprocalRank);
            overall.setAttribute("residual-mrr", residualMRR);
            overall.setAttribute("avg-nodes", avgNodes);
            overall.setAttribute("avg-words", avgTokens);
            overall.setAttribute("min-words", "" + minTokens);
            overall.setAttribute("max-words", "" + maxTokens);
            Element rules = new Element("rules");
            root.addContent(rules);
            rules.setAttribute("avg-apps", avgRuleApps);
            Element edges = new Element("edges");
            root.addContent(edges);
            edges.setAttribute("avg", avgEdges);
            edges.setAttribute("avg-unpruned", avgUnprunedEdges);
            edges.setAttribute("avg-removed", avgRemoved);
            edges.setAttribute("avg-never-added", avgNeverAdded);
            edges.setAttribute("avg-cell-max", avgCellMax);
            if (oracleBetter > 0) edges.setAttribute("oracle-better", "" + oracleBetter);
            if (goldMissing > 0) edges.setAttribute("gold-missing", "" + goldMissing);
            Element newBest = new Element("new-best");
            root.addContent(newBest);
            newBest.setAttribute("total", "" + totalNewBest);
            newBest.setAttribute("avg", avgNewBest);
            Element times = new Element("times-summary");
            root.addContent(times);
            times.setAttribute("avg-lex", avgLex);
            times.setAttribute("std-lex", stdLex);
            times.setAttribute("avg-first", avgFirst);
            times.setAttribute("std-first", stdFirst);
            times.setAttribute("max-first", "" + maxFirst);
            times.setAttribute("avg-best", avgBest);
            times.setAttribute("std-best", stdBest);
            times.setAttribute("max-best", "" + maxBest);
            times.setAttribute("max-new-best", "" + maxNewBest);
            times.setAttribute("avg-packed", avgPacked);
            times.setAttribute("max-packed", "" + maxPacked);
            times.setAttribute("avg-stopped-or-done", avgStoppedOrDone);
            times.setAttribute("std-stopped-or-done", stdStoppedOrDone);
            times.setAttribute("max-stopped-or-done", "" + maxStoppedOrDone);
            Element strings = new Element("max-strings");
            root.addContent(strings);
            Element lex = new Element("lex");
            strings.addContent(lex);
            lex.addContent(maxLexStr);
            Element first = new Element("first");
            strings.addContent(first);
            first.addContent(maxFirstStr);
            Element best = new Element("best");
            strings.addContent(best);
            best.addContent(maxBestStr);
            Element newBest2 = new Element("new-best");
            strings.addContent(newBest2);
            newBest2.addContent(maxNewBestStr);
            Element packed = new Element("packed");
            strings.addContent(packed);
            packed.addContent(maxPackedStr);
            Element stoppedOrDone = new Element("stopped-or-done");
            strings.addContent(stoppedOrDone);
            stoppedOrDone.addContent(maxStoppedOrDoneStr);
            Element scores = new Element("scores");
            root.addContent(scores);
            for (int i = 0; i < bestActualScores.size(); i++) {
                Element score = new Element("score");
                scores.addContent(score);
                score.setAttribute("val", bestActualScores.get(i).toString());
                score.setAttribute("est", bestEstimatedScores.get(i).toString());
                score.setAttribute("rank", itemRanks.get(i).toString());
            }
            firstMap.saveTimes(root);
            bestMap.saveTimes(root);
            allMap.saveTimes(root);
            try {
                FileOutputStream out = new FileOutputStream(statsfile);
                grammar.serializeXml(doc, out);
                out.flush();
            }
            catch (IOException exc) {
                System.out.println("Unable to write stats to: " + statsfile + " (" + exc + ")");
            }
        }
    }
    
    // show outcome, with wrapping
    private static void showOutcome(String parseResult, String realizeResult, String starForBadSentence, String str) {
        showOutcome(parseResult, realizeResult, starForBadSentence, str, null);
    }
    
    // show outcome including best realization
    private static void showOutcome(String parseResult, String realizeResult, String starForBadSentence, 
                                    String str, String bestRealization) 
    {
        System.out.print(parseResult + "\t" + realizeResult + "\t");
        simpleWrap(starForBadSentence + str);
        if (bestRealization != null) {
            System.out.print("\t\t");
            simpleWrap("(best: " + bestRealization + ")");
        }
    }
    
    // does simple wrapping at TEXTWIDTH
    private static void simpleWrap(String str) {
        int TEXTWIDTH = 60;
        for (int i = 0; i <= (str.length()-1)/TEXTWIDTH; i++) {
            if (i != 0) {
                System.out.print("\t\t");
            }
            System.out.println(str.substring(i*TEXTWIDTH, Math.min(i*TEXTWIDTH + TEXTWIDTH, str.length())));
        }
    }
    
    // formats to three decimal places
    private static final NumberFormat nf = initNF();
    private static NumberFormat initNF() { 
        NumberFormat f = NumberFormat.getInstance();
        f.setMinimumIntegerDigits(1);
        f.setMinimumFractionDigits(1);
        f.setMaximumFractionDigits(2);
        return f;
    }
    
    // formats to three decimal places in scientific notation
    private static final NumberFormat nfE = initNFE();
    private static NumberFormat initNFE() {
    	DecimalFormat f = new DecimalFormat("0.###E0");
        return f;
    }
    
    /** Shows realizer settings for current test. */
    static void showRealizerSettings() {
        // get, show prefs
        Preferences prefs = Preferences.userNodeForPackage(TextCCG.class);
        boolean useIndexing = prefs.getBoolean(EdgeFactory.USE_INDEXING, true);
        boolean useChunks = prefs.getBoolean(EdgeFactory.USE_CHUNKS, true);
        boolean useLicensing = prefs.getBoolean(EdgeFactory.USE_FEATURE_LICENSING, true);
        boolean useCombos = prefs.getBoolean(opennlp.ccg.realize.Chart.USE_COMBOS, true);
        boolean usePacking = prefs.getBoolean(opennlp.ccg.realize.Chart.USE_PACKING, false);
        int timeLimit = prefs.getInt(opennlp.ccg.realize.Chart.TIME_LIMIT, opennlp.ccg.realize.Chart.NO_TIME_LIMIT);
        double nbTimeLimit = prefs.getDouble(opennlp.ccg.realize.Chart.NEW_BEST_TIME_LIMIT, opennlp.ccg.realize.Chart.NO_TIME_LIMIT);
        int pruningVal = prefs.getInt(opennlp.ccg.realize.Chart.PRUNING_VALUE, opennlp.ccg.realize.Chart.NO_PRUNING);
        int cellPruningVal = prefs.getInt(opennlp.ccg.realize.Chart.CELL_PRUNING_VALUE, opennlp.ccg.realize.Chart.NO_PRUNING);
        String msg = "Timing realization with index filtering " + ((useIndexing) ? "on" : "off") + ", "; 
        msg += "chunks " + ((useChunks) ? "on" : "off") + ", "; 
        msg += "licensing " + ((useLicensing) ? "on" : "off") + ", ";
        if (usePacking) msg += "packing on, ";
        else {
            msg += "combos " + ((useCombos) ? "on" : "off") + ", ";
            if (timeLimit == opennlp.ccg.realize.Chart.NO_TIME_LIMIT) msg += "no time limit, ";
            else msg += "a time limit of " + timeLimit + " ms, ";
            if (nbTimeLimit == opennlp.ccg.realize.Chart.NO_TIME_LIMIT) msg += "no new best time limit, ";
            else {
                msg += "a new best time limit of ";
                if (nbTimeLimit >= 1) msg += ((int)nbTimeLimit) + " ms, ";
                else msg += nbTimeLimit + " of first, ";
            }
        }
        if (pruningVal == opennlp.ccg.realize.Chart.NO_PRUNING) msg += "no pruning, ";
        else msg += "a pruning value of " + pruningVal + ", ";
        msg += "and ";
        if (cellPruningVal == opennlp.ccg.realize.Chart.NO_PRUNING) msg += "no cell pruning";
        else msg += "a cell pruning value of " + cellPruningVal;
        System.out.println(msg);
        System.out.println();
    }
    

    /** 
     * Writes the target strings from the given testbed to the given textfile.
     */
    public void writeTargets(File tbFile, String textfile) throws IOException {
        writeTargets(tbFile, textfile, false, false, false);
    }
    
    /** 
     * Writes the target strings with semantic class replacement 
     * from the given testbed to the given textfile. 
     */
    public void writeTargetsSC(File tbFile, String textfile) throws IOException {
        writeTargets(tbFile, textfile, true, false, false);
    }
    
    /** 
     * Writes the target strings with all associated factors 
     * from the given testbed to the given textfile. 
     */
    public void writeTargetsF(File tbFile, String textfile) throws IOException {
        writeTargets(tbFile, textfile, false, true, false);
    }
    
    /** 
     * Writes the target strings with all associated factors with semantic class replacement  
     * from the given testbed to the given textfile. 
     */
    public void writeTargetsFSC(File tbFile, String textfile) throws IOException {
        writeTargets(tbFile, textfile, true, true, false);
    }
    
    // writes targets, optionally with sem class replacement or factors, 
    // and optionally reversing the words; ungrammatical options are filtered out 
    private void writeTargets(
    		File tbFile, String filename, 
    		boolean semClassReplacement, boolean withFactors, 
    		boolean reverse
    ) throws IOException {
        // open text file
        String option = "";
        if (withFactors) option = " with factors";
        if (semClassReplacement) option += " with semantic class replacement";
        if (reverse) option += ", reversed";
        System.out.println("Writing text file" + option + ": " + filename);
        System.out.println();
        PrintWriter tOut = new PrintWriter(new BufferedWriter(new FileWriter(filename)));
        HashSet<String> unique = new HashSet<String>(); 
        Tokenizer tokenizer = grammar.lexicon.tokenizer;
        // loop through files
        for (File f : getXMLFiles(tbFile)) {
	        // load testbed
	        System.out.println("Loading testbed from: " + f);
	        RegressionInfo tbInfo = new RegressionInfo(grammar, f);
	        int numItems = tbInfo.numberOfItems();
	        // do each test item
	        for (int i = 0; i < numItems; i++) {
	            // check even/odd only
	            if (i % 2 == 1 && evenOnly) continue;
	            if (i % 2 == 0 && oddOnly) continue;
	            RegressionInfo.TestItem testItem = tbInfo.getItem(i); 
	        	// check grammatical
	        	if (testItem.numOfParses == 0) continue;
	            String s = testItem.sentence;
	            // get parsed words if doing more than just text
	            List<Word> words = null;
	            if (semClassReplacement || withFactors) {
	                // use words from sign or pre-parsed full words if available
	            	if (testItem.sign != null) 
	            		words = testItem.sign.getWords();
	            	else if (testItem.fullWords != null) 
	                    words = tokenizer.tokenize(testItem.fullWords, true);
	                // otherwise parse
	                else words = grammar.getParsedWords(s);
	            }
	            else words = tokenizer.tokenize(s);
	            // reverse, if apropos
	            if (reverse) {
	                List<Word> tmp = words;
	                words = new ArrayList<Word>(words.size());
	                words.add(Word.createWord("<s>"));
	                for (int j = tmp.size()-1; j >= 0; j--) {
	                    Word w = tmp.get(j);
	                    if (w.getForm() == "<s>" || w.getForm() == "</s>") continue; // skip <s> or </s>
	                    words.add(w);
	                }
	                words.add(Word.createWord("</s>"));
	            }
	            // write str, add to unique set
	            String str = (!withFactors)
	                ? tokenizer.getOrthography(words, semClassReplacement)
	                : tokenizer.format(words, semClassReplacement);
	            tOut.println(str);
	            unique.add(str);
	            System.out.print("."); // indicate progress
	        }
	        System.out.println();
        }
        tOut.flush(); tOut.close();
        System.out.println();
        System.out.println("Unique strings: " + unique.size());
        System.out.println();
    }
    
    private void writeDerivationFactors(File tbFile, String filename) throws IOException {
        // open text file
        System.out.println("Writing derivation factors file: " + filename);
        System.out.println();
        PrintWriter tOut = new PrintWriter(new BufferedWriter(new FileWriter(filename)));
        Tokenizer tokenizer = grammar.lexicon.tokenizer;
        // loop through files
        for (File f : getXMLFiles(tbFile)) {
	        // load testbed
	        System.out.println("Loading testbed from: " + f);
	        RegressionInfo tbInfo = new RegressionInfo(grammar, f);
	        int numItems = tbInfo.numberOfItems();
	        // do each test item, using the saved sign
	        for (int i = 0; i < numItems; i++) {
	            RegressionInfo.TestItem testItem = tbInfo.getItem(i); 
	        	if (testItem.numOfParses == 0) continue; // check grammatical
	        	Sign sign = testItem.sign;
	        	List<Word> factors = GenerativeSyntacticModel.getFactors(sign);
	        	for (Word w : factors) {
	        		tOut.print(tokenizer.format(w));
	        		tOut.print(" ");
	        	}
	        	tOut.println();
	            System.out.print("."); // indicate progress
	        }
	        System.out.println();
        }
        tOut.flush(); tOut.close();
        System.out.println();
    }
    
    
    /** Command-line routine for regression testing. */
    public static void main(String[] args) throws IOException { 

        String usage = "java opennlp.ccg.test.Regression \n" + 
                       "  (-noparsing) (-norealization) (-even|-odd) (-gc) \n" + 
                       "  (-nullscorer) (-randomscorer) \n" + 
                       "  (-depthfirst) (-exactmatches) (-aanfilter (<excfile>)) \n" +
                       "  (-scorer <scorerclass>) \n" +
                       "  (-parsescorer <scorerclass>) \n" +
                       "  (-extractor <extractorclass>) \n" +
                       "  (-ngrampruningstrategy) (-pruningstrategy <pruningstrategyclass>) \n" +
                       "  (-hypertagger <hypertaggerclass> | -htconfig <configfile>) (-htgold) \n" +
                       "  (-supertagger <supertaggerclass> | -stconfig <configfile>) \n" +
                       "  (-ngramorder N) (-lm|-lmsc <lmfile>) \n" + 
                       "  (-srilm " + Arrays.toString(SRILMNgramModelType.values()) + ")\n"+
                       "  (-flm|-flmsc <flmfile>) \n" + 
                       "  (-text|-textsc|-textf|-textfsc <textfile>) (-reverse) \n" +
                       "  (-derivf <derivfactorsfile>) \n" +
                       "  (-2events <eventfile>) (-includegoldinevents) \n" +
                       "  (-2apml <apmldir>) (-bleu <bleufileprefix>) \n" +
                       "  (-nbestrealfile <nbestrealfile>) (-nbestnormbleu) (-realserdir <realserdir>) \n" + 
                       "  (-nbestincludelfs) \n" +
                       "  (-rescorefile <rescorefile>) \n" + 
                       "  (-nbestparsefile <nbestparsefile>) \n" + 
                       "  (-g <grammarfile>) (-s <statsfile>) (<regressionfile>|<regressiondir>)";
                       
        if (args.length > 0 && args[0].equals("-h")) {
            System.out.println("Usage: \n\n" + usage);
            System.exit(0);
        }
        
        // setup Regression tester
        Regression tester = new Regression();

        // args
        String grammarfile = "grammar.xml";
        String regressionfile = "testbed.xml";
        boolean depthFirst = false;
        boolean aanfilter = false;
        String excfile = null;
        String scorerClass = null;
        String parseScorerClass = null;
        String extractorClass = null;
        boolean ngrampruningstrategy = false;
        String pruningStrategyClass = null; 
        String hypertaggerClass = null, htconfig = null; 
        boolean htgold = false;
        String supertaggerClass = null, stconfig = null;
        String lmfile = null;
        String flmfile = null;
        boolean useSemClasses = false;
        boolean withFactors = false;
        boolean reverse = false;
        String textfile = null;
        String derivfactorsfile = null;
        boolean srilm = false;
        SRILMNgramModelType srilmModelType = SRILMNgramModelType.STANDARD;
        
        for (int i = 0; i < args.length; i++) {
        	if (args[i].startsWith("-D")) {
        		String prop = args[i].substring(2); int equalpos = prop.indexOf("=");
        		String key = prop.substring(0, equalpos); String val = prop.substring(equalpos+1);
        		System.setProperty(key, val); continue;
        	}
            if (args[i].equals("-noparsing")) { tester.doParsing = false; continue; }
            if (args[i].equals("-norealization")) { tester.doRealization = false; continue; }
            if (args[i].equals("-even")) { tester.evenOnly = true; continue; }
            if (args[i].equals("-odd")) { tester.oddOnly = true; continue; }
            if (args[i].equals("-gc")) { tester.doGC = true; continue; }
            if (args[i].equals("-nullscorer")) { 
            	tester.scorer = SignScorer.nullScorer; tester.parseScorer = SignScorer.nullScorer; continue; 
            }
            if (args[i].equals("-randomscorer")) { 
            	tester.scorer = SignScorer.randomScorer; tester.parseScorer = SignScorer.randomScorer; continue; 
            }
            if (args[i].equals("-depthfirst")) { depthFirst = true; continue; }
            if (args[i].equals("-exactmatches")) { tester.exactMatches = true; continue; }
            if (args[i].equals("-aanfilter")) {
                aanfilter = true; 
                if (i < args.length-1 && args[i+1].charAt(0) != '-') excfile = args[++i]; 
                continue;
            }
            if (args[i].equals("-scorer")) { scorerClass = args[++i]; continue; }
            if (args[i].equals("-parsescorer")) { parseScorerClass = args[++i]; continue; }
            if (args[i].equals("-extractor")) { extractorClass = args[++i]; continue; }
            if (args[i].equals("-ngrampruningstrategy")) { ngrampruningstrategy = true; continue; }
            if (args[i].equals("-pruningstrategy")) { pruningStrategyClass = args[++i]; continue; }
            if (args[i].equals("-hypertagger")) { hypertaggerClass = args[++i]; continue; }
            if (args[i].equals("-htconfig")) { htconfig = args[++i]; continue; }
            if (args[i].equals("-htgold")) { htgold = true; continue; }
            if (args[i].equals("-supertagger")) { supertaggerClass = args[++i]; continue; }
            if (args[i].equals("-stconfig")) { stconfig = args[++i]; continue; }
            if (args[i].equals("-ngramorder")) { tester.ngramOrder = Integer.parseInt(args[++i]); continue; }
            if (args[i].equals("-lm")) { lmfile = args[++i]; continue; }
            if (args[i].equals("-lmsc")) { lmfile = args[++i]; useSemClasses = true; continue; }
            if (args[i].equals("-flm")) { flmfile = args[++i]; continue; }
            if (args[i].equals("-flmsc")) { flmfile = args[++i]; useSemClasses = true; continue; }
            if (args[i].equals("-reverse")) { reverse = true; continue; }
            if (args[i].equals("-text")) { textfile = args[++i]; continue; }
            if (args[i].equals("-textsc")) { textfile = args[++i]; useSemClasses = true; continue; }
            if (args[i].equals("-textf")) { textfile = args[++i]; withFactors = true; continue; }
            if (args[i].equals("-textfsc")) { textfile = args[++i]; useSemClasses = true; withFactors = true; continue; }
            if (args[i].equals("-derivf")) { derivfactorsfile = args[++i]; continue; }
            if (args[i].equals("-2events")) { tester.eventfile = args[++i]; continue; }
            if (args[i].equals("-includegoldinevents")) { tester.includeGoldInEvents = true; continue; }
            if (args[i].equals("-2apml")) { tester.apmldir = args[++i]; continue; }
            if (args[i].equals("-bleu")) { tester.bleufileprefix = args[++i]; continue; }
            if (args[i].equals("-nbestrealfile")) { tester.nbestrealfile = args[++i]; continue; }
            if (args[i].equals("-nbestnormbleu")) { tester.nbestnormbleu = true; continue; }
            if (args[i].equals("-realserdir")) { tester.realserdir = args[++i]; continue; }
            if (args[i].equals("-nbestincludelfs")) { tester.nbestincludelfs = true; continue; }
            if (args[i].equals("-rescorefile")) { tester.rescorefile = args[++i]; continue; }
            if (args[i].equals("-nbestparsefile")) { tester.nbestparsefile = args[++i]; continue; }
            if (args[i].equals("-g")) { grammarfile = args[++i]; continue; }
            if (args[i].equals("-s")) { tester.statsfile = args[++i]; continue; }
            if (args[i].equals("-srilm")) { 
            	srilm = true;
            	if(i < (args.length - 1)) {
	            	String type = args[i + 1];
	            	try {
	            		srilmModelType = SRILMNgramModelType.valueOf(type);
	            		i++;
	            	}
	            	catch(IllegalArgumentException iae) {
	            		srilmModelType = SRILMNgramModelType.STANDARD;
	            		System.err.println(
	            			"Warning: unknown SRILM n-gram model type " + type
	            				+ " specified, using default ("
	            				+ srilmModelType + ")");
	            	}
            	}
            	continue;
            }
            regressionfile = args[i];
        }
        
        // load grammar
        URL grammarURL = new File(grammarfile).toURI().toURL();
        System.out.println("Loading grammar from URL: " + grammarURL);
        tester.grammar = new Grammar(grammarURL);
        System.out.println();
        
        // with -aanfilter (<excfile) option, instantiate AAnFilter
        AAnFilter aanFilter = null;
        if (aanfilter) {
            if (excfile != null) System.out.println("Loading a/an exceptions from file: " + excfile);
            aanFilter = (excfile != null) ? new AAnFilter(excfile) : new AAnFilter();
        }
        
        // instantiate scorer, if any
        if (scorerClass != null) {
            try {
                System.out.println("Instantiating sign scorer from class: " + scorerClass);
                SignScorer scorer = (SignScorer) Class.forName(scorerClass).newInstance();
            	if (scorer instanceof NgramScorer) {
                    NgramScorer lmScorer = (NgramScorer) scorer;
                    if (aanfilter) lmScorer.addFilter(aanFilter);
                    tester.ngramOrder = lmScorer.getOrder();
                }
                tester.scorer = scorer;
                System.out.println();
            } catch (Exception exc) {
                throw (RuntimeException) new RuntimeException().initCause(exc);
            }
        }
        
        // with -lm|-lmsc options, load n-gram model
        if (lmfile != null) {
            int order = (tester.ngramOrder > 0) ? tester.ngramOrder : 3;
            String reversedStr = (reverse) ? "reversed " : "";
            System.out.println("Loading " + reversedStr + order
            		+ "-gram model from file: " + lmfile);
            NgramScorer lmScorer = (srilm)
            	? new SRILMNgramModel(order, new File(lmfile), useSemClasses, 
            			srilmModelType)
            	: new StandardNgramModel(order, lmfile, useSemClasses);
            if (reverse) lmScorer.setReverse(true);
            if (aanfilter) lmScorer.addFilter(aanFilter);
            tester.scorer = lmScorer;
            System.out.println();
        }

        // with -flm|-flmsc options, load factored n-gram model family
        if (flmfile != null) {
            String reversedStr = (reverse) ? "reversed " : "";
            System.out.println("Loading " + reversedStr + "factored n-gram model family from file: " + flmfile);
            NgramScorer flmScorer = new FactoredNgramModelFamily(flmfile, useSemClasses);
            if (reverse) flmScorer.setReverse(true);
            if (aanfilter) flmScorer.addFilter(aanFilter);
            tester.scorer = flmScorer;
            tester.ngramOrder = flmScorer.getOrder();
            System.out.println();
        }

        // with -text|-textsc|-textf|-textfsc options, just write text file and exit
        if (textfile != null) {
        	File tbFile = new File(regressionfile);
            tester.writeTargets(tbFile, textfile, useSemClasses, withFactors, reverse);
            System.exit(0);
        }
        
        // with -derivf option, just write derivation factors file and exit
        if (derivfactorsfile != null) {
        	File tbFile = new File(regressionfile);
        	tester.writeDerivationFactors(tbFile, derivfactorsfile);
            System.exit(0);
        }
        
        // setup parser
        if (tester.doParsing) {
            tester.parser = new Parser(tester.grammar);
            // instantiate scorer, if any
            if (parseScorerClass != null) {
                try {
                    System.out.println("Instantiating parsing sign scorer from class: " + parseScorerClass);
                    tester.parseScorer = (SignScorer) Class.forName(parseScorerClass).newInstance();
                    tester.showParseStats = true; // turn parsing stats on
                    System.out.println();
                } catch (Exception exc) {
                    throw (RuntimeException) new RuntimeException().initCause(exc);
                }
            }
            // set parser scorer, if any
            if (tester.parseScorer != null) tester.parser.setSignScorer(tester.parseScorer);
            // also turn on parse stats if doing n-best output
            if (tester.nbestparsefile != null) tester.showParseStats = true;
            // instantiate supertagger, if any
            if (supertaggerClass != null || stconfig != null) {
                try {
                	Supertagger supertagger;
                	if (supertaggerClass != null) {
	                    System.out.println("Instantiating supertagger from class: " + supertaggerClass);
	                    supertagger = (Supertagger) Class.forName(supertaggerClass).newInstance();
                	}
                	else {
                		System.out.println("Instantiating supertagger from config file: " + stconfig);
                		supertagger = WordAndPOSDictionaryLabellingStrategy.supertaggerFactory(stconfig);
                	}
                    tester.parser.setSupertagger(supertagger);
                    if (tester.eventfile != null) {
                    	supertagger.setIncludeGold(true); // use gold tags during training
                    	tester.parser.setSupertaggerMostToLeastRestrictiveDirection(false); // reverse direction to start with least restrictive setting
                    }
                    System.out.println();
                } catch (Exception exc) {
                    throw (RuntimeException) new RuntimeException().initCause(exc);
                }
            }
        }
        
        // setup realizer, show settings
        if (tester.doRealization) {
            tester.realizer = new Realizer(tester.grammar);
            tester.realizer.depthFirst = depthFirst;
            // instantiate pruning strategy, if any
            if (ngrampruningstrategy) {
                int order = (tester.ngramOrder > 0) ? tester.ngramOrder : 3;
                System.out.println("Instantiating n-gram diversity pruning strategy with order " + order);
                tester.realizer.pruningStrategy = new NgramDiversityPruningStrategy(order);
                System.out.println();
            }
            if (pruningStrategyClass != null) {
                try {
                    System.out.println("Instantiating pruning strategy from class: " + pruningStrategyClass);
                    tester.realizer.pruningStrategy = (PruningStrategy) Class.forName(pruningStrategyClass).newInstance();
                    System.out.println();
                } catch (Exception exc) {
                    throw (RuntimeException) new RuntimeException().initCause(exc);
                }
            }
            if (hypertaggerClass != null || htconfig != null) {
                try {
                	Hypertagger hypertagger;
                	if (hypertaggerClass != null) {
                        System.out.println("Instantiating hypertagger from class: " + hypertaggerClass);
                        hypertagger = (Hypertagger) Class.forName(hypertaggerClass).newInstance();
                	}
                	else {
                		System.out.println("Instantiating hypertagger from config file: " + htconfig);
                		hypertagger = ZLMaxentHypertagger.ZLMaxentHypertaggerFactory(htconfig);
                	}
                    tester.realizer.hypertagger = hypertagger;
                    if (tester.eventfile != null) {
                    	hypertagger.setIncludeGold(true); // use gold tags during training
                        // NB: could investigate most-to-least-restrictive direction
                    }
                    if (htgold) hypertagger.setIncludeGold(true); // use gold tags, eg for paraphrasing
                    System.out.println();
                } catch (Exception exc) {
                    throw (RuntimeException) new RuntimeException().initCause(exc);
                }
            }
            showRealizerSettings();
        }
        
        // ensure dir for event file exists; 
        // set up feature extractor
        if (tester.eventfile != null) {
    		File tmp = new File(tester.eventfile); 
    		File tmpParent = tmp.getParentFile(); 
    		if (tmpParent != null) tmpParent.mkdirs(); 
            System.out.println("Writing event file to: " + tester.eventfile);
            System.out.println();
        }
        
        // instantiate feature extractor, if generating events 
        if (tester.eventfile != null) {
        	// ensure just doing parsing or realization
        	if (tester.doParsing && tester.doRealization) {
        		throw new RuntimeException("Events can't be generated for parsing and realization at the same time.");
        	}
        	FeatureExtractor extractor = null;
        	if (extractorClass != null) {
	            try {
	                System.out.println("Instantiating feature extractor from class: " + extractorClass);
	                extractor = (FeatureExtractor) Class.forName(extractorClass).newInstance();
	                tester.featureExtractor = extractor;
	                System.out.println();
	            } catch (Exception exc) {
	                throw (RuntimeException) new RuntimeException().initCause(exc);
	            }
        	}
        	// use or combine with scorer, if it's also a feature extractor
            if (tester.scorer instanceof FeatureExtractor) {
            	if (extractor != null)
            		tester.featureExtractor = new ComposedFeatureExtractor(
            					new FeatureExtractor[] {
            							(FeatureExtractor)tester.scorer, extractor
            					}
            				);
            	else tester.featureExtractor = (FeatureExtractor) tester.scorer;
            }
            else if (tester.parseScorer instanceof FeatureExtractor) {
            	if (extractor != null)
            		tester.featureExtractor = new ComposedFeatureExtractor(
            					new FeatureExtractor[] {
            							(FeatureExtractor)tester.parseScorer, extractor
            					}
            				);
            	else tester.featureExtractor = (FeatureExtractor) tester.parseScorer;
            }
            // otherwise use an n-gram precision model 
            if (tester.featureExtractor == null)
            	tester.featureExtractor = new NgramPrecisionModel(new String[]{""}, true);
            // set new alphabet
            tester.featureExtractor.setAlphabet(new Alphabet(10000));
        }
        
        // ensure apmldir exists
        if (tester.apmldir != null) {
            File apmlDir = new File(tester.apmldir);
            if (!apmlDir.exists()) { apmlDir.mkdirs(); }
            System.out.println("Writing APML files to dir: " + tester.apmldir);
            System.out.println();
        }

        // ensure dir for bleu files exists
        if (tester.bleufileprefix != null) {
    		File tmp = new File(tester.bleufileprefix + "-gen.sgm");  
    		File tmpParent = tmp.getParentFile(); 
    		if (tmpParent != null) tmpParent.mkdirs(); 
            System.out.println("Writing BLEU files to: " + tester.bleufileprefix + "-*.sgm");
            System.out.println();
        }
        
        // ensure dir for nbestrealfile exists
        if (tester.nbestrealfile != null) {
    		File tmp = new File(tester.nbestrealfile);
    		File tmpParent = tmp.getParentFile(); 
    		if (tmpParent != null) tmpParent.mkdirs(); 
            System.out.println("Writing N-best realizations to: " + tester.nbestrealfile);
            System.out.println();
        }
        
        // ensure realserdir exists
        if (tester.realserdir != null) {
            File realserDir = new File(tester.realserdir);
            if (!realserDir.exists()) { realserDir.mkdirs(); }
            System.out.println("Writing best realization serialization files to dir: " + tester.realserdir);
            System.out.println();
        }

        // ensure dir for rescorefile exists
        if (tester.rescorefile != null) {
    		File tmp = new File(tester.rescorefile);
    		File tmpParent = tmp.getParentFile(); 
    		if (tmpParent != null) tmpParent.mkdirs(); 
            System.out.println("Writing rescored sign scores to: " + tester.rescorefile);
            System.out.println();
        }
                
        // run test
        tester.runTest(new File(regressionfile));
    }
}


================================================
FILE: src/opennlp/ccg/test/RegressionInfo.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003-4 Jason Baldridge and University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.test;

import opennlp.ccg.grammar.Grammar;
import opennlp.ccg.synsem.*;

import org.jdom.*;
import org.jdom.input.*;
import java.io.*;
import java.util.*;

/**
 * Manages the info in a regression test file.
 *
 * @author  Jason Baldridge
 * @author  Michael White
 * @version $Revision: 1.16 $, $Date: 2011/08/27 19:27:01 $
 */
public class RegressionInfo {

    // the grammar
    private Grammar grammar;
    
    // the test items
    private TestItem[] testItems;
    
    /** Test item. */
    public class TestItem {
        /** The test sentence/phrase. */
        public String sentence;
        /** An alternative paraphrase to target, or null if none. */
        public String alt = null;
        /** The desired number of parses. */
        public int numOfParses = 1;
        /** Whether the sentence/phrase is known to fail to parse. */
        public boolean knownFailure = false;
        /** The full words for the sentence/phrase, or null if none, formatted by the configured tokenizer. */
        public String fullWords = null;
        /** The LF, in XML, for the sentence/phrase, or null if none. */
        public Element lfElt = null;
        /** Any additionally id info, or null if none. */
        public String info = null;
		/** The gold std nominal id name & supertag for LF predicates. @deprecated Should use fullWords. */
		public String predInfo = null;
		/** The gold standard derivation. */
		public Sign sign = null;
		/** Returns the id from info, without prefixed "ID=" if present. */
		public String getId() {
			if (info == null) return null;
			int pos = info.indexOf('=');
			return (pos < 0) ? info : info.substring(pos+1);
		}
    }

    /** Reads in the given regression test file and corresponding .ser file, if any. */    
    public RegressionInfo(Grammar grammar, File regressionFile) throws FileNotFoundException {
    	this(grammar, new FileInputStream(regressionFile), serStream(regressionFile));
    }
    
    /** Reads in a regression test from the given input stream and object input stream. */    
	@SuppressWarnings("unchecked")
	public RegressionInfo(Grammar grammar, InputStream istr, ObjectInputStream serStream) {
        this.grammar = grammar;
        SAXBuilder builder = new SAXBuilder();
        try {
        	Map<String,Sign> signMap = readSerStream(serStream);
            Document doc = builder.build(istr);
            Element root = doc.getRootElement();
            List<Element> items = root.getChildren("item");
            testItems = new TestItem[items.size()];
            for (int i = 0; i < items.size(); i++) {
                Element item = (Element) items.get(i);
                TestItem testItem = new TestItem();
                testItems[i] = testItem;
                testItem.sentence = item.getAttributeValue("string");
                testItem.alt = item.getAttributeValue("alt");
                testItem.numOfParses = Integer.parseInt(item.getAttributeValue("numOfParses"));
                testItem.knownFailure = ("true".equals(item.getAttributeValue("known"))) ? true : false;
                Element fullWordsElt = item.getChild("full-words");
                if (fullWordsElt != null) testItem.fullWords = fullWordsElt.getTextNormalize();
                testItem.lfElt = item.getChild("lf");
                testItem.info = item.getAttributeValue("info");
				Element predInfoElt = item.getChild("pred-info");
				if (predInfoElt != null) testItem.predInfo = predInfoElt.getAttributeValue("data");
				if (signMap != null && testItem.info != null) testItem.sign = signMap.get(testItem.info);
            }
        } catch (Exception e) {
            throw (RuntimeException) new RuntimeException().initCause(e);
        }
    }

    
    /** Returns the corresponding .ser file for loading sign objects. */
    public static File serFile(File regressionFile) {
    	String name = regressionFile.getName();
    	String prefix = name.substring(0, name.lastIndexOf('.'));
    	return new File(regressionFile.getParentFile(), prefix + ".ser");
    }

    /** Returns object input stream for corresponding .ser file, or null if none. */
    public static ObjectInputStream serStream(File regressionFile) {
    	File serFile = serFile(regressionFile);
    	if (serFile.exists()) {
			try {
				return new ObjectInputStream(new FileInputStream(serFile));
			} catch (FileNotFoundException e) {
	            throw (RuntimeException) new RuntimeException().initCause(e); 
			} catch (IOException e) {
	            throw (RuntimeException) new RuntimeException().initCause(e);
			}
    	}
		else return null;
    }
    
    /** Reads in a map of info keys and gold standard signs from the given stream, or returns null if the stream is null. */
    @SuppressWarnings("unchecked")
	public static Map<String,Sign> readSerStream(ObjectInputStream serStream) throws IOException {
    	if (serStream == null) return null;
    	try {
			return (Map<String,Sign>) serStream.readObject();
		} catch (ClassNotFoundException e) {
            throw (RuntimeException) new RuntimeException().initCause(e);
		}
    }
    
    /** Writes the map of info keys and gold standard signs to the corresponding .ser file. */
    public static void writeSerFile(Map<String,Sign> signMap, File regressionFile) throws FileNotFoundException, IOException {
    	File serFile = serFile(regressionFile);
    	ObjectOutputStream oos = new ObjectOutputStream(new FileOutputStream(serFile));
    	oos.writeObject(signMap);
    	oos.close();
    }
    
    
    /** Returns the number of test items. */
    public int numberOfItems() {
        return testItems.length;
    }
    
    /** Returns the test item with the given index. */ 
    public TestItem getItem(int i) {
        return testItems[i];
    }
    
    
    /**
     * Makes an XML test item from the given test item object.
     */
    public static Element makeTestItem(TestItem testItem) {
        Element item = new Element("item");
        item.setAttribute("numOfParses", "" + testItem.numOfParses);
        if (testItem.knownFailure) item.setAttribute("known", "true");
        item.setAttribute("string", testItem.sentence);
        if (testItem.alt != null) item.setAttribute("alt", testItem.alt);
        if (testItem.fullWords != null) {
            Element fullWordsElt = new Element("full-words");
            item.addContent(fullWordsElt);
            fullWordsElt.addContent(testItem.fullWords);
        }
        if (testItem.lfElt != null) {
            testItem.lfElt.detach();
            item.addContent(testItem.lfElt);
        }
        if (testItem.info != null) item.setAttribute("info", testItem.info);
        return item;
    }
    
    /**
     * Makes an XML test item with the given string, number of parses and LF, 
     * applying the configured to-XML transformations.
     */
    public Element makeTestItem(String target, int numParses, LF lf) throws IOException { 
        return makeTestItem(grammar, target, numParses, lf);
    }
    
    /**
     * Makes an XML test item with the given string, number of parses and LF, 
     * applying the configured to-XML transformations.
     */
    public static Element makeTestItem(Grammar grammar, String target, int numParses, LF lf) throws IOException { 
        return makeTestItem(grammar, target, numParses, lf, null);
    }

    /**
     * Makes an XML test item with the given string, number of parses, LF and info attribute,  
     * applying the configured to-XML transformations.
     */
    public static Element makeTestItem(Grammar grammar, String target, int numParses, LF lf, String info) throws IOException { 
        Element item = new Element("item");
        item.setAttribute("numOfParses", "" + numParses);
        item.setAttribute("string", target);
        if (lf != null) item.addContent(grammar.makeLfElt(lf));
        if (info != null) item.setAttribute("info", info);
        return item;
    }

    /**
     * Adds the given sign with its string, number of parses and converted LF 
     * as a test item to the testbed with the given filename, applying the configured to-XML
     * transformations.
     */
    public static void addToTestbed(Grammar grammar, Sign sign, int numParses, LF lf, String filename) throws IOException { 

        // ensure dirs exist for filename
        File file = new File(filename);
        File parent = file.getParentFile();
        if (parent != null && !parent.exists()) { parent.mkdirs(); }
        
        // load or make doc
        Document doc; 
        Element root;
        boolean newDoc = false;
        if (file.exists()) {
            // read XML
            SAXBuilder builder = new SAXBuilder();
            try {
                doc = builder.build(file);
            } catch (JDOMException jde) {
                throw (IOException) new IOException().initCause(jde);
            }
            root = doc.getRootElement();
        }
        else {
            doc = new Document();
            root = new Element("regression");
            doc.setRootElement(root);
            newDoc = true;
        }
        
        // load or make sign map
    	Map<String,Sign> signMap = readSerStream(serStream(file));
    	if (signMap == null) signMap = new HashMap<String,Sign>();
        
    	// find unique id
    	int count = 0;
    	String id = "i" + count;
    	while (signMap.containsKey(id)) id = "i" + ++count;
    	
        // make test item
    	String target = sign.getOrthography();
        Element item = makeTestItem(grammar, target, numParses, lf, id);
        
        // append new item
        if (!newDoc) root.addContent("  "); // nb: for some reason, this gets the indenting right
        root.addContent(item);
        
        // add sign to map
        signMap.put(id, sign);
        
        // save
        FileOutputStream out = new FileOutputStream(file); 
        grammar.serializeXml(doc, out);
        out.close();
        writeSerFile(signMap, file);
    }
}


================================================
FILE: src/opennlp/ccg/test/ScorerMaker.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2004 University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.test;

import opennlp.ccg.synsem.SignScorer;

import java.io.*;

/**
 * Interface for making custom scorers for use in cross-validation tests with the realizer.
 *
 * @author  Michael White
 * @version $Revision: 1.6 $, $Date: 2007/12/21 05:13:37 $
 */
public interface ScorerMaker {

    /**
     * Sets the context for this scorer maker.
     */
    public void setCVR(CrossValidateRealizer cvr);
    
    /**
     * Prepares a scoring model from the training data. 
     * The data can be accessed by creating a RegressionInfo 
     * object from the given training file.
     * The test data is also made available to optionally 
     * compute perplexity or other measures.
     * The model can be stored in a file in tmpDir, keyed off of foldNum.
     */
    public void prepScorer(File tmpDir, int foldNum, File trainFile, File testFile) throws IOException;
    
    /**
     * Optionally summarizes perplexity or other measures 
     * after all calls to prepScorer.
     */
    public void prepScorersSummary(File tmpDir) throws IOException;
    
    /**
     * Loads a scoring model created from the training data. 
     */
    public SignScorer loadScorer(File tmpDir, int foldNum, File trainFile) throws IOException;
}


================================================
FILE: src/opennlp/ccg/test/TimingMap.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003-4 University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.test;

import java.util.*;

import org.jdom.*;

/**
 * Utility class for managing average times per number of nodes.
 *
 * @author  Michael White
 * @version $Revision: 1.5 $, $Date: 2009/12/21 04:18:31 $
 */
public class TimingMap {
    
    private String label;
    private List<Integer> times = new ArrayList<Integer>();
    private HashMap<Integer,List<Integer>> map = new HashMap<Integer,List<Integer>>();
    
    /** Constructor, with label. */
    public TimingMap(String label) {
        this.label = label;
    }
    
    /** Adds a number, time pair. */
    public void add(int num, int time) {
        Integer timeInt = new Integer(time);
        times.add(timeInt); 
        Integer key = new Integer(num);
        List<Integer> timesPerNum = map.get(key);
        if (timesPerNum == null) {
            timesPerNum = new ArrayList<Integer>();
            map.put(key, timesPerNum);
        }
        timesPerNum.add(timeInt);
    }
    
    /** Returns the mean time. */
    public double mean() {
        int total = 0;
        for (int i = 0; i < times.size(); i++) {
            Integer time = times.get(i);
            total += time.intValue();
        }
        return (1.0 * total) / times.size(); 
    }
    
    /** Returns the standard deviation. */
    public double sigma() {
        if (times.size() < 2) return -1; // NA
        double mean = mean();
        double numerator = 0;
        for (int i = 0; i < times.size(); i++) {
            Integer time = times.get(i);
            numerator += Math.pow(time.intValue() - mean, 2);
        }
        int denominator = times.size() - 1;
        return Math.sqrt(numerator / denominator);
    }
    
    /** Saves the times and times per number (with average) as XML elements under the given one. */
    public void saveTimes(Element root) {
        Element timesElt = new Element("times");
        root.addContent(timesElt);
        timesElt.setAttribute("label", label);
        Element listElt = new Element("list");
        timesElt.addContent(listElt);
        listElt.setAttribute("mean", "" + mean());
        listElt.setAttribute("sigma", "" + sigma());
        for (int i = 0; i < times.size(); i++) {
            Element timeElt = new Element("time");
            listElt.addContent(timeElt);
            timeElt.setAttribute("val", times.get(i).toString());
        }
        Element perNumsElt = new Element("per-nums");
        timesElt.addContent(perNumsElt);
        Set<Integer> keys = map.keySet();
        List<Integer> nums = new ArrayList<Integer>(keys.size());
        nums.addAll(keys);
        Collections.sort(nums);
        int min = nums.get(0).intValue();
        int max = nums.get(nums.size()-1).intValue();
        for (int num = min; num <= max; num++) {
            Element perNumElt = new Element("per");
            perNumsElt.addContent(perNumElt);
            perNumElt.setAttribute("num", "" + num);
            Integer numKey = new Integer(num);
            List<Integer> timesPer = map.get(numKey);
            if (timesPer == null) { 
                perNumElt.setAttribute("count", "0");
                continue; 
            }
            int sum = 0;
            int count = timesPer.size();
            perNumElt.setAttribute("count", "" + count);
            for (int i = 0; i < timesPer.size(); i++) {
                Integer time = (Integer) timesPer.get(i);
                sum += time.intValue();
                Element timeElt = new Element("time");
                perNumElt.addContent(timeElt);
                timeElt.setAttribute("val", time.toString());
            }
            double mean = (sum * 1.0) / count;
            perNumElt.setAttribute("mean", "" + mean);
        }
    }
}


================================================
FILE: src/opennlp/ccg/test/UpdateTestbed.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2004 University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.test;

import opennlp.ccg.grammar.*;
import opennlp.ccg.lexicon.*;

import org.jdom.*;

import java.io.*;
import java.net.*;
import java.util.*;

/**
 * Utility class to update testbed files; just adds full words based on 
 * sign or parse at present.
 *
 * @author      Michael White
 * @version     $Revision: 1.5 $, $Date: 2009/12/21 04:18:31 $
 */
public class UpdateTestbed
{
    /** The grammar. */
    private Grammar grammar; 

    /** Constructor. */
    private UpdateTestbed(URL grammarURL) throws IOException {
        // load grammar
        System.out.println("Loading grammar from URL: " + grammarURL);
        grammar = new Grammar(grammarURL);
    }
    
    
    /** Adds full words for each test item, if missing, based on the sign or parse. */
    private void addFullWords(File tbFile) throws IOException {
        
        // load testbed
        System.out.println("Loading testbed from: " + tbFile);
        RegressionInfo tbInfo = new RegressionInfo(grammar, tbFile);
        
        // create output doc
        Document outDoc = new Document();
        Element outRoot = new Element("regression");
        outDoc.setRootElement(outRoot);

        // update each one
        int numItems = tbInfo.numberOfItems();
        Tokenizer tokenizer = grammar.lexicon.tokenizer;
        System.out.print("Adding full words ");
        for (int i = 0; i < numItems; i++) {
            RegressionInfo.TestItem testItem = tbInfo.getItem(i);
            if (testItem.fullWords == null) {
                List<Word> words = (testItem.sign != null) 
                	? testItem.sign.getWords() 
                	: grammar.getParsedWords(testItem.sentence);
                testItem.fullWords = tokenizer.format(words);
            }
            outRoot.addContent(RegressionInfo.makeTestItem(testItem));
            System.out.print("."); // indicate progress
        }
        System.out.println();
        
        // save file, backing up original
        File tbFileBackup = new File(tbFile.getParentFile(), tbFile.getName() + "~");
        System.out.println("Backing up testbed to: " + tbFileBackup);
        tbFile.renameTo(tbFileBackup);
        System.out.println("Saving results to: " + tbFile);
        FileOutputStream out = new FileOutputStream(tbFile); 
        grammar.serializeXml(outDoc, out);
        out.close();
    }

    
    /** Updates the given input file. */    
    public static void main(String[] args) throws IOException {
        
        String usage = "Usage: java opennlp.ccg.test.UpdateTestbed (-g <grammarfile>) (-add-full-words) (<testbedfile>)";
        
        if (args.length > 0 && args[0].equals("-h")) {
            System.out.println(usage);
            System.exit(0);
        }

        // args
        String grammarfile = "grammar.xml";
        String testbedfile = "testbed.xml";
        boolean addFullWords = false;
        for (int i = 0; i < args.length; i++) {
            if (args[i].equals("-g")) {
                grammarfile = args[++i]; continue; 
            }
            if (args[i].equals("-add-full-words")) {
                addFullWords = true; continue; 
            }
            testbedfile = args[i];
        }

        // create updater, check testbed exists
        File gFile = new File(grammarfile);
        URL grammarURL = gFile.toURI().toURL();
        File tbFile = new File(testbedfile);
        if (!tbFile.exists()) {
            tbFile = new File(gFile.getParentFile(), testbedfile);
        }
        if (!tbFile.exists()) {
            System.out.println("Unable to find testbed file: " + testbedfile);
            System.exit(-1);
        }
        UpdateTestbed updater = new UpdateTestbed(grammarURL); 
        
        // do tasks
        if (addFullWords) updater.addFullWords(tbFile);
        
        System.out.println("Done.");
    }
}


================================================
FILE: src/opennlp/ccg/test/Validator.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003 University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.test;

// import javax.xml.parsers.*;
import org.xml.sax.*;
import org.xml.sax.helpers.*;
// import java.net.*;


/**
 * Validates XML files against their declared schemas.
 *
 * @author  Michael White
 * @version $Revision: 1.4 $, $Date: 2005/10/20 18:49:42 $
 */
public class Validator {

    public static void main(String[] args) throws Exception {
        
        if (args.length == 0) {
            System.out.println("Usage: java opennlp.ccg.test.Validator <XML files>");
            System.exit(1);
        }

        // configure schema validating XML parser
        XMLReader parser = getXercesSchemaValidatingParser();
        
        // parse
        for (int i = 0; i < args.length; i++) {
            // System.out.println("Parsing: " + args[i]);
            parser.parse(args[i]);
        }
    }

    // NB: this requires xercesImpl.jar, but on the other hand it does not seem 
    //     possible to validate with the version of JAXP that comes with JDK 1.4.1
    //     (cf. JAXP sample SAXLocalNameCount.java)
    private static XMLReader getXercesSchemaValidatingParser() throws Exception {
        String DEFAULT_PARSER_NAME = "org.apache.xerces.parsers.SAXParser";
        XMLReader parser = XMLReaderFactory.createXMLReader(DEFAULT_PARSER_NAME);
        String VALIDATION_FEATURE_ID = "http://xml.org/sax/features/validation";
        String SCHEMA_VALIDATION_FEATURE_ID = "http://apache.org/xml/features/validation/schema";
        parser.setFeature(VALIDATION_FEATURE_ID, true);
        parser.setFeature(SCHEMA_VALIDATION_FEATURE_ID, true);
        return parser;
    }
}


================================================
FILE: src/opennlp/ccg/unify/EmptySubstitution.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2002 Jason Baldridge
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.unify;

import java.util.Iterator;


/**
 * A Substitution which does not hold any substitutions.
 * 
 * @author Jason Baldridge
 * @version $Revision: 1.2 $, $Date: 2005/10/20 17:30:30 $
 */
public class EmptySubstitution implements Substitution {

	public Object makeSubstitution(Variable var, Object u) throws UnifyFailure {
		return u;
	}

	public Object getValue(Variable var) {
		return null;
	}

	public Iterator<Variable> varIterator() {
		return null;
	}

}


================================================
FILE: src/opennlp/ccg/unify/Feature.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2002 Jason Baldridge and Gann Bierner
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.unify;

/**
 * An attribute paired with a value, possibly with an index that ties
 * it to another feature.
 *
 * @author      Jason Baldridge
 * @version     $Revision: 1.1.1.1 $, $Date: 2003/02/28 18:02:13 $
 **/
public interface Feature {

    public String getAttribute ();
    public Unifiable getValue ();
    public short getIndex ();

    public void setValue (Unifiable u);
    public void setIndex (short index);

}


================================================
FILE: src/opennlp/ccg/unify/FeatureStructure.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2002-5 Jason Baldridge, Gann Bierner and 
//                      University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.unify;

import java.util.Set;

/**
 * A feature structure containing attributes and their associated values.
 *
 * @author      Jason Baldridge
 * @author      Gann Bierner
 * @author      Michael White
 * @version     $Revision: 1.5 $, $Date: 2009/02/16 17:31:38 $
 */
public interface FeatureStructure extends Unifiable, Mutable {

    /**
     * Store a attribute/value pair
     *
     * @param attribute the attribute of the feature
     * @param value the value of the feature
     */
    public void setFeature(String attribute, Object value);


    /**
     * Get the value corresponding to an attribute.
     *
     * @param attribute the attribute of the feature
     * @return the value of the feature
     */
    public Object getValue(String attribute);
    
    /**
     * Checks to see if the feature structure contains a feature with 
     * the given attribute.
     *
     * @param attribute the attribute
     * @return if this structure contains that attribute
     */
    public boolean hasAttribute(String attribute);

    /**
     * Checks to see if an attribute has a particular value in this structure
     *
     * @param attribute the attribute
     * @param value the value
     * @return if this structure contains that attribute/value pair
     */
    public boolean attributeHasValue(String attribute, Object value);


    /**
     * The all attributes in set form
     *
     * @return the set of attributes
     */
    public Set<String> getAttributes();

    
    /**
     * The number of features in this feature structure
     *
     * @return number of features in this feature structure
     */
    public int size();

    
    /**
     * Returns whether or not this feature structure contains any features
     *
     * @return whether this feature structure contains any features
     */
    public boolean isEmpty();

    
    /**
     * Explictly clear the attribute value mappings in this feature structure
     *
     * @param b the empty value
     */
    public void clear();
    

    /**
     * Makes a deep copy of this feature structure.
     *
     * @return a copy of this feature structure
     */
    public FeatureStructure copy();


    /**
     * Computes whether this feature structure contains (is a superset
     * of) another feature structure.
     *
     * @param fs the possibly contained feature structure
     * @return if that structure is a subset of this one 
     */
    public boolean contains(FeatureStructure fs);

    /**
     * Changes this feature structure such that all its features that
     * are in another feature structure are changed to have the values of
     * the other feature structure.  This is destructive.
     *
     * @param f the feature structure to inherit from
     * @return the changed feature structure
     */
    public FeatureStructure inherit(FeatureStructure fs);

    /**
     * Determines if this feature structure is exactly the same as another.  This
     * means that for every feature, the structures have exactly the same value.
     *
     * @param f the other feature structure
     * @return if this structure is the same as the other
     */
    public boolean equals(FeatureStructure fs);

    /** Returns the index. */
    public int getIndex();
    /** Sets the index. */
    public void setIndex(int index);
    /** Returns the inheritsFrom (default unification) index. */
    public int getInheritsFrom();
    
    /**
     * Returns the supertag info for this feature structure.
     */
    public String getSupertagInfo();
    
    /**
     * Returns a TeX formatted feature structure.
     */
    public String toTeX();
}


================================================
FILE: src/opennlp/ccg/unify/GFeatStruc.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003-7 Jason Baldridge, Gann Bierner, Michael White and Gunes Erkan
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.unify;

import opennlp.ccg.synsem.LF;
import opennlp.ccg.hylo.*;
import opennlp.ccg.grammar.*;
import gnu.trove.*;
import org.jdom.*;
import java.util.*;


/**
 * A feature structure for use with CCG categories.
 *
 * @author      Jason Baldridge
 * @author      Gann Bierner
 * @author      Michael White
 * @author      Gunes Erkan
 * @version     $Revision: 1.29 $, $Date: 2011/11/11 15:30:42 $
 */
public class GFeatStruc extends HashMap<String,Object> implements FeatureStructure {

	private static final long serialVersionUID = 1L;

	boolean _empty = true;
    int _index = 0;
    int _inheritsFrom = 0;
    
    public GFeatStruc() {
        super(3);
    }

    public GFeatStruc(int i) {
        super(i);
    }

    @SuppressWarnings("unchecked")
	public GFeatStruc(Element fsEl) {
        super(fsEl.getChildren().size());
        String index = fsEl.getAttributeValue("id");
        if (index != null) {
            _index = Integer.parseInt(index);
        }
        String inheritsFrom = fsEl.getAttributeValue("inheritsFrom");
        if (inheritsFrom != null) {
            _inheritsFrom = Integer.parseInt(inheritsFrom);
        }
        List<Element> feats = fsEl.getChildren();
        if (feats.size() == 0) {
            setFeature(fsEl);
        }
        else {
            for (Iterator<Element> featIt=feats.iterator(); featIt.hasNext();) {
                setFeature((Element)featIt.next());
            }
        }
    }
    
    public Element toXml() {
    	Element retval = new Element("fs");
    	if (_index > 0) retval.setAttribute("id", Integer.toString(_index));
    	if (_inheritsFrom > 0) retval.setAttribute("inheritsFrom", Integer.toString(_inheritsFrom));
    	List<String> keys = new ArrayList<String>(keySet()); 
		Collections.sort(keys);
    	if (size() == 1 && get(keys.get(0)) instanceof SimpleType) {
    		String attr = keys.get(0); SimpleType val = (SimpleType) get(attr);
    		retval.setAttribute("attr", attr);
    		retval.setAttribute("val", val.getName());
    	}
    	else {
    		for (String attr : keys) {
    			Element featElt = new Element("feat");
    			featElt.setAttribute("attr", attr);
    			retval.addContent(featElt);
    			Object val = get(attr);
    			if (val instanceof SimpleType) 
    				featElt.setAttribute("val", ((SimpleType) val).getName());
    			else {
    				if (val instanceof GFeatVar) {
    					GFeatVar var = (GFeatVar) val;
    					Element varElt = new Element("featvar");
    					featElt.addContent(varElt);
    					String name = var.name();
    					String typeName = var.getType().getName();
    					if (!typeName.equals(Types.TOP_TYPE)) name += ":" + typeName;
    					varElt.setAttribute("name", name);
    				}
    				else if (val instanceof LF)
    					featElt.addContent(HyloHelper.toXml((LF)val));
    				else 
    					throw new RuntimeException("Unsupported feature value type in constructing XML: " + val);
    			}
    		}
    	}
    	return retval;
    }

    public void deepMap(ModFcn mf) {
        for (Iterator<String> attributes=keySet().iterator(); attributes.hasNext();) {
            Object val1 = getValue(attributes.next());
            if (val1 instanceof Mutable) {
                ((Mutable)val1).deepMap(mf);
            }
        }
        mf.modify(this);
    }

    public void setFeature(String attribute, Object val) { 
        put(attribute, val);
        _empty = false;
    }

    private void setFeature(Element e) {
        String attr = e.getAttributeValue("attr");
        if (attr == null) attr = e.getAttributeValue("a");
        if (attr == null) {
            return;
        }
        String val = e.getAttributeValue("val");
        if (val == null) val = e.getAttributeValue("v");
        Object value;
        if (val != null) {
            value = Grammar.theGrammar.types.getSimpleType(val);
        } else {
            Element valEl = (Element)e.getChildren().get(0);
            if (valEl.getName().equals("featvar") || valEl.getName().equals("fvar")) {
                String[] name = valEl.getAttributeValue("name").split(":");
                if (name[0]==null) name = valEl.getAttributeValue("n").split(":",2);
                if (name.length<2) {
                    value = new GFeatVar(name[0]);
                }
                else
                    value = new GFeatVar(name[0], Grammar.theGrammar.types.getSimpleType(name[1]));
            } else {
                value = HyloHelper.getLF((Element)e.getChildren().get(0));
            }
        }
        setFeature(attr, value);
    }
    
    public Object getValue(String attribute) {
        return get(attribute);
    }

    public boolean hasAttribute(String attribute) {
        return containsKey(attribute);
    }

    public boolean attributeHasValue(String attribute, Object val) {
        return val.equals(getValue(attribute));
    }

    public Set<String> getAttributes() {
        return keySet();
    }
    
    public void clear() { 
        clear();
        _empty = true;
    }

    /** Returns true iff this feature structure has the same index and set of attr-val pairs. */
    public boolean equals(FeatureStructure fs) {
        if (!(fs instanceof GFeatStruc)) return false;
        GFeatStruc bfs = (GFeatStruc)fs;
        
        if (_index != bfs._index) return false; 

        if (size() != bfs.size()) return false;
        Set<String> atts1 = getAttributes();
        Set<String> atts2 = bfs.getAttributes();
        if (!atts1.containsAll(atts2)) return false;
        
        for (Iterator<String> it = atts1.iterator(); it.hasNext(); ) {
            String att = it.next();
            if (!getValue(att).equals(bfs.getValue(att))) return false;
        }
        
        return true;
    }
    
    /** Returns a hash code consistent with equals. */
    public int hashCode() { return super.hashCode() + _index; }

    public FeatureStructure copy() { 
        GFeatStruc $fs = new GFeatStruc(size());
        $fs.setIndex(_index);
        $fs._inheritsFrom = _inheritsFrom;
        for (Iterator<String> i=getAttributes().iterator(); i.hasNext();) {
            String a = i.next();
            $fs.setFeature(a, UnifyControl.copy(getValue(a)));
        }
        return $fs;
    }

    public boolean contains(FeatureStructure fs) { 
        if (size() < fs.size())
            return false;
        
        Set<String> atts1 = getAttributes();
        Set<String> atts2 = fs.getAttributes();
        if (atts1.containsAll(atts2)) {
            for (Iterator<String> i2 = atts2.iterator(); i2.hasNext();) {
                String a2 = i2.next();
                boolean foundA2 = false;
                for (Iterator<String> i1 = atts1.iterator(); !foundA2 && i1.hasNext();) {
                    String a1 = i1.next();
                    if (a1.equals(a2)) {
                        if (!getValue(a1).equals(fs.getValue(a2)))
                            return false;
                        foundA2 = true;
                    }
                }
            }
            return true;
        }
        else {
            return false;
        }
    }

    public boolean occurs(Variable v) {
        for (Iterator<?> i = values().iterator(); i.hasNext();) {
            Object $_ = i.next();
            if ($_ instanceof Unifiable && ((Unifiable)$_).occurs(v))
                return true;
        }
        return false;
    }

    public void unifyCheck(Object u) throws UnifyFailure {
        if (!(u instanceof FeatureStructure)) {
            throw new UnifyFailure();
        }
        // look for incompatible string-valued features
        FeatureStructure fs2 = (FeatureStructure)u;
        Set<String> keys1 = getAttributes();
        for (Iterator<String> i1=keys1.iterator(); i1.hasNext();) {
            String k1 = i1.next();
            Object val1 = getValue(k1);
            if (!(val1 instanceof SimpleType)) continue;
            Object val2 = fs2.getValue(k1);
            if (!(val2 instanceof SimpleType)) continue;
            ((SimpleType)val1).unifyCheck(val2);
        }
    }

    public Object unify(Object u, Substitution sub) throws UnifyFailure { 

        if (!(u instanceof FeatureStructure)) {
            throw new UnifyFailure();
        } 

        FeatureStructure fs2 = (FeatureStructure)u;
        FeatureStructure $fs = new GFeatStruc(size());
        Set<String> keys1 = getAttributes();
        Set<String> keys2 = fs2.getAttributes();
        for (Iterator<String> i1=keys1.iterator(); i1.hasNext();) {
            String k1 = i1.next();
            Object val1 = getValue(k1);
            Object val2 = fs2.getValue(k1);
            if (val2 != null) {
                $fs.setFeature(k1, Unifier.unify(val1, val2, sub));
            }
            else {
                $fs.setFeature(k1, UnifyControl.copy(val1));
            }
        }
        for (Iterator<String> i2=keys2.iterator(); i2.hasNext();) {
            String k2 = i2.next();
            if (!keys1.contains(k2))
                $fs.setFeature(k2, UnifyControl.copy(fs2.getValue(k2)));
        }

        int fs2Index = fs2.getIndex();
        int newIndex = 0;
        if (_index == 0) {
            newIndex = fs2Index;
        } else if (fs2Index == 0) {
            newIndex = _index;
        } else if (sub instanceof GSubstitution) {
            newIndex = ((GSubstitution)sub).makeNewIndex(_index, fs2Index);
        }
        $fs.setIndex(newIndex);

        if (sub instanceof GSubstitution && newIndex > 0) {
            ((GSubstitution)sub).addIndexedObject(newIndex,$fs);
        }
        return $fs;
    }

    public Object fill(Substitution sub) throws UnifyFailure {
        FeatureStructure $fs = copy();
        for (Iterator<String> i = $fs.getAttributes().iterator(); i.hasNext();) {
            String a = i.next();
            Object value = getValue(a);
            if (value instanceof Variable) {
                Object varVal = sub.getValue((Variable)value);
                if (null != varVal) {
                    $fs.setFeature(a, Unifier.unify(value,varVal,sub));
                }
            }
        }
        if (_index > 0 && sub instanceof GSubstitution) {
            FeatureStructure otherVals =
                (FeatureStructure)((GSubstitution)sub).getIndexedObject(_index);
            if (null != otherVals) {
                if (!$fs.equals(otherVals)) {
                    $fs = (FeatureStructure)$fs.unify(otherVals, sub);
                    $fs.setIndex(otherVals.getIndex());
                }
            }
        }
        return $fs;
    }

    public FeatureStructure inherit(FeatureStructure fs) { 
        FeatureStructure $fs = copy();
        for (Iterator<String> i = fs.getAttributes().iterator(); i.hasNext();) {
            String a = i.next();
            $fs.setFeature(a, UnifyControl.copy(fs.getValue(a)));
        }
        return $fs;
    }

    public int getIndex() {
        return _index;
    }

    public void setIndex(int index) {
        _index = index;
    }

    public int getInheritsFrom() {
        return _inheritsFrom;
    }

    private void addFeatureString(String attribute, StringBuffer sb) {
        Object val = getValue(attribute);
        sb.append(attribute).append('=').append(val.toString());
    }
    
    public String toString() {

        // if (_empty) return "";

        StringBuffer sb = new StringBuffer(size()*4);
 
        if (_index > 0) {
            sb.append('<'); sb.append(_index); sb.append('>');
        }
        
        if (_empty) return sb.toString();

        String featsToShow = Grammar.theGrammar.prefs.featsToShow;

        sb.append('{');

        List<String> filteredKeys = new ArrayList<String>(size());
        if (featsToShow.length() == 0) {
            filteredKeys.addAll(keySet());
        }
        else {
            for (Iterator<String> it = keySet().iterator(); it.hasNext(); ) {
                String key = it.next();
                if (featsToShow.indexOf(key) != -1) 
                    filteredKeys.add(key);
            }
        }
        String[] keys = new String[filteredKeys.size()];
        filteredKeys.toArray(keys);
        Arrays.sort(keys);
        
        for (int i=0; i < keys.length; i++) {
            addFeatureString(keys[i], sb);
            if (i < keys.length - 1) sb.append(", ");
        }
        
        sb.append('}');
        
        return sb.toString();
    }

    /**
     * Returns the supertag info for this feature structure.
     * In particular, returns the values of any non-variable 
     * features of interest, within square brackets.
     * The features of interest are configurable 
     * at the grammar level.
     */
    public String getSupertagInfo() {
        if (_empty) return "";
        StringBuffer sb = new StringBuffer();
        ArrayList<String> attrs = new ArrayList<String>(getAttributes());
        Collections.sort(attrs);
        Set<String> supertagFeatures = Grammar.theGrammar.supertagFeatures;
        for (int i = 0; i < attrs.size(); i++) {
            String attr = attrs.get(i);
            if (!supertagFeatures.contains(attr)) continue;
            Object val = getValue(attr);
            if (val instanceof Variable) continue;
            String s = val.toString();
            if (s.equals("+") || s.equals("-")) s = s + attr;
            sb.append('[').append(s).append(']');
        }
        return sb.toString();
    }
    
    private void addFeatureTeX(String attribute, StringBuffer sb) {
        Object val = getValue(attribute);
        String s = cleanText(val.toString());
        if (s.equals("+") || s.equals("-")) s = attribute + s;
        sb.append(" ").append(s);
    }
    
    // makes sure every special character is handled correctly in LaTeX
    private String cleanText(String s) {
        String str = s;
        try {
            //order matters!!
            str = str.replaceAll("\\\\", " \\\\\\backslash ");
            str = str.replaceAll("\\{", " \\\\\\{ ");
            str = str.replaceAll("\\}", " \\\\\\} ");
            str = str.replaceAll("\\$", " \\\\\\$ ");
            str = str.replaceAll("\\#", " \\\\\\# ");
            str = str.replaceAll("\\%", " \\\\\\% ");
            str = str.replaceAll("\\&", " \\\\\\& ");
            str = str.replaceAll("\\~", "  \\\\\\tilde\\{\\} ");
            str = str.replaceAll("\\_", " \\\\\\_ ");
            str = str.replaceAll("\\^", "  \\\\\\hat\\{\\} ");
        }
        catch (Exception e) {
            System.out.println("Error while evaluating RegExp: " + e.toString());
        }
        return str;
    }
    
    public String toTeX() {
        StringBuffer sb = new StringBuffer();
        if ((_index > 0)&&(_empty)) {
            sb.append(" \\subsf{ < "); sb.append(_index); sb.append(" > } ");
        }
        if (_empty) return sb.toString();
        String featsToShow = Grammar.theGrammar.prefs.featsToShow;
        sb.append(" \\subsf{ ");
        if ((_index > 0)) {
            sb.append("  < "); sb.append(_index); sb.append(" > ");
        }
        List<String> filteredKeys = new ArrayList<String>(size());
        if (featsToShow.length() == 0) {
            filteredKeys.addAll(keySet());
        }
        else {
            for (Iterator<String> it = keySet().iterator(); it.hasNext(); ) {
                String key = it.next();
                if (featsToShow.indexOf(key) != -1) 
                    filteredKeys.add(key);
            }
        }
        String[] keys = new String[filteredKeys.size()];
        filteredKeys.toArray(keys);
        Arrays.sort(keys);
        for (int i=0; i < keys.length; i++) {
            addFeatureTeX(keys[i], sb);
            if (i < keys.length - 1) sb.append(" , ");
        }
        sb.append(" } ");
        return sb.toString();
    }
    
    
    /**
     * Returns a hash code using the given map from vars to ints, 
     * to allow for equivalence up to variable names.
     */
    public int hashCode(TObjectIntHashMap varMap) {

        int retval = 0;
        
        // nb: treat index as a regular var
        if (_index != 0) {
    		// see if index already in map
    		if (varMap.containsKey(_index))
    			retval = varMap.get(_index);
    		// otherwise add it
    		else {
	    		int next = varMap.size() + 1;
	    		varMap.put(_index, next);
	    		retval = next;
    		}
        }
        // otherwise treat missing index as unique, keyed to negative identity hash
		else {
    		int next = varMap.size() + 1;
    		varMap.put(-1 * Math.abs(System.identityHashCode(this)), next);
    		retval = next;
		}
        
        if (_empty) { return retval; }

        // sort keys
        Set<String> keySet = keySet();
        String[] keys = new String[keySet.size()];
        keySet.toArray(keys);
        Arrays.sort(keys);
        
        // do each key
        for (int i=0; i<keys.length; i++) {
            retval += keys[i].hashCode();
            Object val = getValue(keys[i]);
            // use map for vars
            if (val instanceof Variable) retval += ((Variable)val).hashCode(varMap);
            // otherwise just hash code
            else retval += val.hashCode();
        }
        
        return retval;
    }
    
    /**
     * Returns whether this feature structure equals the given object  
     * up to variable names, using the given maps from vars to ints.
     */
    public boolean equals(Object obj, TObjectIntHashMap varMap, TObjectIntHashMap varMap2) {
        if (obj.getClass() != this.getClass()) { return false; }
        GFeatStruc fs = (GFeatStruc) obj;
        
        int mappedIndex = (_index != 0) ? varMap.get(_index) : varMap.get(-1 * Math.abs(System.identityHashCode(this)));
        int fsMappedIndex = (fs._index != 0) ? varMap2.get(fs._index) : varMap2.get(-1 * Math.abs(System.identityHashCode(fs)));
        if (mappedIndex != fsMappedIndex) return false;
        
        if (size() != fs.size()) return false;
        Set<String> atts1 = getAttributes();
        Set<String> atts2 = fs.getAttributes();
        if (!atts1.containsAll(atts2)) return false;
        
        for (Iterator<String> it = atts1.iterator(); it.hasNext(); ) {
            String att = it.next();
            Object val = getValue(att);
            Object val2 = fs.getValue(att);
            if (val instanceof Variable && val2 instanceof Variable) {
            	if (!((Variable)val).equals(val2, varMap, varMap2)) return false;
            }
            else {
                if (!val.equals(val2)) return false;
            }
        }
        
        return true;
    }
}


================================================
FILE: src/opennlp/ccg/unify/GFeatVar.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2002-7 Jason Baldridge, Gunes Erkan and Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.unify;

import java.io.Serializable;
import gnu.trove.TObjectIntHashMap;
import opennlp.ccg.grammar.*;

/**
 * A class for variables which can stand for any feature.
 *
 * @author      Jason Baldridge
 * @author      Gunes Erkan
 * @author      Michael White
 * @version     $Revision: 1.9 $, $Date: 2009/07/17 04:23:30 $
 **/
public class GFeatVar implements Variable, Indexed, Mutable, Serializable {
    
	private static final long serialVersionUID = -5526887599728099988L;
	
	protected final String _name;
    protected int _index;
    protected int _hashCode;
    protected SimpleType type;
    
    public GFeatVar(String name) {
        this(name, 0, null);
    }

    public GFeatVar(String name, SimpleType st) {
        this(name, 0, st);
    }

    protected GFeatVar(String name, int index, SimpleType st) {
        _name = name;
        _index = index;
        type = (st != null) ? st : Grammar.theGrammar.types.getSimpleType(Types.TOP_TYPE);
        _hashCode = _name.hashCode() + _index + type.getIndex();
    }
    
    public String name() {
        return _name;
    }

    public Object copy() {
        return new GFeatVar(_name, _index, type);
    }
    
    public void deepMap(ModFcn mf) {
        mf.modify(this);
    }
    
    public int getIndex() {
        return _index;
    }

    public SimpleType getType() {
        return type;
    }

    public void setIndex(int index) {
        _hashCode += index - _index;
        _index = index;
    }

    public boolean occurs(Variable var) {
        return equals(var);
    }

    public int hashCode() {
        return _hashCode;
    }
    
    public boolean equals(Object o) {
        if (this == o) return true;
        if (!(o instanceof GFeatVar)) return false;
        GFeatVar var = (GFeatVar) o;
        return _index == var._index && _name.equals(var._name) && type.equals(var.type);
    }

    /**
	 * Returns a hash code using the given map from vars to ints.
	 */
	public int hashCode(TObjectIntHashMap varMap) {
		// see if this already in map
		if (varMap.containsKey(this))
			return varMap.get(this);
		// otherwise add it
		int next = varMap.size() + 1;
		varMap.put(this, next);
		return next;
	}
        
    /**
	 * Returns whether this var equals the given object up to variable names,
	 * using the given maps from vars to ints.
	 * (Note that the name and index may differ, but the types must be equal.)
	 */
    public boolean equals(Object obj, TObjectIntHashMap varMap, TObjectIntHashMap varMap2) {
        if (this == obj) return true;
        if (obj.getClass() != this.getClass()) { return false; }
        GFeatVar gv = (GFeatVar) obj;
        if (varMap.get(this) != varMap2.get(gv)) return false;
        if (!this.type.equals(gv.type)) return false;
        return true;
    }
    
    public void unifyCheck(Object o) throws UnifyFailure {}
    
    public Object unify(Object u, Substitution sub) throws UnifyFailure {
        if (equals(u)) {
            return this;
        }
        else if (u instanceof SimpleType) {
            SimpleType st1 = getType();
            SimpleType st2 = (SimpleType)u;
            return sub.makeSubstitution(this, st2.unify(st1, sub));
        }
        else if (u instanceof GFeatVar) {
            GFeatVar var = (GFeatVar) u;
            if (var.occurs(this)) throw new UnifyFailure();
            SimpleType st1 = getType();
            SimpleType st2 = var.getType();
            SimpleType st3 = (SimpleType) st2.unify(st1, sub);
            // substitute var with most specific type
            if (st3.equals(st2)) return sub.makeSubstitution(this, var);
            else if (st3.equals(st1)) return sub.makeSubstitution(var, this);
            else {
                // need a new var with intersection type
                GFeatVar var3 = new GFeatVar(_name, UnifyControl.getUniqueVarIndex(), st3);
                sub.makeSubstitution(var, var3);
                return sub.makeSubstitution(this, var3);
            }
        }
        else {
            return sub.makeSubstitution(this, u);
        }
    }

    public Object fill(Substitution sub) throws UnifyFailure {
        Object val = sub.getValue(this);
        if (val != null) {
            return val;
        } else {
            return this;
        }
    }


    public String toString() { 
        String retval = _name;
        if (!type.getName().equals(Types.TOP_TYPE)) retval += ":" + type.getName();
        return retval;
    }
}


================================================
FILE: src/opennlp/ccg/unify/GSubstitution.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003 Jason Baldridge, University of Edinburgh (Michael White) 
//                    and Gunes Erkan
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.unify;

import gnu.trove.*;
import java.util.*;

/**
 * Implementation of Substitution interface which ensures that all
 * the categories it contains are updated as new substitutions are
 * made.
 *
 * @author      Jason Baldridge
 * @author      Michael White
 * @author      Gunes Erkan
 * @version     $Revision: 1.13 $, $Date: 2009/12/21 03:27:19 $ 
*/
public class GSubstitution extends THashMap implements Substitution {

	private static final long serialVersionUID = 1L;

	private TIntObjectHashMap _indexedObjects = new TIntObjectHashMap();
    private TIntIntHashMap _newFeatStrucIndexes = new TIntIntHashMap();

    /**
     * Request the Substitution to identify a variable with an
     * object. Automagically condenses the Substitution so that all
     * other values in this Substitution get the new value for the
     * variable if they contain it.
     *
     * @param var the variable whose value has been determined
     * @param o the Object identified with the variable
     * @return the Object identified with the variable, which has
     * potentially undergone further unifications as a result of
     * making the substitution
     * @exception throws UnifyFailure if the Object cannot be unified
     * with a previous value substituted for the Variable.
     */
    @SuppressWarnings("unchecked")
	public Object makeSubstitution(Variable var, Object u) throws UnifyFailure {
        Object val1 = getValue(var);
        if (u instanceof Variable) {
            Variable var2 = (Variable)u;
            Object val2 = getValue(var2);
            // check if var -> u already
            if (val1 != null && val1.equals(u)) return u;
            // check if u -> var already
            if (val2 != null && val2.equals(var)) return var;
            // otherwise continue 
            if (val1 != null) {
                if (val1 instanceof Unifiable && ((Unifiable)val1).occurs(var2)) {
                    throw new UnifyFailure();
                }
                if (val2 != null) {
                    u = Unifier.unify(var, val2, this);
                } else {
                    u = makeSubstitution(var2, val1);
                }
            } else if (val2 != null) {
                if (val2 instanceof Unifiable && ((Unifiable)val2).occurs(var)) {
                    throw new UnifyFailure();   
                }
                makeSubstitution(var, val2);
            } 
        } else if (val1 != null) {
            u = Unifier.unify(val1, u, this);
        }
        put(var, u);
        for (Iterator<Variable> i=keySet().iterator(); i.hasNext();) {
            Variable v = (Variable)i.next();
            Object res = getValue(v);
            if (res instanceof Unifiable) {
                res = ((Unifiable)res).fill(this);
            }
            put(v, res);
        }
        if (u instanceof Unifiable) {
            u = ((Unifiable)u).fill(this);
        }
        return u;
    }

    /**
     * Try to get the value of a variable from this Substitution.
     * Returns null if the variable is unknown to the Substitution.
     *
     * @param var the variable whose value after unification is desired
     * @return the Object which this variable has been unified with 
     */
    public Object getValue(Variable var) {
        Object val = get(var);
        if (null != val) {
            if (val instanceof Variable) {
                Object deepVal = getValue((Variable)val);
                if (null != deepVal) {
                    val = deepVal;
                }
            }
        }
        return val;
    }

    @SuppressWarnings("unchecked")
	public Iterator<Variable> varIterator() {
        return keySet().iterator();
    }

    public int makeNewIndex(int fs1Index, int fs2Index) {
        int index = UnifyControl.getUniqueFeatureStructureIndex();
        int fs1IndexUpdated = getUpdatedIndex(fs1Index);
        int fs2IndexUpdated = getUpdatedIndex(fs2Index);
        addReindex(fs1IndexUpdated, index);
        addReindex(fs2IndexUpdated, index);
        return index;
    }

    public void addReindex(int oldIndex, int newIndex) {
        // avoid creating a pointer cycle
        if (oldIndex == newIndex) return;
        if (_newFeatStrucIndexes.containsKey(newIndex)) {
            throw new RuntimeException(
                "Whoops!  Index map already contains newIndex: " + newIndex + "\n" + this
            );
        }
        _newFeatStrucIndexes.put(oldIndex, newIndex);
    }

    public int getUpdatedIndex(int oldIndex) {
        if (!_newFeatStrucIndexes.containsKey(oldIndex)) return oldIndex;
        return getUpdatedIndex(_newFeatStrucIndexes.get(oldIndex));
    }
    
    public void addIndexedObject(int index, Object o) {
        _indexedObjects.put(index, o);
    }
    
    public Object getIndexedObject(int index) {
        return _indexedObjects.get(getUpdatedIndex(index));
    }

    public void condense() throws UnifyFailure {
        int[] keys = _indexedObjects.keys();
        for (int i=0; i < keys.length; i++) {
            Object obj = _indexedObjects.get(keys[i]);
            if (obj instanceof Unifiable) {
                Object filled = ((Unifiable)obj).fill(this);
                _indexedObjects.put(keys[i], filled);
            }
        }
        // drop old indexed objects
        for (int i = 0; i < keys.length; i++) {
            if (_newFeatStrucIndexes.containsKey(keys[i])) {
                _indexedObjects.remove(keys[i]);
            }
        }
    }

    @SuppressWarnings("unchecked")
	public String toString() {
        StringBuffer sb = new StringBuffer();
        sb.append("vars: \t");
        for (Iterator<Variable> keys=keySet().iterator(); keys.hasNext();) {
            Object key = keys.next();
            sb.append(key).append('=').append(get(key)).append('\t');
        }
        sb.append('\n');
        sb.append("indexes: \t");
        int indexKeys[] = _newFeatStrucIndexes.keys();
        for (int i = 0; i < indexKeys.length; i++) {
            sb.append(indexKeys[i] + "->" + _newFeatStrucIndexes.get(indexKeys[i]) + "\t");
        }
        return sb.toString();
    }
}


================================================
FILE: src/opennlp/ccg/unify/GUnifier.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2002 Jason Baldridge
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.unify;

import opennlp.ccg.synsem.*;

/**
 * A unifier for CCG categories.
 *
 * @author      Jason Baldridge
 * @version     $Revision: 1.1.1.1 $, $Date: 2003/02/28 18:02:13 $
 */
public class GUnifier { 

    public static Category unify (Category c1, Category c2) throws UnifyFailure {
        return (Category)unify(c1, c2, new EmptySubstitution());
    }

    public static Category unify (Category c1, Category c2, Substitution sub) throws UnifyFailure {
        if (c1 instanceof AtomCat && c2 instanceof ComplexCat) {
            c2.unifyCheck(c1);
            return (Category)c2.unify(c1, sub);
        }
        c1.unifyCheck(c2);
        return (Category)Unifier.unify(c1, c2, sub);
    }
}


================================================
FILE: src/opennlp/ccg/unify/Indexed.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2002 Jason Baldridge
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.unify;

/**
 * An object which can be indexed.
 *
 * @author      Jason Baldridge
 * @version     $Revision: 1.1.1.1 $, $Date: 2003/02/28 18:02:13 $
 **/
public interface Indexed {

    /**
     * Gets the index of this Indexed object.
     *
     * @return the index 
     **/
    public int getIndex ();


    /**
     * Sets the index of this Indexed object.
     *
     * @param index An int which provides a unique index
     **/
    public void setIndex (int index);
    
}


================================================
FILE: src/opennlp/ccg/unify/ModFcn.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2002 Jason Baldridge
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.unify;

/**
 * Interface for functions which modify Mutable objects.
 *
 * @author      Jason Baldridge
 * @version     $Revision: 1.1.1.1 $, $Date: 2003/02/28 18:02:13 $
 */
public interface ModFcn {

    /**
     * Changes a Mutable object in some way.
     *
     * @param mf a function to be applied
     **/
    public void modify (Mutable m);

}


================================================
FILE: src/opennlp/ccg/unify/Mutable.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2002 Jason Baldridge
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.unify;

/**
 * Interface for objects which might contain recursive structure and are
 * mutable.
 *
 * @author      Jason Baldridge
 * @version     $Revision: 1.1.1.1 $, $Date: 2003/02/28 18:02:13 $
 */
public interface Mutable {

    /**
     * Applies a ModFcn to this Mutable and then applies it to all fields
     * which are themselves Mutables.
     *
     * @param mf a function to be applied
     **/
    public void deepMap (ModFcn mf);

}


================================================
FILE: src/opennlp/ccg/unify/SelfCondensingSub.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2002 Jason Baldridge
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.unify;

import java.util.*;

/**
 * Implementation of Substitution interface which ensures that all the
 * categories it contains are updated as new substitutions are made.
 * 
 * @author Jason Baldridge
 * @version $Revision: 1.3 $, $Date: 2009/12/21 03:27:19 $
 */
public class SelfCondensingSub extends HashMap<Variable,Object> implements Substitution {

	private static final long serialVersionUID = 1L;

	/**
	 * Request the Substitution to identify a variable with an object.
	 * Automagically condenses the Substitution so that all other values in this
	 * Substitution get the new value for the variable if they contain it.
	 * 
	 * @param var
	 *            the variable whose value has been determined
	 * @param o
	 *            the Object identified with the variable
	 * @return the Object identified with the variable, which has potentially
	 *         undergone further unifications as a result of making the
	 *         substitution
	 * @exception throws
	 *                UnifyFailure if the Object cannot be unified with a
	 *                previous value substituted for the Variable.
	 */
	public Object makeSubstitution(Variable var, Object u) throws UnifyFailure {

		Object val1 = getValue(var);

		if (u instanceof Variable) {
			Variable var2 = (Variable) u;
			Object val2 = getValue(var2);
			if (val1 != null) {
				if (val2 != null)
					u = Unifier.unify(var, val2, this);
				else
					u = makeSubstitution(var2, val1);
			} else {
				if (val2 != null)
					makeSubstitution(var, val2);
				else
					put(var, var2);
			}
		} else if (val1 != null) {
			u = Unifier.unify(val1, u, this);
		}
		put(var, u);
		for (Iterator<Variable> i = keySet().iterator(); i.hasNext();) {
			Variable v = i.next();
			Object res = getValue(v);
			if (res instanceof Unifiable) {
				res = ((Unifiable) res).fill(this);
			}
			put(v, res);
		}
		if (u instanceof Unifiable) {
			u = ((Unifiable) u).fill(this);
		}
		return u;
	}

	/**
	 * Try to get the value of a variable from this Substitution. Returns null
	 * if the variable is unknown to the Substitution.
	 * 
	 * @param var
	 *            the variable whose value after unification is desired
	 * @return the Object which this variable has been unified with
	 */
	public Object getValue(Variable var) {
		return get(var);
	}

	public Iterator<Variable> varIterator() {
		return keySet().iterator();
	}

}


================================================
FILE: src/opennlp/ccg/unify/SimpleSubstitution.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2002-5 Jason Baldridge and University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.unify;

import java.util.*;

/**
 * Simple implementation of Substitution interface.
 * 
 * @author Jason Baldridge
 * @version $Revision: 1.3 $, $Date: 2005/10/20 17:30:30 $
 */
public class SimpleSubstitution extends HashMap<Variable,Object> implements Substitution {

	private static final long serialVersionUID = 1L;

	public SimpleSubstitution() {}

	public SimpleSubstitution(Map<Variable,Object> map) {
		super(map);
	}

	public Object makeSubstitution(Variable var, Object u) throws UnifyFailure {
		if (u instanceof Unifiable) {
			u = ((Unifiable) u).fill(this);
		}
		put(var, u);
		return u;
	}

	public Object getValue(Variable var) {
		return get(var);
	}

	public Iterator<Variable> varIterator() {
		return keySet().iterator();
	}
}


================================================
FILE: src/opennlp/ccg/unify/SimpleType.java
================================================
///////////////////////////////////////////////////////////////////////////////
//// Copyright (C) 2003-9 Gunes Erkan and Michael White
//// 
//// This library is free software; you can redistribute it and/or
//// modify it under the terms of the GNU Lesser General Public
//// License as published by the Free Software Foundation; either
//// version 2.1 of the License, or (at your option) any later version.
//// 
//// This library is distributed in the hope that it will be useful,
//// but WITHOUT ANY WARRANTY; without even the implied warranty of
//// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
//// GNU Lesser General Public License for more details.
//// 
//// You should have received a copy of the GNU Lesser General Public
//// License along with this program; if not, write to the Free Software
//// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
////////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.unify;

import opennlp.ccg.grammar.*;

import java.io.ObjectStreamException;
import java.io.Serializable;
import java.util.*;

/**
 * A simple type for feature values in CCG categories.
 * 
 * Note that during deserialization, the type is resolved using the current grammar.
 * 
 * @author      Gunes Erkan
 * @author 		Michael White
 * @version     $Revision: 1.8 $, $Date: 2009/07/17 04:23:30 $
 */
public class SimpleType implements Unifiable, Serializable {
    
	private static final long serialVersionUID = 7028285176993549672L;
	
	private int index;
    private String name;
    private BitSet bitset;
    private BitSet tempBitset = new BitSet();
    private transient Types types;

    public SimpleType(int i, String n, BitSet bs, Types t) {
        index = i;
        name = n;
        bitset = bs;
        types = t;
    }
	
    public int getIndex() { return index; }

    public BitSet getBitSet() { return bitset; }

    public String getName() { return name; }

    public String toString() { return name; }
    
    public void unifyCheck(Object u) throws UnifyFailure {
        if (!(u instanceof SimpleType)) {
            throw new UnifyFailure();
        }
    }

    public Object unify(Object u, Substitution sub) throws UnifyFailure {
        if (!(u instanceof SimpleType)) {
            throw new UnifyFailure();
        }
        if (this == u) return this;
        SimpleType st2 = (SimpleType) u;
        tempBitset.clear();
        tempBitset.or(bitset);
        tempBitset.and(st2.getBitSet());
        int resultTypeIndex = tempBitset.nextSetBit(0);
        if (resultTypeIndex == -1) {
        	throw new UnifyFailure();
        }
        return types.getIndexMap().get(resultTypeIndex);
    }

    public Object fill(Substitution s) throws UnifyFailure {
        return this;
    }
    
    public boolean occurs(Variable v) { return false; }
    
    public int hashCode() { return index; } 
    
    public boolean equals(Object o) {
        if (!(o instanceof SimpleType)) return false;
        if (index == ((SimpleType)o).getIndex()) return true;
        else return false;
    }
    
    /** Returns canonical version of deserialized type based on current grammar. */
    public Object readResolve() throws ObjectStreamException {
    	return Grammar.theGrammar.types.getSimpleType(name);
    }
}


================================================
FILE: src/opennlp/ccg/unify/Substitution.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2002 Jason Baldridge and Gann Bierner
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.unify;

import java.util.*;

/**
 * Specifies how variable are to be replaced to make two objects unify.
 * 
 * @author Gann Bierner & Jason Baldridge
 * @version $Revision: 1.2 $, $Date: 2005/10/20 17:30:30 $
 */
public interface Substitution {

	/**
	 * Request the Substitution to identify a variable with an object.
	 * 
	 * @param var
	 *            the variable whose value has been determined
	 * @param o
	 *            the Object identified with the variable
	 * @return the Object identified with the variable, which has potentially
	 *         undergone further unifications as a result of making the
	 *         substitution
	 * @exception throws
	 *                UnifyFailure if the Object cannot be unified with a
	 *                previous value substituted for the Variable.
	 */
	public Object makeSubstitution(Variable var, Object u) throws UnifyFailure;

	/**
	 * Try to get the value of a variable from this Substitution. Should return
	 * null if the variable is unknown to the Substitution.
	 * 
	 * @param var
	 *            the variable whose value after unification is desired
	 * @return the Object which this variable has been unified with
	 */
	public Object getValue(Variable var);

	public Iterator<Variable> varIterator();

}


================================================
FILE: src/opennlp/ccg/unify/Unifiable.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2002-5 Jason Baldridge and Gann Bierner
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.unify;

/**
 * An interface for classes that may be unified.
 * 
 * @author Gann Bierner
 * @version $Revision: 1.2 $, $Date: 2005/10/19 21:27:16 $
 */
public interface Unifiable {

	/**
	 * Determines if a Variable occurs within this Unifiable
	 * 
	 * @param v
	 *            the Variable to check for
	 * @return whether or not the Variable occurs
	 */
	public boolean occurs(Variable v);

	/**
	 * Tests for equality with the given Object.
	 * 
	 * @param o
	 *            object to test for equality
	 * @return true if this Unifiable is equal to <code>o</code>, false if
	 *         not.
	 */
	public boolean equals(Object o);

	/**
	 * Unify this Unfiable with another Object.
	 * 
	 * @param o
	 *            object to unify with
	 * @param s
	 *            Substitution containing the variable resolutions
	 * @exception UnifyFailure
	 *                if this Unifiable cannot be unified with the Object
	 * @return an object which represents the unification of this Unifiable with
	 *         the Object
	 */
	public Object unify(Object u, Substitution s) throws UnifyFailure;

	/**
	 * Check if this Unifiable can unify with another Object. This should be
	 * implemented as a quick check to allow users of the Unifiable to scan a
	 * group of Unifications to rapidly see if the entire group is at least
	 * possible before descending into each one with a full unification
	 * procedure. Thus, if a call to this method does not result in a
	 * UnifyFailure exception being thrown, it doesn't mean that the Object can
	 * definitely be unified with this Unifiable -- what is important is that
	 * when a call to this method throws a UnifyFailure exception, it permits
	 * one to avoid calling the unify() method on other Unifiables in a group
	 * because the quick check failed on this one.
	 * 
	 * @param o
	 *            object to check for unifiability
	 * @exception UnifyFailure
	 *                if this Unifiable cannot be unified with the Object
	 */
	public void unifyCheck(Object u) throws UnifyFailure;

	/**
	 * Replaces any variables in this Unifiable with the values found for them
	 * in the Substitution argument.
	 * 
	 * @param s
	 *            Substitution containing the variable resolutions
	 * @return a copy of this Unifiable with all variables from the Substitution
	 *         replaced by their values.
	 */
	public Object fill(Substitution s) throws UnifyFailure;

}


================================================
FILE: src/opennlp/ccg/unify/Unifier.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2002 Jason Baldridge and Gann Bierner
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.unify;

/**
 * A unification utility that abstracts a few basic issues such
 * Variables and not needed to pass a substitution object explictly.
 *
 * @author      Jason Baldridge
 * @version     $Revision: 1.2 $, $Date: 2004/11/11 17:50:13 $
 **/
public class Unifier {
   
    /**
     * Uses a <code>SelfCondensingSub</code> underlyingly so that it
     * is not necessary to pass a substitution object explictly.
     *
     * @param u1 the first of two Unifiables to unify
     * @param u2 the second of two Unifiables to unify
     * @return the result of unifying u1 and u2
     **/
    public static final Object unify (Object u1, Object u2) throws UnifyFailure {
        Substitution sub = new SelfCondensingSub();
        Object result =  unify(u1, u2, sub);
        if (result instanceof Unifiable) {
            result = ((Unifiable)result).fill(sub);
        }
        return result;
    }

    /**
     * Method which handles ordering to make sure that the Unifiable
     * unify() method is called on the Variable if either of the
     * arguments is a Variable.  This way, under a unification scheme
     * for a set of classes, you don't have to have each Unifiable
     * check to see if the thing it is trying to be unified with is a
     * Variable.
     *
     * @param u1 the first of two Unifiables to unify
     * @param u2 the second of two Unifiables to unify
     * @param sub the substitution object holding global unification
     * information
     * @return the result of unifying u1 and u2
     **/
    public static final Object unify (Object u1, Object u2, Substitution sub) throws UnifyFailure {
    
        // !!!!!!!!!!!!!!!!!!!!!!!! CAUTION !!!!!!!!!!!!!!!!!!!!!!!!
        // the order of this if-else statement is important, so be
        // careful before you change it!
        // !!!!!!!!!!!!!!!!!!!!!!!! CAUTION !!!!!!!!!!!!!!!!!!!!!!!!
        if (u2 instanceof Variable) {
            return ((Variable)u2).unify(u1, sub);
        } else if (u1 instanceof Unifiable) {
            return ((Unifiable)u1).unify(u2, sub);
        } else if (u2 instanceof Unifiable) {
            return ((Unifiable)u2).unify(u1, sub);
        } else if (u1.equals(u2)) {
            return u1;
        } else {
            throw new UnifyFailure();
        }
    }
}


================================================
FILE: src/opennlp/ccg/unify/UnifyControl.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003 Jason Baldridge and University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.unify;

import opennlp.ccg.synsem.*;

import gnu.trove.*;

/**
 * Center of command for the unification process.  
 * Needs work to allow for multithreading. 
 *
 * @author      Jason Baldridge
 * @author      Michael White
 * @version     $Revision: 1.6 $, $Date: 2005/10/20 17:30:30 $
 */
public class UnifyControl { 

    /**
     * An integer used to keep variables unique in lexical items.
     */
    private static int _varIndex = 0;

    /**
     * A function that makes variables unique.
     */
    private static ModFcn uniqueFcn = new ModFcn() {
        public void modify (Mutable m) {
            if (m instanceof Indexed && m instanceof Variable) {
                ((Indexed)m).setIndex(_varIndex);
            }
        }};


    /**
     * An integer used to keep feature structure indexes unique.
     */
    private static int _fsIndex = 1;
    private static TIntIntHashMap _reindexed = new TIntIntHashMap();

    private static CategoryFcn indexFcn = new CategoryFcnAdapter() {
        public void forall (Category c) {
            FeatureStructure fs = c.getFeatureStructure();
            if (fs != null) {
                int index = fs.getIndex();
                if (index > 0) {
                    int $index = _reindexed.get(index);
                    if ($index == 0) {
                        $index = _fsIndex++;
                        _reindexed.put(index, $index); 
                    }
                    fs.setIndex($index);
                }
            }
        }
    };

    /** Resets the uniqueness counters. */
    public static void startUnifySequence() {
        _varIndex = 0;
        _fsIndex = 1;
    }
    
    /** Sets the var and feature structure indices to unique values. */
    public static void reindex(Category cat) { 
        reindex(cat, null); 
    }

    /** Sets the var and feature structure indices to unique values. */
    public static void reindex(Category cat, Category anotherCat) {
        _reindexed.clear();
        cat.forall(indexFcn);
        cat.deepMap(uniqueFcn);
        if (cat != anotherCat && anotherCat != null) {
            anotherCat.forall(indexFcn);
            anotherCat.deepMap(uniqueFcn);
        }
        _varIndex++;
    }

    public static int getUniqueVarIndex() {
        return ++_varIndex;
    }

    public static int getUniqueFeatureStructureIndex() {
        return ++_fsIndex;
    }
    
    public static Object copy(Object o) {
        if (o instanceof Category) {
            return ((Category)o).copy();
        } else if (o instanceof GFeatVar) {
            return ((GFeatVar)o).copy();
        } else if (o instanceof LF) {
            return ((LF)o).copy();
        } else if (o instanceof GFeatStruc) {
            return ((GFeatStruc)o).copy();
        } else {
            return o;
        }
    }
}


================================================
FILE: src/opennlp/ccg/unify/UnifyFailure.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2002-3 Jason Baldridge, Gann Bierner and 
//                      University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.unify;

/**
 * @author      Jason Baldridge
 * @author      Michael White
 * @version     $Revision: 1.4 $, $Date: 2009/11/28 03:39:27 $
 */
public class UnifyFailure extends Exception {

	private static final long serialVersionUID = 1L;

    /** Constructor. */
    public UnifyFailure() {}

    /** Constructor with message. */
    public UnifyFailure(String m) { super(m); }

    /** Constructor with two args that failed to unify. */
    public UnifyFailure(String arg1, String arg2) {
    	super("Unable to unify " + arg1 + " with " + arg2 + ".");
    }

    /** Returns exception message. */
    public String toString() {
    	String msg = getMessage();
        return "Unify Failure: " + (msg != null ? msg : "(no message)");
    }
}


================================================
FILE: src/opennlp/ccg/unify/Variable.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2002-7 Jason Baldridge, Gann Bierner and Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.unify;

import gnu.trove.TObjectIntHashMap;

/**
 * A variable that can stand for some class of Unifiable objects.
 *
 * @author      Gann Bierner
 * @author 		Michael White
 * @version     $Revision: 1.2 $, $Date: 2007/12/20 21:30:22 $
 **/
public interface Variable extends Unifiable {

    /**
     * Returns the name of this variable.
     *
     * @return the variable's name
     **/        
    public String name();

    /**
	 * Returns a hash code using the given map from vars to ints.
	 */
	public int hashCode(TObjectIntHashMap varMap);
        
    /**
	 * Returns whether this var equals the given object up to variable names,
	 * using the given maps from vars to ints.
	 */
    public boolean equals(Object obj, TObjectIntHashMap varMap, TObjectIntHashMap varMap2);
}


================================================
FILE: src/opennlp/ccg/util/ArrayListWithIdentityEquals.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003-4 University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.util;

import java.util.*;

/**
 * An array list where equality is checked using == on the list elements, which 
 * are assumed to be canonical.
 * The hashCode method is compatible with SingletonList and StructureSharingList.
 *
 * @author      Michael White
 * @version     $Revision: 1.4 $, $Date: 2009/12/21 03:27:18 $
 */
public class ArrayListWithIdentityEquals<T> extends ArrayList<T> {
    
	private static final long serialVersionUID = 1L;

	/** Default constructor. */
    public ArrayListWithIdentityEquals() {}
    
    /** Constructor with initial collection. */
    public ArrayListWithIdentityEquals(Collection<T> c) { super(c); }
    
    /** Constructor with initial capacity. */
    public ArrayListWithIdentityEquals(int initialCapacity) { super(initialCapacity); }
    
    
    /** Returns a hash code for this list, using identity hash codes of the list elements. */
    public int hashCode() {
        int hc = 1;
        for (int i = 0; i < size(); i++) {
            hc = 31*hc + System.identityHashCode(get(i));
        }
        return hc;
    }
    
    /** Returns whether this list equals the given object, using identity tests on the list elements. */
    public boolean equals(Object obj) {
        if (this == obj) return true;
        if (!(obj instanceof List<?>)) return false;
        List<?> list = (List<?>) obj;
        if (size() != list.size()) return false;
        for (int i = 0; i < size(); i++) {
            if (get(i) != list.get(i)) return false;
        }
        return true; 
    }
}


================================================
FILE: src/opennlp/ccg/util/CompositeFilter.java
================================================
//////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2012 Scott Martin
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.util;

import java.util.Arrays;
import java.util.Collection;
import java.util.Collections;
import java.util.HashSet;
import java.util.Set;

/**
 * Composes the effects of several {@linkplain Filter filters} into a single filter.
 * The component filters are interpreted conjunctively, so that they all must allow a
 * given element for the composite filter to allow it.
 * 
 * @author <a href="http://www.ling.ohio-state.edu/~scott/">Scott Martin</a>
 */
public class CompositeFilter<E> implements Filter<E> {

	Set<Filter<? super E>> filters;
	
	/**
	 * Creates a new empty composite filter.
	 */
	public CompositeFilter() {
		this.filters = new HashSet<Filter<? super E>>();
	}
	
	/**
	 * Creates a new composite filter made up of the specified filters.
	 * @see #CompositeFilter(Collection)
	 */
	@SafeVarargs
	public CompositeFilter(Filter<? super E>... edgeFilters) {
		this(Arrays.asList(edgeFilters));
	}
	
	/**
	 * Creates a new composite filter made up of the specified filters.
	 * The specified filters can be filters on an superclass of this filter's
	 * type parameter.
	 */
	public CompositeFilter(Collection<? extends Filter<? super E>> filters) {
		this.filters = new HashSet<Filter<? super E>>(filters);
	}
	
	/**
	 * Gets the set of filters this composite filter is made up of. 
	 * @return An unmodifiable set view of the filters making up this composite filter.
	 */
	public Set<? extends Filter<? super E>> filters() {
		return Collections.unmodifiableSet(filters);
	}
	
	/**
	 * Tests whether this filter contains a given filter.
	 * @return <tt>true</tt> if the specified filter is one of the ones making up this 
	 * composite filter.
	 */
	public boolean containsFilter(Filter<? super E> filter) {
		return filters.contains(filter);
	}
	
	/**
	 * Adds a filter to this composite filter, if it is not already present.
	 * @param filter The filter to add.
	 * @return <tt>true</tt> if the filter was not already contained.
	 * @throws IllegalArgumentException If <tt>filter</tt> is <tt>null</tt>.
	 * 
	 * @see Collection#add(Object)
	 */
	public boolean addFilter(Filter<? super E> filter) {
		if(filter == null) {
			throw new IllegalArgumentException("filter is null");
		}
		
		return filters.add(filter);
	}
	
	/**
	 * Removes the specified filter.
	 * @param filter The filter to remove.
	 * @return <tt>true</tt> if the specified filter was removed from this composite filter.
	 */
	public boolean removeFilter(Filter<? super E> filter) {
		return filters.remove(filter);
	}

	/**
	 * Tests whether the given element is allowed by applying each of this composite filter's components
	 * to it one by one, calling each of their {@link Filter#allows(Object)} method exactly once wit the
	 * specified argument.
	 * 
	 * @return <tt>false</tt> if one of the filters making up this composite filters returns <tt>false</tt> from its
	 * {@link Filter#allows(Object)} method for the argument <tt>e</tt>, otherwise <tt>true</tt>. In particular,
	 * this means that an empty composite filter returns <tt>true</tt> for every argument.
	 */
	@Override
	public boolean allows(E e) {
		for(Filter<? super E> f : filters) {
			if(!f.allows(e)) {
				return false;
			}
		}
		
		return true;
	}

}


================================================
FILE: src/opennlp/ccg/util/DelegatedFilter.java
================================================
//////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2012 Scott Martin
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.util;

/**
 * Abstract class for filters that delegates to another filter that tests elements that do not
 * necessarily apply to the same type of elements as this filter. This filter's
 * {@link #allows(Object)} method returns the value of the 
 * {@linkplain #getDelegateFilter() delegate filter}'s <tt>allows(...)</tt> method
 * for the value returned by {@link #delegateValueFor(Object)} for the specified
 * element.
 * <p>
 * Concrete subclasses need to specify (1) the delegate filter (via their constructor), and
 * (2) a way to determine which element of type <tt>D</tt> the delegate filter should use
 * based on a specified element of type <tt>E</tt> by implementing {@link #delegateValueFor(Object)}.
 * A typical example is the case when a filter is desired that compares elements of type <tt>E</tt>, but
 * the comparison needs to take place on some type-<tt>D</tt> object somehow derived from instances of
 * <tt>E</tt>, e.g. by an accessor method.
 * 
 * @param <E> The type of elements that this filter applies to.
 * @param <D> The type of elements that the delegated filter applies to.
 * 
 * @author <a href="http://www.ling.ohio-state.edu/~scott/">Scott Martin</a>
 */
public abstract class DelegatedFilter<E, D> implements Filter<E> {

	Filter<? super D> delegateFilter;
	
	/**
	 * Creates a delegated filter with the specified filter to delegate to. The delegated filter will be
	 * used in the test for {@link #allows(Object)}, through the {@link #delegateValueFor(Object)}.
	 */
	protected DelegatedFilter(Filter<? super D> delegateFilter) {
		this.delegateFilter = delegateFilter;
	}

	/**
	 * Gets the filter that this filter delegates to.
	 * @return The filter specified at creation.
	 * @see #DelegatedFilter(Filter)
	 */
	public Filter<? super D> getDelegateFilter() {
		return delegateFilter;
	}

	/**
	 * Tests whether this filter allows the specified element by testing whether its
	 * {@linkplain #getDelegateFilter() delegate filter} allows the value of {@link #delegateValueFor(Object)}
	 * for the argument <tt>e</tt>.
	 * @return <tt>true</tt> if the delegate filter's {@link Filter#allows(Object)} method returns <tt>true</tt>
	 * for the element returned by <tt>delegateValueFor(e)</tt>.
	 * @see #delegateValueFor(Object)
	 */
	@Override
	public boolean allows(E e) {
		return delegateFilter.allows(delegateValueFor(e));
	}

	/**
	 * Gets the element of type <tt>D</tt> that the delegated filter should use in its
	 * {@link Filter#allows(Object)} comparisons, given the specified type-<tt>E</tt> element.
	 * @param e The element to obtain a type-<tt>D</tt> element for.
	 * @return The element that the delegated filter should use for comparison, based on <tt>e</tt>.
	 */
	public abstract D delegateValueFor(E e);
}


================================================
FILE: src/opennlp/ccg/util/DisplayPrefs.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2006 Ben Wing
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.util;

import java.util.prefs.Preferences;

import opennlp.ccg.TextCCG;

/**
 * Simple class for holding preferences for converting an object to a
 * string or other displayable representation.
 *
 * @author  Ben Wing
 * @version $Revision: 1.5 $, $Date: 2007/06/22 01:52:21 $
 */
public class DisplayPrefs {

    /* Whether to show feature info along with each nonterminal */
    public boolean showFeats = false; 
    /* Whether to show semantic info (logical forms) */
    public boolean showSem = false;
    /* Which features to show. */
    public String featsToShow = "";
    
    /** Constructor sets initial prefs from current user prefs. */
    public DisplayPrefs() {
    	Preferences prefs = Preferences.userNodeForPackage(TextCCG.class);
    	showFeats = prefs.getBoolean(TextCCG.SHOW_FEATURES, false);
    	showSem = prefs.getBoolean(TextCCG.SHOW_SEMANTICS, false);
    	featsToShow = prefs.get(TextCCG.FEATURES_TO_SHOW, "");
    }
}

================================================
FILE: src/opennlp/ccg/util/Filter.java
================================================
//////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2012 Scott Martin
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.util;

/**
 * Interface for filters that characterize a set by some membership criteria.
 * This interface uses a single method, {@link #allows(Object)}, to allow implementing
 * classes to say whether the specified element should be a member of the collection or not.
 * <p>
 * Filters can be thought of as characteristic functions for sets. The type parameter is 
 * used to signal what kind of elements a filter applies to.
 * 
 * @param <E> The type of elements that this filter applies to.
 * 
 * @see FilteredSet
 * @see FilteredMap
 * @author <a href="http://www.ling.ohio-state.edu/~scott/">Scott Martin</a>
 */
public interface Filter<E> {

	/**
	 * Tests whether the specified element is allowed.
	 * @return <tt>true</tt> if the provided element should be allowed into the collection.
	 */
	boolean allows(E e);
}


================================================
FILE: src/opennlp/ccg/util/FilteredMap.java
================================================
//////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2012 Scott Martin
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.util;

import java.util.AbstractMap;
import java.util.LinkedHashMap;
import java.util.Map;
import java.util.Set;

/**
 * A map whose keys must be allowed by a specified {@linkplain #getKeyFilter() key filter}.
 * The filtered mappings are kept in the same order they occurred in in the
 * {@linkplain #getOriginalMap() original map}.
 * 
 * @see Filter
 * @author <a href="http://www.ling.ohio-state.edu/~scott/">Scott Martin</a>
 */
public class FilteredMap<K,V> extends AbstractMap<K,V> {

	Map<? extends K,? extends V> originalMap;
	Filter<? super K> keyFilter;
	
	private final Map<K,V> map = new LinkedHashMap<K,V>();
	
	/**
	 * Creates a new filtered map including only the elements in <tt>originalMap</tt> whose
	 * keys are {@linkplain Filter#allows(Object) allowed} by the specified
	 * <tt>keyFilter</tt>.
	 * <p>
	 * Filtered maps maintain an {@linkplain #entrySet() entry set} whose entries occur in
	 * the same order as they occurred in the original map.
	 * 
	 * @param originalMap The map to draw this map's elements from.
	 * @param keyFilter The filter that decides which keys from the original map should be
	 * represented in this filtered map.
	 * @throws IllegalArgumentException If <tt>keyFilter</tt> is <tt>null</tt>.
	 * @see Map#putAll(Map)
	 */
	public FilteredMap(Map<? extends K,? extends V> originalMap, Filter<? super K> keyFilter) {
		if(keyFilter == null) {
			throw new IllegalArgumentException("keyFilter is null");
		}
		
		this.originalMap = originalMap;
		this.keyFilter = keyFilter;
		
		putAll(originalMap);
	}

	/**
	 * Gets the map that this map draws its elements from.
	 * @return The map specified at creation
	 * @see #FilteredMap(Map, Filter)
	 */
	public Map<? extends K,? extends V> getOriginalMap() {
		return originalMap;
	}
	
	/**
	 * Gets this map's key filter.
	 */
	public Filter<? super K> getKeyFilter() {
		return keyFilter;
	}	

	/**
	 * Gets the entry set for this map. Each entry's key is
	 * guaranteed to be allowable according to this map's {@linkplain #getKeyFilter() key 
	 * filter}.
	 * 
	 * @return The subset of the {@linkplain #getOriginalMap() original map}'s entries that
	 * are allowable by the key filter.
	 * 
	 * @see Map#entrySet()
	 */
	@Override
	public Set<Entry<K,V>> entrySet() {
		return map.entrySet();
	}

	/**
	 * Provides the ability to put new mappings into this filtered map, provided the specified
	 * key is {@linkplain Filter#allows(Object) allowed} by this map's
	 * {@linkplain #getKeyFilter() key filter}.
	 * 
	 * @return the element previously associated with <tt>key</tt> if the specified
	 * <tt>key</tt> is allowed by the key filter (and <tt>null</tt> if none was associated).
	 * This method always returns <tt>null</tt> for key/value pairs in which the specified
	 * key is <em>not</em> allowed by the key filter in effect. 
	 */
	@Override
	public V put(K key, V value) {
		if(keyFilter.allows(key)) {
			return map.put(key, value);
		}
		
		return null;
	}
}


================================================
FILE: src/opennlp/ccg/util/FilteredSet.java
================================================
//////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2012 Scott Martin
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.util;

import java.util.AbstractSet;
import java.util.Collection;
import java.util.Iterator;
import java.util.LinkedHashSet;
import java.util.Set;

/**
 * A set whose elements must be {@linkplain Filter#allows(Object) allowed} by a specified
 * {@link Filter}. Conceptually, instances of this class represent the sets described by the
 * characteristic function corresponding to their {@linkplain #getFilter() filter}.
 * <p>
 * The elements in the filtered set are kept in the same order they occur in according to the
 * {@linkplain #getOriginalCollection() original collection}'s iterator.
 * 
 * @see Filter 
 * @author <a href="http://www.ling.ohio-state.edu/~scott/">Scott Martin</a> 
 */
public class FilteredSet<E> extends AbstractSet<E> {

	Collection<? extends E> originalCollection;
	Filter<? super E> filter;
	
	private final Set<E> set = new LinkedHashSet<E>();
	
	/**
	 * Creates a new filtered set based on the specified collection and filter. The resulting set will
	 * contain all the members of the original collection for which the specified filter's
	 * {@link Filter#allows(Object)} method returns <tt>true</tt>.
	 * @param originalCollection The collection from which this filtered set will draw its elements.
	 * @param filter The filter that decides which of the members of <tt>originalCollection</tt> are
	 * allowable. The specified filter can apply to elements of any superclass of this filtered set's
	 * type parameter.
	 * @throws IllegalArgumentException If <tt>filter</tt> is <tt>null</tt>.
	 * 
	 * @see #addAll(Collection)
	 */
	public FilteredSet(Collection<? extends E> originalCollection, Filter<? super E> filter) {
		if(filter == null) {
			throw new IllegalArgumentException("filter is null");
		}
		
		this.filter = filter;
		this.originalCollection = originalCollection;
		
		addAll(originalCollection);
	}

	/**
	 * Gets the original collection from which this filtered set's elements are drawn.
	 * @return The collection specified at creation.
	 * @see #FilteredSet(Collection, Filter)
	 */
	public Collection<? extends E> getOriginalCollection() {
		return originalCollection;
	}

	/**
	 * Gets the filter used by this filtered set to determine which elements are allowed in it.
	 * @return The filter specified at creation.
	 * @see #FilteredSet(Collection, Filter)
	 */
	public Filter<? super E> getFilter() {
		return filter;
	}

	/**
	 * Gets an iterator over the elements in this filtered set.
	 */
	@Override
	public Iterator<E> iterator() {
		return set.iterator();
	}

	/**
	 * Gets the size of this filtered set (the number of elements it contains).
	 */
	@Override
	public int size() {
		return set.size();
	}

	/**
	 * Adds an element if it conforms to the {@linkplain #getFilter() filter in effect}, determined by
	 * consulting the filter's {@link Filter#allows(Object)} method using the supplied element. 
	 * @param e The element to add, after testing its allowability according to this filtered set's filter.
	 * @return <tt>true</tt> if the filter allows <tt>e</tt> and this set changed as a result of the addition
	 * (because the specified element <tt>e</tt> was not already contained).
	 */
	@Override
	public boolean add(E e) {
		return filter.allows(e) && set.add(e);
	}

}


================================================
FILE: src/opennlp/ccg/util/GroupMap.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003-6 Jason Baldridge, Gann Bierner and 
//                      Michael White (University of Edinburgh, The Ohio State University)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.util;

import gnu.trove.*;

import java.io.Serializable;
import java.util.*;

/**
 * A map where putting a value does not replace an old value but is rather
 * included in a set of values for that key.
 * The map may use identity equals on keys. 
 *
 * @author      Jason Baldridge
 * @author      Gann Bierner
 * @author      Michael White
 * @version     $Revision: 1.9 $, $Date: 2009/07/17 04:23:30 $
 */
public class GroupMap<KeyType,ValType> implements Serializable {
    
	private static final long serialVersionUID = -2995356057195571222L;
	
	// the underlying map
	private THashMap map;
	
	/** Default constructor. */
	public GroupMap() { this(false); }
	
	/** Constructor with flag for whether to use identity instead of <code>equals</code> on keys. */
	public GroupMap(boolean useIdentityEquals) {
		if (useIdentityEquals) map = new THashMap(new TObjectIdentityHashingStrategy());
		else map = new THashMap();
	}
	
    /** Adds the given key-value pair to the map, and returns null. */
	@SuppressWarnings("unchecked")
	public Object put(KeyType key, ValType value) {
        // get current val
        Object currentVal = map.get(key);
        // if none, add value to map
        if (currentVal == null) { 
        	map.put(key, value);
        }
        // if already a set, add value to set
        else if (currentVal instanceof Set) {
            Set<ValType> set = (Set<ValType>) currentVal;
            set.add(value);
        }
        // otherwise replace with a set including both values
        else {
            Set<ValType> set = new THashSet();
            set.add((ValType)currentVal);
            set.add(value);
            map.put(key, set);
        }
        // return null, since we're not really replacing the old val
        return null;
    }

    /** Returns the set of values for the given key (or null). */
    @SuppressWarnings("unchecked")
	public Set<ValType> get(KeyType key) {
        // get val
        Object val = map.get(key);
        // return if null or already a set
        if (val == null || val instanceof Set) {
            return (Set<ValType>) val;
        }
        // otherwise replace val with a set and return it
        Set<ValType> set = new THashSet();
        set.add((ValType)val);
        map.put(key, set);
        return set;
    }
    
    /** Adds a key-value pair to the map for all the given vals. */
    public void putAll(KeyType key, Collection<ValType> vals) {
    	for (ValType val : vals) put(key, val);
    }
    
    
    /** Returns the size of the underlying map. */
    public int size() { return map.size(); }

    /** Returns the keys. */
    @SuppressWarnings("unchecked")
	public Set<KeyType> keySet() {
    	return (Set<KeyType>) map.keySet();
    }
    
    /** Returns whether the keys contain the given one. */
    public boolean containsKey(KeyType key) {
    	return map.containsKey(key);
    }
    
    /** Removes the given key, returning its previous value (if any). */
    Set<ValType> remove(KeyType key) {
    	Set<ValType> retval = get(key);
    	map.remove(key);
    	return retval;
    }
}


================================================
FILE: src/opennlp/ccg/util/IntHashSetMap.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003 Jason Baldridge, Gann Bierner and 
//                    University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.util;

import gnu.trove.*;

/**
 * A map from ints to sets which allows objects with the same key to be
 * added without overriding previous puts.
 *
 * @author      Jason Baldridge
 * @author      Gann Bierner
 * @author      Michael White
 * @version     $Revision: 1.6 $, $Date: 2005/10/13 20:33:49 $
 */
public class IntHashSetMap extends TIntObjectHashMap {

	private static final long serialVersionUID = 1L;

	/** Adds the given key-value pair to the map. */
    public Object put(int key, Object value) {
    	THashSet val = (THashSet) get(key);
        if (val==null) {
            val = new THashSet();
            val.add(value);
            super.put(key, val); 
        } else {
            val.add(value);
        }
        return val;
    }
}


================================================
FILE: src/opennlp/ccg/util/Interner.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2004 University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.util;

import java.util.*;
import java.lang.ref.*;

/**
 * A utility class for interning (canonicalizing) objects.
 * A WeakHashMap is used as the backing store, so that interned objects can
 * be garbage collected.
 * Normally, it is easier to use the globalIntern method (sharing a global 
 * backing store) than to allocate separate interners.
 * Individual interners can be constructed to use soft references to 
 * the interned objects, so that they are kept around longer than is the 
 * case with weak references (the default). 
 *
 * @author      Michael White
 * @version     $Revision: 1.5 $, $Date: 2005/10/13 20:33:49 $
 *
 */
public class Interner<T> {

    // the backing store
    private Map<T,Reference<T>> weakMap = new WeakHashMap<T,Reference<T>>();
    
    // flag for whether to use soft references 
    private boolean softRefs = false;
    
    /** Default constructor. */
    public Interner() {}

    /** Constructor with soft references flag. */
    public Interner(boolean softRefs) { this.softRefs = softRefs; }

    /** 
     * Returns a canonical version of the given object.
     * The returned object is .equals() to the given one.
     * If the given object is not equal to one already seen, 
     * then the returned object will be == to the given one.
     */
    public T intern(T obj) {
        // check if equivalent key already in map
        if (weakMap.containsKey(obj)) {
            // return existing canonical obj if so 
            Reference<T> ref = weakMap.get(obj);
            return ref.get();
        }
        // otherwise add this object to the map, wrapped in a 
        // weak/soft reference so that it can still be gc'ed
        Reference<T> ref = (softRefs) 
            ? new SoftReference<T>(obj) 
            : new WeakReference<T>(obj);
        weakMap.put(obj, ref);
        return obj;
    }
    
    /** 
     * Returns the canonical version of the given object, if any, 
     * otherwise returns null.
     */
    public T getInterned(T obj) {
        // get weak reference to canonical obj, if any
        Reference<T> ref = weakMap.get(obj);
        // return obj, if any, otherwise null
        return (ref != null) ? ref.get() : null;
    }
    
    /** Returns the number of interned objects. */
    public int size() {
        return weakMap.size();
    }
    
    
    // the global interner
    private static Interner<Object> globalInterner = null;
    
    /** 
     * Returns a canonical version of the given object using a global interner.
     * The returned object is .equals() to the given one.
     * If the given object is not equal to one already seen, 
     * then the returned object will be == to the given one.
     */
    public static Object globalIntern(Object obj) {
        if (globalInterner == null) globalInterner = new Interner<Object>();
        return globalInterner.intern(obj);
    }
    
    /** 
     * Returns the canonical version of the given object using the global interner, if any, 
     * otherwise returns null.
     */
    public static Object getGlobalInterned(Object obj) {
        if (globalInterner == null) return null;
        return globalInterner.getInterned(obj);
    }
    
    /** Returns the number of interned objects in the global interner. */
    public static int globalSize() {
        if (globalInterner == null) return 0;
        return globalInterner.size();
    }
    
    
    /** Tests the implementation. */
    public static void main(String[] args) {

        Interner<Integer> interner = new Interner<Integer>();
        int SIZE = 100000;
        Integer[] ints = new Integer[SIZE];

        System.out.println("Adding " + SIZE + " ints to interner.");
        for (int i = 0; i < SIZE; i++) {
            ints[i] = new Integer(i);
            Integer interned = interner.intern(ints[i]);
            if (interned != ints[i]) {
                System.out.println("Whoops: ints[" + i + "] not == to interned: " + interned);
                System.exit(-1);
            }
        }
        System.out.println("interner.size(): " + interner.size()); // should be SIZE
        System.out.println("Doing gc().");
        System.gc();
        System.out.println("interner.size(): " + interner.size()); // should be the same
        System.out.println();
        
        System.out.println("Now adding " + SIZE + " equivalent ints to interner.");
        for (int i = 0; i < SIZE; i++) {
            Integer intI = new Integer(i);
            Integer interned = interner.intern(intI);
            if (interned == intI) {
                System.out.println("Whoops: intI (i=" + i + ") is == to interned: " + interned);
                System.exit(-1);
            }
        }
        System.out.println("interner.size(): " + interner.size()); // should be the same
        System.out.println();
        
        System.out.println("Next adding " + SIZE + " new, unreferenced ints to interner.");
        for (int i = SIZE; i < SIZE*2; i++) {
            Integer intI = new Integer(i);
            Integer interned = interner.intern(intI);
            if (interned != intI) {
                System.out.println("Whoops: intI (i=" + i + ") not == to interned: " + interned);
                System.exit(-1);
            }
        }
        System.out.println("interner.size(): " + interner.size()); // should be larger than SIZE
        System.out.println("Doing gc().");
        System.gc();
        System.out.println("interner.size(): " + interner.size()); // should be back to SIZE
        System.out.println();
    }
}


================================================
FILE: src/opennlp/ccg/util/InverseFilter.java
================================================
//////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2012 Scott Martin
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.util;

/**
 * A filter that wraps another filter an inverts its effects. Specifically, for each argument that
 * the wrapped filter's {@link Filter#allows(Object)} method returns <tt>true</tt>, this filter
 * returns <tt>false</tt>, and vice versa.
 * 
 * @author <a href="http://www.ling.ohio-state.edu/~scott/">Scott Martin</a>
 */
public class InverseFilter<E> implements Filter<E> {

	Filter<? super E> originalFilter;
	
	/**
	 * Creates a new filter based on the specified filter, inverting its effects. The specified filter can
	 * apply to any superclass of this filter's type parameter.
	 * @param originalFilter The filter to invert.
	 * @throws IllegalArgumentException If <tt>originalFilter</tt> is <tt>null</tt>.
	 */
	public InverseFilter(Filter<? super E> originalFilter) {
		if(originalFilter == null) {
			throw new IllegalArgumentException("originalFilter is null");
		}
		
		this.originalFilter = originalFilter;
	}
	
	/**
	 * Gets the original, non-inverted filter that this inverse filter wraps.
	 * @return The filter specified at creation.
	 * @see #InverseFilter(Filter)
	 */
	public Filter<? super E> getOriginalFilter() {
		return originalFilter;
	}

	/**
	 * Tests whether this filter allows a specified element by calling the original filter's
	 * {@link Filter#allows(Object)} method and reversing its boolean value.
	 * 
	 * @param e The element to test.
	 * @return A value equivalent to calling <tt>!getOriginalFilter().allows(e)</tt>.
	 */
	@Override
	public boolean allows(E e) {
		return !originalFilter.allows(e);
	}

}


================================================
FILE: src/opennlp/ccg/util/JLineReader.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2004 David Reitter and University of Edinburgh (Michael White) 
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.util;

import java.io.*;
import java.util.*;

import jline.*;

/**
 * A command-line reader based on JLine.
 *
 * @author  David Reitter
 * @author  Michael White
 * @version $Revision: 1.4 $, $Date: 2009/12/21 03:27:18 $
 */
public class JLineReader extends LineReader {

	// reader for console input
    ConsoleReader reader;

    // command history, buffer    
    History history = null;
    StringWriter histbuf = null;
    
    /** Constructor with completion strings. */
    public JLineReader(String[] completions) throws IOException {
        // init reader
        reader = new ConsoleReader();
		// store commands for 'tab' argument completion 
    	List<SimpleCompletor> completors = new LinkedList<SimpleCompletor>();
    	completors.add(new SimpleCompletor(completions));
        reader.addCompletor(new ArgumentCompletor(completors));
    }
    
    /** Sets the command history. */
    public void setCommandHistory(String histStr) throws IOException {
		// initialize history with max size = 50
		history = new History();
        history.setMaxSize(50);
		if (!histStr.equals("")) {
            histStr = histStr.replaceAll("<br/>", "\n"); // using <br/> to get around XML problem in Java 1.4
			StringReader sreader = new StringReader(histStr);
			history.load(sreader); 
		}
        // set to reader's history
		reader.setHistory(history);
    }
    
    /** Gets the current command history. */
    public String getCommandHistory() throws IOException {
        if (history == null) return "";
        StringBuffer retbuf = new StringBuffer();
        List<?> commands = history.getHistoryList();
        for (Iterator<?> it = commands.iterator(); it.hasNext(); ) {
            retbuf.append(it.next().toString());
            if (it.hasNext()) retbuf.append("<br/>"); // using <br/> to get around XML problem in Java 1.4
        }
        return retbuf.toString();
    }
    
    /** Returns an input string, using the given prompt. */
    public String readLine(String prompt) throws IOException {
	    return reader.readLine(prompt);
    }
}


================================================
FILE: src/opennlp/ccg/util/LineReader.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2004 University of Edinburgh (Michael White) and David Reitter 
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.util;

import java.io.*;

/**
 * Abstract command-line reader.
 *
 * @author  Michael White
 * @author  David Reitter
 * @version $Revision: 1.2 $, $Date: 2005/10/13 20:33:49 $
 */
abstract public class LineReader {

    /** Creates a default line reader (currently a JLineReader) with the given completion strings. */
    public static LineReader createLineReader(String[] completions) throws IOException {
        return new JLineReader(completions);
    }
    
    /** Sets the command history. */
    abstract public void setCommandHistory(String histStr) throws IOException;
    
    /** Gets the current command history. */
    abstract public String getCommandHistory() throws IOException;
    
    /** Returns an input string, using the given prompt. */
    abstract public String readLine(String prompt) throws IOException;
}


================================================
FILE: src/opennlp/ccg/util/ListMap.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2006 Michael White (The Ohio State University)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.util;

import gnu.trove.*;
import java.util.*;

/**
 * A map where putting a value does not replace an old value 
 * but is instead included in a list of values for that key.
 * The map may use identity equals on keys. 
 * (NB: A ListMap is essentially a GroupMap that uses lists instead of sets.)
 *
 * @author      Michael White
 * @version     $Revision: 1.1 $, $Date: 2006/08/15 18:21:31 $
 */
public class ListMap<KeyType,ValType> {
    
	// the underlying map
	private THashMap map;
	
	/** Default constructor. */
	public ListMap() { this(false); }
	
	/** Constructor with flag for whether to use identity instead of <code>equals</code> on keys. */
	public ListMap(boolean useIdentityEquals) {
		if (useIdentityEquals) map = new THashMap(new TObjectIdentityHashingStrategy());
		else map = new THashMap();
	}
	
    /** Adds the given key-value pair to the map, and returns null. */
	@SuppressWarnings("unchecked")
	public Object put(KeyType key, ValType value) {
        // get current val
        Object currentVal = map.get(key);
        // if none, add value to map
        if (currentVal == null) { 
        	map.put(key, value);
        }
        // if already a list, add value to list
        else if (currentVal instanceof List) {
            List<ValType> list = (List<ValType>) currentVal;
            list.add(value);
        }
        // otherwise replace with a list including both values
        else {
            List<ValType> list = new ArrayList<ValType>(3);
            list.add((ValType)currentVal);
            list.add(value);
            map.put(key, list);
        }
        // return null, since we're not really replacing the old val
        return null;
    }

    /** Returns the list of values for the given key (or null). */
    @SuppressWarnings("unchecked")
	public List<ValType> get(KeyType key) {
        // get val
        Object val = map.get(key);
        // return if null or already a list
        if (val == null || val instanceof List) {
            return (List<ValType>) val;
        }
        // otherwise replace val with a list and return it
        List<ValType> list = new ArrayList<ValType>(1);
        list.add((ValType)val);
        map.put(key, list);
        return list;
    }
    
    /** Adds a key-value pair to the map for all the given vals. */
    public void putAll(KeyType key, Collection<ValType> vals) {
    	for (ValType val : vals) put(key, val);
    }
    
    
    /** Returns the size of the underlying map. */
    public int size() { return map.size(); }

    /** Returns the keys. */
    @SuppressWarnings("unchecked")
	public Set<KeyType> keySet() {
    	return (Set<KeyType>) map.keySet();
    }
    
    /** Returns whether the keys contain the given one. */
    public boolean containsKey(KeyType key) {
    	return map.containsKey(key);
    }
    
    /** Removes the given key, returning its previous value (if any). */
    List<ValType> remove(KeyType key) {
    	List<ValType> retval = get(key);
    	map.remove(key);
    	return retval;
    }
}


================================================
FILE: src/opennlp/ccg/util/MembershipFilter.java
================================================
//////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2012 Scott Martin
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.util;

import java.util.Set;

/**
 * A filter that allows elements based on their membership in a set specified at creation. Later modifications
 * to this set will be reflected in the behavior of this filter's {@link #allows(Object)} method because
 * the set is not copied at creation.
 * 
 * @author <a href="http://www.ling.ohio-state.edu/~scott/">Scott Martin</a>
 */
public class MembershipFilter<E> implements Filter<E> {

	/**
	 * The set to test for membership.
	 */
	protected Set<E> members;
	
	/**
	 * Creates a new membership filter based on the specified set of members. This set can later be modified
	 * and have its new membership reflected by this filter's {@link #allows(Object)} method because the
	 * specified set is not copied by this filter.
	 * 
	 * @param members The set to test for membership.
	 * @throws IllegalArgumentException If <tt>members</tt> is <tt>null</tt>.
	 */
	public MembershipFilter(Set<E> members) {
		if(members == null) {
			throw new IllegalArgumentException("members is null");
		}
		
		this.members = members;
	}

	/**
	 * Tests whether this membership filter allows the specified element by testing whether the membership
	 * set contains the element.
	 * 
	 * @param e The element to test membership for. 
	 * @return <tt>true</tt> if the set of members specified at creation contains <tt>e</tt>.
	 * @see #MembershipFilter(Set)
	 */
	@Override
	public boolean allows(E e) {
		return members.contains(e);
	}

}


================================================
FILE: src/opennlp/ccg/util/Pair.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003 Jason Baldridge, Gann Bierner and 
//                    University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.util;

import java.io.Serializable;

/**
 * Dinky class to package pairs of things.
 *
 * @author      Jason Baldridge
 * @author      Gann Bierner
 * @author      Michael White
 * @version     $Revision: 1.7 $, $Date: 2009/12/21 03:27:18 $
 */
public final class Pair<TypeA,TypeB> implements Serializable {
    
	private static final long serialVersionUID = 3626104184233533389L;

	/** The first element of the pair. */
    public final TypeA a; 

    /** The second element of the pair. */
    public final TypeB b;

    /** Constructor. */
    public Pair(TypeA a, TypeB b) {
        this.a = a; this.b = b; 
    }
    
    /** Returns a hash code constructed from those of a and b. */
    public int hashCode() { return a.hashCode() - b.hashCode(); }
    
    /** Returns true if the given object pairs the same elements. */
    public boolean equals(Object obj) {
        if (this == obj) return true;
        if (!(obj instanceof Pair<?, ?>)) return false;
        Pair<?, ?> p = (Pair<?, ?>) obj;
        return a.equals(p.a) && b.equals(p.b);
    }

    /** Returns "[a/b]". */
    public String toString() { return "["+a+"/"+b+"]"; }
}


================================================
FILE: src/opennlp/ccg/util/SingletonList.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2004 University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.util;

import java.io.Serializable;
import java.util.*;

/**
 * An unmodifiable list of one element.
 * Equality is checked using == on the list element, which 
 * is assumed to be canonical.
 *
 * @author      Michael White
 * @version     $Revision: 1.5 $, $Date: 2009/12/21 03:27:18 $
 */
public class SingletonList<T> extends AbstractList<T> implements Serializable {
    
	private static final long serialVersionUID = -4340168177098319085L;
	
	/** The single list element. */
    public final T elt;

    /** Constructor. */
    public SingletonList(T elt) {
        this.elt = elt;
    }
    
    /** Returns the size of this list. */
    public int size() { return 1; }
    
    /** Returns the ith element of the list. */
    public T get(int i) {
        if (i == 0) return elt;
        else throw new IndexOutOfBoundsException("No element with index: " + i);
    }
    
    /** Returns a hash code for this list, using the identity hash code of the list element. */
    public int hashCode() {
        return 31 + System.identityHashCode(elt);
    }
    
    /** Returns whether this list equals the given object, using identity tests on the list element. */
    public boolean equals(Object obj) {
        if (this == obj) return true;
        if (!(obj instanceof List<?>)) return false;
        List<?> list = (List<?>) obj;
        if (size() != list.size()) return false;
        return (get(0) == list.get(0));
    }
}


================================================
FILE: src/opennlp/ccg/util/StructureSharingList.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2003-4 University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.util;

import java.io.Serializable;
import java.util.*;

/**
 * An unmodifiable list formed by sequencing two sublists. 
 * The sublists are assumed to remain unchanged as well.
 * Equality is checked using == on the list elements, which 
 * are assumed to be canonical.
 *
 * @author      Michael White
 * @version     $Revision: 1.7 $, $Date: 2009/12/21 03:27:18 $
 */
public class StructureSharingList<T> extends AbstractList<T> implements Serializable {
    
	private static final long serialVersionUID = 6692080357319326492L;

	/** The first sublist. */
    public final List<T> first; 

    /** The second sublist. */
    public final List<T> second;
    
    // cached hashcode
    private int hashcode = -1;

    // size
    private final int size;
    
    /** Constructor. */
    public StructureSharingList(List<T> first, List<T> second) {
        this.first = first; this.second = second;
        this.size = first.size() + second.size();
    }
    
    /** Returns the size of this list. */
    public int size() { return size; }
    
    /** Returns the ith element of the list. */
    public T get(int i) {
        if (i < first.size()) { 
            return first.get(i); 
        }
        else {
            return second.get(i - first.size());
        }
    }
    
    /** Returns a hash code for this list, using identity hash codes of the list elements. */
    public int hashCode() {
        // check whether already cached
        if (hashcode != -1) return hashcode;
        int hc = 1;
        for (int i = 0; i < size(); i++) {
            hc = 31*hc + System.identityHashCode(get(i));
        }
        // cache then return
        hashcode = hc;
        return hc;
    }
    
    /** Returns whether this list equals the given object, using identity tests on the list elements. */
    public boolean equals(Object obj) {
        if (this == obj) return true;
        if (!(obj instanceof List<?>)) return false;
        List<?> list = (List<?>) obj;
        if (list instanceof StructureSharingList<?>) {
            StructureSharingList<?> ssl = (StructureSharingList<?>) list;
            if (first == ssl.first && second == ssl.second) return true;
        }
        if (size() != list.size()) return false;
        for (int i = 0; i < size(); i++) {
            if (get(i) != list.get(i)) return false;
        }
        return true; 
    }
}


================================================
FILE: src/opennlp/ccg/util/TrieMap.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2005 University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.util;

import java.util.*;

/**
 * Implements a trie with a data object at each node. Keys are assumed to be
 * canonical, and thus checked using identity (==) rather than equality. For
 * efficient allocation, all children can be added at once.
 * 
 * @author Michael White
 * @version $Revision: 1.6 $, $Date: 2011/03/20 20:11:58 $
 */
public class TrieMap<KeyType,DataType> {

	/** Interface for methods returning an interned key. */
	public interface KeyExtractor<KeyType> {
		/** Returns an interned key. */
		public KeyType getKey();
	}

	/** The data object. */
	public DataType data;

	/**
	 * The mapping to the children. If there is just one child, it's stored in a
	 * pair with its key. Otherwise, an IdentityHashMap is used.
	 */
	private Object childMap = null;

	/** The parent node. */
	private TrieMap<KeyType, DataType> parent = null;

	/** Constructor with data object. */
	public TrieMap(DataType data) {
		this.data = data;
	}

	/** Factory method, for adding empty child nodes. */
	protected TrieMap<KeyType,DataType> createNode() {
		return new TrieMap<KeyType,DataType>(null);
	}
	
	/** Adds the given child with its key. */
	@SuppressWarnings("unchecked")
	public void addChild(KeyType key, TrieMap<KeyType, DataType> child) {
		child.parent = this;
		if (childMap == null) {
			childMap = new Pair<KeyType, TrieMap<KeyType, DataType>>(key, child);
			return;
		}
		Map<KeyType, TrieMap<KeyType, DataType>> map;
		if (childMap instanceof Pair) {
			Pair<KeyType, TrieMap<KeyType, DataType>> pair = (Pair<KeyType, TrieMap<KeyType, DataType>>) childMap;
			map = new IdentityHashMap<KeyType, TrieMap<KeyType, DataType>>();
			map.put(pair.a, pair.b);
			childMap = map;
		} else {
			map = (Map<KeyType, TrieMap<KeyType, DataType>>) childMap;
		}
		map.put(key, child);
	}

	/** Adds the given children with their keys. */
	@SuppressWarnings("unchecked")
	public void addChildren(List<KeyType> keys, List<TrieMap<KeyType, DataType>> childNodes) {
		if (childMap == null && keys.size() == 1) {
			TrieMap<KeyType, DataType> child = childNodes.get(0);
			child.parent = this;
			childMap = new Pair<KeyType, TrieMap<KeyType, DataType>>(keys.get(0), child);
			return;
		}
		Map<KeyType, TrieMap<KeyType, DataType>> map;
		if (childMap == null) {
			map = new IdentityHashMap<KeyType, TrieMap<KeyType, DataType>>(keys.size());
			childMap = map;
		} else if (childMap instanceof Pair) {
			Pair<KeyType, TrieMap<KeyType, DataType>> pair = (Pair<KeyType, TrieMap<KeyType, DataType>>) childMap;
			map = new IdentityHashMap<KeyType, TrieMap<KeyType, DataType>>(keys.size() + 1);
			map.put(pair.a, pair.b);
			childMap = map;
		} else {
			map = (Map<KeyType, TrieMap<KeyType, DataType>>) childMap;
		}
		for (int i = 0; i < keys.size(); i++) {
			TrieMap<KeyType, DataType> child = childNodes.get(i);
			child.parent = this;
			map.put(keys.get(i), child);
		}
	}

	/** Gets the parent node, or null if none. */
	public TrieMap<KeyType, DataType> getParent() {
		return parent;
	}

	/** Gets the child for the given key, or null if none. */
	@SuppressWarnings("unchecked")
	public TrieMap<KeyType, DataType> getChild(KeyType key) {
		if (childMap == null) return null;
		if (childMap instanceof Pair) {
			Pair<KeyType, TrieMap<KeyType, DataType>> pair = (Pair<KeyType, TrieMap<KeyType, DataType>>) childMap;
			if (pair.a == key) return pair.b;
			else return null;
		}
		Map<KeyType, TrieMap<KeyType, DataType>> map = (Map<KeyType, TrieMap<KeyType, DataType>>) childMap;
		return map.get(key);
	}

	/** Gets the child for the given list of keys, or null if none. */
	public TrieMap<KeyType, DataType> getChildFromList(List<KeyType> keys) {
		TrieMap<KeyType, DataType> next = this;
		for (int pos = 0; pos < keys.size(); pos++) {
			next = next.getChild(keys.get(pos));
			if (next == null) return null;
		}
		return next;
	}

	/** Gets the child for the given list of keys extractors, or null if none. */
	public TrieMap<KeyType, DataType> getChildFromLazyList(List<KeyExtractor<KeyType>> keyExtractors) {
		TrieMap<KeyType, DataType> next = this;
		for (int pos = 0; pos < keyExtractors.size(); pos++) {
			next = next.getChild(keyExtractors.get(pos).getKey());
			if (next == null) return null;
		}
		return next;
	}

	/**
	 * Finds the child for the given key, adding one (with a null data object)
	 * if necessary.
	 */
	public TrieMap<KeyType, DataType> findChild(KeyType key) {
		TrieMap<KeyType, DataType> child = getChild(key);
		if (child == null) {
			child = createNode();
			addChild(key, child);
		}
		return child;
	}

	/**
	 * Finds the child for the given list of keys, adding one (with a null data
	 * object) if necessary, along with any necessary intervening parents.
	 */
	public TrieMap<KeyType, DataType> findChildFromList(List<KeyType> keys) {
		TrieMap<KeyType, DataType> next = this;
		for (int pos=0; pos < keys.size(); pos++) {
			KeyType key = keys.get(pos);
			TrieMap<KeyType, DataType> child = next.getChild(key);
			if (child == null) {
				child = createNode();
				next.addChild(key, child);
			}
			next = child;
		}
		return next;
	}

	/**
	 * Finds the child for the given list of keys, adding one (with a null data
	 * object) if necessary, along with any necessary intervening parents.
	 */
	public TrieMap<KeyType, DataType> findChildFromLazyList(List<KeyExtractor<KeyType>> keyExtractors) {
		TrieMap<KeyType, DataType> next = this;
		for (int pos=0; pos < keyExtractors.size(); pos++) {
			KeyType key = keyExtractors.get(pos).getKey();
			TrieMap<KeyType, DataType> child = next.getChild(key);
			if (child == null) {
				child = createNode();
				next.addChild(key, child);
			}
			next = child;
		}
		return next;
	}

	/**
	 * Gets the keys leading to this node. This requires a linear search at each
	 * level.
	 */
	@SuppressWarnings("unchecked")
	public List<KeyType> traceKeys() {
		ArrayList<KeyType> retval = new ArrayList<KeyType>();
		// collect keys up to root
		TrieMap<KeyType, DataType> currentNode = this;
		TrieMap<KeyType, DataType> currentParent = parent;
		while (currentParent != null) {
			if (currentParent.childMap instanceof Pair) {
				Pair<KeyType, TrieMap<KeyType, DataType>> pair = (Pair<KeyType, TrieMap<KeyType, DataType>>) currentParent.childMap;
				retval.add(pair.a);
			} else {
				Map<KeyType, TrieMap<KeyType, DataType>> map = (Map<KeyType, TrieMap<KeyType, DataType>>) currentParent.childMap;
				for (Map.Entry<KeyType, TrieMap<KeyType, DataType>> entry : map.entrySet()) {
					if (entry.getValue() == currentNode) {
						retval.add(entry.getKey());
						break;
					}
				}
			}
			currentNode = currentParent;
			currentParent = currentParent.parent;
		}
		// reverse and return
		Collections.reverse(retval);
		return retval;
	}

	/** Returns this trie map as a string, with indenting. */
	public String toString() {
		StringBuffer sb = new StringBuffer();
		toString(sb, "");
		return sb.toString();
	}

	// appends this trie map as a string, with the given indenting level,
	// to the given string buffer
	@SuppressWarnings("unchecked")
	private void toString(StringBuffer sb, String indent) {
		sb.append("node: " + data);
		if (childMap == null)
			return;
		indent += "  ";
		if (childMap instanceof Pair) {
			Pair<KeyType, TrieMap<KeyType, DataType>> pair = (Pair<KeyType, TrieMap<KeyType, DataType>>) childMap;
			toString(sb, indent, pair.a, pair.b);
		} else {
			Map<KeyType, TrieMap<KeyType, DataType>> map = (Map<KeyType, TrieMap<KeyType, DataType>>) childMap;
			List<KeyType> keys = new ArrayList<KeyType>(map.keySet());
			Comparator<KeyType> toStringComparator = new Comparator<KeyType>() {
				public int compare(KeyType o1, KeyType o2) {
					return o1.toString().compareTo(o2.toString());
				}
			};
			Collections.sort(keys, toStringComparator);
			for (KeyType key : keys) {
				toString(sb, indent, key, map.get(key));
			}
		}
	}

	// appends the given key and child
	private void toString(StringBuffer sb, String indent, Object key, TrieMap<?, ?> child) {
		sb.append("\n").append(indent).append('[').append(key).append("] ");
		child.toString(sb, indent);
	}
}


================================================
FILE: src/opennlp/ccg/util/VisitedFilter.java
================================================
//////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2012 Scott Martin
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.util;

import java.util.HashSet;

/**
 * A filter that tracks which elements have already been visited by some process or iteration, allowing only
 * those that have not yet been visited. An element is considered visited when this filter's 
 * {@link #allows(Object)} method has been called with it as an argument.
 * <p>
 * Internally, the visited elements are tracked by using a
 * {@link MembershipFilter} based on a {@link HashSet}.  
 * 
 * @author <a href="http://www.ling.ohio-state.edu/~scott/">Scott Martin</a>
 */
public class VisitedFilter<E> extends MembershipFilter<E> {

	/**
	 * Creates a new visited filter with an empty set of visited elements.
	 */
	public VisitedFilter() {
		super(new HashSet<E>());
	}
	
	/**
	 * Tests whether this filter allows <tt>e</tt> by testing whether or not it has been visited. An element
	 * has been visited if this method has been previously called with it as an argument.
	 * 
	 * @param e The element to test whether it has been visited or not.
	 * @return <tt>true</tt> if <tt>e</tt> has not yet been visited.
	 * 
	 * @see #hasVisited(Object)
	 */
	@Override
	public boolean allows(E e) {
		if(!hasVisited(e)) {
			members.add(e);
			return true;
		}
		
		return false;
	}
	
	/**
	 * Tests whether the specified element has been visited or not.
	 * @param e The element to test for visitation.
	 * @return <tt>true</tt> if <tt>e</tt> is among the elements that have been previously visited.
	 * 
	 * @see #allows(Object)
	 * @see MembershipFilter#allows(Object)
	 */
	public boolean hasVisited(E e) {
		return super.allows(e);
	}
}


================================================
FILE: src/opennlp/ccg/util/Visualizer.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2004 Alexandros Triantafyllidis and 
//                    University of Edinburgh (Michael White)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////
package opennlp.ccg.util;

import opennlp.ccg.lexicon.*;
import opennlp.ccg.grammar.*;
import opennlp.ccg.synsem.*;

import java.io.*;
import java.util.*;

/**
 * Class for visualizing CCG derivations using latex.
 *
 * @author  Alexandros Triantafyllidis
 * @author  Michael White
 * @version $Revision: 1.9 $, $Date: 2009/12/21 03:27:18 $
 */
public class Visualizer {

    private String ruleToTeX(String rule, int indent, int length) {
        StringBuffer sb = new StringBuffer();
        int i=0;
        for (i=0; i < indent; i++) sb.append("&");
        sb.append(" \\mc{" + Integer.toString(length) + "} ");
        if(rule == null || rule.length()==1)
            sb.append("{\\hrulefill_{"+ rule  + "}} \\\\\n"); 
        else
            sb.append("{\\hrulefill_{"+ rule.substring(0,1) + "\\mathbf{" + rule.substring(1) + "}}}\\\\\n");
        return sb.toString();
    }
    
    // Gets a file name for a temporary file, e.g.:  ~tmp0
    public String getTempFileName() {
        File f1 = null;
        File f2 = null;
        int i=0;
        f1 = new File("~tmp"+Integer.toString(i)+".tex");
        f2 = new File("~tmp"+Integer.toString(i)+".div");
        while(f1.exists() || f2.exists() ) {
            i++;
            f1 = null; f2 = null;
            f1 = new File("~tmp"+Integer.toString(i)+".tex");
            f2 = new File("~tmp"+Integer.toString(i)+".div");
        }
        f1 = null; f2 = null;
        return "~tmp"+Integer.toString(i);
    }
    
    public String getTempDirName() {
        File f1 = null;
        int i=0;
        f1 = new File("tmp");
        while(f1.exists()  ) {
            i++;
            f1 = null; 
            f1 = new File("tmp"+Integer.toString(i) );
        }
        f1 = null; 
        return "tmp"+Integer.toString(i);
    }
    
    public int getTreeDepth(Sign sign, int level)
    {
        int max_depth = 0, depth = 0;
        Sign[] children = sign.getDerivationHistory().getInputs();
        if (children != null && sign.getWords().size() > 1) 
            for (int i=0; i < children.length; i++) {
                depth = getTreeDepth(children[i], level+1);
                if (depth > max_depth) max_depth = depth;
            }
        else
            max_depth = level;
        return max_depth;
    }

    private int numberOfLeaves(Sign results) {
        int totalLeaves = 0;    
        Sign[] children = results.getDerivationHistory().getInputs();
        if (children==null || results.getWords().size()==1) return 1;
        for(int i=0;i<children.length;i++)
            totalLeaves+=numberOfLeaves(children[i]);
        return totalLeaves;
    }
    
    public List<TeXSign> processSign(Sign results, int level, int identation) {
        List<TeXSign> signList = new ArrayList<TeXSign>();
        Sign[] children = results.getDerivationHistory().getInputs();
        int depth = getTreeDepth(results, 0);
        TeXSign ts = new TeXSign();
        int offset=0;
        if (children != null && results.getWords().size() > 1)
            for (int i=0; i < children.length; i++) {
                if (i > 0)
                    offset += numberOfLeaves(children[i-1]);
                signList.addAll( processSign(children[i], level + 1, identation + offset) );
            }
        ts.identation = identation;
        ts.height = depth;
        ts.sign = results;
        signList.add(ts);
        return signList;
    }

    public boolean writeFooter(String fileName){
        java.io.BufferedWriter bw = null;
        try{    
            bw = new java.io.BufferedWriter(new FileWriter(fileName,true) );  
            bw.write("\\end{document}\n");   
            bw.close();
        }
        catch(Exception e){ return false; }
        return true;
    }

    public  boolean writeHeader(String fileName) {
        java.io.BufferedWriter bw = null;
        try {
            bw = new java.io.BufferedWriter(new FileWriter(fileName) );  
            bw.write("\\documentclass{article}\n");
            bw.write("\\usepackage[margin=0.5in]{geometry}\n");
            bw.write("\\newcommand{\\deriv}[2]\n");
            bw.write("{  \\renewcommand{\\arraystretch}{.5}\n");
            bw.write("$\\begin{array}[t]{*{#1}{c}}\n");
            bw.write("     #2\n");
            bw.write("   \\end{array}$ }\n");
            bw.write("\\newcommand{\\gf}[1]{\\textsf{\\textsl{#1}}}\n");
            bw.write("\\newcommand{\\cf}[1]{\\mbox{\\ensuremath{\\cfont{#1}}}}\n");
            bw.write("\\newcommand{\\uline}[1]\n");
            bw.write("{\\mc{#1}{\\hrulefill} }\n");
            bw.write("\\newcommand{\\mc}[2]\n");
            bw.write("  {\\multicolumn{#1}{c}{#2}}\n");
            bw.write("\\newcommand{\\cfont}{\\mathsf}\n");
            bw.write("\\newcommand{\\bs}{\\backslash}\n");
            bw.write("\\newcommand{\\subsa}[1]{\\hspace{-0.75mm}_{_{#1}}}\n");
            bw.write("\\newcommand{\\subsb}[1]{\\hspace{-0.10mm}_{_{#1}}}\n");
            bw.write("\\newcommand{\\subs}[1]{\\hspace{-0.40mm}_{#1}}\n");
            bw.write("\\newcommand{\\subsf}[1]{\\hspace{-0.75mm}_{_{#1}}}\n");
            bw.write("\\newcommand{\\supsa}[1]{\\hspace{-1.75mm}^{^{#1}} }\n");
            bw.write("\\newcommand{\\supsb}[1]{\\hspace{-0.80mm}^{^{#1}}  }\n");
            bw.write("\\newcommand{\\sups}[1]{\\hspace{-0.40mm}^{#1}}\n");
	    bw.write("\\pagestyle{empty}\n");
            bw.write("\\begin{document}\n");
            bw.close();
        }
        catch(Exception e){ return false; }
        return true;
    }

    /** 
     * Shows the current derivation using YaP or xdvi.
     */
    public boolean show(String fileName) {
        String viewerName = null;
        try {
        	runCommand("latex " + fileName + ".tex");
            //Process p =
        	java.lang.Runtime.getRuntime().exec("latex " + fileName + ".tex");
            if (System.getProperty("os.name").toUpperCase().startsWith("WINDOWS"))
                viewerName = "yap";
            else
                viewerName = "xdvi";

            System.out.println("Close " + viewerName  + " to continue ...");
            runCommand(viewerName + " " + fileName);
            // The process will wait indefinitely unless we close each of the related streams:/
            //p.getInputStream().close();
            //p.getOutputStream().close();
            //p.getErrorStream().close();
            //p.waitFor();
            //p = null;
            //p = java.lang.Runtime.getRuntime().exec(viewerName + " " + fileName);
            //p.getInputStream().close();
            //p.getOutputStream().close();
            //p.getErrorStream().close();
            //System.out.println("Close " + viewerName  + " to continue ...");
            //p.waitFor();
        } catch(Exception e) {
            System.out.println("Error invoking latex/" + viewerName + " : " + e.toString());
            return false;
        }
        return true;
    }
    
    class myFilter implements FileFilter {
        String baseFileName=null;
        public myFilter(String s) {
            baseFileName = s.toUpperCase();
        }
        public boolean accept(File f) {
            System.out.println("checking: " + f.getName());
            if(f.getName().toUpperCase().startsWith(baseFileName))
                return true;
            else
                return false;
        }
    }
    
    public class myFileNameFilter implements FilenameFilter {
        public String fn=null;
        public myFileNameFilter(String s) {
            fn=s;
        }
        public boolean accept(File dir, String name) { 
            return name.startsWith(fn);
        }
    }
    
    public boolean cleanFiles(String fileName) {
        try {
            File dir = new File(System.getProperty("user.dir")); 
            myFileNameFilter filter = new  myFileNameFilter( fileName) ;
            File[] allFiles = dir.listFiles(filter);
            for(int i=0;i<allFiles.length;i++)
                allFiles[i].delete();
        } catch (Exception e) {
            System.out.println("Error cleaning files: "+ e.toString());
            return false;
        }
        return true;
    }

    public class auxFileNameFilter implements FilenameFilter {
        public String fn=null;
        public auxFileNameFilter(String s) {
            fn=s;
        }
        public boolean accept(File dir, String name) { 
            if((name.startsWith(fn)) && (! ((name.toUpperCase().endsWith(".TEX")) || (name.toUpperCase().endsWith(".DVI")))))
                return true;
            else
                return false;
        }
    }

    public boolean cleanAuxFiles(String fileName) {
        try{
            File dir = new File(System.getProperty("user.dir")); 
            auxFileNameFilter filter = new  auxFileNameFilter( fileName) ;
            File[] allFiles = dir.listFiles(filter);
            for(int i=0;i<allFiles.length;i++)
                allFiles[i].delete();
        } catch (Exception e) {
            System.out.println("Error cleaning files: "+ e.toString());
            return false;
        }
        return true;
    }
    
    /** 
     * Writes a derivation in fileName in TeX format; 
     * returns false in case it fails.
     */
    public boolean saveTeXFile(Sign results, String fileName) {
        List<TeXSign> signList = null;
        java.io.BufferedWriter bw = null;
        try {
            int i=0, numDerivs=0;
            TeXSign texSign = null;
            bw = new java.io.BufferedWriter(new FileWriter( fileName,true) );  
            signList = sortList( processSign(results,0, 0 ) );
            numDerivs = results.getWords().size();
            Tokenizer tokenizer = Grammar.theGrammar.lexicon.tokenizer;
            bw.write("\\deriv{" + Integer.toString(numDerivs)  +  "}{\n");
            for (i=0; i < results.getWords().size(); i++) {
                if (i != 0) bw.write(" & ");
                String orth = tokenizer.getOrthography((Word)results.getWords().get(i), false);
                orth = orth.replaceAll("_", "\\\\_");
                orth = orth.replaceAll("%", "\\\\%");
                bw.write("\\gf{" + orth + "}");
            }
            bw.write(" \\\\\n\\uline{1}");
            for (i=1; i < results.getWords().size(); i++)
                bw.write(" & \\uline{1}");
            bw.write(" \\\\\n");
            texSign = (TeXSign)signList.get(0);
            bw.write("\\cf{"+  texSign.sign.getCategory().toTeX()  + "}");
            for (i=1; i < numDerivs; i++) {
                texSign = (TeXSign)signList.get(i);
                bw.write(" & \\cf{"+  texSign.sign.getCategory().toTeX()  + "}");
            }
            bw.write(" \\\\\n");    

            for (i=numDerivs; i < signList.size(); i++) {
                String ruleStr=null;
                texSign = (TeXSign)signList.get(i);
                ruleStr = ruleToTeX(texSign.sign.getDerivationHistory().getRule().name(), texSign.identation, texSign.sign.getWords().size()   );
                bw.write(ruleStr);
                for (int j=0; j < texSign.identation; j++)
                    bw.write("&");
                bw.write(" \\mc{" + texSign.sign.getWords().size() + "}{\\cf{"+ texSign.sign.getCategory().toTeX() +"}} \\\\\n");
            }
	    // Originally 1in, but that's too much when displayed onscreen
            bw.write("}\n\n\\vspace{5mm}\n\n");
            bw.close();
        } catch(Exception e) {
            System.out.println("Error while saving to TeX: " + e.toString()); 
            e.printStackTrace();
            return false; 
        }
        
        return true;
    }

    private List<TeXSign> sortList(List<TeXSign> signList) {
        for (int i=0; i < signList.size(); i++)
            for(int j=i; j < signList.size(); j++) {
                TeXSign texSign1 = signList.get(i);
                TeXSign texSign2 = signList.get(j);
                if(texSign1.height > texSign2.height) { 
                    signList.set(i,texSign2); signList.set(j, texSign1);  }
                if(texSign1.height == texSign2.height)
                if(texSign1.identation > texSign2.identation) { 
                    signList.set(i,texSign2); signList.set(j, texSign1);  }
            }
        return signList;
    }

    private class TeXSign {
        Sign sign = null;
        int identation = 0;
        int height = 0;
    }

    /**
     * Calls runCommand/2 assuming that wait=true.
     *
     * @param  cmd  The string containing the command to execute
     */
    public static void runCommand (String cmd) {
	runCommand(cmd, true);
    }

    /**
     * Run a command with the option of waiting for it to finish.
     *
     * @param  cmd  The string containing the command to execute
     * @param  wait True if the caller should wait for this thread to 
     *              finish before continuing, false otherwise.
     */
    public static void runCommand (String cmd, boolean wait) {
	try {
            //System.out.println("Running command: "+ cmd);
	    Process proc = Runtime.getRuntime().exec(cmd);

	    // This needs to be done, otherwise some processes fill up
	    // some Java buffer and make it so the spawned process
	    // doesn't complete.
            BufferedReader br = 
		new BufferedReader(new InputStreamReader(proc.getInputStream()));
            //String line = null;
            //while ( (line = br.readLine()) != null) {
            while ( (br.readLine()) != null) {
		; // just eat up the inputstream

		// Use this if you want to see the output from running
		// the command.
		//System.out.println(line);
	    }

	    if (wait) {
		try {
		    proc.waitFor();
		} catch (InterruptedException e) {
		    Thread.currentThread().interrupt();
		}
	    }
	    proc.getInputStream().close();
	    proc.getOutputStream().close();
	    proc.getErrorStream().close();
	} catch (IOException e) {
	    System.out.println("Unable to run command: "+cmd);
	}
    }

}


================================================
FILE: src/opennlp/ccg/util/XmlScanner.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2006 Michael White (The Ohio State University)
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccg.util;

//JAXP packages
import javax.xml.parsers.*;
import org.xml.sax.*;
import org.xml.sax.helpers.*;

// jdom
import org.jdom.*;

import java.io.*;
import java.net.*;
import java.util.*;

/**
 * Quick-and-dirty class for using JDOM elements in parsing XML 
 * without building a document for the whole XML file.
 * The <code>parse</code> method parses an XML file with a SAX 
 * parser, constructing JDOM elements for root and the top-level elements,
 * without attaching the top-level elements to the root.
 * Along the way, the <code>handleRoot</code> and <code>handleElement</code> 
 * methods are invoked, to handle these elements incrementally.
 * To use the class, just implement <code>handleElement</code>, and optionally 
 * implement <code>handleRoot</code>, and call <code>parse</code> on the 
 * input XML via its URL.  Note that with Java's incremental garbage 
 * collection, an XmlScanner should be reasonably efficient, but not 
 * as efficient as a pure SAX parser (which however requires considerably 
 * more work to implement).  At present, the parser only handles elements 
 * and attributes without namespaces; all attributes with namespaces, text nodes, 
 * comments, etc. are ignored. 
 *
 * @author      Michael White
 * @version     $Revision: 1.3 $, $Date: 2009/12/21 03:27:18 $
 */
public abstract class XmlScanner extends DefaultHandler {
    
	/** 
	 * Method for handling the root element, sans children. 
	 * The default method does nothing. 
	 */
    public void handleRoot(Element e) {}
    
	/** Method for handling top-level elements. */
    public abstract void handleElement(Element e);
    
    /** 
     * Method for parsing an XML document, handling the childless root element 
     * and the top-level elements along the way. 
     */
    public void parse(URL url) throws IOException {
    	try {
	        // Create a JAXP SAXParserFactory and configure it
	        SAXParserFactory spf = SAXParserFactory.newInstance();
	
	        // Create a JAXP SAXParser
	        SAXParser saxParser = spf.newSAXParser();
	
	        // Get the encapsulated SAX XMLReader
	        XMLReader xmlReader = saxParser.getXMLReader();
	
	        // Set the ContentHandler of the XMLReader
	        xmlReader.setContentHandler(this);
	
	        // Tell the XMLReader to parse the XML document
	        xmlReader.parse(url.toString());
    	}
    	catch (ParserConfigurationException exc) {
    		throw (IOException) new IOException().initCause(exc);
    	}
    	catch (SAXException exc) {
    		throw (IOException) new IOException().initCause(exc);
    	}
    }

    
    // flag for whether the root element has been seen yet
    private boolean seenRoot = false;
    // the element that is currently being processed
    private Element current = null;

    
    //
    // ContentHandler methods (just elements)
    //

    /** 
     * For the root, a childless element is created and handled, via <code>handleRoot</code>; 
     * for all other elements, a new current element is created and added as a child of the 
     * current element, if any. 
     */
    public void startElement(String uri, String localName, String qname, Attributes attributes) throws SAXException {
        
        if (!seenRoot) { 
        	seenRoot = true;
        	Element root = createElement(uri, localName, qname, attributes);
        	handleRoot(root);
        	return; 
    	}
        
        Element parent = current;
        current = createElement(uri, localName, qname, attributes);
        if (parent != null) parent.addContent(current);
    }

    /** 
     * Constructs and returns a new element from the given info.
     * This implementation ignores the <code>uri</code> and <code>localName</code>, 
     * and filters out any attributes whose <code>qname</code> contains a colon.
     */
    protected Element createElement(String uri, String localName, String qname, Attributes attributes) {
        Element retval = new Element(qname);
        if (attributes != null) {
            int length = attributes.getLength();
            for (int i = 0; i < length; i++) {
                String attrQName = attributes.getQName(i);
                if (attrQName.indexOf(':') >= 0) continue;
                String attrValue = attributes.getValue(i);
                retval.setAttribute(attrQName, attrValue);
            }
        }
        return retval;
    }
    
    /** 
     * Resets the current element to its parent, after first invoking 
     * <code>handleElement</code> on the element if it's a top-level one. 
     */
    public void endElement(String uri, String localName, String qname) throws SAXException {
        if (current == null) return; // for root
        Element parent = (Element) current.getParent();
        if (parent == null) handleElement(current);
        current = parent;
    } 

    
    /**
     *  Example scanner: prints root, counts top- and second-level elements.
     */
    public static class MyScanner extends XmlScanner {
        int count = 0; int second = 0;
		public void handleRoot(Element e) {
        	System.out.println("root name: " + e.getName());
        	System.out.print("root attributes: ");
            @SuppressWarnings("unchecked")
        	List<Attribute> attrs = (List<Attribute>) e.getAttributes();
        	for (Attribute attr : attrs) {
        		System.out.print(attr.getName() + "=" + attr.getValue() + " ");
        	}
        	System.out.println();
        }
        public void handleElement(Element e) { 
            count++; second += e.getContentSize();
        }
    }
    
    /**
     * The main method shows an example of using a scanner, by 
     * invoking an instance of <code>MyScanner</code> on the file 
     * whose name is given by the first arg.
     */
    public static void main(String[] args) throws IOException {
        String filename = args[0];
        MyScanner myScanner = new MyScanner();
        myScanner.parse(new File(filename).toURI().toURL());
        System.out.println("top-level elements: " + myScanner.count);
        System.out.println("second-level elements: " + myScanner.second);
    }
}


================================================
FILE: src/opennlp/ccgbank/CCGBankConvert.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

/*
 * $Id: CCGBankConvert.java,v 1.8 2011/11/10 22:18:42 mwhite14850 Exp $ 
 */
package opennlp.ccgbank;

import java.io.BufferedReader;
import java.io.File;
import java.io.FileReader;
import java.io.IOException;
import java.io.Reader;
import java.util.ArrayList;
import java.util.List;
import java.util.StringTokenizer;

import javax.xml.transform.Source;
import javax.xml.transform.sax.SAXSource;

import opennlp.ccgbank.convert.InfoHelper;
import opennlp.ccgbank.convert.XSLTTrueCaser;
import opennlp.ccgbank.convert.MorphLookup;
import opennlp.ccgbank.parse.CCGbankDerivation;
import opennlp.ccgbank.parse.SimpleNode;

import org.apache.tools.ant.BuildException;
import org.apache.tools.ant.DefaultLogger;
import org.apache.tools.ant.Project;
import org.apache.tools.ant.ProjectHelper;
import org.jdom.Document;
import org.jdom.Element;
import org.jdom.transform.JDOMSource;
import org.xml.sax.InputSource;


/**
 * Converts the CCGBank to a modified version for grammar extraction.
 * <p>
 * Within this task, a series of <code>FileList</code>s is specified. These
 * files are the lists of xsltProcessors that should be used to transform the 
 * CCGBank. These xsltProcessors are processed in the order they occur in the
 * <code>FileList</code> specified within this task. 
 * @author <a href="http://www.ling.osu.edu/~scott/">Scott Martin</a>
 * @author Rajakrishnan Rajkumar
 * @version $Revision: 1.8 $
 * @see CCGBankExtract
 */
public class CCGBankConvert extends CCGBankTask {
	
	/** Flag for whether to keep case-marking preps in PP categories; defaults to false. */
	boolean keepPPHeads = false;

	TreeWalker treeWalker = new TreeWalker();
	
	CCGbankDerivation deriv = null;
	File auxFileDirectory, bbnAuxDirectory, wordsFile, stemsFile,
		currentDirectory = null;
	
	/* (non-Javadoc)
	 * @see opennlp.ccgbank.CCGBankTask#start()
	 */
	@Override
	protected void start() throws BuildException {
		
		InfoHelper.init(auxFileDirectory, bbnAuxDirectory);
		String trueCaseListPath=auxFileDirectory.getAbsolutePath()+"/"+"truecase-list.gz";
		XSLTTrueCaser.init(trueCaseListPath);
		
		try {
			MorphLookup.init(wordsFile, stemsFile);
			
		}
		catch(IOException io) {
			throw new BuildException("problem loading words or stems", io,
					getLocation());
		}
		
		xsltProcessor = useXMLFilter
			? new XMLFilterProcessor(this, this)
			: new TemplatesProcessor(this);
		
		// "prime" parser
		// TODO fix this hack!!
		try {
			File tmp = File.createTempFile(getClass().getName(), "prime");
			tmp.deleteOnExit();
						
			deriv = new CCGbankDerivation(new FileReader(tmp));
		}
		catch(IOException e) {
			throw new BuildException("Problem priming parser: "
				+ e.getMessage(), e, getLocation());
		}
	}

	/** Read aux files for the next WSJ section **/
	@Override
	protected void nextDirectory(File section) throws BuildException {
		
		currentDirectory = section;
		
		// only create if a numbered directory
		File d = new File(target, currentDirectory.getName());
		if(!d.exists() && !d.mkdirs()) {
			throw new BuildException("unable to create directory " + d);
		}
		
		//Read in aux files
		try { 
			InfoHelper.readBBNAuxfiles(section.getName());
			InfoHelper.readQuoteAuxfiles(section.getName());
			InfoHelper.readPTBAuxfiles(section.getName());
			InfoHelper.readTreeAuxfiles(section.getName());
		}
		catch(NumberFormatException nfe) {
			// not a numbered PTB directory
		}
	}

	@Override
	protected InputSource nextFile(File file) throws BuildException {
		try {
			Reader reader = new BufferedReader(new FileReader(file));
			
			if(deriv == null) { 
				deriv = new CCGbankDerivation(reader);
			}
			else {
				CCGbankDerivation.ReInit(reader);
			}
			
			SimpleNode root = CCGbankDerivation.start();
			Element result = new Element("Derivation");
			
			String fileName = file.getName();
			int start = fileName.contains(File.separator)
				? fileName.lastIndexOf(File.separatorChar) : 0;
			
			StringBuilder sb = new StringBuilder(
			    	fileName.substring(start, fileName.lastIndexOf('.')));
		    sb.append(".xml");
		    
		    File targetDir = new File(target, currentDirectory.getName());
		    File targetFile = new File(targetDir, sb.toString());			        
		    
		    xsltProcessor.resetSerializer();
		    xsltProcessor.setTarget(targetFile);
		    		    
		    Document doc = new Document(treeWalker.eval(root, result));
		    
		    // TODO attempt to get error reporting for file / line !!
		    Source s = new JDOMSource(doc);
		    s.setSystemId(file.toURI().toString());
		    
		    return SAXSource.sourceToInputSource(s);
		}
		catch(Exception e) {
			throw new BuildException(e, getLocation());
		}
	}
	
	
	/** @param keepPPHeads the keepPPHeads value to set */
	public void setKeepPPHeads(boolean keepPPHeads) { this.keepPPHeads = keepPPHeads; }
	
	
	/**
	 * @param stemsFile the stemsFile to set
	 */
	public void setStemsFile(File stemsFile) {
		this.stemsFile = stemsFile;
	}

	
	/**
	 * @param wordsFile the wordsFile to set
	 */
	public void setWordsFile(File wordsFile) {
		this.wordsFile = wordsFile;
	}

	/**
	 * @param auxFileDirectory the auxFileDirectory to set
	 */
	public void setAuxFileDirectory(File auxFileDirectory) {
		this.auxFileDirectory = auxFileDirectory;
		
	}
	
	/**
	 * @param bbnAuxDirectory the bbnAuxDirectory to set
	 */
	public void setBbnAuxDirectory(File bbnAuxDirectory) {
		this.bbnAuxDirectory = bbnAuxDirectory;
	}

	public static void main(String[] args) {
		File baseDir = new File(System.getProperty("user.dir"));
		File buildFile = new File(baseDir, "build.xml");
		
		Project project = new Project();
		
		project.init();
		
		project.setBaseDir(baseDir);
		
		ProjectHelper helper = ProjectHelper.getProjectHelper();
		
		project.setProjectReference(helper);
		
		helper.parse(project, buildFile);
		
		DefaultLogger logger = new DefaultLogger();
		logger.setErrorPrintStream(System.err);
		logger.setOutputPrintStream(System.out);
		
		project.addBuildListener(logger);
		
		project.executeTarget("convert-base");		
	}
	
	class TreeWalker {
		// General purpose datastructure to store ccgbank indices of categories.
		// Refreshed after the lifespan of a node is over.
		public List<String> idList = new ArrayList<String>();
		// flag for whether under a leaf node;
		// used to control whether to add fs id's
		private boolean underLeaf = false;
		
		public Element eval(SimpleNode node, Element root) throws Exception {

			// No:of children of any given node
			int numC = node.jjtGetNumChildren();

			// Loop & flag variables
			int i = 0;
			SimpleNode child;

			// Processing the child nodes of the current node.
			for (i = 0; i < numC; i++) {

				child = (SimpleNode) node.jjtGetChild(i);

				// Cat spec without co-indexation info in the leafnodes
				if (child.type.equals("Redundant")) {

					if (node.type.equals("Leafnode")) {
						node.catRedundant = child.print();
						continue;
					}

					// Processes treenode categories
					if (node.type.equals("Treenode"))
						child.type = "complexcat";
				}

				// The header node is accessed and the CCGbankId is passed on to the
				// treenode root of the sentence which is processed next
				if (child.type.equals("Header")) {

					i++;
					String temp1 = child.getHeader();
					int spacePos = temp1.indexOf(' ');
					if (spacePos > 0)
						temp1 = temp1.substring(0, spacePos);

					child = (SimpleNode) node.jjtGetChild(i);
					child.setHeader(temp1);
					// System.out.println(temp1);
				}

				// Xml element which is going to be generated.
				Element leaf = new Element(child.type);

				if (child.type.equals("complexcat")
						|| child.type.equals("Treenode")
						|| child.type.equals("Leafnode")) {

					// Atomic categories are represented in the javacc tree as
					// catSpec-aotmcat. So for such cases the catSpec child is
					// skipped and the next child is accessed.

					if (child.jjtGetNumChildren() == 1
							&& child.type.equals("complexcat")) {

						child = (SimpleNode) child.jjtGetChild(0);

						// The element which is to be added to the xml
						// representation
						leaf = new Element("atomcat");

						// Extracting the content of the node and storing it.
						node.cat = child.print();
					} else {

						// A complexcat element is created.
						leaf = ccinserter(child, leaf);

						// Extracting the content of the node and storing it.
						if (root.getName().equals("Leafnode")) {
							node.cat = child.print();
						}

						if (root.getName().equals("Treenode")
								&& leaf.getName().equals("complexcat")) {
							// Leafnode and treenode cat spec elements created
							node.cat = child.print();
						}

						// Recursive processing of the children of the current node
						leaf = eval(child, leaf);

						// Sending Leaf,Tree nodes for to a function which inserts
						// the family (ie normalized cat spec) of its contents.
						if (!child.type.equals("complexcat"))
							leaf = catInserter(child, leaf);

						// Adding the current element to its parent in the xml tree.
						root.addContent(leaf);

						continue;
					}

				}

				// Slash elements added to the tree
				if (child.cat.equals("/") || child.cat.equals("\\")) {
					leaf = opinserter(child);
					root.addContent(leaf);
					continue;
				}

				// Atomcat elements added to the tree
				leaf = atomcatinserter(child);
				root.addContent(leaf);

				// if(!child.type.matches("\\p{Punct}"))
			}

			// The final result of the above operations returned.
			return root;

		}
		
		public Element ccinserter(SimpleNode node, Element leaf) {

			// This function produces complexcat/treenode/leafnode elements.
			// mww: the name of this function is not very helpful

			// The node can be of any of the above types.
			String name;
			name = node.type;

			// Set treebankId,parseNo at root of the sent
			String h = node.getHeader();
			if (h != null)
				leaf.setAttribute("Header", h);

			// Treenode info ie head,daughter represented
			if (name.equals("Treenode")) {

				leaf.setAttribute("head", node.head);
				leaf.setAttribute("dtr", node.dtr);

				idList.clear();
				underLeaf = false;
			}

			// Leafnode info represented
			if (name.equals("Leafnode")) {
				leaf.setAttribute("lexeme", node.lex); // nb: may be truecased later
				leaf.setAttribute("lexeme0", node.lex);
				leaf.setAttribute("pos", node.pos);
				idList.clear();
				underLeaf = true;
			}

			// add propbank info here
			if (node.nodeRoles != null) {
				String roles = "";
				for (SimpleNode.LexSenseRole lexSenseRole : node.nodeRoles) {
					if (lexSenseRole.role.equals("rel")) {
						leaf.setAttribute("rel", lexSenseRole.lex + "." + lexSenseRole.sense);
					}
					else {
						String role = adjustRole(lexSenseRole.role);
						roles += lexSenseRole.lex + "." + lexSenseRole.sense + ":" + role + " ";
					}
				}
				if (roles.length() > 0) leaf.setAttribute("roles", roles.trim());
			}
			if (node.argRoles != null) {
				String args = "";
				for (String role : node.argRoles) {
					role = adjustRole(role);
					args += role + " ";
				}
				leaf.setAttribute("argRoles", args.trim());
			}
			// done
			return leaf;
		}

		public Element atomcatinserter(SimpleNode node) throws Exception {

			// Predicate for atomcat creation.
			// Flag signifies whether the elem is a single atomcat.
			// Relevant as if the present cat is an atomcat LF variable can be set
			// in the syntax here itself.

			StringTokenizer lex;
			Element atomcat = new Element("atomcat");
			Element fs = new Element("fs");
			Element feat = new Element("feat");
			String id = "NotGiven";
			String form;

			// Current element info extracted from the node
			String elem = node.print();

			// Index extracted by sensing undescore delimiter
			if (elem.contains("_")) {
				// elem=elem.replaceAll(":[A-Z]","");
				lex = new StringTokenizer(elem, "_");
				elem = lex.nextToken();
				id = lex.nextToken();
				String x[] = id.split(":");
				// System.out.println(id);

				if (x.length == 2) {
					// mww: moved this to atomcat
					//feat.setAttribute("attr", "dep");
					//feat.setAttribute("val", x[1]);
					//fs.addContent(feat);
					atomcat.setAttribute("dep", x[1]);
				}

				id = id.replaceAll(":[A-Z]", "");
			} else {
				// Default id 1 is alloted otherwise
				id = Integer.toString(idList.size() + 1);
				idList.add(id);
			}

			// Normalizing the id by comparing with previous indices.
			if (!idList.contains(id))
				idList.add(id);
			id = Integer.toString(idList.indexOf(id) + 1);

			// Normalized index is set (leaves only)
			if (underLeaf)
				fs.setAttribute("id", id);

			// make lowercase
			elem = elem.toLowerCase();
			// remove superfluous [nb] in np[nb]
			elem = elem.replaceAll("np\\[nb\\]", "np");
			// also strip PP heads if apropos
			elem = stripPPHeads(elem);

			// Form attrtibute detected and set.
			if (elem.contains("[")) {
				lex = new StringTokenizer(elem, "[,]");
				elem = lex.nextToken();
				form = lex.nextToken();
				feat = new Element("feat");
				feat.setAttribute("attr", "form");
				feat.setAttribute("val", form);
				fs.addContent(feat);
			}

			// add fs if non-empty
			if (underLeaf || fs.getContentSize() > 0)
				atomcat.addContent(fs);
			atomcat.setAttribute("type", elem);
			return atomcat;

		}

		public Element opinserter(SimpleNode node) {

			Element slash = new Element("slash");
			String dir;
			String op = node.cat;

			// Slash direction sensed and set.

			if (op.equals("\\"))
				dir = "<";
			else
				dir = ">";

			slash.setAttribute("dir", op);
			slash.setAttribute("mode", dir);
			return slash;

		}

		public Element catInserter(SimpleNode node, Element leaf) {
			int i;

			// The normalization process. Relevant indices replaced by 1,2,3..n

			if (idList.size() > 0) {
				for (i = 0; i < idList.size(); i++)
					node.cat = node.cat.replaceAll(idList.get(i),
							Integer.toString(i + 1));
			}

			String l = node.getLeftover();
			if (l != null)
				node.cat = node.cat + l;

			// Purging the cat spec of indices outside brackets & colons ie )_2 ,:B
			int ind = node.cat.indexOf(")_");

			while (ind != -1) {

				String str1 = node.cat.substring(0, ind + 1);
				String str2 = node.cat.substring(ind + 1, node.cat.length());

				str2 = str2.replaceFirst("_(\\p{Digit})++", "");

				// System.out.println(str1);
				// System.out.println(str2);

				node.cat = str1 + str2;

				ind = node.cat.indexOf(")_");

			}

			node.cat = node.cat.replaceAll(":[A-Z]", "");

			// Add categories with normalized indices, lowercased
			String cat = node.cat.toLowerCase();
			cat = cat.replaceAll("np\\[nb\\]", "np");
			// also strip PP heads if apropos
			cat = stripPPHeads(cat);
			leaf.setAttribute("cat", cat);

			String cat0 = "";

			// Add the same category to the treenodes
			if (node.type.equals("Treenode"))
				cat0 = node.cat;
			else
				cat0 = node.catRedundant;

			// Add the bare category to the leafnodes
			leaf.setAttribute("cat0", cat0);

			// Refresh index list.
			idList.clear();

			return leaf;
		}
	}
	
	// strips PP heads if apropos
	private String stripPPHeads(String cat) {
		if (keepPPHeads) return cat;
		return cat.replaceAll("pp\\[[a-z]+\\]", "pp");
	}
	
	// adjusts role, stripping PP head if apropos
	private String adjustRole(String role) {
		role = role.replaceFirst("ARG", "Arg");
		if (!keepPPHeads) {
			int hyph = role.indexOf('-');
			if (hyph > 0) role = role.substring(0, hyph);
		}
		return role;
	}
}


================================================
FILE: src/opennlp/ccgbank/CCGBankExtract.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

/*
 * $Id: CCGBankExtract.java,v 1.5 2011/11/04 01:49:57 raja-asoka Exp $ 
 */
package opennlp.ccgbank;

import java.io.BufferedInputStream;
import java.io.File;
import java.io.FileInputStream;
import java.io.FileNotFoundException;
import java.io.FileWriter;
import java.io.IOException;
import java.io.InputStream;
import java.io.PrintWriter;
import java.io.Writer;
import java.util.EnumMap;
import java.util.Map;

import javax.xml.transform.Source;
import javax.xml.transform.Templates;
import javax.xml.transform.TransformerConfigurationException;
import javax.xml.transform.TransformerException;
import javax.xml.transform.TransformerFactory;
import javax.xml.transform.URIResolver;
import javax.xml.transform.sax.SAXTransformerFactory;
import javax.xml.transform.stream.StreamSource;

import opennlp.ccgbank.CCGBankTaskTemplates.Type;
import opennlp.ccgbank.extract.FreqTally;
import opennlp.ccgbank.extract.RulesTally;
import opennlp.ccgbank.extract.Testbed;

import org.apache.tools.ant.BuildException;
import org.xml.sax.InputSource;
import org.xml.sax.SAXException;


/**
 * Extracts a grammar from a converted version of the CCGBank.
 * @author <a href="http://www.ling.osu.edu/~scott/">Scott Martin</a>
 * @version $Revision: 1.5 $
 * @see CCGBankConvert
 */
public class CCGBankExtract extends CCGBankTask implements URIResolver {
	
	static String pkgPath = null;
	static final String LEXICON_TEMPLATE = "lexicon-base.xsl",
		RULES_TEMPLATE = "rules-base.xsl";
	
	String grammarName = "ccgbankextract";
	boolean pPheads = true, skipUnmatched = false;
	int catFreqCutoff = 1, lexFreqCutoff = 1, openFreqCutoff = 100,
		ruleFreqCutoff = 1;
	CCGBankTaskTestbed testbed = null;
	
	File lexiconTempFile, rulesTempFile;
	TemplatesProcessor ruleProcessor;
	Map<Type, XSLTProcessor> xsltProcessors
		= new EnumMap<Type, XSLTProcessor>(Type.class);
	
	public CCGBankExtract() {
		super();
		if(pkgPath == null) {
			pkgPath = getClass().getPackage().getName().replace('.', '/');
		}
	}
	
	/**
	 * Sets the name of the generated grammar.
	 * @param grammarName The name of the generated grammar. This is the string
	 * that will appear in the "name" attribute of the root element of the
	 * generated grammar's <code>grammar.xml</code> file.
	 */
	public void setGrammarName(String grammarName) {
		this.grammarName = grammarName;
	}

	
	/**
	 * @param tb the testbed to set
	 */
	public void addConfiguredTestbed(CCGBankTaskTestbed tb) {
		this.testbed = tb;
	}

	
	/**
	 * @param catFreqCutoff the catFreqCutoff to set
	 */
	public void setCatFreqCutoff(int catFreqCutoff) {
		this.catFreqCutoff = catFreqCutoff;
	}

	
	/**
	 * @param lexFreqCutoff the lexFreqCutoff to set
	 */
	public void setLexFreqCutoff(int lexFreqCutoff) {
		this.lexFreqCutoff = lexFreqCutoff;
	}

	
	/**
	 * @param openFreqCutoff the openFreqCutoff to set
	 */
	public void setOpenFreqCutoff(int openFreqCutoff) {
		this.openFreqCutoff = openFreqCutoff;
	}

	
	/**
	 * @param pPheads the ppheads to set
	 */
	public void setPPheads(boolean pPheads) {
		this.pPheads = pPheads;
	}

	
	/**
	 * @param ruleFreqCutoff the ruleFreqCutoff to set
	 */
	public void setRuleFreqCutoff(int ruleFreqCutoff) {
		this.ruleFreqCutoff = ruleFreqCutoff;
	}

	
	/**
	 * @param skipUnmatched the skipUnmatched to set
	 */
	public void setSkipUnmatched(boolean skipUnmatched) {
		this.skipUnmatched = skipUnmatched;
	}
	
	
	/* (non-Javadoc)
	 * @see javax.xml.transform.URIResolver#resolve(java.lang.String, java.lang.String)
	 */
	public Source resolve(String href, String base) {
		if(href != null && href.length() > 0 && href.startsWith(pkgPath)) {
			String lastChunk = (href.contains("/") && !href.endsWith("/"))
				? href.substring(href.lastIndexOf('/') + 1) : href;
			if(lastChunk.endsWith(CCGBankExtract.LEXICON_TEMPLATE)
					|| lastChunk.endsWith(CCGBankExtract.RULES_TEMPLATE)) {
				return new StreamSource(getResource(href));
			}
		}
		
		return new StreamSource(new File(href));
	}
	
	
	/* (non-Javadoc)
	 * @see opennlp.ccgbank.CCGBankTask#addConfiguredCCGBankTaskTemplates(opennlp.ccgbank.CCGBankTaskTemplates)
	 */
	@Override
	public void addConfiguredTemplates(CCGBankTaskTemplates taskTemplates) {
		if(xsltProcessors.containsKey(taskTemplates.type)) {
			throw new BuildException(taskTemplates.type 
					+ " extraction type is multiply defined");
		}
		
		XSLTProcessor xp = useXMLFilter
			? new XMLFilterProcessor(this, this)
			: new TemplatesProcessor(this);
		
		xp.addTemplates(taskTemplates);
		xp.transformerFactory.setURIResolver(this);
		
		xsltProcessors.put(taskTemplates.type, xp);
	}


	/* (non-Javadoc)
	 * @see opennlp.ccgbank.CCGBankTask#start()
	 */
	@Override
	protected void start() throws BuildException {
		xsltProcessor = new TemplatesProcessor(this);
		((TemplatesProcessor)xsltProcessor).addTemplates(
			loadTemplates(pkgPath + "/" + CCGBankExtract.LEXICON_TEMPLATE));
		ruleProcessor = new TemplatesProcessor(this);
		ruleProcessor.addTemplates(loadTemplates(pkgPath + "/"
				+ CCGBankExtract.RULES_TEMPLATE));

		FreqTally.reset();
		FreqTally.CAT_FREQ_CUTOFF = catFreqCutoff;
		FreqTally.LEX_FREQ_CUTOFF = lexFreqCutoff;
		FreqTally.OPEN_FREQ_CUTOFF = openFreqCutoff;
		
		RulesTally.reset();
		RulesTally.RULE_FREQ_CUTOFF = ruleFreqCutoff;
        RulesTally.KEEP_UNMATCHED = !skipUnmatched;
		
		try {
			lexiconTempFile = File.createTempFile(grammarName, ".xml");
			lexiconTempFile.deleteOnExit();
			xsltProcessor.setTarget(lexiconTempFile);
			
			rulesTempFile = File.createTempFile(grammarName + "-rules", ".xml");
			rulesTempFile.deleteOnExit();
			ruleProcessor.setTarget(rulesTempFile);
			
			Writer w = xsltProcessor.serializer.getWriter();
			w.write("<ccg-lexicon>");
			w.flush();
			
			Writer rw = ruleProcessor.serializer.getWriter();
			rw.write("<rules>");
			rw.flush();
		}
		catch(IOException io) {
			throw new BuildException(io, getLocation());
		}
	}
	
		
	/* (non-Javadoc)
	 * @see opennlp.ccgbank.CCGBankTask#nextFile(java.io.File)
	 */
	@Override
	protected InputSource nextFile(File file) throws BuildException {
		try {
			ruleProcessor.process(super.nextFile(file));
		}
		catch(IOException io) {
			throw new BuildException("I/O problem processing " + file + ": "
				+ io.getMessage(), io, getLocation());
		}
		catch(SAXException se) {
			throw new BuildException("Problem processing " + file + ": "
				+ se.getMessage(), se, getLocation());
		}
		catch(TransformerException te) {
			throw new BuildException("Problem processing " + file + ": "
				+ te.getMessageAndLocation(), te, getLocation());
		}
		
		return super.nextFile(file); // TODO is this right?
	}


	/* (non-Javadoc)
	 * @see opennlp.ccgbank.CCGBankTask#finish()
	 */
	@Override
	protected void finish() throws BuildException {
		try {
			Writer w = xsltProcessor.serializer.getWriter();
			w.write("</ccg-lexicon>");
			w.close();
			
			Writer rw = ruleProcessor.serializer.getWriter();
			rw.write("</rules>");
			rw.close();
		}
		catch(IOException io) {
			throw new BuildException(io, getLocation());
		}
		
		// generate lexicon, morph, rules
		for(Type t : xsltProcessors.keySet()) {
			if(t == Type.LEXICON) {
				try {
					FreqTally.printTally(target);
				}
				catch(FileNotFoundException fnfe) {
					throw new BuildException("problem generating frequencies",
							fnfe, getLocation());
				}
			}
			else if(t == Type.RULES) {
				try {
					RulesTally.printTally(target);
				}
				catch(FileNotFoundException fnfe) {
					throw new BuildException(
						"problem generating rule frequencies", fnfe,
						getLocation());
				}
			}
			
			String fileName = t.fileName();
			log("Generating " + fileName);
			try {
				XSLTProcessor xp = xsltProcessors.get(t);
				xp.setTarget(new File(target, fileName));
				
				xp.process(new InputSource(
					new BufferedInputStream(new FileInputStream(						
						(t == Type.RULES) ? rulesTempFile : lexiconTempFile))));
			}
			catch(IOException io) {
				throw new BuildException("I/O problem writing " + fileName,
						io, getLocation());
			}
			catch(TransformerException te) {
				throw new BuildException("Problem transforming " + fileName
					+ ": " + te.getMessageAndLocation(), te, getLocation());
			}
			catch(SAXException se) {
				throw new BuildException("Problem transforming " + fileName
					+ ": " + se.getMessage(), se, getLocation());
			}
		}
		
		// generate grammar.xml, if it doesn't already exist
		// nb: should eventually make schema refs relative to OPENCCG_HOME		
		try {
			File gramFile = new File(target, "grammar.xml");
			if (!gramFile.exists()) {
				log("Generating grammar.xml");
				PrintWriter gramOut = new PrintWriter(new FileWriter(gramFile));
				gramOut.println("<?xml version=\"1.0\"?>");
				gramOut.println("<grammar name=\"" + grammarName + "\"");
				gramOut.println("  xmlns:xsi=\"http://www.w3.org/2001/XMLSchema-instance\"");
				gramOut.println("  xsi:noNamespaceSchemaLocation=\"../grammar.xsd\"");
				gramOut.println(">");
				gramOut.println("  <lexicon file=\"lexicon.xml\"/>");
				gramOut.println("  <morphology file=\"morph.xml\"/>");
				gramOut.println("  <rules file=\"rules.xml\"/>");
				gramOut.println("<tokenizer replacement-sem-classes=\"DATE LOCATION MONEY ORGANIZATION PERCENT PERSON TIME\"/>");
				gramOut.println("<LF-from-XML>");
				gramOut.println("<transform file=\"convert-to-hlds.xsl\"/>");
				gramOut.println("<transform file=\"add-chunks.xsl\"/>");
				gramOut.println("</LF-from-XML>");
				gramOut.println("<LF-to-XML>");
				gramOut.println("<transform file=\"raise-nodes.xsl\"/>");
				gramOut.println("<transform file=\"convert-to-graph.xsl\"/>");
				gramOut.println("</LF-to-XML>");
				gramOut.println("</grammar>");
				gramOut.close();
			}
		}
		catch(IOException io) {
			throw new BuildException("problem generating grammar.xml",
					io, getLocation());
		}
		
		if(testbed != null) {
			log("Creating testbed ...");
			
			try {
				Testbed ct = new Testbed(ccgBankTaskSources,
						target, testbed);
				ct.createTestFiles();
			}
			catch(Exception e) {e.printStackTrace();
				throw new BuildException("problem generating testbed: "
						+ e.getMessage(), e, getLocation());
			}
		}
	}
	
	Templates loadTemplates(String resourceName) throws BuildException {
		try {
			// XXX nb: no xsltc option this way
			//TransformerFactory tf = XSLTProcessor.newTransformerFactory(); 
			SAXTransformerFactory tf = (SAXTransformerFactory)TransformerFactory.newInstance();
			
			return tf.newTemplates(new StreamSource(new BufferedInputStream(
				getResource(resourceName))));
		}
		catch(TransformerConfigurationException e) {
			throw new BuildException("Problem loading template "
				+ resourceName + ": " + e.getMessage(), e, getLocation());
		}
	}
	
	/**
	 * Loads a resource using the fully qualified name with the current
	 * class loader
	 */
	InputStream getResource(String resourceName) {
		return getClass().getClassLoader().getResourceAsStream(resourceName);
	}
}


================================================
FILE: src/opennlp/ccgbank/CCGBankTask.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

/*
 * $Id: CCGBankTask.java,v 1.5 2010/11/30 18:44:32 mwhite14850 Exp $ 
 */
package opennlp.ccgbank;

import java.io.BufferedInputStream;
import java.io.File;
import java.io.FileInputStream;
import java.io.FileNotFoundException;
import java.io.IOException;
import java.util.ArrayList;
import java.util.HashSet;
import java.util.List;
import java.util.Set;

import javax.xml.transform.ErrorListener;
import javax.xml.transform.TransformerException;

import opennlp.ccgbank.parse.TokenMgrError;

import org.apache.tools.ant.BuildException;
import org.apache.tools.ant.Task;
import org.apache.tools.ant.TaskContainer;
import org.xml.sax.ErrorHandler;
import org.xml.sax.InputSource;
import org.xml.sax.SAXException;
import org.xml.sax.SAXParseException;


/**
 * Abstract class to provide functionality for applying XSLT to an XML stream.
 * <p>
 * This class is designed to be run as a task from within an Ant build file.
 * There is one concrete implementer for each of the separate tasks of 
 * converting the CCGBank and extracting a grammar for the converted corpus.
 * @author <a href="http://www.ling.osu.edu/~scott/">Scott Martin</a>
 * @version $Revision: 1.5 $
 * @see CCGBankConvert
 * @see CCGBankExtract
 * @see <a href="http://ant.apache.org/">Ant home page</a>
 */
public abstract class CCGBankTask extends Task
		implements TaskContainer,ErrorHandler,ErrorListener {
	
	File target;
	Set<CCGBankTaskSources> ccgBankTaskSources
		= new HashSet<CCGBankTaskSources>();
	List<CCGBankTaskTemplates> ccgBankTaskTemplates
		= new ArrayList<CCGBankTaskTemplates>();
	XSLTProcessor xsltProcessor = null;
	
	boolean useXMLFilter = true;
	boolean terminateOnError = true, terminateOnWarning = false;
		
	/**
	 * Counters
	 */
	int directoriesProcessed, filesProcessed, warnings, errors;
	
	
	/**
	 * Adds a sub-task, but included here only for binary compatibility.
	 * @throws BuildException Always throws an exception, only
	 * sourcesSet or xsltProcessors can be added to this task.
	 */
	public void addTask(Task task) {
		throw new BuildException("nested task \"" + task.getTaskName()
				+ "\" not supported, only sourcesSet or xsltProcessors");
	}

	
	/**
	 * Sets the target directory.
	 * @param target The location of the result of the XSLT conversion (the 
	 * converted corpus, extracted grammar, etc.).
	 * @throws BuildException If the target is <code>null</code>
	 * or not a directory.
	 */
	public void setTarget(File target) {
		this.target = target;
		
		if(target == null) {
			throw new BuildException("no target specified");
		}
		if(!target.exists()) {
			target.mkdirs();
		}
		else if(!target.isDirectory()) {
			throw new BuildException("specified target is not a directory");
		}
	}
	
	/**
	 * @param terminateOnError the terminateOnError to set
	 */
	public void setTerminateOnError(boolean terminateOnError) {
		this.terminateOnError = terminateOnError;
	}


	/**
	 * @param terminateOnWarning the terminateOnWarning to set
	 */
	public void setTerminateOnWarning(boolean terminateOnWarning) {
		this.terminateOnWarning = terminateOnWarning;
	}

	
	/**
	 * @param useXMLFilter the useXMLFilter to set
	 */
	public void setUseXMLFilter(boolean useXMLFilter) {
		this.useXMLFilter = useXMLFilter;
	}


	/**
	 * Adds a file set of source files.
	 */
	public void addConfiguredSources(CCGBankTaskSources sources) {
		ccgBankTaskSources.add(sources);
	}
	
	
	/**
	 * Adds a series of xsltProcessors for XSLT transformation.
	 */
	public void addConfiguredTemplates(CCGBankTaskTemplates templates) {
		ccgBankTaskTemplates.add(templates);
	}

	
	/**
	 * Hook to be overridden by subclasses that want notification of the start
	 * of the transformation process.
	 */
	protected void start() throws BuildException {		
		// to be overridden
	}
	
	
	/**
	 * Hook to be overridden by subclasses that want notification of the end
	 * of the transformation process.
	 */
	protected void finish() throws BuildException {		
		// to be overridden
	}

	
	/**
	 * Hook that lets subclasses be notified when processing starts on a new
	 * directory.
	 * @param section The file (directory) on which processing is starting.
	 */
	protected void nextDirectory(File section)
			throws BuildException {		
		// to be overridden
	} 
	

	/**
	 * Hook that lets implementing subclasses know when processing starts on
	 * a new file.
	 * @param file The file on which processing is about to start.
	 * @return The input source to process.
	 */
	protected InputSource nextFile(File file) throws BuildException {
		try {
			return new InputSource(
					new BufferedInputStream(new FileInputStream(file)));
		}
		catch(FileNotFoundException fnfe) {
			throw new BuildException("Unable to find file " + file,
					fnfe, getLocation());
		}
	}
	
	
	/**
	 * Required by {@link ErrorHandler}. Reports the specified error using the
	 * Ant task {@link Task#log(String)} method.
	 */
	public void error(SAXParseException exception) {
		errors++;
		handleError("Error", exception, terminateOnError);
	}

	
	/**
	 * Required by {@link ErrorHandler}. Reports the specified error using the
	 * Ant task {@link Task#log(String)} method.
	 */
	public void fatalError(SAXParseException exception) {
		errors++;
		handleError("Fatal error", exception, terminateOnError);
	}

	
	/**
	 * Required by {@link ErrorHandler}. Reports the specified error using the
	 * Ant task {@link Task#log(String)} method.
	 */
	public void warning(SAXParseException exception) {
		warnings++;
		handleError("Warning", exception, terminateOnWarning);
	}
	
	
	/**
	 * Required by {@link ErrorListener}. Reports the specified error using the
	 * Ant task {@link Task#log(String)} method.
	 */
	public void error(TransformerException exception) {
		errors++;
		handleError("Error", exception, terminateOnError);
	}

	
	/**
	 * Required by {@link ErrorListener}. Reports the specified error using the
	 * Ant task {@link Task#log(String)} method.
	 */
	public void fatalError(TransformerException exception) {
		errors++;
		handleError("Fatal error", exception, terminateOnError);
	}

	
	/**
	 * Required by {@link ErrorListener}. Reports the specified error using the
	 * Ant task {@link Task#log(String)} method.
	 */
	public void warning(TransformerException exception) {
		warnings++;
		handleError("Warning", exception, terminateOnWarning);
	}

	
	/**
	 * Helper method for the methods required by {@link ErrorHandler}.
	 */
	void handleError(String prefix, SAXParseException spe, boolean terminate) {
		StringBuilder sb = new StringBuilder(prefix);
		sb.append(": problem in parse: ");
		sb.append(spe.getSystemId());
		sb.append(" on line ");
		sb.append(spe.getLineNumber());
		sb.append(", column ");
		sb.append(spe.getColumnNumber());
		sb.append(": ");
		sb.append(spe.getMessage());
		
		if(!terminate) {
			log(sb.toString());
		}
		else {
			throw new BuildException(sb.toString(), spe, getLocation());
		}
	}
	
	
	/**
	 * Helper method for the methods required by {@link ErrorListener}.
	 */
	void handleError(String prefix, TransformerException te,
			boolean terminate) {
		StringBuilder sb = new StringBuilder(prefix);
		sb.append(": problem in transform: ");
		sb.append(te.getMessageAndLocation());
		
		if(!terminate) {
			log(sb.toString());
		}
		else {
			throw new BuildException(sb.toString(), te, getLocation());
		}
	}
	
	
	/**
	 * Does the work of transforming the CCGBank and extracting grammars.
	 * @throws BuildException In case no sourcesSet have been specified or an 
	 * error occurs during the transformation process.
	 * <p>
	 * This method calls {@link #start()}, {@link #finish()},
	 * {@link #nextDirectory(File)}, and {@link #nextFile(File)} as required.
	 */
	@Override
	public void execute() throws BuildException {
		if(ccgBankTaskSources.isEmpty()) {
			throw new BuildException("no sourcesSet specified");
		}
				
		filesProcessed = directoriesProcessed = warnings = errors = 0;
		
		start();
		log("Target: " + target);
		
		if(xsltProcessor == null) { // should have been configured
			throw new BuildException("null XSLT processor");
		}
		
		xsltProcessor.addAllTemplates(ccgBankTaskTemplates);
		
		try {
			for(CCGBankTaskSources sources : ccgBankTaskSources) {
				File prevDir = null;
				File currentDir = null;
				
				for(File file : sources) {
					currentDir = file.getParentFile();
					if(!currentDir.equals(prevDir)) {
						log("Processing " + currentDir + " ...");
						directoriesProcessed++;
						
						nextDirectory(currentDir);
					}
					
					prevDir = currentDir;
					
					log("Processing " + file);
					filesProcessed++;
					
					xsltProcessor.process(nextFile(file));
				}
			}
		}
		catch(IOException io) {
			throw new BuildException("I/O problem during processing: " + 
				io.getMessage(), io, getLocation());
		}
		catch(SAXException se) {
			throw new BuildException("Problem during processing: " + 
					se.getMessage(), se, getLocation());
		}
		catch(TransformerException te) {
			throw new BuildException("I/O problem during processing: " + 
					te.getMessageAndLocation(), te, getLocation());
		}
		catch (TokenMgrError te) {
			throw new BuildException("I/O problem during processing: " + 
					te.getMessage(), te, getLocation());
		}
		finally {
			finish();
			
			StringBuilder sb = new StringBuilder("Processed ");
			sb.append(filesProcessed);
			sb.append(" files in ");
			sb.append(directoriesProcessed);
			sb.append(" directories with ");
			sb.append(errors);
			sb.append(" error");
			if(errors != 1) {
				sb.append('s');
			}
			sb.append(" and ");
			sb.append(warnings);
			sb.append(" warning");
			if(warnings != 1) {
				sb.append('s');
			}
			
			log(sb.toString());
		}
	}

}


================================================
FILE: src/opennlp/ccgbank/CCGBankTaskFileGroup.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

/*
 * $Id: CCGBankTaskFileGroup.java,v 1.1 2009/11/09 19:21:50 mwhite14850 Exp $ 
 */
package opennlp.ccgbank;

import java.io.File;
import java.util.Collection;
import java.util.Iterator;
import java.util.NoSuchElementException;

import org.apache.tools.ant.BuildException;
import org.apache.tools.ant.Task;
import org.apache.tools.ant.TaskContainer;
import org.apache.tools.ant.types.FileList;
import org.apache.tools.ant.types.FileSet;


/**
 * Abstract class providing generalized functionality for file groups used by
 * {@link CCGBankTask}s.
 * <p>
 * For convenience, this class implements {@link Iterable} over {@link File}s.
 * This allows instances to be used in standard iteration constructs while
 * abstracting away from implementation details such as multiple
 * {@link FileSet}s or {@link FileList}s. 
 * @author <a href="http://www.ling.osu.edu/~scott/">Scott Martin</a>
 * @version $Revision: 1.1 $
 */
public abstract class CCGBankTaskFileGroup<G> extends Task implements
		TaskContainer,Iterable<File> {

	protected Collection<G> subGroups;
	
	/**
	 * Creates a file group over the specified collection of subgroups.
	 * @param subGroups The collection over which this class is an abstracted
	 * view.
	 */
	protected CCGBankTaskFileGroup(Collection<G> subGroups) {
		this.subGroups = subGroups;
	}
	
	
	/**
	 * Adds a subgroup to the collection of subgroups this class abstracts over.
	 */
	protected void addGroup(G group) {
		subGroups.add(group);
	}
	
	
	/**
	 * Gets all the files in a group as an array. To be implemented by extending
	 * classes, as {@link FileSet} and {@link FileList} represent files 
	 * differently.
	 * @return The collection of files in <code>group</code>, as an array.
	 */
	protected abstract File[] getFiles(G group); 
	
	
	/**
	 * Creates an array of files given a directory and an array of file names
	 * (specified relative to that directory).
	 * @param directory The directory that the specified file names are relative
	 * to.
	 * @param fileNames The file names, relative to the specified directory.
	 * @return An array containing all the files as specified relative to the
	 * specified directory.
	 */
	protected File[] makeFiles(File directory, String[] fileNames) {
		File[] files = new File[fileNames.length];
		
		for(int i = 0; i < fileNames.length; i++) {
			files[i] = new File(directory, fileNames[i]);
		}
		
		return files;
	}
	
	
	/**
	 * Included for binary compatibility with {@link TaskContainer}.
	 * @throws BuildException Always throws a build exception, as only the
	 * parameterized type of this class's subgroups can be contained by this
	 * task.
	 */
	public void addTask(Task task) {
		throw new BuildException("nested task \"" + task
				+ "\" not supported, only "
				+ subGroups.getClass().getTypeParameters()[0]
				  .getGenericDeclaration());
	}
	
	
	/**
	 * Provides an
	 * iterator over all the files in the collection of subgroups contained by
	 * this instance. The iterator returned will iterate through files in all
	 * the subgroups returned in the same order as the order returned by the
	 * subgroups collection. 
	 */
	public Iterator<File> iterator() {
		return new AllFileView();
	}

	
	/**
	 * Implements an iterator over the files contained in the subgroups
	 * collection. This class iterates over all the files contained in the
	 * groups in the subgroups collection, in the order that they
	 * are returned by the subgroups collection.
	 * @author <a href="http://www.ling.osu.edu/~scott/">Scott Martin</a>
	 * @version $Revision: 1.1 $
	 */
	class AllFileView implements Iterator<File> {

		Iterator<G> groupIterator = subGroups.iterator();
		Iterator<File> currentIterator;
		
		/**
		 * Tests whether there is a next file.
		 * @return true If the current subgroup contains a next file, or if
		 * there is a next subgroup that is non-empty.
		 */
		public boolean hasNext() {
			while((currentIterator == null || !currentIterator.hasNext())
					&& groupIterator.hasNext()) {
				currentIterator = new FileArrayIterator(
						getFiles(groupIterator.next()));
			}
			
			// current may be empty
			return (currentIterator != null && currentIterator.hasNext()); 
		}
		
		
		/**
		 * Gets the next file in the series, as returned in order by the 
		 * subgroups collection.
		 * @throws NoSuchElementException If the collection of subgroups is
		 * exhausted.
		 */
		public File next() {
			if(!hasNext()) {
				throw new NoSuchElementException("elements exhausted");
			}
			
			return currentIterator.next();
		}
		
		/**
		 * Included only for binary compatibility with {@link Iterator}.
		 * @throws UnsupportedOperationException Always, as this operation is
		 * not supported.
		 */
		public void remove() {
			throw new UnsupportedOperationException("removed not supported");
		}
		
	}
	
	
	/**
	 * Implements an iterator view of an array of {@link File} objects.
	 * @author <a href="http://www.ling.osu.edu/~scott/">Scott Martin</a>
	 * @version $Revision: 1.1 $
	 */
	class FileArrayIterator implements Iterator<File> {

		File[] array;
		int index = 0;
		
		
		/**
		 * Creates a new iterator view over the specified array of files.
		 * @param array The file array backing this iterator view.
		 */
		FileArrayIterator(File[] array) {
			this.array = array;
		}
		
		/**
		 * Tests whether the array of files is exhausted.
		 * @return true If the current index is less than the array length.
		 */
		public boolean hasNext() {
			return (index < array.length);
		}

		/**
		 * Gets the next file in series, as specified by the array backing this
		 * iterator view.
		 * @throws NoSuchElementException If the array of files is exhausted.
		 * @see #hasNext()
		 */
		public File next() {
			if(!hasNext()) {
				throw new NoSuchElementException("elements exhausted");
			}
			
			return array[index++];
		}

		/**
		 * Included only for binary compatibility with {@link Iterator}.
		 * @throws UnsupportedOperationException Always, as this operation is
		 * not supported.
		 */
		public void remove() {
			throw new UnsupportedOperationException("remove not supported");
		}
		
	}
}


================================================
FILE: src/opennlp/ccgbank/CCGBankTaskSources.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

/*
 * $Id: CCGBankTaskSources.java,v 1.1 2009/11/09 19:21:50 mwhite14850 Exp $ 
 */
package opennlp.ccgbank;

import java.io.File;
import java.util.HashSet;

import org.apache.tools.ant.BuildException;
import org.apache.tools.ant.DirectoryScanner;
import org.apache.tools.ant.Project;
import org.apache.tools.ant.types.FileSet;


/**
 * Represents a set of source files. This class encapsulates a set of 
 * {@link FileSet}s.
 * @author <a href="http://www.ling.osu.edu/~scott/">Scott Martin</a>
 * @version $Revision: 1.1 $
 * @see <a href="http://ant.apache.org/">Ant home page</a>
 * @see FileSet
 */
public class CCGBankTaskSources extends CCGBankTaskFileGroup<FileSet> {

	/**
	 * Creates a new sources object (required by Ant).
	 */
	public CCGBankTaskSources() {
		super(new HashSet<FileSet>());
	}
	
	
	/**
	 * Adds a file set to this sources object.
	 */
	public void addConfiguredFileSet(FileSet fileSet) {
		addGroup(fileSet);
	}


	/**
	 * Gets the files in the specified group as an array of files. The files in
	 * the returned array are in the order returned by <code>group</code>'s
	 * {@link FileSet#getDirectoryScanner(Project) directory scanner}.
	 */
	@Override
	protected File[] getFiles(FileSet group) {
		Project proj = getProject();
		DirectoryScanner scanner = group.getDirectoryScanner(proj);
		scanner.scan();
		
		String[] fileNames = scanner.getIncludedFiles();
		if(fileNames.length == 0) {
			throw new BuildException("no source files included");
		}
		
		return makeFiles(group.getDir(proj), fileNames);
	}

}


================================================
FILE: src/opennlp/ccgbank/CCGBankTaskTemplates.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

/*
 * $Id: CCGBankTaskTemplates.java,v 1.1 2009/11/09 19:21:50 mwhite14850 Exp $ 
 */
package opennlp.ccgbank;

import java.io.File;
import java.util.ArrayList;

import org.apache.tools.ant.Project;
import org.apache.tools.ant.types.FileList;


/**
 * Represents a series of templates. This class encapsulates a list of lists of
 * {@link FileList}s.
 * @author <a href="http://www.ling.osu.edu/~scott/">Scott Martin</a>
 * @version $Revision: 1.1 $
 * @see <a href="http://ant.apache.org/">Ant home page</a>
 * @see FileList
 */
public class CCGBankTaskTemplates extends CCGBankTaskFileGroup<FileList> {

	/**
	 * File types/names for the generated OpenCCG-format grammar files.
	 * @author <a href="http://www.ling.osu.edu/~scott/">Scott Martin</a>
	 * @version $Revision: 1.1 $
	 */
	enum Type {
		/**
		 * The lexicon file.
		 */
		LEXICON, 
		
		/**
		 * The file containing morphological information.
		 */
		MORPH, 
		
		/**
		 * The file where the grammar rules are stored.
		 */
		RULES;
		
		/**
		 * Gets a filename corresponding to a given file type.
		 * @return The file type's name, lowercased, with the string 
		 * <code>".xml"</code> appended. Example: for <code>LEXICON</code>,
		 * returns the string <code>lexicon.xml</code>.
		 */
		String fileName() {
			StringBuilder sb = new StringBuilder(name().toLowerCase());
			sb.append(".xml");
			return sb.toString();
		}
	}
	
	Type type = null;
	
	
	/**
	 * Creates a new xsltProcessors object (no-arg constructor required by Ant).
	 */
	public CCGBankTaskTemplates() {
		super(new ArrayList<FileList>());
	}
	
	/**
	 * Adds a file list to the list of transforms.
	 * @param fileList The <code>FileList</code> object to add.
	 */
	public void addConfiguredFilelist(FileList fileList) {
		addGroup(fileList);
	}

	
	/**
	 * Gets the list of files contained in <code>group</code> as an array.
	 * The order of files in the returned array is the same as the order 
	 * of <code>group</code>'s {@link FileList#getFiles(Project) files}.
	 */
	@Override
	protected File[] getFiles(FileList group) {
		Project proj = getProject();
		return makeFiles(group.getDir(proj), group.getFiles(proj));
	}

	/**
	 * Sets the {@link CCGBankTaskTemplates#type file type}.
	 * @param typeName The name of the type to set. The actual type is
	 * coerced using {@link Enum#valueOf(Class, String)} using
	 * <code>typeName</code> as an argument.
	 */
	public void setType(String typeName) {
		this.type = Type.valueOf(typeName.toUpperCase());
	}
}


================================================
FILE: src/opennlp/ccgbank/CCGBankTaskTestbed.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

/*
 * $Id: CCGBankTaskTestbed.java,v 1.3 2010/12/09 04:58:12 mwhite14850 Exp $ 
 */
package opennlp.ccgbank;

import java.io.File;

import org.apache.tools.ant.Task;


/**
 * @author <a href="http://www.ling.osu.edu/~scott/">Scott Martin</a>
 * @version $Revision: 1.3 $
 *
 */
public class CCGBankTaskTestbed extends Task {
	
	boolean debugDerivations = false, showSem = false;
	File text, factors, combos, preds, treeAuxFile;
	
	
	/**
	 * @return the combos
	 */
	public File getCombos() {
		return combos;
	}

	
	/**
	 * @return the debugDerivations
	 */
	public boolean isDebugDerivations() {
		return debugDerivations;
	}

	
	/**
	 * @return the showSem
	 */
	public boolean isShowsSem() {
		return showSem;
	}

	
	/**
	 * @return the factors
	 */
	public File getFactors() {
		return factors;
	}

	
	/**
	 * @return the preds
	 */
	public File getPreds() {
		return preds;
	}

	
	/**
	 * @return the text
	 */
	public File getText() {
		return text;
	}

	//Get the file which stores info about the id info of treenodes
	public File getTree() {
		return treeAuxFile;
	}
	
	/**
	 * @param combos the combos to set
	 */
	public void setCombos(File combos) {
		this.combos = combos;
	}
	
	/**
	 * @param debugDerivations the debugDerivations to set
	 */
	public void setDebugDerivations(boolean debugDerivations) {
		this.debugDerivations = debugDerivations;
	}
	
	/**
	 * @param showSem the showSem to set
	 */
	public void setShowSem(boolean showSem) {
		this.showSem = showSem;
	}
	
	/**
	 * @param factors the factors to set
	 */
	public void setFactors(File factors) {
		this.factors = factors;
	}
	
	/**
	 * @param preds the preds to set
	 */
	public void setPreds(File preds) {
		this.preds = preds;
	}
	
	/**
	 * @param text the text to set
	 */
	public void setText(File text) {
		this.text = text;
	}
	
	public void setTree(File treeAuxFile) {
		this.treeAuxFile = treeAuxFile;
	}
}


================================================
FILE: src/opennlp/ccgbank/InputSourceAdapter.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

/*
 * $Id: InputSourceAdapter.java,v 1.1 2009/11/09 19:21:50 mwhite14850 Exp $
 * Copyright (C) 2009 Scott Martin (http://www.coffeeblack.org/contact/)
 */
package opennlp.ccgbank;

import java.io.File;
import java.io.InputStream;
import java.io.Reader;

import javax.xml.transform.Source;
import javax.xml.transform.stream.StreamSource;

import org.xml.sax.InputSource;


/**
 * Turns an {@link InputSource} into a {@link StreamSource}. This class wraps
 * an input source for XSLT transformation routines that expect {@link Source}
 * objects.
 * @author <a href="http://www.ling.osu.edu/~scott/">Scott Martin</a>
 * @version $Revision: 1.1 $
 */
class InputSourceAdapter extends StreamSource {
	InputSource inputSource;
	
	InputSourceAdapter(InputSource inputSource) {
		this.inputSource = inputSource;
	}

	/**
	 * @return
	 * @see org.xml.sax.InputSource#getPublicId()
	 */
	@Override
	public String getPublicId() {
		return inputSource.getPublicId();
	}

	/**
	 * @return
	 * @see org.xml.sax.InputSource#getSystemId()
	 */
	@Override
	public String getSystemId() {
		return inputSource.getSystemId();
	}

	/**
	 * @param publicId
	 * @see org.xml.sax.InputSource#setPublicId(java.lang.String)
	 */
	@Override
	public void setPublicId(String publicId) {
		inputSource.setPublicId(publicId);
	}

	/**
	 * @param systemId
	 * @see org.xml.sax.InputSource#setSystemId(java.lang.String)
	 */
	@Override
	public void setSystemId(String systemId) {
		inputSource.setSystemId(systemId);
	}

	/* (non-Javadoc)
	 * @see javax.xml.transform.stream.StreamSource#getInputStream()
	 */
	@Override
	public InputStream getInputStream() {
		return inputSource.getByteStream();
	}

	/* (non-Javadoc)
	 * @see javax.xml.transform.stream.StreamSource#getReader()
	 */
	@Override
	public Reader getReader() {
		return inputSource.getCharacterStream();
	}

	/* (non-Javadoc)
	 * @see javax.xml.transform.stream.StreamSource#setInputStream(java.io.InputStream)
	 */
	@Override
	public void setInputStream(InputStream inputStream) {
		inputSource.setByteStream(inputStream);
	}

	/* (non-Javadoc)
	 * @see javax.xml.transform.stream.StreamSource#setReader(java.io.Reader)
	 */
	@Override
	public void setReader(Reader reader) {
		inputSource.setCharacterStream(reader);
	}

	/* (non-Javadoc)
	 * @see javax.xml.transform.stream.StreamSource#setSystemId(java.io.File)
	 */
	@Override
	public void setSystemId(File f) {
		super.setSystemId(f);
		inputSource.setSystemId(super.getSystemId());
	}
	
}


================================================
FILE: src/opennlp/ccgbank/TemplatesProcessor.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

/*
 * $Id: TemplatesProcessor.java,v 1.2 2010/09/04 16:24:36 mwhite14850 Exp $
 * Copyright (C) 2009 Scott Martin (http://www.coffeeblack.org/contact/)
 */
package opennlp.ccgbank;

import java.io.BufferedOutputStream;
import java.io.ByteArrayInputStream;
import java.io.ByteArrayOutputStream;
import java.io.IOException;
import java.io.InputStream;
import java.util.ArrayList;
import java.util.Iterator;
import java.util.List;

import javax.xml.transform.ErrorListener;
import javax.xml.transform.Result;
import javax.xml.transform.Source;
import javax.xml.transform.Templates;
import javax.xml.transform.Transformer;
import javax.xml.transform.TransformerException;
import javax.xml.transform.stream.StreamResult;
import javax.xml.transform.stream.StreamSource;

import org.xml.sax.InputSource;
import org.xml.sax.SAXException;


/**
 * Implements an XSLT processor using {@link Templates}. This class processes
 * XSLT template objects successively with a given input, writing the output
 * of each successive transformation into memory, then feeding that output to
 * the next template in the chain.
 * @author <a href="http://www.ling.osu.edu/~scott/">Scott Martin</a>
 * @version $Revision: 1.2 $
 */
class TemplatesProcessor extends XSLTProcessor {
	List<Templates> templates = null;
	
	TemplatesProcessor(ErrorListener errorListener) {
		super(errorListener);
	}
	
	void addTemplates(Templates t) {
		if(templates == null) {
			templates = new ArrayList<Templates>();
		}
		
		templates.add(t);
	}
	
	/* (non-Javadoc)
	 * @see opennlp.ccgbank.XSLTProcessor#process(java.io.File)
	 */
	@Override
	void process(InputSource inputSource) throws IOException,SAXException,
			TransformerException {
		if(templates == null) {
			templates = makeTemplates(taskTemplatesList);
		}
		
		StreamSource input = new InputSourceAdapter(inputSource);
		
		ByteArrayOutputStream buffer = new ByteArrayOutputStream();
		byte[] bytesIn = null;
		
		try {
			// transform input with each template successively,
			// writing the output of each to a memory buffer
			Iterator<Templates> i = templates.iterator();
			Source source;
			StreamSource memorySource = null;
			while(i.hasNext()) {
				if(bytesIn == null) { // first pass?
					source = input; // use source
				}
				else { // use buffer otherwise
					InputStream in = new ByteArrayInputStream(bytesIn);
					if(memorySource == null) {
						memorySource = new StreamSource(in);						
					}
					else {
						memorySource.setInputStream(in);
					}
					
					source = memorySource;
				}
				
				// get and configure transformer for this template
				Templates template = i.next();
				Transformer transformer = template.newTransformer();
				transformer.setOutputProperties(xmlProperties);
				transformer.setErrorListener(errorListener);
				
				boolean ihn = i.hasNext(); // reuse
				
				Result result = ihn // last template?
					? new StreamResult(buffer)
					// if it's the last, write output to file
					: new StreamResult(new BufferedOutputStream(
							serializer.getOutputStream()));
										
				transformer.transform(source, result);
				
				if(ihn) {
					bytesIn = buffer.toByteArray();
					buffer.reset();
				}
			}
		}
		finally {
			bytesIn = null;
			try {
				buffer.close();
			}
			catch(IOException e) {
				// do nothing
			}
		}
	}
}


================================================
FILE: src/opennlp/ccgbank/XMLFilterProcessor.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

/*
 * $Id: XMLFilterProcessor.java,v 1.4 2010/09/05 15:54:43 mwhite14850 Exp $
 * Copyright (C) 2009 Scott Martin (http://www.coffeeblack.org/contact/)
 */
package opennlp.ccgbank;

import java.io.FileNotFoundException;
import java.io.IOException;
import java.util.*;

import javax.xml.transform.ErrorListener;
import javax.xml.transform.Templates;
import javax.xml.transform.TransformerConfigurationException;
import javax.xml.transform.TransformerException;
import javax.xml.transform.sax.SAXTransformerFactory;

import org.apache.tools.ant.BuildException;
import org.xml.sax.ErrorHandler;
import org.xml.sax.InputSource;
import org.xml.sax.SAXException;
import org.xml.sax.XMLFilter;
import org.xml.sax.helpers.XMLReaderFactory;


/**
 * An implementation of {@link XSLTProcessor} that performs transformations
 * using an {@link XMLFilter}. This particular implementation uses the XSLTC
 * compiler distributed with Apache's Xalan in order to avoid the known 
 * problems with re-using {@link XMLFilter}.
 * @see <a href="http://xml.apache.org/xalan-j/">Apache Xalan</a>
 * @author <a href="http://www.ling.osu.edu/~scott/">Scott Martin</a>
 * @version $Revision: 1.4 $
 */
class XMLFilterProcessor extends XSLTProcessor {
	
	// nb: this could be in the super class
	List<Templates> templates = null;
	
	XMLFilter filter;
	ErrorHandler errorHandler;
	
	static final String
		XSLT_KEY = "javax.xml.transform.TransformerFactory",
		XSLTC_VALUE = "org.apache.xalan.xsltc.trax.TransformerFactoryImpl";
	
	XMLFilterProcessor(ErrorListener errorListener, ErrorHandler errorHandler) {
		super(errorListener);
		this.errorHandler = errorHandler;
	}
	
	SAXTransformerFactory newTransformerFactory() {
		// TODO try using xsltc (seems to yield hard-to-trace bugs at the moment)
		//System.setProperty(XSLT_KEY, XSLTC_VALUE);
		return super.newTransformerFactory();
	}
	
	/* (non-Javadoc)
	 * @see opennlp.ccgbank.XSLTProcessor#process(java.io.File)
	 */
	@Override
	void process(InputSource inputSource) throws IOException,SAXException,
			TransformerException {
		// TODO figure out how to re-use filter without breaking :(
		// make new filter each time
		filter = makeFilter(taskTemplatesList);
		filter.setContentHandler(serializer.asContentHandler());
		filter.parse(inputSource);
	}
	
	/**
	 * Makes a filter from a single xsltProcessors object.
	 * @see #makeFilter(List)
	 */
	XMLFilter makeFilter(CCGBankTaskTemplates templates)
		throws FileNotFoundException,SAXException,
			TransformerConfigurationException {
		return makeFilter(Collections.singletonList(templates));
	}
	
	
	/**
	 * Makes a filter from a series of xsltProcessors that applies those 
	 * templates in order.
	 * @param templateList The series of xsltProcessors used to construct the
	 * filter.
	 * @throws BuildException If no xsltProcessors are specified.
	 */
	XMLFilter makeFilter(List<CCGBankTaskTemplates> templateList)
		throws FileNotFoundException,SAXException,
			 TransformerConfigurationException {

		// make templates
		if(templates == null) {
			templates = makeTemplates(taskTemplatesList);
		}
		
		// assemble list of xslt templates into a filter
		XMLFilter currentFilter = null, previousFilter = null;
		for (Templates t : templates) {
			currentFilter = transformerFactory.newXMLFilter(t);
			currentFilter.setErrorHandler(errorHandler);
			
			if(previousFilter == null) { // it's the first one
				currentFilter.setParent(
						XMLReaderFactory.createXMLReader());					
			}
			else {
				currentFilter.setParent(previousFilter);
			}
			
			previousFilter = currentFilter;
		}
		
		if(currentFilter == null ) {
			throw new IllegalArgumentException("no templates specified");
		}
		
		currentFilter.setErrorHandler(errorHandler);
		currentFilter.setFeature("http://xml.org/sax/features/namespace-prefixes", true);
		
		return currentFilter;
	}
}


================================================
FILE: src/opennlp/ccgbank/XSLTProcessor.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

/*
 * $Id: XSLTProcessor.java,v 1.4 2010/09/05 15:54:43 mwhite14850 Exp $
 * Copyright (C) 2009 Scott Martin (http://www.coffeeblack.org/contact/)
 */
package opennlp.ccgbank;

import java.io.BufferedInputStream;
import java.io.BufferedOutputStream;
import java.io.File;
import java.io.FileInputStream;
import java.io.FileNotFoundException;
import java.io.FileOutputStream;
import java.io.IOException;
import java.util.ArrayList;
import java.util.Collections;
import java.util.List;
import java.util.Properties;

import javax.xml.transform.ErrorListener;
import javax.xml.transform.OutputKeys;
import javax.xml.transform.Templates;
import javax.xml.transform.TransformerConfigurationException;
import javax.xml.transform.TransformerException;
import javax.xml.transform.TransformerFactory;
import javax.xml.transform.sax.SAXResult;
import javax.xml.transform.sax.SAXSource;
import javax.xml.transform.sax.SAXTransformerFactory;
import javax.xml.transform.stream.StreamSource;

import org.apache.tools.ant.BuildException;
import org.apache.xml.serializer.OutputPropertiesFactory;
import org.apache.xml.serializer.Serializer;
import org.apache.xml.serializer.SerializerFactory;
import org.xml.sax.InputSource;
import org.xml.sax.SAXException;


/**
 * Abstract base class for XSLT processing. Templates are added to a processor,
 * then {@link #process(InputSource)} is called for each input source. 
 * Subclasses will implement different processing strategies for transforming
 * XML using a series of XSL templates.
 * @author <a href="http://www.ling.osu.edu/~scott/">Scott Martin</a>
 * @version $Revision: 1.4 $
 */
abstract class XSLTProcessor {
	
	SAXTransformerFactory transformerFactory = newTransformerFactory();
	
	static final Properties xmlProperties
		= OutputPropertiesFactory.getDefaultMethodProperties("xml");
	
	static {
		xmlProperties.setProperty(OutputKeys.INDENT, "yes");
		xmlProperties.setProperty(
				"{http://xml.apache.org/xalan}indent-amount", "2");
	}
	
	List<CCGBankTaskTemplates> taskTemplatesList
		= new ArrayList<CCGBankTaskTemplates>();
	Serializer serializer = SerializerFactory.getSerializer(
			XSLTProcessor.xmlProperties);
	ErrorListener errorListener;	
	
	XSLTProcessor(ErrorListener errorListener) {
		this.errorListener = errorListener;
		transformerFactory.setErrorListener(errorListener);
	}
	
	boolean addAllTemplates(List<CCGBankTaskTemplates> templateList) {
		boolean b = false;
		
		for(CCGBankTaskTemplates t : templateList) {
			b |= addTemplates(t);
		}
		
		return b;
	}
	
	boolean addTemplates(CCGBankTaskTemplates taskTemplates) {
		return taskTemplatesList.add(taskTemplates);
	}
	
	
	/**
	 * Processes an input source, applying each of the templates specified 
	 * using {@link #addTemplates(CCGBankTaskTemplates)} or
	 * {@link #addAllTemplates(List)}. Subclasses will actually implement this
	 * method.
	 * @param inputSource The input source to which the templates will be
	 * applied.
	 * @throws IOException If a problem reading or writing occurs.
	 * @throws SAXException If a subclass uses a SAX processor and there is a 
	 * problem with it.
	 * @throws TransformerException If a subclass uses a processor that causes
	 * a transformer problem.
	 */
	abstract void process(InputSource inputSource)
		throws IOException,SAXException,TransformerException;
	
	void setTarget(File file) throws FileNotFoundException {
		serializer.setOutputStream(
			new BufferedOutputStream(new FileOutputStream(file)));
		// ensure output properties set (shouldn't really be nec!)
		serializer.setOutputFormat(xmlProperties);
	}
	
	/**
	 * Resets the serializer, if resetting is possible. If not, re-creates the
	 * serializer.
	 */
	void resetSerializer() {
		if(!serializer.reset()) {
	    	serializer // create new unless re-useable
	    		= SerializerFactory.getSerializer(xmlProperties);
	    }
	}
	
	SAXTransformerFactory newTransformerFactory() {
		SAXTransformerFactory tf
			= (SAXTransformerFactory)TransformerFactory.newInstance();
		
		if(!tf.getFeature(SAXSource.FEATURE)) {
			throw new IllegalStateException(
				"SAX transformer factory does not support SAXSource");
		}
		if(!tf.getFeature(SAXResult.FEATURE)) {
			throw new IllegalStateException(
				"SAX transformer factory does not support SAXResult");
		}
		
		return tf;
	}
	
	/**
	 * Makes a list of templates from a single xsltProcessors object.
	 * @see #makeTemplates(List)
	 */
	List<Templates> makeTemplates(CCGBankTaskTemplates taskTemplates) 
			throws FileNotFoundException,TransformerConfigurationException {
		return makeTemplates(Collections.singletonList(taskTemplates));
	}
	
	
	/**
	 * Makes a list of templates from a series of xsltProcessors that applies those xsltProcessors
	 * in order.
	 * @param templateList The series of xsltProcessors used to construct the
	 * filter.
	 * @throws BuildException If no xsltProcessors are specified.
	 */
	List<Templates> makeTemplates(List<CCGBankTaskTemplates> templateList)
			throws FileNotFoundException,TransformerConfigurationException {
		List<Templates> l = new ArrayList<Templates>();
		
		for(CCGBankTaskTemplates taskTemplates : templateList) {
			for(File f : taskTemplates) {
				StreamSource ss = new StreamSource(
					new BufferedInputStream(new FileInputStream(f)));
				ss.setSystemId(f);
				
				l.add(transformerFactory.newTemplates(ss));				
			}
		}
		
		return Collections.unmodifiableList(l);
	}
}


================================================
FILE: src/opennlp/ccgbank/ccgbank.properties
================================================
ccgbanktask=opennlp.ccgbank.CCGBankTask
sources=opennlp.ccgbank.CCGBankTaskSources
templates=opennlp.ccgbank.CCGBankTaskTemplates
convert=opennlp.ccgbank.CCGBankConvert
extract=opennlp.ccgbank.CCGBankExtract
testbed=opennlp.ccgbank.CCGBankTaskTestbed

================================================
FILE: src/opennlp/ccgbank/convert/ApposTally.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

//Class which stores info about punctuations
package opennlp.ccgbank.convert;

import java.io.BufferedReader;
import java.io.FileReader;
import java.io.IOException;
import java.util.ArrayList;

public class ApposTally {

	//Operation performed
	//private String oper = "";

	//Dest dir
	//private String destDir = "";

	//Sentence id
	private String id = "";

	//Context of a comma 
	//private String cont = "";

	//Status whether comma is balanced or not
	private String balStatus = "";

	//Intervening lexical mtl
	private String lexMtl = "";

	//Cue analysis result
	//private String cueResult = "";

	//Features for appos vs conj identification
	private ArrayList<String> featInfo = new ArrayList<String>();

	//Heads of np
	private ArrayList<String> headInfo1 = new ArrayList<String>();

	//Heads of appositive
	private ArrayList<String> headInfo2 = new ArrayList<String>();

	//Cues
	private static ArrayList<String> cueList = new ArrayList<String>();

	//Proc which opens the cue file
	public void openCueFile(String fileName) throws IOException {

		BufferedReader br = new BufferedReader(new FileReader(fileName));
		String line = "";

		while ((line = br.readLine()) != null) {
			if (!cueList.contains(line))
				cueList.add(line);
			//System.out.println(line);
		}
		br.close();
	}

	//Proc which traps, stores id of each sentence in a global var 
	public String storeId(String x) {
		id = "";
		id = x;
		//System.out.println(id);
		return null;
	}

	//Proc which reinitializes all vars when a new comma is encountered
	public void flushVars() {
		balStatus = "conj";
		lexMtl = "";
		headInfo1.clear();
		headInfo2.clear();
		//cueResult = "";
		featInfo.clear();
	}

	//Proc which stores whether comma is balanced
	public void storeBalance(String status) {

		balStatus = status;

	}

	//Proc which returns balance status
	public String getBalance() {

		return balStatus;

	}

	//Proc which returns capitalized string of balance status
	public String getCaps(String x) {

		return x.toUpperCase();

	}

	//Proc which stores intervening lexical mtl
	public void storeLex(String word, String pos) {

		String info = "";

		if (pos.equals("X"))
			info = word;
		else
			info = word + "/" + pos;

		lexMtl = lexMtl + " " + info;

	}

	//Proc which prints intervening lexical mtl
	public void printLex() {

		lexMtl = id + " " + lexMtl;
		//System.out.println(lexMtl+'\n');
		lexMtl = "";
	}

	//Proc which stores head of np1
	public void storeHead(String word, String pos, int npNo) {

		String info = "";

		//Eliding the distinction b/w sing&plural nouns
		if (pos.equals("NNS"))
			pos = "NN";
		if (pos.equals("NNPS"))
			pos = "NNP";

		info = word + "/" + pos;

		if (npNo == 1)
			headInfo1.add(info);
		else
			headInfo2.add(info);

	}

	//Heuristic2: Cue based analysis
	public String cueAnalysis() {

		//String[] np = lexMtl.split("X");
		String[] sent = lexMtl.split("X");

		//Sift out possessed in genitive constr
		if (sent[0].contains("'s/POS") && headInfo1.size() > 0)
			headInfo1.remove(0);
		if (sent[1].contains("'s/POS") && headInfo2.size() > 0)
			headInfo2.remove(0);

		String res = "";

		int flag = 0;

		String np1head[] = new String[2];

		if (headInfo1.size() == 0 || headInfo2.size() == 0) {
			//System.out.println(id+": "+lexMtl+'\n');
			headInfo1.add("X1/ECK");
			np1head = (headInfo1.get(headInfo1.size() - 1)).split("/");

		} else
			np1head = (headInfo1.get(headInfo1.size() - 1)).split("/");

		//Comparing the heads of np1 & np2
		for (String x : headInfo2) {
			String[] np2head = x.split("/");
			if (np2head[1].equals(np1head[1]))
				flag = 1;
			else {
				flag = 0;
				break;
			}
		}

		//Avoid place names: ie like c
		if (flag == 1 && headInfo1.size() == 1 && headInfo2.size() == 1)
			flag = 0;

		if (flag == 1 && sent[0].contains("/CC") && !sent[0].contains(","))
			flag = 0;

		//Like nps together smacks of a conjunction
		if (flag == 0 && sent[1].contains("/CC")) {
			headInfo2.add("X2/ECK");
			String np2head[] = (headInfo2.get(0)).split("/");
			if (np2head[1].equals(np1head[1]))
				flag = 1;
		}

		//if(flag==0 && sent[1].contains(",/, and/CC"))flag=1;

		/*Stub to print a particular sentence
		 if(id.equals("ID=wsj_0012.3")){
		 System.out.println("Flag: "+flag);
		 System.out.println(headInfo1);
		 System.out.println(headInfo2);
		 }*/

		if (flag == 1)
			res = "conj";
		else
			res = "appos";

		//if(unit.contains("/CD") || unit.contains("/POS") || unit.contains("/IN") || unit.contains("/DT")|| unit.contains("PRP$") || head1==true || cue==true)featInfo.add("appos");

		return res;

	}

}


================================================
FILE: src/opennlp/ccgbank/convert/DiscrCheck.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

//Class which stores the context of punctuations
package opennlp.ccgbank.convert;


public class DiscrCheck{

		//Sentence id
		private  String id="";

	 //Proc which traps, stores id of each sentence in a global var
    public String storeId(String x){

				id="";
				id=x;
				return null;
    }

		 public void checkCatDiscr(String cat,String cat0,String lex){

				 //Comparing discrepancies between cat0 & cat1
				 //Just a check. Should be commented out in the final version
				 
				 String catA=cat0;
				 String catB=cat;
				 
				 catA=catA.toLowerCase();
				 catB=catB.replaceAll("[0-9]","");
				 catB=catB.replaceAll("_","");
				 
				 if(!catA.equals(catB) && !cat0.contains("nb"))
						 System.out.println(id+": "+cat0+"***"+cat+" - "+lex);
				 
		 }
		
}


================================================
FILE: src/opennlp/ccgbank/convert/GenChal11Adjuster.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2011 Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccgbank.convert;

import java.util.*;

/**
 * Utility class for adjusting Generation Challenges 2011 outputs.
 * Strings are lowercased, named entities and hyphenated words are split, 
 * and dollar sign and numbers are transposed. 
 */ 
public class GenChal11Adjuster {

	/** Returns the adjusted text string . */
	public String getAdjustedString(String text) {
		// lowercase and split
		String[] tokens = text.toLowerCase().split("\\s+");
		// swap dollar signs
		for (int i=0; i < tokens.length-1; i++) {
			if (tokens[i+1].equals("$")) {
				try {
					// check for preceding number token
					Double.parseDouble(tokens[i]);
					// swap, skip
					String num = tokens[i];
					tokens[i] = tokens[i+1];
					tokens[i+1] = num;
					i++;
				}
				catch (NumberFormatException e) {}
			}
		}
		// split NEs and hyphenated words
		List<String> splitTokens = new ArrayList<String>(tokens.length*2);
		for (String token : tokens) {
			String[] tokenSplits = token.replace("-"," - ").split("[_ ]");
			for (String s : tokenSplits)
				splitTokens.add(s);
		}
		// join
		StringBuffer retval = new StringBuffer();
		for (int i=0; i < splitTokens.size()-1; i++) {
			retval.append(splitTokens.get(i));
			retval.append(' ');
		}
		retval.append(splitTokens.get(splitTokens.size()-1));
		// done
		return retval.toString();
	}
}


================================================
FILE: src/opennlp/ccgbank/convert/GenConjRule.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

//Java class which adds brackets, stores arg1 position for inferConjRules.xsl,normConjRulesId, normTreenodeId.xsl

package opennlp.ccgbank.convert;

import java.util.ArrayList;
import java.util.Hashtable;
//import java.util.StringTokenizer;

public class GenConjRule {

	//The largest current id
	private static int globalId = 0;

	//The store of ids
	private static Hashtable<String,String> idTally = new Hashtable<String,String>();

	//Dollar status of res, arg1 & arg2
	private static ArrayList<String> dollarStatus = new ArrayList<String>();

	//Final result of dollar status calcs
	private static String ds = "No_Dollar";

	//Add brackets to complex categories
	public String addParen(String str) {

		if (str.contains("\\") || str.contains("/"))
			str = "(" + str + ")";
		return str;

	}

	//Add _conj to the result category
	public String modRes(String str) {
		//StringTokenizer st = new StringTokenizer(str, "[]");
		str = str + "_conj";
		return str;
	}

	//Procedure which cleans the unary rule result
	public String getConjRes(String x) {
		x = x.replaceAll("_conj", "");
		x = x.replaceAll("_[0-9]", "");
		//System.out.println(x);
		return x;
	}

	//Normalizes id of input category
	public String normId(String oldId, String oldInhId, String cat) {

		String newId = "";
		//int choice = 0;

		//Switch for usage between Treenode & Leafnode Id normalization 
		if (oldId.length() > 0)
			cat = cat + "_" + oldId;
		if (oldInhId.length() > 0)
			cat = cat + "_" + oldInhId;

		cat = cat.trim();

		//Normalization condition
		if (!idTally.containsKey(cat)) {
			globalId++;
			newId = Integer.toString(globalId);
			idTally.put(cat, newId);
		}

		newId = (String) idTally.get(cat);

		return newId;
	}

	//Initialization of idTally & globalId before start of a new conj rule 
	public String globalInit() {
		globalId = 0;
		idTally.clear();
		return null;
	}

	//Initialization of idTally before each of Result,arg1 & arg2 is added 
	public String localInit() {
		idTally.clear();
		return null;
	}

	//Calculation of dollarStatus before start of a new conj rule 

	//Initialization of dollarStatus before start of a new conj rule 
	public String dsInit() {
		//System.out.println(dollarStatus);
		dollarStatus.clear();
		ds = "No_Dollar";
		return null;
	}

	//Store dollar status of res, arg1 & arg2
	public String storeDollarStatus(String type) {
		type = type.trim();
		dollarStatus.add(type);
		/*System.out.println('\n');
		 System.out.println("Insertion of: "+type);
		 System.out.println(dollarStatus);
		 System.out.println('\n');*/
		return "null";
	}

	public String dsCalc() {

		//System.out.println(dollarStatus);
		if (dollarStatus.size() == 3)
			ds = "Dollar";

		/*System.out.println('\n');
		 System.out.println("Retrieval");
		 System.out.println(dollarStatus);
		 System.out.println('\n');*/

		return null;
	}

	//Get dollar status of conjunct
	public String getDollarStatus() {
		return ds;
	}

	//Function invoked by invertedDirSpComma.xsl
	public String getglobalId() {
		globalId++;
		return Integer.toString(globalId);
	}
}


================================================
FILE: src/opennlp/ccgbank/convert/InfoHelper.java
================================================
///////////////////////////////////////////////////////////////////////////////
//Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
//
//This library is free software; you can redistribute it and/or
//modify it under the terms of the GNU Lesser General Public
//License as published by the Free Software Foundation; either
//version 2.1 of the License, or (at your option) any later version.
//
//This library is distributed in the hope that it will be useful,
//but WITHOUT ANY WARRANTY; without even the implied warranty of
//MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
//GNU Lesser General Public License for more details.
//
//You should have received a copy of the GNU Lesser General Public
//License along with this program; if not, write to the Free Software
//Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

//Java class which helps info extr from PTB

package opennlp.ccgbank.convert;

//import opennlp.ccg.lexicon.*;

import java.util.*;
import java.io.*;

public class InfoHelper{
	
	/** CCG terminal & non-terminal nos.. */
	private int termNo=0;private int ntNo=500;
	
	/** BBN-info. */
	private static Hashtable<String,String> bbnInfo=new Hashtable<String, String>();
	private static Hashtable<String,ArrayList<String>> bbnSpans=new Hashtable<String, ArrayList<String>>();
	private static ArrayList<String>bbnClasses=new ArrayList<String>();
	
	/** Quote info. */
	private static Hashtable<String,String> quoteInfo=new Hashtable<String, String>();
	
	/** PTB aux info viz. SBJ, FN_Tag & TPC annotation **/
	private static Hashtable<String,String> sbjInfo=new Hashtable<String, String>();
	private static Hashtable<String,String> fntagInfo=new Hashtable<String, String>();
	private static Hashtable<String,String> tpcInfo=new Hashtable<String, String>();
	
	/** Treenode info. */
	private static Hashtable<String,String> treeInfo=new Hashtable<String, String>();
	
	/** Directory where aux file and BBN NE info is stored. */
	static File auxFileDirectory = null, bbnAuxDirectory = null;
	
	/** Store aux file directories. */
	public static void init(File auxDir, File bbnAuxDir) {
		InfoHelper.auxFileDirectory = auxDir;
		InfoHelper.bbnAuxDirectory = bbnAuxDir;
	}
	
	/** Read BBN NE aux file corresponding to the WSJ Section provided as argument. */
	public static void readBBNAuxfiles(String sect){
		
		String bbnAuxFile=bbnAuxDirectory+"/"+"bbn-ccg"+sect+".aux";
		
		try{
			
			if(new File(bbnAuxFile).exists()){
				BufferedReader inp= new BufferedReader(new FileReader(bbnAuxFile));
				System.out.println("Reading in BBN aux file: "+bbnAuxFile);
				String line="";
				while((line=inp.readLine())!=null ){
					if(line.length()==0)continue;
					String bbn[]=line.trim().split(" ");
					String sentId=bbn[0];
					String span=bbn[1]+","+bbn[2];
					String key=sentId+" "+span;
					String bbnData="";
					
					for(int i=3;i<bbn.length;i++)
						bbnData=bbnData+" "+bbn[i];
					bbnData=bbnData.trim();
					//Remove colons in class names which seem to offend maxent
					bbnData=bbnData.replaceAll(":","|");
					bbnInfo.put(key,bbnData);
					ArrayList<String> spanList=new ArrayList<String>();
					if(!bbnSpans.containsKey(sentId))
						bbnSpans.put(sentId,spanList);
					spanList=bbnSpans.get(sentId);
					spanList.add(span);
					bbnSpans.put(sentId,spanList);
					
				}
				inp.close();
			}
		}
		catch(IOException e){
			System.out.println("Error reading: "+bbnAuxFile);
		}
	}
	
	/** Read quotes aux file corresponding to the WSJ Section provided as argument. */
	public static void readQuoteAuxfiles(String sect){
		
		String quoteAuxFile=auxFileDirectory+"/"+"aux-quotes-"+sect+".txt";
		
		try{
			
			if(new File(quoteAuxFile).exists()){
				System.out.println("Reading in quotes aux File: "+quoteAuxFile);
				String line="";
				BufferedReader inp= new BufferedReader(new FileReader(quoteAuxFile));
				while((line=inp.readLine())!=null ){
					
					if(line.length()==0)continue;
					String quoteData[]=line.trim().split(" ");
					String sentId=quoteData[0];
					String span=quoteData[1]+","+quoteData[2];
					String key=sentId+" "+span;
					String quotedText="";
					
					for(int i=3;i<quoteData.length;i++)
						quotedText=quotedText+" "+quoteData[i];
					quotedText=quotedText.trim();
					quoteInfo.put(key,quotedText);
				}
				inp.close();
			}
		}
		catch(IOException e){
			System.out.println("Error reading: "+quoteAuxFile);
		}
	}
	
	/** Read PTB aux file (sbj, fn-tag and tpc info) corresponding to the WSJ Section provided as argument. */
	public static void readPTBAuxfiles(String sect){
		
		String ptbAuxFile=auxFileDirectory+"/"+"ptb-aux-"+sect+".txt";
		
		try{
			
			if(new File(ptbAuxFile).exists()){
				System.out.println("Reading in PTB aux file: "+ptbAuxFile);
				//Example: wsj_0098.16 SBJ VBZ_uses_31 NN_company_30 Arg0
				String line="";
				BufferedReader inp= new BufferedReader(new FileReader(ptbAuxFile));
				while((line=inp.readLine())!=null ){
					line=line.trim();
					if(line.length()==0)continue;
					String[]info=line.split(" ");
					String wsjId=info[0];
					String label=info[1];
					String head=info[2];
					String dep=info[3];
					String rel=info[4].replaceFirst("ARG","Arg");
					//Store info in appropriate hastable
					if(label.equals("SBJ")){
						String key=wsjId+" "+head;
						sbjInfo.put(key,rel);
					}
					else{
						String key=wsjId+" "+dep;
						if(label.equals("FNT")){
							fntagInfo.put(key,rel);
						}
						else if(label.equals("TPC")){
							tpcInfo.put(key,rel);
						}
					}
				}
				inp.close();
			}
		}
		catch(IOException e){
			System.out.println("Error reading: "+ptbAuxFile);
		}
	}
	
	/** Read tree aux file corresponding to the WSJ Section provided as argument. */
	public static void readTreeAuxfiles(String sect){
		
		String treeAuxFile=auxFileDirectory+"/"+"tree-aux-"+sect+".txt";
		
		try{
			
			if(new File(treeAuxFile).exists()){
				System.out.println("Reading in Tree aux file: "+treeAuxFile);
				BufferedReader inp= new BufferedReader(new FileReader(treeAuxFile));
				String line="";
				while((line=inp.readLine())!=null ){
					if(line.length()==0)continue;
					String[] treeParts=line.split(" ");
					if(treeParts.length!=3)
						continue;
					String key=treeParts[0]+" "+treeParts[1];
					String catId=treeParts[2];
					treeInfo.put(key,catId);
				}
				inp.close();
			}

		}
		catch(IOException e){
			System.out.println("Error reading: "+treeAuxFile);
		}
	}
	

	private ArrayList<String> treeCont=new ArrayList<String>();
	public boolean checkTreeInfo(String header,String ntId,int numCats){
		
		String key=header+" "+ntId;
		
		if(treeInfo.containsKey(key)){
			String treeCats=treeInfo.get(key);
			String[] x=treeCats.split(",");
			
			if(numCats==x.length)
				return true;
			else return false;
		}
		else return false;
	}
	
	/** Retrieve treenode info. */
	public String getTreeInfo(String key){
		
		String retVal="";
		treeCont=new ArrayList<String>();
		
		if(treeInfo.containsKey(key)){
			retVal=treeInfo.get(key);
			String[]temp=retVal.split(",");
			
			for(String x:temp)
				treeCont.add(x);
		}
		
		return retVal;
	}
	
	/** Procedure which gives back id of a particular cat. */
	public String getTreeId(){
		
		String retVal="";
		
		if(treeCont.size()>0){
			retVal=treeCont.get(0);
			treeCont.remove(0);
			String x[]=retVal.split("_");
			retVal=x[1];
			if(x.length==3)
				retVal="M_"+retVal;
		}
		
		return retVal;
	}
	
	/** Procedure which gives slash of combination. */
	public String getTreeSlash(){
		
		String retVal="";
		if(treeCont.size()>0){
			String slash=treeCont.get(0);
			String mode="";
			
			if(slash.length()>1)
				mode=Character.toString(slash.charAt(1));
			else if(slash.startsWith("/"))
				mode=">";
			else if(slash.startsWith("\\"))
				mode="<";
			treeCont.remove(0);
			retVal=Character.toString(slash.charAt(0));
			retVal=retVal+"_"+mode;
			
		}
		
		return retVal;
	}
	
	/** Retrieve BBN class for lexical items for use in the Leafnodes. */
	public String getBBNClass(String header,String lex,String pos,String cat,int nodeInd){
		
		String retVal="";
		String semClass="";
		
		//Check and exit if the pos is not relevant
		boolean relFlag=false;
		
		if(cat.matches("pp\\[[a-z]+\\]_~2/np_2"))
			return "";
		
		if (pos.startsWith("NN") || pos.startsWith("RB") || pos.startsWith("JJ") || pos.startsWith("VB") ||pos.equals("CD") || lex.equals("%") || pos.equals("$"))
			relFlag=true;
		
		if(!relFlag)
			return "";
		
		String sentId=header.replaceFirst("ID=","");
		ArrayList<String> spanList=new ArrayList<String>();
		
		String key=sentId+" "+Integer.toString(nodeInd)+","+Integer.toString(nodeInd);
		if(bbnInfo.containsKey(key)){
			
			String bbnData=bbnInfo.get(key);
			String info[]=bbnData.split(" ");
			
			if(info.length>=2){
				
				semClass=getCleanClass(info[0]);
				retVal=(classReplace(semClass,lex,info[1])).trim();
				if(retVal.length()>0 && !bbnClasses.contains(retVal))
					bbnClasses.add(retVal);
			}
			
			return retVal;
		}
		else if(bbnSpans.containsKey(sentId))
			spanList=bbnSpans.get(sentId);
		
		for(String span: spanList){
			
			String inds[]=span.split(",");
			if(inds.length!=2)continue;
			
			if(!inds[0].matches("[0-9]+") || !inds[1].matches("[0-9]+") || inds[0].equals("NA") || inds[1].equals("NA"))
				continue;
			
			int ind1=Integer.parseInt(inds[0]);
			int ind2=Integer.parseInt(inds[1]);
			if(nodeInd >=ind1 && nodeInd <=ind2){
				
				key=sentId+" "+span;
				
				String bbnData=bbnInfo.get(key);
				String info[]=bbnData.split(" ");
				
				if(info.length==0)
					continue;
				
				semClass=getCleanClass(info[0]);
				
				//Compile a list of acceptable classes
				boolean accClasses=false;
				
				if (!semClass.startsWith("DATE") && !semClass.startsWith("TIME") && !semClass.startsWith("ORDINAL") && !semClass.startsWith("QUANTITY") && !semClass.startsWith("PERCENT") && !semClass.startsWith("MONEY")) 
					accClasses=true;
				
				if (accClasses || pos.startsWith("NN") || pos.equals("CD") || lex.equals("%") || pos.equals("$")){
					String wordBit="";
					int relInd=nodeInd-ind1+1;
					
					if(relInd<info.length && relInd>=0)
						wordBit=info[(nodeInd-ind1+1)];
					
					retVal=classReplace(semClass,lex,wordBit);
					if(retVal.length()>0 && !bbnClasses.contains(retVal))
						bbnClasses.add(retVal);
					break;
				}
				
			}
		}
		
		return retVal;
		
	}
	
	/** Perform semantic replacement over relevant parts of the part. */
	public String classReplace(String semClass,String lex,String wordBit){
		
		String retVal="";
		
		/*CITY-based classes
		if(wordBit.equals(lex))
			retVal=semClass;
		else if(lex.contains(wordBit))
			retVal=lex.replaceFirst(wordBit,semClass);*/
		
		//Ignore CITY-based classes
		if(wordBit.equals(lex))
			retVal=semClass;
		
		return retVal;
		
	}
	
	/** Strip off label like ENAMEX,TIMEX,NUMEX. */
	public String getCleanClass(String semClass){
		
		String retVal="";
		String x[]=semClass.split("=");
		if(x.length>=2)
			retVal=x[1];
		
		return retVal;
	}
	
	/** Retrieve stored bbn-info for use in the Treenodes. */
	public String getBBNInfo(String header,String span,String words){
		String sentId=header.replaceFirst("ID=","");
		String bbnData="";
		String key=sentId+" "+span;
		
		boolean legitPhr=false;
		
		//Checking stored BBN-data with actual words
		if(bbnInfo.containsKey(key)){
			String[] ccgWords=words.split("_");
			bbnData=bbnInfo.get(key);
			String[] bbnWords=bbnData.split(" ");
			
			if(ccgWords.length>0 && bbnWords.length>1 && ccgWords.length==bbnWords.length-1){
				for(int i=0;i<ccgWords.length;i++){
					
					if(ccgWords[i].toLowerCase().contains(bbnWords[i+1].toLowerCase()))
						legitPhr=true;
					else{
						legitPhr=false;
						break;
					}
				}
			}
			else legitPhr=false;
			
			if(legitPhr){
				bbnData=bbnData+" "+span;
			}
			else bbnData="";
		}
		
		return bbnData.trim();
	}
	
	/** Get collapsed entity status. */
	private boolean collStatus=false;
	public boolean getCollapseStatus(){
		boolean retVal=collStatus;
		collStatus=false;
		return retVal;
	}
	
	private String collPhr="";
	public String collapse(String word,String choice){
		
		String retVal="";
		
		if(choice.equals("1"))
			collPhr=collPhr+"_"+word;
		else{
			retVal=collPhr.trim();
			retVal=retVal.replaceFirst("_","");
			collPhr="";
		}
		
		return retVal;
	}
	
	/** Retrieve stored quotes-info for use in the Treenodes. */
	public String getQuoteInfo(String header,int ind1,int ind2,String words){
		
		String sentId=header.replaceFirst("ID=","");
		String span1=Integer.toString(ind1)+","+Integer.toString(ind2);
		String span2=Integer.toString(ind1)+","+Integer.toString(ind2+1);
		String quotedText="";
		String retVal="";
		String key1=sentId+" "+span1;
		String key2=sentId+" "+span2;
		
		if(quoteInfo.containsKey(key1)){
			quotedText=quoteInfo.get(key1);
			String []qInfo=quotedText.split(" ");
			if(qInfo.length>0)
				retVal=span1+" "+qInfo[0];
		}
		else if(quoteInfo.containsKey(key2)){
			quotedText=quoteInfo.get(key2);
			String []qInfo=quotedText.split(" ");
			
			if(qInfo.length>0 && qInfo[qInfo.length-1].matches("\\p{Punct}")){
				retVal=span2+" "+qInfo[0]+" "+qInfo[qInfo.length-1];
			}
			
		}
		
		return retVal;
	}
	
	/** Store result cat. */
	String res="";
	public void storeRes(String str){
		this.res=str.replaceAll("\\[.*","");
	}
	
	/** Retrieve result cat. */
	public String getRes(){
		String retVal=this.res;
		return retVal;
	}
	
	/** The store of ids. */
	private Hashtable<String,Integer> idTally=new Hashtable<String, Integer>();
	public String id(String cat){
		
		String retVal="";
		
		int idNum=idTally.size()+2;
		if(!idTally.containsKey(cat))
			idTally.put(cat,idNum);
		else 
			idNum=idTally.get(cat);
		
		if(idTally.size()==1)
			retVal="first"+"_"+Integer.toString(idNum);
		else retVal="later"+"_"+Integer.toString(idNum);
		
		return retVal;
		
	}
	
	public void id(){
		idTally=new Hashtable<String, Integer>();
	}
	
	/** Retrieve terminal no. */
	public String getTermNo(){
		String tn=Integer.toString(this.termNo);
		this.termNo++;
		return tn;
	}
	
	/** Retrieve non-terminal no. */
	public String getNonTermNo(){
		String ntNo=Integer.toString(this.ntNo);
		this.ntNo++;
		return ntNo;
	}
	
	/** Get punctless index. */
	int plessInd=0;
	public String getPunctlessIndex(String word){
		boolean isCCGWord=this.isCCGWord(word);
		int retval=-1;
		if(isCCGWord){
			retval=this.plessInd;
			this.plessInd++;
		}
		return Integer.toString(retval);
	}
	
	/** Given a lexical item, ascertain whether it is a legit original CCGbank word **/
	public boolean isCCGWord(String word){
		
		boolean retval=true;
		if(word.matches("\\p{Punct}|[\\.]+|(-lrb-)|(-rrb-)|(-lcb-)|(-rcb-)|(--)|(`)|(')|(``)|('')") && !word.equals("$") && !word.equals("%")){
			retval=false;
		}
		return retval;
	}
	
	/** Init terminal nos. */
	public String initId(){
		this.termNo=0;
		this.ntNo=500;
		this.plessInd=0;
		return null;
	}
	
	/** Extract PTB SBJ,FN-TAG &  TPC annotation. */
	public String getPTBInfo(String label,String sentId,String head,String lexInd){
		
		String retval="";
		sentId=sentId.replaceFirst("ID=","");
		String key=sentId+" "+head+"_"+lexInd;
		String rel=null;
		
		if(label.equals("SBJ"))rel=sbjInfo.get(key);
		else if(label.equals("FNT"))rel=fntagInfo.get(key);
		else if(label.equals("TPC"))rel=tpcInfo.get(key);
		
		if(rel!=null){
			retval=rel;
		}
		return retval;
	}
	
	/** Print out BBN classes (for use in grammar.xml). */
	public void printBBNClasses(){
		
		try{
			
			System.out.println("Printing BBN classes used in the corpus to bbn-types.txt (for use in grammar.xml)");
			// Create a FileWriter stream to the file
			FileWriter file_writer = new FileWriter ("bbn-types.txt");
			BufferedWriter buf_writer = new BufferedWriter (file_writer);
			PrintWriter print_writer = new PrintWriter (buf_writer,true);
			print_writer.print("<tokenizer replacement-sem-classes=\"");
			
			for(int i=0;i<bbnClasses.size();i++){
				
				String bbn=bbnClasses.get(i);
				if(i==0)
					print_writer.print(bbn);
				else print_writer.print(" "+bbn);
				if(i==bbnClasses.size()-1)
					print_writer.print("\"/>");
				print_writer.flush();
			}
			print_writer.close();
		}
		catch (Exception e){
			System.err.println ("Error writing info to file");
		}
	}
	
	/** Input a string which contains a ':' and replace it by '|'. */
	public String replaceColon(String str) {
		
		String replacedStr=str.replace(":","|");
		return replacedStr;
	}	
	
}


================================================
FILE: src/opennlp/ccgbank/convert/Javafns.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

//Java Program invoked by pp-head extraction routines

package opennlp.ccgbank.convert;

import java.util.ArrayList;
import java.util.List;

// NB: addRes and changeCat probably made superfluous by computeCats.xsl
public class Javafns{
	
	//Prep heads storage
	public List<String> heads = new ArrayList<String>();
	
	//Temp id of pp heads with args
	String tempId="";	

	//Insert the prep-head into a result category by string replacement
	public String addRes(String cat,String ppHead){
		
		//Xsl spl char detected and escaped
		if(ppHead.equals("$"))
			ppHead="\\$";
		
		//Head inserted into first PP category
		cat=cat.replaceFirst("pp","pp["+ppHead+"]");
		return cat;
	}
	
	//A safety hatch to elide extra heads detected - For leaf nodes
	public String elimRedun(int headCount){
		
		//Calculating redundant Headcount
		int j=0;
		
		//All heads following the last PP-head in a cat spec are redundant
		int redun=heads.size()-headCount;
		
		//Redundant heads removed
		for(j=0;j<redun;j++)
			heads.remove(heads.size()-1);
		
		return null;
		
	}
	
	//Fn to store temp id of a treenode with pp arg(s)
	public String putTempId(String x){
		
			tempId=x;	
			return tempId;
	
	}
		
	//Fn to retrieve temp id of a treenode with pp arg(s)
	public String getTempId(){
			
			return tempId;
	
	}

	//Inserts pp-heads into argument categories 
	public String changeCat(String cat){
		
		//System.out.println(cat);
		//System.out.println(heads);
		
		int i=heads.size()-1;
		
		for(;i>-1;i--){
			
			String ppHead = heads.get(i);
			
			//Escaping dollar signs for xsl
			if(ppHead.equals("$"))
				ppHead="\\$";
			
			//Simple head insertion by replacement on the string
			cat=cat.replaceFirst("pp_","pp["+ppHead+"]_");
			
		}

		return cat;
	}
	
	public String flush(){
		heads.clear();tempId="";		
		return null;
	}
	
	
	public String setHead(String head){
		heads.add(head);
		return null;
	}
	
	
	public String getHead(){
		
		String head="";
		
		if(heads.size()==0)
			head="WrongHead";
		else{
			head = heads.get(heads.size()-1);
			heads.remove(heads.size()-1);
		} 
		
		return head;
	}
	
	
	public String peekHead(){
		
		String head="WrongHead";
		
		if(heads.size()>0)
			head = heads.get(heads.size()-1);
		
		return head;
	}

	public String printCat(String cat){
		System.out.println(cat);
		return cat;
	}

}


================================================
FILE: src/opennlp/ccgbank/convert/MWHelper.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

//Bkgrnd java class which helps with operations reltd to multi-word units
//As a first stab, I combine multi-word conjns like "As well as"

package opennlp.ccgbank.convert;

import java.util.*;

public class MWHelper {

	// The largest current id
	private String lex = "";

	private String pos = "";

	private String term_no = "";

	// A list of the particle terminal nos
	private ArrayList<Integer> prtTally = new ArrayList<Integer>();

	// Index of terminal nos and the lexical items they correspond to
	private Hashtable<Integer, String> prtIndex = new Hashtable<Integer, String>();

	public void initSettings() {
		prtTally = new ArrayList<Integer>();
		prtIndex = new Hashtable<Integer, String>();
	}

	// Concat lex,pos & term_nos of multi-word units
	public void concatWords(String lex, String pos, String term_no) {

		// System.out.println(lex);
		this.lex = this.lex + "_" + lex;
		this.pos = this.pos + " " + pos;
		this.term_no = this.term_no + " " + term_no;
	}

	// Retrieve stored info
	public String getInfo(int choice) {

		String retVal = "";

		switch (choice) {

		case 1:
			retVal = lex.trim().replaceFirst("_", "");
			this.lex = "";
			break;
		case 2:
			retVal = pos.trim();
			this.pos = "";
			break;
		case 3:
			retVal = term_no.trim();
			this.term_no = "";
			break;

		}

		return retVal;
	}

	// Store particle ids
	public void storePrt(String prt_term_no, String prt) {
		prtTally.add(Integer.parseInt(prt_term_no));
		prtIndex.put(Integer.parseInt(prt_term_no), prt);
	}

	public String peekPrt(int nextPrnNo) {

		String retVal = "";
		if (prtIndex.containsKey(nextPrnNo)) {
			retVal = prtIndex.get(nextPrnNo);
		}

		return retVal;
	}

	public String getPrt() {
		// System.out.println(prtTally);
		// prtTally=new ArrayList();
		Collections.sort(prtTally);
		String retVal = "";
		if (prtTally.size() > 0) {

			retVal = (prtTally.get(prtTally.size() - 1)).toString();
			// System.out.println(retVal);
			prtTally.remove(prtTally.size() - 1);
		}

		return retVal;
	}

}


================================================
FILE: src/opennlp/ccgbank/convert/MorphLookup.java
================================================
package opennlp.ccgbank.convert;

import java.io.BufferedReader;
import java.io.File;
import java.io.FileReader;
import java.io.IOException;
import java.util.HashMap;
import java.util.Map;

/**
 * Utility class for looking up stems as determined by the morpha utility. 
 */ 
public class MorphLookup {

	// map from word_pos to stem
	private static Map<String,String> stemMap = null;
	static File words, stems;
	
	public static void init(File wordsFile, File stemsFile) throws IOException {
		MorphLookup.words = wordsFile;
		MorphLookup.stems = stemsFile;
		
		if(MorphLookup.words == null) {
			throw new IllegalArgumentException("words file not specified");
		}
		if(MorphLookup.stems == null) {
			throw new IllegalArgumentException("stems file not specified");
		}
		
		stemMap = new HashMap<String,String>();
		
		BufferedReader wordsReader = new BufferedReader(
				new FileReader(words));
		BufferedReader stemsReader = new BufferedReader(
				new FileReader(stems));
		String wordsLine, stemsLine;
		// read lines in parallel
		while ( (wordsLine = wordsReader.readLine()) != null ) {
			stemsLine = stemsReader.readLine();
			//System.out.println(stemsLine);
			// wordsLine has a word and a POS
			String[] tokens = wordsLine.split("\\s+");
			String word = tokens[0]; String pos = tokens[1];
			// stemsLine just has a stem; lowercase it, for good measure
			String stem = stemsLine.trim().toLowerCase();
			// add word_POS -> stem to map, also with word lowercased
			String key = word + "_" + pos;
			String key2 = word.toLowerCase() + "_" + pos;
			stemMap.put(key, stem);
			stemMap.put(key2, stem);
		}
		wordsReader.close();
		stemsReader.close();
	}
	
	/** Returns the stem for the given word and pos, or the empty string if none. */
	public String getStem(String word, String pos) {
		String retval="";String key=word + "_" + pos;
		if (MorphLookup.stemMap.containsKey(key))
			retval = stemMap.get(word + "_" + pos);
			/*if (retval == null) retval = "";
		//System.out.println(key+" "+retval);*/
		
		if(retval.length()==0)
			System.out.println("addStems: No stem for: "+key);
		return retval;
	}
}


================================================
FILE: src/opennlp/ccgbank/convert/OrigPunctRules.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

//Class which stores the context of punctuations

package opennlp.ccgbank.convert;

import java.util.Hashtable;

public class OrigPunctRules {

	//Sentence id
	private String id = "";

	//The largest current id
	private static int globalId = 0;

	//ccgbank section
	private String sect="";

	//Label for a punct mark
	private String label = "";

	//The store of ids
	private static Hashtable<String,String> idTally = new Hashtable<String,String>();

	//Proc which traps, stores id of each sentence in a global var
	public String storeId(String x) {
		id = "";
		sect = "";
		//System.out.println(x+" "+"Raja");
		String expId[] = x.split("_");
		id = expId[1];
		sect = id.substring(0, 2);
		if (sect.length() < 0) sect += "just avoiding a warning here"; 
		//System.out.println(sect+" "+"Raja");
		return null;
	}

	//Initialization before start of a new binary rule 
	public String initId() {
		globalId = 0;
		idTally.clear();
		return null;
	}

	//Id allotment
	public String allotId(String cat) {
		String newId = "";
		//Id allotment
		if (!idTally.containsKey(cat)) {
			globalId++;
			newId = Integer.toString(globalId);
			idTally.put(cat, newId);
		}
		newId = (String) idTally.get(cat);
		return newId;
	}

	public String storeLabel(String x) {
		label = x;
		return null;
	}

	public String getLabel() {
		return label;
	}

	public String initLabel() {
		label = "";
		return null;
	}
}


================================================
FILE: src/opennlp/ccgbank/convert/PunctHelper.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

//Java class which adds brackets, stores arg1 position for inferConjRules.xsl,normConjRulesId, normTreenodeId.xsl

package opennlp.ccgbank.convert;

import java.util.ArrayList;
import java.util.Hashtable;

public class PunctHelper {

	//The largest current id
	private int globalId = 0;

	//The store of ids
	//private Hashtable idTally = new Hashtable();

	private String feat = "";

	private String pos = "";

	private String balCom = "";

	//The pos-indexRel tally
	private static Hashtable<String,ArrayList<String>> indexRel = new Hashtable<String,ArrayList<String>>();

	//Calculate & store the indexRel
	public String calcIndexRel(String cat, String pos) {

		ArrayList<String> temp = new ArrayList<String>();
		pos = pos.replaceAll("[0-9]", "");

		//System.out.println(cat);

		if (!pos.equals("PUNCT_LPAREN")) {

			cat = cat.replaceAll("/\\*punct\\[,\\]_[0-9]", "");
			cat = cat.replaceAll("/\\*punct\\[--\\]_[0-9]", "");
			cat = cat.replaceAll("/\\*punct\\[-rrb-\\]_[0-9]", "");
			cat = cat.replaceAll("/\\*punct\\[-rcb-\\]_[0-9]", "");

		}

		//System.out.println(cat);

		if (!indexRel.containsKey(pos)) {
			temp.add(cat);
			indexRel.put(pos, temp);
		}

		temp = indexRel.get(pos);
		if (!temp.contains(cat))
			temp.add(cat);

		String ind = Integer.toString(temp.indexOf(cat) + 1);

		return ind;

	}

	//Initialization before start of a new conj rule 
	public String globalInit() {
		globalId = 0;
		//idTally.clear();
		return null;
	}

	//Function invoked by invertedDirSpComma.xsl
	public String getglobalId() {
		globalId++;
		return Integer.toString(globalId);
	}

	public String setglobalId(int x) {
		globalId = x;
		return null;
	}

	public String storePOS(String x) {
		pos = x;
		return null;
	}

	public String getPOS() {
		String retVal = pos;
		return retVal;
	}

	public String initPOS() {
		pos = "";
		return null;
	}

	public String balInit() {
		balCom = "";
		return null;
	}

	public String storeBal(String x) {
		balCom = x;
		return null;
	}

	public String getBal() {
		return balCom;
	}

	public String storeFeat(String x) {
		feat = x;
		return null;
	}

	public String getFeat() {
		return feat;
	}

	public String featInit() {
		feat = "";
		return null;
	}

	public String debugPrint(String x, String y) {
		System.out.println("Debug: " + x + " at " + y);
		return null;
	}

	public String removeFeats(String cat) {
		cat = cat.replaceAll("\\[[a-zA-Z]+\\]", "");
		//System.out.println("Debug: "+cat);
		return cat;
	}

	public String purgeCat(String cat) {
		cat = cat.replaceAll("\\[[a-zA-Z]+\\]", "");
		cat = cat.replaceAll("~", "");
		cat = cat.replaceAll("_[0-9]+", "");
		//System.out.println("Debug: "+cat);
		return cat;
	}

	public String purgeCat1(String cat) {
		cat = cat.toLowerCase();
		cat = cat.replaceAll("\\[[a-zA-Z]+\\]", "");
		cat = cat.replaceAll("~", "");
		cat = cat.replaceAll("_[0-9]+", "");
		//System.out.println("Debug: "+cat);
		return cat;
	}

	//Replace pp[] by pp
	public String cleanPP(String cat) {
		cat = cat.replaceAll("pp\\[\\]", "pp");
		return cat;
	}
}


================================================
FILE: src/opennlp/ccgbank/convert/RoleAdjuster.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccgbank.convert;

/**
 * Utility class for adjusting roles and augmenting cat names with roles. 
 */ 
public class RoleAdjuster {

	/** Returns the adjusted argument roles, making guesses at the missing roles. */
	public String getAdjustedRoles(String cat, String roles) {
		// aux things like "have to"
		if (roles.equals("null e") || roles.equals("e e")) {
			if (cat.indexOf("np[thr]") < 0)
				return "Arg0 Arg1";
			else 
				return "e Arg1";
		}
		// vp mods
		if (roles.startsWith("null e")) {
			return "null ArgM" + roles.substring("null e".length());
		}
		// missing subjects, mostly
		if (roles.startsWith("null")) {
			String rest = roles.substring("null".length());
			return addMissingArg(cat, rest);
		}
		// various
		if (roles.startsWith("e")) {
			String rest = roles.substring("e".length());
			// mods
			if (cat.indexOf("_~") > 0)
				return "ArgM" + rest;
			// leave expletives unchanged
			if (cat.indexOf("np[expl]") > 0 || cat.indexOf("np[thr]") > 0)
				return roles;
			// otherwise add standard guess
			return addMissingArg(cat, rest);
		}
		// otherwise unchanged
		return roles;
	}

	// add guess at missing arg
	private String addMissingArg(String cat, String rest) {
		// distinguish passive
		if (cat.startsWith("s[pss]")) {
			if (rest.indexOf("Arg1") < 0)
				return "Arg1" + rest;
			else 
				return "Arg2" + rest;
		}
		// otherwise Arg0 or Arg1
		if (rest.indexOf("Arg0") < 0)
			return "Arg0" + rest;
		else 
			return "Arg1" + rest;
	}
	
	/** Returns the cat name augmented with the given argument roles. */
	public String getCatPlusRoles(String cat, String roles) {
		return cat + ":" + roles.replaceAll(" ", "+");
	}
}


================================================
FILE: src/opennlp/ccgbank/convert/XSLTTrueCaser.java
================================================
///////////////////////////////////////////////////////////////////////////////
//Copyright (C) 2011 Dennis N. Mehay
//
//This library is free software; you can redistribute it and/or
//modify it under the terms of the GNU Lesser General Public
//License as published by the Free Software Foundation; either
//version 2.1 of the License, or (at your option) any later version.
//
//This library is distributed in the hope that it will be useful,
//but WITHOUT ANY WARRANTY; without even the implied warranty of
//MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
//GNU Lesser General Public License for more details.
//
//You should have received a copy of the GNU Lesser General Public
//License along with this program; if not, write to the Free Software
//Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccgbank.convert;

/**
 * A class that has a static constructor to create a TrueCaser so that XSLT (which requires such a
 * set-up) can call the TrueCaser.
 *
 * @author      Dennis N. Mehay
 *
 */

import opennlp.ccg.lexicon.TrueCaser;

public class XSLTTrueCaser {
	
	static TrueCaser tc = null;
	
	/**
	 * Static constructor that creates a true-caser. See the TrueCaser.java doc's for more info.
	 */
	public static void init(String pathToTrueCaseList) {
		XSLTTrueCaser.tc = new TrueCaser(pathToTrueCaseList, 0.5);
	}
	
	/** Function invoked from the XSLT transform trueCaser.xsl to true case words in a derivation .*/
	public String trueCase(String theWord, String neClass, String pos,String wordPosition) {
		return tc.trueCase(theWord, true, true);
	}
}

================================================
FILE: src/opennlp/ccgbank/extract/CatNode.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

//Java class to store all the info associated with a category

package opennlp.ccgbank.extract;

import java.io.PrintWriter;
import java.util.ArrayList;
import java.util.HashMap;
import java.util.List;
import java.util.Map;
import java.util.StringTokenizer;

public class CatNode {
	
	// Category name, POS
	public final String cat;
	public final String pos;
	
	//Lexeme frequency
	private Map<String,Integer> lexFreq = new HashMap<String,Integer>();
	
	//Sentence id of lexemes
	private Map<String,List<String>> lexOccur = new HashMap<String,List<String>>();
	
	//Constructor to initialize the cat name
	public CatNode(String cat, String pos){
		this.cat=cat; this.pos = pos;
	}
	
	//Procedure to insert info associated with all lexemes of a category
	public void lexInsert(String lex, String id){
		//When first occurences of lexemes detected, entries opened
		if (!lexFreq.containsKey(lex)){
			lexFreq.put(lex, 1);
			List<String> idList = new ArrayList<String>(4);
			idList.add(id);
			lexOccur.put(lex, idList);
		}
		else { //Subsequent occurences of lexemes updated
			lexFreq.put(lex, lexFreq.get(lex)+1);
			List<String> idList = lexOccur.get(lex);
			//Ids of up to four sentences stored
			if(!idList.contains(id) && idList.size() < 4){
				idList.add(id);
			}
		}
	}
	
	// returns frequence of lex with this cat and pos
	public int getLexFreq(String lex) {
		Integer retval = lexFreq.get(lex);
		if (retval == null) return 0;
		else return retval;
	}
	
	//Proc which prints out the lexical info of a category
	public void printTally(PrintWriter output) {
		
		//Lexemes sorted in descending order of freq
		List<String> sortedLex = FreqTally.sortTally(lexFreq);
		
		String ccgbankHome = System.getProperty("CCGBANK_HOME", "/home/corpora/EN/ccgbank");
		
		//Sorted list processed
		for (int i=0; i<3 && i<sortedLex.size(); i++) {
			
			String lex = sortedLex.get(i);
			int freq = lexFreq.get(lex);
			
			output.println("<ul>");
			output.println("<li>");
			output.println(lex+" "+freq);
			
			//Sentence ids also printed
			List<String> temp = lexOccur.get(lex);
			for (String id: temp) {
				//System.out.println(id);
				String[]idInfo=id.split("\\.");
				//System.out.println(idInfo[0]);

				StringTokenizer st=new StringTokenizer(id,".");
				output.println("<ul>");

				String idLink="";
				String sentNo="";
				String dir="";

				//2 courses of action depending on whether input is gold std .auto parses or C&C .auto parses
				if(idInfo.length==2){
						idLink=st.nextToken()+".html";
						sentNo="#Sentence "+st.nextToken();
						dir=id.substring(4,6);
				}
				else {
						idLink=idInfo[0];
						sentNo="#Sentence "+idInfo[0];
						dir=idInfo[0];
				}
				output.println("<li>");
				output.println(id);
				output.println(" <a href=file://" + ccgbankHome + "/original/data/HTML/"+dir+"/"+idLink+" target="+sentNo+">");
				output.println(idLink);
				output.println("</a>");  
				output.println("</li>");  
				output.println("</ul>");
			}

			
			output.println("</li>");
			output.println("</ul>");
			output.println("");
			output.flush();
		}
	}
}


================================================
FILE: src/opennlp/ccgbank/extract/DebugHelper.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

//Bkgrnd java class which helps with operations for debugging LFs

package opennlp.ccgbank.extract;

import java.util.*;
import java.io.*;

public class DebugHelper {

	public static boolean init = true;

	public static ArrayList<String> unmatCats = new ArrayList<String>();

	public static int nsrCount = 0;

	public static int unmatCount = 0;

	public boolean getInit() {

		return init;

	}

	//Read in bkgrnd info
	public void readInfo() {

		try {

			BufferedReader inp = new BufferedReader(new FileReader(
					"/scratch/propgrammar/unmat.txt"));
			String line = "";

			while ((line = inp.readLine()) != null) {

				if (line.length() == 0)
					continue;

				String parts[] = line.split(" ");
				String name = parts[parts.length - 2];
				String pos = parts[parts.length - 1];
				String x[] = name.split("=");
				String y[] = pos.split("=");
				name = purgeCat(x[1]);
				pos = purgeCat(y[1]);
				String unmat = name + " " + pos;
				unmatCats.add(unmat);
				//System.out.println(name+" "+pos);		

			}
			//System.out.println(tagInfo);
			//System.out.println(tagInfo.size());
			init = false;
			inp.close();
		}

		catch (IOException e) {
			System.out.println("Error reading input file");
		}
	}

	public String purgeCat(String cat) {

		cat = cat.replaceAll("\"", "");
		cat = cat.replaceAll("~", "");
		cat = cat.replaceAll("_[0-9]+", "");
		cat = cat.replaceAll(">", "");
		//System.out.println("Debug: "+cat);
		return cat;

	}

	public void recordInfo(String sentId, String pred, String misc) {

		nsrCount++;
		if (unmatCats.contains(misc))
			unmatCount++;

	}

	public void printInfo() {
		System.out.println(unmatCats);
		System.out.println("No:of nsr LFs: " + nsrCount);
		System.out.println("No:of unmatched that a NSR LF contains: "
				+ unmatCount);
	}

}


================================================
FILE: src/opennlp/ccgbank/extract/DefaultLFHelper.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

//Bkgrnd java class which helps with operations for debugging LFs

package opennlp.ccgbank.extract;

import java.util.*;
//import java.io.*;

public class DefaultLFHelper {

	private ArrayList<String> idTally = new ArrayList<String>();

	private Hashtable<String,Integer> freqTable = new Hashtable<String,Integer>();

	private String lfType = "ord";

	public void init() {

		lfType = "ord";
		idTally = new ArrayList<String>();
		freqTable = new Hashtable<String,Integer>();
		argCounter = 0;
	}

	public void storeCat(String cat, String id, String idType) {

		int freq = 1;

		if (id.length() > 0) {

			//System.out.println(cat+" "+id+" "+idType);

			if (!freqTable.containsKey(id))
				freqTable.put(id, freq);
			else {
				freq = freqTable.get(id) + 1;
				freqTable.put(id, freq);
			}

			if (id.equals("1") && idType.equals("inherits"))
				lfType = "mod-mod";
			else if (!lfType.equals("mod-mod") && id.equals("1")
					&& idTally.size() > 0 && idTally.get(0).equals("1"))
				lfType = "mod";

			idTally.add(id);
		}
	}

	public String getType() {
		String retVal = lfType;
		lfType = "";
		argCounter = 0;
		return retVal;
	}

	private int argCounter = 0;

	public String getArgNo(int argCount) {
		int argNo = argCount - argCounter;
		argCounter++;
		return Integer.toString(argNo);
	}

	public boolean isArg(String id) {

		//System.out.println(id);
		//System.out.println(freqTable);

		int freq = 0;
		if (freqTable.containsKey(id))
			freq = freqTable.get(id);

		boolean retVal = false;
		if (freq == 1)
			retVal = true;
		return retVal;
	}

	public String purgeCat(String cat) {
		cat = cat.replaceAll("\"", "");
		cat = cat.replaceAll("~", "");
		cat = cat.replaceAll("_[0-9]+", "");
		cat = cat.replaceAll(">", "");
		//System.out.println("Debug: "+cat);
		return cat;
	}
}


================================================
FILE: src/opennlp/ccgbank/extract/ExtractGrammar.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

package opennlp.ccgbank.extract;

import java.io.File;
import java.io.FileWriter;
import java.io.PrintWriter;
import java.util.Arrays;
import java.util.Iterator;
import java.util.List;

import javax.xml.transform.stream.StreamSource;

public class ExtractGrammar {

	/** Class for holding properties of desired grammar extraction. */
	public static class ExtractionProperties {

		/** Whether to use the PP head augmented corpus. */
		public boolean ppHeads = true;

		/** Source directory. */
		public String srcDir = "/scratch/ccgbank/converted";

		/** Destination directory. */
		public String destDir = "/scratch/grammars/protogrammar";

		/** Temp directory. */
		public String tempDir = "/tmp/ccgbankextract";

		/** Start section. */
		public int startSection = 0;

		/** End section. */
		public int endSection = 24;

		/** Selected file (-1 if none). */
		public int fileNum = -1;

		/** Frequency cutoff for including an extracted cat. */
		public int catFreqCutoff = 1;

		/** Frequency cutoff for including an extracted lex, cat, pos triple. */
		public int lexFreqCutoff = 1;

		/** Frequency cutoff for making a family (ie, cat & pos) open. */
		public int openFreqCutoff = 100;

		/** Rule frequency cutoff. */
		public int ruleFreqCutoff = 1;

		/** Flag for whether to skip unmatched rules. */
		public boolean skipUnmatched = false;

		/** Whether to show debug info for failed derivations. */
		public boolean debugDerivs = false;

		/** File name for text only output. */
		public String textfile = null;

		/** File name for text factors output. */
		public String factorsfile = null;

		/** File name for observed supertag-rule combos.. */
		public String combosfile = null;

		// Flag to add feats excl to the lexicon
		public boolean lexF = false;

		// Flag to adjust lfs of orig puncts ie those corrs to extant corp
		// binary rules
		public boolean origPuncts = false;

		// String taking names of macros as input. Expects a dash separated list
		public String macroSpecs = "";

		// String taking names of LF specificity condtions as input. Expects a
		// dash separated list
		// Overt wh pronouns: wh
		public String lfSpecs = "";

	}

	/** Processes args and invokes extraction steps. */
	public static void main(String args[]) throws Exception {

		List<String> arguments = Arrays.asList(args);
		ExtractionProperties extractProps = new ExtractionProperties();

		// flags for each extraction step
		boolean doLex = true;
		boolean doMorph = true;
		boolean doRules = true;
		boolean doTestbed = true;

		if (arguments.contains("-h") || arguments.contains("--help")) {
			System.out.println("usage: extractGrammar \n"
							+ "\t[-noPPs|--noPPHeads] \n"
							+ "\t[-lexF] \n"
							+ "\t[-origPuncts] \n"
							+ "\t[-s|--section sectnum] [-ss|--startSection sectnum] [-es|endSection sectnum] \n"
							+ "\t[-f|--file filenum] \n"
							+ "\t[--lexOnly|--morpOnly|--rulesOnly|--testbedOnly] [--skipLex] [--skipMorph] [--skipRules] [--skipTestbed]\n"
							+ "\t[-tmp|--tempDir tempDir] \n"
							+ "\t[-cfc|--catFreqCutoff num] \n"
							+ "\t[-lfc|--lexFreqCutoff num] \n"
							+ "\t[-ofc|--openFreqCutoff num] \n"
							+ "\t[-rfc|--ruleFreqCutoff num] \n"
							+ "\t[--skipUnmatched] \n"
							+ "\t[-dd|--debugDerivs] \n"
							+ "\t[--text textfile] [--textf factorsfile] \n"
							+ "\t[--combos combosfile] \n"
							+ "\t[srcDir] [destDir]");
			System.exit(0);
		}

		if (arguments.contains("-noPPs") || arguments.contains("--noPPHeads")) {
			extractProps.ppHeads = false;
		}

		// process args
		Iterator<String> it = arguments.iterator();

		String s;
		boolean seenSrc = false;
		while (it.hasNext()) {
			s = it.next();
			if (s.equals("-s") || s.equals("--section") || s.equals("-ss")
					|| s.equals("--startSection") || s.equals("-es")
					|| s.equals("--endSection")) {
				if (!it.hasNext()) {
					throw new IllegalArgumentException("encountered flag " + s
							+ ", but no sectnum specified");
				}
				int sectNum = Integer.parseInt(it.next());
				if (s.equals("-s") || s.equals("--section") || s.equals("-ss")
						|| s.equals("--startSection"))
					extractProps.startSection = sectNum;
				if (s.equals("-s") || s.equals("--section") || s.equals("-es")
						|| s.equals("--endSection"))
					extractProps.endSection = sectNum;
			} else if (s.equals("-f") || s.equals("--filenum")) {
				if (!it.hasNext()) {
					throw new IllegalArgumentException("encountered flag " + s
							+ ", but no filenum specified");
				}
				extractProps.fileNum = Integer.parseInt(it.next());
			} else if (s.equals("-lexF")) {
				System.out
						.println("Inserting lexicon specific feats - Punct filter placeholder feats now");
				extractProps.lexF = true;

			} else if (s.equals("-origPuncts")) {
				extractProps.origPuncts = true;

			}

			else if (s.equals("--lexOnly")) {
				doMorph = false;
				doRules = false;
				doTestbed = false;
			} else if (s.equals("--morphOnly")) {
				doLex = false;
				doRules = false;
				doTestbed = false;
			} else if (s.equals("--rulesOnly")) {
				doLex = false;
				doMorph = false;
				doTestbed = false;
			} else if (s.equals("--testbedOnly")) {
				doLex = false;
				doMorph = false;
				doRules = false;
			} else if (s.equals("--skipLex")) {
				doLex = false;
			} else if (s.equals("--skipMorph")) {
				doMorph = false;
			} else if (s.equals("--skipRules")) {
				doRules = false;
			} else if (s.equals("--skipTestbed")) {
				doTestbed = false;
			} else if (s.equals("-tmp") || s.equals("--tempDir")) {
				if (!it.hasNext()) {
					throw new IllegalArgumentException("encountered flag " + s
							+ ", but no temp dir specified");
				}
				extractProps.tempDir = it.next();
			} else if (s.equals("-cfc") || s.equals("--catFreqCutoff")) {
				if (!it.hasNext()) {
					throw new IllegalArgumentException("encountered flag " + s
							+ ", but no num specified");
				}
				int num = Integer.parseInt(it.next());
				extractProps.catFreqCutoff = num;
			} else if (s.equals("-lfc") || s.equals("--lexFreqCutoff")) {
				if (!it.hasNext()) {
					throw new IllegalArgumentException("encountered flag " + s
							+ ", but no num specified");
				}
				int num = Integer.parseInt(it.next());
				extractProps.lexFreqCutoff = num;
			} else if (s.equals("-ofc") || s.equals("--openFreqCutoff")) {
				if (!it.hasNext()) {
					throw new IllegalArgumentException("encountered flag " + s
							+ ", but no num specified");
				}
				int num = Integer.parseInt(it.next());
				extractProps.openFreqCutoff = num;
			} else if (s.equals("-rfc") || s.equals("--ruleFreqCutoff")) {
				if (!it.hasNext()) {
					throw new IllegalArgumentException("encountered flag " + s
							+ ", but no num specified");
				}
				int num = Integer.parseInt(it.next());
				extractProps.ruleFreqCutoff = num;
			} else if (s.equals("--skipUnmatched"))
				extractProps.skipUnmatched = true;
			else if (s.equals("-dd") || s.equals("--debugDerivs"))
				extractProps.debugDerivs = true;
			else if (s.equals("--text")) {
				if (!it.hasNext()) {
					throw new IllegalArgumentException("encountered flag " + s
							+ ", but no file name specified");
				}
				extractProps.textfile = it.next();
			} else if (s.equals("--textf")) {
				if (!it.hasNext()) {
					throw new IllegalArgumentException("encountered flag " + s
							+ ", but no file name specified");
				}
				extractProps.factorsfile = it.next();
			} else if (s.equals("--combos")) {
				if (!it.hasNext()) {
					throw new IllegalArgumentException("encountered flag " + s
							+ ", but no file name specified");
				}
				extractProps.combosfile = it.next();
			} else if (!seenSrc) {
				extractProps.srcDir = s;
				seenSrc = true;
			} else {
				extractProps.destDir = s;
			}
		}

		// ensure directories exist or can be made
		File tempDir = new File(extractProps.tempDir);
		if (!tempDir.exists() && !tempDir.mkdirs())
			throw new IllegalArgumentException(
					"could not create temp directory: " + extractProps.tempDir);
		File srcDir = new File(extractProps.srcDir);
		if (!srcDir.exists() || !srcDir.isDirectory())
			throw new IllegalArgumentException(
					"source directory does not exist: " + extractProps.srcDir);
		File destDir = new File(extractProps.destDir);
		if (!destDir.exists() && !destDir.mkdirs())
			throw new IllegalArgumentException(
					"could not create destination directory: "
							+ extractProps.destDir);

		// log params
		System.out.println("Extracting Grammar");
		System.out.println("Reading from: " + srcDir);
		System.out.println("Writing to: " + destDir);
		System.out.println("Temp dir: " + tempDir);
		System.out.println("Start section: " + extractProps.startSection);
		System.out.println("End section: " + extractProps.endSection);
		if (extractProps.fileNum >= 0)
			System.out.println("File: " + extractProps.fileNum);

		// do extraction steps
		if (doLex)
			LexExtract.extractLex(extractProps);
		if (doMorph)
			MorphExtract.extractMorph(extractProps);
		if (doRules)
			RulesExtract.extractRules(extractProps);

		// generate grammar.xml, if it doesn't already exist
		// nb: should eventually make schema refs relative to OPENCCG_HOME
		File gramFile = new File(destDir, "grammar.xml");
		if (!gramFile.exists()) {
			System.out.println("Generating grammar.xml");
			PrintWriter gramOut = new PrintWriter(new FileWriter(gramFile));
			gramOut.println("<?xml version=\"1.0\"?>");
			gramOut.println("<grammar name=\"proto\"");
			gramOut.println("  xmlns:xsi=\"http://www.w3.org/2001/XMLSchema-instance\"");
			gramOut.println("  xsi:noNamespaceSchemaLocation=\"../grammar.xsd\"");
			gramOut.println(">");
			gramOut.println("  <lexicon file=\"lexicon.xml\"/>");
			gramOut.println("  <morphology file=\"morph.xml\"/>");
			gramOut.println("  <rules file=\"rules.xml\"/>");
			gramOut.println("</grammar>");
			gramOut.close();
		}

		// do testbed
		if (doTestbed && !doTestbed) ; // nb: just avoiding a warning here
		// TODO if (doTestbed) Testbed.createTestFiles(extractProps);
	}

	/* Returns a stream source for the given resource from the class loader. */
	public static StreamSource getSource(String resourceName) {
		ClassLoader cl = ExtractGrammar.class.getClassLoader();
		return new StreamSource(cl.getResourceAsStream(resourceName));
	}
}


================================================
FILE: src/opennlp/ccgbank/extract/FreqTally.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

//Class which stores lexical info and associated frequencies. 

//This class is invoked by LexExtr.xsl and StemInsert.xsl transforms

package opennlp.ccgbank.extract;

import java.io.File;
import java.io.FileNotFoundException;
import java.io.FileOutputStream;
import java.io.PrintWriter;
import java.util.ArrayList;
import java.util.Collections;
import java.util.HashMap;
import java.util.HashSet;
import java.util.List;
import java.util.Map;
import java.util.Set;

import opennlp.ccgbank.extract.ExtractGrammar.ExtractionProperties;

//import javax.xml.transform.TransformerConfigurationException;
//import javax.xml.transform.TransformerException;

//import org.jdom.JDOMException;
//import org.xml.sax.SAXException;


public class FreqTally{

	// Frequency cutoff for including an extracted cat 
	public static int CAT_FREQ_CUTOFF = 1;  

	// Frequency cutoff for including an extracted lex, cat, pos triple 
	public static int LEX_FREQ_CUTOFF = 1; 

	// Frequency cutoff for making a family (ie, cat & pos) open
	public static int OPEN_FREQ_CUTOFF = 100; 


	//The object where lexical info of each category has been stored
	private static Map<String,CatNode> catInfo = new HashMap<String,CatNode>();

	//Freq of cat specs
	private static Map<String,Integer> catFreq = new HashMap<String,Integer>();

	//Sentence id
	private static String id="";

	// Observed lex combos
	private static Set<String> observedLexCombos = new HashSet<String>();

	/** Resets the statically held tallies. */
	public static void reset() {
		catInfo = new HashMap<String,CatNode>();
		catFreq = new HashMap<String,Integer>();
		id="";
		observedLexCombos = new HashSet<String>();
	}
	
	//Proc which traps and stores id of each sentence
	public String storeId(String x) {
		if(x.length()>0){
			id = x;
			int posEquals = x.indexOf('=');
			if (posEquals > 0) {
				id = x.substring(posEquals+1);
			}
		}
		return id;
	}

	//Changes case of proper nouns
	public String changeCase(String lex,String pos){

		//if(!pos.equals("NNP") && !pos.equals("NNPS") && !lex.equals("I"))lex=lex.toLowerCase();
		return lex;

	}

	// Creating a freq tally using hashtables. Invoked by LexExtr.xsl.
	// Returns whether cat+pos is seen for the first time.
	public boolean loadTally(String lex, String cat, String pos) {

		String key = catPosKey(cat, pos);
		CatNode cn;
		boolean retval;

		//First occurence of cat+pos. Entry made
		if(!catFreq.containsKey(key)){
			cn = new CatNode(cat, pos);
			catInfo.put(key, cn);
			catFreq.put(key,1);
			retval = true;
		}
		else { // otherwise inc count
			cn = catInfo.get(key);
			catFreq.put(key, catFreq.get(key)+1);
			retval = false;
		}

		// store lex info 
		cn.lexInsert(lex,id);

		return retval;
	}


	/** Returns a string key for a cat and pos. */
	public static String catPosKey(String cat, String pos) {
		return cat+"-"+pos;
	}


	//Proc which outputs list of map keys in descending order of frequencies
	public static List<String> sortTally(Map<String,Integer> x) { 

		// retval
		List<String> sortedList = new ArrayList<String>();

		//Sorting by freq
		ArrayList<Integer> vals1 = new ArrayList<Integer>(x.values());
		Collections.sort(vals1);

		//Removing unique frequencies to a new arraylist
		ArrayList<Integer> vals = new ArrayList<Integer>(vals1.size());
		int prev = -1;
		for (Integer freq : vals1) {
			if (freq != prev) vals.add(freq);
			prev = freq;
		}

		//Finding all the keys corresponding to a particular freq
		for (int i=vals.size()-1; i >=0; i--) {
			int sortedFreq = vals.get(i);
			for (String key : x.keySet()) {
				int freq = x.get(key);
				if(freq==sortedFreq) sortedList.add(key);
			}
		}

		return sortedList;
	}

	public static void printTally(ExtractionProperties extractProps) throws FileNotFoundException {
		FreqTally.printTally(new File(extractProps.tempDir));
	}


	public static void printTally(File directory) throws FileNotFoundException {

		System.out.println("Generating CorpFreq.html");

		//Freq Output file
		File freqFile = new File(directory, "CorpFreq.html");
		PrintWriter output=new PrintWriter(new FileOutputStream(freqFile));
		List<String> sortedCatKeys = sortTally(catFreq);

		//Printing the final ouput in html form
		output.println("<html>");
		output.println("<head>");
		output.println("<title>");
		output.println("Lexical Info");
		output.println("</title>");
		output.println("</head>");
		output.println("<body>");
		output.flush();

		for (int i=0; i < sortedCatKeys.size(); i++) {

			String key = sortedCatKeys.get(i);
			CatNode cn = catInfo.get(key);
			String cat = cn.cat;
			String pos = cn.pos;
			int freq = catFreq.get(key);

			output.println("<p>");
			output.println(i+1+" Category: "+cat+" POS: "+pos+" Freq: "+freq);
			output.println("</p>");

			output.println();
			cn.printTally(output);
			output.flush();
		}

		output.println("</body>");
		output.println("</html>");
	}


	/** Returns whether this lex combo has been seen for the first time. */
	public boolean firstLexCombo(String lex, String stem, String rel, String cat, String pos,String semClass) {
		String key = lex + "_" + stem + "_" + rel + "_" + cat + "_" + pos + "_" + semClass;
		//String key = lex + "_" + stem + "_" + rel + "_" + cat + "_" + pos;

		if (observedLexCombos.contains(key)) return false;
		observedLexCombos.add(key);
		return true;
	}


	// returns the freq for the given key, or 0 if not present
	private int getFreq(String key) {
		Integer freq = catFreq.get(key);
		return (freq != null) ? freq : 0;
	}

	/** Returns the frequency of the cat and pos. */
	public int getFreq(String cat, String pos) {
		String key = catPosKey(cat, pos);
		return getFreq(key); 
	}

	/** Returns whether the cat and pos pass the frequency cutoff. */
	public boolean checkFreqStatus(String cat, String pos) {

		/*if(cat.contains("Arg") || cat.startsWith("pp["))
				return true;*/

		/*if(id.contains("wsj_00"))
				return true;*/

		return getFreq(cat, pos) >= CAT_FREQ_CUTOFF; 
	}

	/** Returns whether the lex, cat and pos pass the frequency cutoffs. */
	public boolean checkFreqStatus(String lex, String cat, String pos) {
		String key = catPosKey(cat, pos);
		//System.out.println(cat);
		if(cat.contains("pp["))
			return true;

		/*if(id.contains("wsj_00"))
			return true;*/

		if (getFreq(key) < CAT_FREQ_CUTOFF) return false; 
		CatNode cn = catInfo.get(key);
		return cn.getLexFreq(lex) >= LEX_FREQ_CUTOFF;
	}

	/** Returns whether the cat and pos are for an open family. */
	public boolean isOpen(String cat, String pos) {

		if (getFreq(cat, pos) < OPEN_FREQ_CUTOFF) return false;
		if (pos.startsWith("NN") || pos.equals("CD")) return true;
		else if (pos.startsWith("JJ") && (cat.equals("n_~1/n_1") || cat.equals("s[adj]_1\np_2"))) return true;
		else return false;
	}
}


================================================
FILE: src/opennlp/ccgbank/extract/InsertLFHelper.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

//Helper Class for insertLF.xsl

//This class is invoked by MorphExtr.xsl 

package opennlp.ccgbank.extract;

import java.util.ArrayList;
import java.util.HashSet;
import java.util.List;
import java.util.Set;

public class InsertLFHelper{
	
	private List<String> featTally=new ArrayList<String>();
	
	//Flush feat tally
	public String initFeat(){
		featTally.clear();
		return null;
	}
	
	public String putFeat(String feat){
		featTally.add(feat);
		return null;
	}
	
	public String getFeat(){
		String feat="";
		
		if (featTally.size() > 0) {
			feat = featTally.get(0);
			featTally.remove(0);
		}
		else feat="xxx";
		
		return feat;
	}

	// for ensuring uniqueness of stem/rel pairs
	private Set<String> stemRelPairs = new HashSet<String>();
	
	// reset
	public String resetStemRelPairs() { stemRelPairs.clear(); return null; }
	
	// contains, updating
	public boolean containsStemRelPair(String stem, String rel) {
		String key = stem + "_" + rel;
		if (stemRelPairs.contains(key)) return true;
		stemRelPairs.add(key);
		return false;
	}
	
	private String[] rolesArray = {};
	
	// sets the roles
	public boolean setRoles(String roles) {
		rolesArray = roles.split("\\s+");
		return true;
	}
	
	// returns the nth role
	public String getRole(int n) {
		return (n < rolesArray.length) ? rolesArray[n] : "null";
	}
}


================================================
FILE: src/opennlp/ccgbank/extract/LexExtract.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

//Program which creates a temp.xml file from the bareparse. temp.xml serves are the input for creating lexicon.xml & morph.xml

package opennlp.ccgbank.extract;

import java.io.File;
import java.io.FileOutputStream;
import java.io.IOException;
import java.io.PrintWriter;
import java.util.Arrays;

import javax.xml.transform.Transformer;
import javax.xml.transform.TransformerConfigurationException;
import javax.xml.transform.TransformerException;
import javax.xml.transform.TransformerFactory;
import javax.xml.transform.sax.SAXResult;
import javax.xml.transform.sax.SAXSource;
import javax.xml.transform.sax.SAXTransformerFactory;
import javax.xml.transform.stream.StreamResult;
import javax.xml.transform.stream.StreamSource;

import opennlp.ccgbank.extract.ExtractGrammar.ExtractionProperties;

import org.apache.xml.serializer.OutputPropertiesFactory;
import org.apache.xml.serializer.Serializer;
import org.apache.xml.serializer.SerializerFactory;
import org.jdom.JDOMException;
import org.xml.sax.InputSource;
import org.xml.sax.SAXException;
import org.xml.sax.XMLFilter;
import org.xml.sax.XMLReader;
import org.xml.sax.helpers.XMLReaderFactory;


/**
 * Program which reads in each file of the bare parse xml rep and generates a lexicon, 
 * a freq tally of the lexical info and a list of ccgbank sentences.
 */
public class LexExtract{
	
	public static void extractLex(ExtractionProperties extractProps) throws TransformerException,TransformerConfigurationException,SAXException,IOException,JDOMException {
		
		System.out.println("Extracting lexicon info:");
		
		File lexFile = new File(new File(extractProps.destDir), "lexicon.xml");
		File tempFile = new File(new File(extractProps.tempDir), "temp.xml");
		PrintWriter tempOut = new PrintWriter(new FileOutputStream(tempFile),true);
		
		File ccgbankDir = new File(extractProps.srcDir);
		File[] ccgbankSections=ccgbankDir.listFiles();
		Arrays.sort(ccgbankSections);
		
		FreqTally.CAT_FREQ_CUTOFF = extractProps.catFreqCutoff;
		FreqTally.LEX_FREQ_CUTOFF = extractProps.lexFreqCutoff;
		FreqTally.OPEN_FREQ_CUTOFF = extractProps.openFreqCutoff;
		
		//temp.xml creation

		TransformerFactory tFactory = TransformerFactory.newInstance();
		Transformer lexExtrTransformer = tFactory.newTransformer(ExtractGrammar.getSource("opennlp.ccgbank/transform/lexExtr.xsl"));
		
		// add root 
		tempOut.println("<ccg-lexicon>");
		
		for (int i=extractProps.startSection; i<=extractProps.endSection; i++){
			
			System.out.println("Section " + ccgbankSections[i].getName());
			File[] files=ccgbankSections[i].listFiles();
			Arrays.sort(files);
			
			int fileStart = 0; int fileLimit = files.length;
			if (extractProps.fileNum >= 0) {
				fileStart = extractProps.fileNum;
				fileLimit = extractProps.fileNum + 1;
			}
			
			for (int j=fileStart; j<fileLimit; j++){
				String inputFile=files[j].getAbsolutePath();
				if (j == fileStart) System.out.print(files[j].getName() + " ");
				else if (j == (fileLimit-1)) System.out.println(" " + files[j].getName());
				else System.out.print(".");
				if (fileStart == fileLimit-1) System.out.println();
				try {
					lexExtrTransformer.transform(new StreamSource(inputFile), new StreamResult(tempOut));
				}
				catch (Exception exc) {
                    System.out.println("Skipping: " + inputFile);
                    System.out.println(exc.toString());
				}
				tempOut.flush();
			}
		}
		
		//Closing the root element
		tempOut.println("</ccg-lexicon>");
		tempOut.flush();
		tempOut.close();
		
		//Generating a freq tally from static datastructures
		FreqTally.printTally(extractProps);
		
		System.out.println("Generating lexicon.xml");
		
		if (tFactory.getFeature(SAXSource.FEATURE) && tFactory.getFeature(SAXResult.FEATURE)) {
			
			SAXTransformerFactory saxTFactory = ((SAXTransformerFactory) tFactory);
			
			// Create an XMLFilter for each stylesheet.
			
			// Extract lexicon from temp.xml
			XMLFilter xmlFilter0 = saxTFactory.newXMLFilter(ExtractGrammar.getSource("opennlp.ccgbank/transform/filterLex.xsl"));
			
			XMLFilter xmlFilter1 = saxTFactory.newXMLFilter(ExtractGrammar.getSource("opennlp.ccgbank/transform/closedCatInsert.xsl"));
			
			XMLFilter xmlFilter2 = saxTFactory.newXMLFilter(ExtractGrammar.getSource("opennlp.ccgbank/transform/insertLF.xsl"));

			XMLFilter xmlFilter3 = saxTFactory.newXMLFilter(ExtractGrammar.getSource("opennlp.ccgbank/transform/insertPunctLF.xsl"));

			XMLFilter xmlFilter4 = saxTFactory.newXMLFilter(ExtractGrammar.getSource("opennlp.ccgbank/transform/insertOrigPunctsLF.xsl"));

			XMLFilter xmlFilter5 = saxTFactory.newXMLFilter(ExtractGrammar.getSource("opennlp.ccgbank/transform/addFilterLexFeats.xsl"));
			
			XMLFilter xmlFilter6 = saxTFactory.newXMLFilter(ExtractGrammar.getSource("opennlp.ccgbank/transform/insertSemFeats.xsl"));
			
			XMLFilter xmlFilter7 = saxTFactory.newXMLFilter(ExtractGrammar.getSource("opennlp.ccgbank/transform/markUnmatched.xsl"));
			
			// Create an XMLReader.
			XMLReader reader = XMLReaderFactory.createXMLReader();
			
			// xmlFilter0 uses the XMLReader as its reader.
			xmlFilter0.setParent(reader);
			xmlFilter1.setParent(xmlFilter0);

			xmlFilter2.setParent(xmlFilter1);
			xmlFilter3.setParent(xmlFilter2);

			if (extractProps.lexF) {
				xmlFilter5.setParent(xmlFilter3);
				xmlFilter6.setParent(xmlFilter5);
			} else if (extractProps.origPuncts) {
				xmlFilter4.setParent(xmlFilter2);
				xmlFilter6.setParent(xmlFilter4);
			}

			else xmlFilter6.setParent(xmlFilter3);

			xmlFilter7.setParent(xmlFilter6);
			XMLFilter xmlFilter = xmlFilter7;
			
			java.util.Properties xmlProps = OutputPropertiesFactory.getDefaultMethodProperties("xml");
			xmlProps.setProperty("indent", "yes");
			xmlProps.setProperty("standalone", "no"); 
    		xmlProps.setProperty("{http://xml.apache.org/xalan}indent-amount", "2");
			Serializer serializer = SerializerFactory.getSerializer(xmlProps);              
			serializer.setOutputStream(new FileOutputStream(lexFile));
			xmlFilter.setContentHandler(serializer.asContentHandler());
			xmlFilter.parse(new InputSource(tempFile.getPath()));
		}
	}
}


================================================
FILE: src/opennlp/ccgbank/extract/MorphExtrHelper.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

//This class is invoked by MorphExtr.xsl 

package opennlp.ccgbank.extract;

import java.util.HashSet;
import java.util.Set;

public class MorphExtrHelper {
	
	private FreqTally aFreqTally = new FreqTally(); 
	private Set<String> seenLexPos = new HashSet<String>();
	
	/** Returns whether the lex, cat and pos pass the frequency cutoffs, 
	 *  and the lex-stem-pos combo is new. */
	public boolean checkFreqAndNoveltyStatus(String lex, String stem, String cat, String pos,String semClass) {
		if (!aFreqTally.checkFreqStatus(lex, cat, pos)) return false;
		String key = lex + "_" + stem + "_" + "_" + pos + "_"+ semClass;
		//String key = lex + "_" + stem + "_" + "_" + pos;
		if (seenLexPos.contains(key)) return false;
		seenLexPos.add(key);
		return true;
	}

	//Applies rules to discern whether noun is animate or not
	public String macroNamer(String macro, String semClass,String pos,String lex){

			if((semClass.startsWith("PER") && pos.startsWith("N"))||pos.equals("DT")){
					macro=macro+" "+"@anim-nom";
			}
			else if(pos.startsWith("PP") || lex.equals("those") || (pos.startsWith("PRP") && !lex.startsWith("it")))
					macro=macro+" "+"@anim-nom";
			else macro=macro+" "+"@non-anim-nom";

			macro=macro.trim();

			//Skip date time entities from animacy classification
			if(semClass.contains("STATE") || semClass.contains("NATION") || semClass.startsWith("ORG_DESC") || semClass.contains("DATE")||semClass.contains("TIME")||semClass.contains("QUANTITY")||semClass.contains("CARDINAL") || semClass.contains("PERCENT"))
					macro="";
						
			//Eliminate collective nouns
			if(lex.equals("audience") || lex.equals("band") || lex.equals("group") || lex.equals("team") || lex.equals("club") || lex.equals("congregation"))
					macro="";
					

			return macro;

	}

	//Applies rules to discern whether noun should have number agreement for the copula macro
	public String agrMacroDecider(String macro,String semClass,String pos,String lex){

			if(pos.equals("NN")){
					
					//if(lex.equals("couple") || lex.equals("following") ||lex.equals("rest") || semClass.contains("STATE") || semClass.contains("NATION") || semClass.startsWith("ORG_DESC") || semClass.contains("DATE")||semClass.contains("TIME")||semClass.contains("QUANTITY")||semClass.contains("CARDINAL") ||semClass.endsWith("'S"))
					
					if(lex.equals("couple") || semClass.startsWith("ORG_DESC") || lex.equals("following") ||lex.equals("rest") || semClass.contains("STATE") || semClass.contains("NATION") || semClass.contains("DATE")||semClass.contains("TIME")||semClass.contains("QUANTITY")||semClass.contains("CARDINAL") || semClass.contains("PERCENT") || semClass.endsWith("'S"))
							macro="";

					if(semClass.length()==0)
							macro="";
									
			}
			else{
					
			}

			//System.out.println(macro);		

			return macro;

	}

		public String whLex="";
	public void storeWHLex(String whLex){
			//System.out.println("Raja: "+whLex);
			this.whLex=whLex;
	}	
	public String getWHLex(){
			return this.whLex;
	}
}


================================================
FILE: src/opennlp/ccgbank/extract/MorphExtract.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

//Program which takes in the /tmp/temp.xml file generated and forms a morph.xml file

package opennlp.ccgbank.extract;

import java.io.File;
import java.io.FileOutputStream;
import java.io.IOException;
import java.util.ArrayList;

import javax.xml.transform.TransformerConfigurationException;
import javax.xml.transform.TransformerException;
import javax.xml.transform.TransformerFactory;
import javax.xml.transform.sax.SAXResult;
import javax.xml.transform.sax.SAXSource;
import javax.xml.transform.sax.SAXTransformerFactory;

import opennlp.ccgbank.extract.ExtractGrammar.ExtractionProperties;

import org.apache.xml.serializer.OutputPropertiesFactory;
import org.apache.xml.serializer.Serializer;
import org.apache.xml.serializer.SerializerFactory;
import org.jdom.JDOMException;
import org.xml.sax.InputSource;
import org.xml.sax.SAXException;
import org.xml.sax.XMLFilter;
import org.xml.sax.XMLReader;
import org.xml.sax.helpers.XMLReaderFactory;

public class MorphExtract {

	public static void extractMorph(ExtractionProperties extractProps)
			throws TransformerException, TransformerConfigurationException,
			SAXException, IOException, JDOMException {

		System.out.println("Extracting morph:");
		System.out.println("Generating morph.xml");

		TransformerFactory tFactory = TransformerFactory.newInstance();

		File morphFile = new File(new File(extractProps.destDir), "morph.xml");
		File tempFile = new File(new File(extractProps.tempDir), "temp.xml");

		if (tFactory.getFeature(SAXSource.FEATURE)
				&& tFactory.getFeature(SAXResult.FEATURE)) {

			SAXTransformerFactory saxTFactory = ((SAXTransformerFactory) tFactory);

			ArrayList<XMLFilter> filterChain = new ArrayList<XMLFilter>();
			ArrayList<String> xslChain = new ArrayList<String>();

			if (extractProps.macroSpecs.length() > 0) {

			}

			addTransforms(xslChain, extractProps.macroSpecs);

			for (String xslFile : xslChain)
				filterChain.add(saxTFactory.newXMLFilter(ExtractGrammar
						.getSource(xslFile)));
			// Create an XMLReader and set first xsl transform to that.
			XMLReader reader = XMLReaderFactory.createXMLReader();
			XMLFilter xmlFilter0 = filterChain.get(0);
			xmlFilter0.setParent(reader);

			//Create chain of xsl transforms
			// Create an XMLFilter for each stylesheet.
			for (int i = 1; i < filterChain.size(); i++) {
				XMLFilter xmlFilterPrev = filterChain.get(i - 1);
				XMLFilter xmlFilterCurr = filterChain.get(i);
				xmlFilterCurr.setParent(xmlFilterPrev);
			}

			XMLFilter xmlFilter = filterChain.get(filterChain.size() - 1);

			java.util.Properties xmlProps = OutputPropertiesFactory
					.getDefaultMethodProperties("xml");
			xmlProps.setProperty("indent", "yes");
			xmlProps.setProperty("standalone", "no");
			xmlProps.setProperty("{http://xml.apache.org/xalan}indent-amount",
					"2");
			Serializer serializer = SerializerFactory.getSerializer(xmlProps);
			serializer.setOutputStream(new FileOutputStream(morphFile));
			//XMLFilter xmlFilter = xmlFilter2;
			//XMLFilter xmlFilter = xmlFilter3;

			xmlFilter.setContentHandler(serializer.asContentHandler());
			xmlFilter.parse(new InputSource(tempFile.getPath()));
		}

		//Deleting the temporary lex file
		//tempFile.delete();
	}

	public static void addTransforms(ArrayList<String> xslChain, String macroSpecs) {

		xslChain.add("opennlp.ccgbank/transform/morphExtr.xsl");

		if (macroSpecs.length() == 0)
			xslChain.add("opennlp.ccgbank/transform/macroInsert.xsl");

		if (macroSpecs.contains("agr")) {
			System.out
					.println("Inserting a macro to check agreement in the copula");
			xslChain.add("opennlp.ccgbank/transform/agr-macroInsert.xsl");
		}

		if (macroSpecs.contains("anim")) {
			System.out
					.println("Inserting a macro to check animacy constraints");
			xslChain.add("opennlp.ccgbank/transform/anim-macroInsert.xsl");
		}
	}
}


================================================
FILE: src/opennlp/ccgbank/extract/RulesExtract.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

//Program which extracts unary rules and their frequencies and finally outputs the rules.xml file

package opennlp.ccgbank.extract;

import java.io.File;
import java.io.FileOutputStream;
import java.io.IOException;
import java.io.PrintWriter;
import java.util.Arrays;

import javax.xml.transform.Transformer;
import javax.xml.transform.TransformerConfigurationException;
import javax.xml.transform.TransformerException;
import javax.xml.transform.TransformerFactory;
import javax.xml.transform.sax.SAXResult;
import javax.xml.transform.sax.SAXSource;
import javax.xml.transform.sax.SAXTransformerFactory;
import javax.xml.transform.stream.StreamResult;
import javax.xml.transform.stream.StreamSource;

import opennlp.ccgbank.extract.ExtractGrammar.ExtractionProperties;

import org.apache.xml.serializer.OutputPropertiesFactory;
import org.apache.xml.serializer.Serializer;
import org.apache.xml.serializer.SerializerFactory;
import org.jdom.JDOMException;
import org.xml.sax.InputSource;
import org.xml.sax.SAXException;
import org.xml.sax.XMLFilter;
import org.xml.sax.XMLReader;
import org.xml.sax.helpers.XMLReaderFactory;

public class RulesExtract {
	
	public static void extractRules(ExtractionProperties extractProps) throws TransformerException, TransformerConfigurationException,SAXException, IOException,JDOMException{
		
		System.out.println("Extracting rule info:");
		
		File rulesFile = new File(new File(extractProps.destDir), "rules.xml");
		File tempFile = new File(new File(extractProps.tempDir), "temp-rules.xml");
		PrintWriter tempOut=new PrintWriter(new FileOutputStream(tempFile),true);
		
		File ccgbankDir = new File(extractProps.srcDir);
		File[] ccgbankSections=ccgbankDir.listFiles();
		Arrays.sort(ccgbankSections);
		
		RulesTally.RULE_FREQ_CUTOFF = extractProps.ruleFreqCutoff;
        RulesTally.KEEP_UNMATCHED = !extractProps.skipUnmatched;
		
		// add root
		tempOut.println("<rules>");
		
		TransformerFactory tFactory = TransformerFactory.newInstance();
		Transformer transformer = tFactory.newTransformer(ExtractGrammar.getSource("opennlp.ccgbank/transform/rulesExtr.xsl"));
		
		for (int i=extractProps.startSection; i<=extractProps.endSection; i++){
			
			File[] files=ccgbankSections[i].listFiles();
			Arrays.sort(files);
			
			int fileStart = 0; int fileLimit = files.length;
			if (extractProps.fileNum >= 0) {
				fileStart = extractProps.fileNum;
				fileLimit = extractProps.fileNum + 1;
			}
			
			for (int j=fileStart; j<fileLimit; j++){
				String inputFile=files[j].getAbsolutePath();
				if (j == fileStart) System.out.print(files[j].getName() + " ");
				else if (j == (fileLimit-1)) System.out.println(" " + files[j].getName());
				else System.out.print(".");
				if (fileStart == fileLimit-1) System.out.println();
				try {
					transformer.transform(new StreamSource(inputFile),new StreamResult(tempOut));
				}
				catch (Exception exc) {
                    System.out.println("Skipping: " + inputFile);
                    System.out.println(exc.toString());
				}
				tempOut.flush();
			}
		}
		
		tempOut.flush();
		tempOut.println("</rules>");
		tempOut.close();
		
		RulesTally.printTally(extractProps);
		
		System.out.println("Generating rules.xml");
		
		if (tFactory.getFeature(SAXSource.FEATURE) && tFactory.getFeature(SAXResult.FEATURE)){
			
			SAXTransformerFactory saxTFactory = ((SAXTransformerFactory) tFactory);
			
			// Create an XMLFilter for each stylesheet.
			XMLFilter xmlFilter1 = saxTFactory.newXMLFilter(ExtractGrammar.getSource("opennlp.ccgbank/transform/ccgRules.xsl"));
			

			//XMLFilter xmlFilter3 = saxTFactory.newXMLFilter(new StreamSource("foo3.xsl"));
			
			// Create an XMLReader.
			XMLReader reader = XMLReaderFactory.createXMLReader();
			
			// xmlFilter1 uses the XMLReader as its reader.
			xmlFilter1.setParent(reader);
			
			java.util.Properties xmlProps = OutputPropertiesFactory.getDefaultMethodProperties("xml");
			xmlProps.setProperty("indent", "yes");
			xmlProps.setProperty("standalone", "no"); 
			xmlProps.setProperty("{http://xml.apache.org/xalan}indent-amount", "2");
			Serializer serializer = SerializerFactory.getSerializer(xmlProps);
			serializer.setOutputStream(new FileOutputStream(rulesFile));


			XMLFilter xmlFilter = xmlFilter1;
			xmlFilter.setContentHandler(serializer.asContentHandler());
			xmlFilter.parse(new InputSource(tempFile.getPath()));
		}
		
		//Deleting the temporory lex file
		//lexiconTempFile.delete();
	}
}


================================================
FILE: src/opennlp/ccgbank/extract/RulesTally.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

//Class which stores unary rule freqs

//This class is invoked by the RulesExtr.xsl transform

package opennlp.ccgbank.extract;

import java.io.File;
import java.io.FileNotFoundException;
import java.io.FileOutputStream;
import java.io.PrintWriter;
import java.util.ArrayList;
import java.util.HashMap;
import java.util.List;
import java.util.Map;
import java.util.StringTokenizer;

import opennlp.ccgbank.extract.ExtractGrammar.ExtractionProperties;

public class RulesTally {
	
	// Frequency cutoff for including an extracted rule 
	public static int RULE_FREQ_CUTOFF = 1;
    
    // Flag for whether to keep unmatched rules in extracted grammar
    public static boolean KEEP_UNMATCHED = true;
	
	//Unary Rule Freq
	private static Map<String,Integer> ruleFreq = new HashMap<String,Integer>();
	
	//Rule Occurrence
	private static Map<String,List<String>> ruleOccur = new HashMap<String,List<String>>();
	
	//Sentence id
	private static String id="";

	/** Resets the statically held tallies. */
	public static void reset() {
		ruleFreq = new HashMap<String,Integer>();
		ruleOccur = new HashMap<String,List<String>>();
		id="";
	}

	
	//Proc which traps and stores id of each sentence
	public String storeId(String x){
		if(x.length()>0){
			id = x;
			int posEquals = x.indexOf('=');
			if (posEquals > 0) {
				id = x.substring(posEquals+1);
			}
		}
		return id;
	}
	
	//Loads freq tables, returns rule name
	public String loadTally(String res, String arg) throws FileNotFoundException{
		
		arg = arg.replaceAll("_\\d", "");
		res = res.replaceAll("_\\d", "");
		String rule = arg+"_to_"+res;
		List<String> temp;
		
		//Freq table entry opened at first instance of rule
		if (!ruleFreq.containsKey(rule)) {
			ruleFreq.put(rule,1);
			temp = new ArrayList<String>(4);
			temp.add(id);
			ruleOccur.put(rule,temp);
		}
		else {
			int freq = ruleFreq.get(rule)+1;
			ruleFreq.put(rule,freq);
			temp = ruleOccur.get(rule);
		}
		
		//First 4 instances of rules stored
		if(temp.size()<4 && !temp.contains(id)){
			temp.add(id);
			ruleOccur.put(rule,temp);
		}
		
		return rule;
	}
	
	public static void printTally(ExtractionProperties extractProps) throws FileNotFoundException {
		RulesTally.printTally(new File(extractProps.tempDir));
	}
	
	//Rule Frequencies printed to file
	public static void printTally(File directory) throws FileNotFoundException{
		
		System.out.println("Generating RuleFreq.html");
		
		//Freq Output file
		File freqFile = new File(directory, "RuleFreq.html");
		PrintWriter output=new PrintWriter(new FileOutputStream(freqFile));
		
		List<String> ruleList = FreqTally.sortTally(ruleFreq);
		
		//Printing the final ouput in html form
		output.flush();
		output.println("<html>");
		output.println("<head>");
		output.println("<title>");output.println("Unary Rule Info");output.println("</title>");
		output.println("</head>");
		output.println("<body>");
		output.flush();
		
		String ccgbankHome = System.getProperty("CCGBANK_HOME", "/home/corpora/EN/ccgbank");
		
		for (int i=0; i<ruleList.size(); i++) {
			
			String rule = ruleList.get(i);
			int freq = ruleFreq.get(rule);
			
			output.flush();
			output.println("<p>");
			output.println(i+1+" Rule: "+rule+" Freq: "+freq);
			output.println("<p>");
			output.flush();
			
			List<String> rules = ruleOccur.get(rule);
			output.flush();
			
			output.println("<ul>");
			output.println("<li>");
			output.flush();
			
			for (int j=0; j<rules.size(); j++){
				output.println("<ul>");
				id=rules.get(j);

				String[]idInfo=id.split("\\.");

				StringTokenizer st=new StringTokenizer(id,".");

				String idLink="";
				String sentNo="";
				String dir="";

				//2 courses of action depending on whether input is gold std .auto parses or C&C .auto parses
				if(idInfo.length==2){
						idLink=st.nextToken()+".html";
						sentNo="#Sentence "+st.nextToken();
						dir=id.substring(4,6);
				}
				else {
						idLink=idInfo[0];
						sentNo="#Sentence "+idInfo[0];
						dir=idInfo[0];
				}
				
				//System.out.println(idLink);
				
				output.println("<li>");
				output.println(id);
				output.println(" <a href=file://" + ccgbankHome + "/original/data/HTML/"+dir+"/"+idLink+" target="+sentNo+">");
				output.println(idLink);
				output.println("</a>");
				output.println("</li>");
				output.println("</ul>");
			}
						
			output.flush();
			output.println("</li>");
			output.println("</ul>");
			output.println("");
			output.flush();
		}
		
		output.flush();
		output.println("</body>");
		output.println("</html>");
		output.flush();
		output.close();
	}
	
	
	//Invoked by RulesExtr.xsl to check repetition of categories
	public boolean checkRuleStatus(String rule) {
		Integer freq = ruleFreq.get(rule);
		return (freq != null && freq == 1);
	}
	
	//Checks the freq of a rule
	public boolean checkRuleFreqStatus(String rule){
		int freq = ruleFreq.get(rule);
		//Freqs >= cutoff accepted
		return (freq >= RULE_FREQ_CUTOFF);
	}
    
    // returns flag
    public boolean keepUnmatched() {
        return KEEP_UNMATCHED;
    }
}


================================================
FILE: src/opennlp/ccgbank/extract/Testbed.java
================================================
///////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2005-2009 Scott Martin, Rajakrishan Rajkumar and Michael White
// 
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
// 
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU Lesser General Public License for more details.
// 
// You should have received a copy of the GNU Lesser General Public
// License along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
//////////////////////////////////////////////////////////////////////////////

//Program which creates a temp.xml file from the bareparse. temp.xml serves are the input for creating lexicon.xml & morph.xml

package opennlp.ccgbank.extract;

import java.io.*;
import java.util.*;

import opennlp.ccgbank.CCGBankTaskSources;
import opennlp.ccgbank.CCGBankTaskTestbed;
import opennlp.ccg.grammar.Grammar;
import opennlp.ccg.grammar.RuleGroup;
import opennlp.ccg.hylo.*;
import opennlp.ccg.lexicon.*;
import opennlp.ccg.parse.ParseException;
import opennlp.ccg.synsem.*;
import opennlp.ccg.test.*;
import opennlp.ccg.unify.*;

import org.jdom.Document;
import org.jdom.Element;
import org.jdom.JDOMException;
import org.jdom.input.SAXBuilder;
import org.jdom.output.Format;
import org.jdom.output.XMLOutputter;

/**
 * Creates test files under in 'test' dir under extracted grammar.
 */
public class Testbed {

	// the grammar
	private Grammar grammar;
	private Lexicon lexicon;
	private RuleGroup rules;

	// supertagger stand-in
	private SupertaggerStandIn supertaggerStandIn = new SupertaggerStandIn();
	
	// results of following deriv
	private Sign sign = null;

	private LF lf = null;

	private String str = "";

	private int numParses = 0;

	private String header = "";

	// Store info related to treenodes in the xml deriv
	private static ArrayList<String> treeInfo = new ArrayList<String>();

	private static boolean treeInfoFlag = false;

	// Store details of preds (nomId key: pos,stag, pos and pred name)
	private static Hashtable<String, String> predInfo = new Hashtable<String, String>();

	// supertag-rule combos
	private Set<String> combos = null;

	Set<CCGBankTaskSources> sourcesSet;

	CCGBankTaskTestbed ccgBankTaskTestbed;

	File grammarFile, targetDirectory;

	// constructor
	public Testbed(Set<CCGBankTaskSources> sourcesSet, File targetDirectory,
			CCGBankTaskTestbed testbed) throws IOException {
		grammarFile = new File(targetDirectory, "grammar.xml");

		this.grammar = new Grammar(grammarFile.toURI().toURL(), true);
		this.lexicon = grammar.lexicon;
		this.rules = grammar.rules;

		this.sourcesSet = sourcesSet;
		this.targetDirectory = targetDirectory;
		this.ccgBankTaskTestbed = testbed;
	}

	// main method for creating test files
	@SuppressWarnings("rawtypes")
	public void createTestFiles() throws IOException, JDOMException {

		ccgBankTaskTestbed.log("Creating test files:");

		// config grammar
		Tokenizer tokenizer = grammar.lexicon.tokenizer;
		grammar.prefs.showFeats = true;
		grammar.prefs.showSem = ccgBankTaskTestbed.isShowsSem();

		// ensure test dir exists
		File testDir = new File(targetDirectory, "test");
		testDir.mkdirs();
		ccgBankTaskTestbed.log("Writing test files to: " + testDir.getPath());

		// text, class-replaced text factors etc. output
		PrintWriter textPW = null;
		PrintWriter textscPW = null;
		PrintWriter factorsPW = null;
		PrintWriter combosPW = null;
		PrintWriter predsPW = null;
		PrintWriter treePW = null;
		File textFile = ccgBankTaskTestbed.getText();
		File factorsFile = ccgBankTaskTestbed.getFactors();
		File combosFile = ccgBankTaskTestbed.getCombos(); 
		File predsFile = ccgBankTaskTestbed.getPreds(); 
		File treeFile = ccgBankTaskTestbed.getTree();
		
		if (textFile != null) {
			File textscFile=new File(textFile.getParent()+"/"+textFile.getName().replaceFirst("text-","textsc-"));
			ccgBankTaskTestbed.log("Writing text to: " + textFile);
			ccgBankTaskTestbed.log("Writing class-replaced text to: " + textscFile);
            textFile.getParentFile().mkdirs(); 
			textPW = new PrintWriter(new BufferedWriter(new FileWriter(textFile)));
			textscPW = new PrintWriter(new BufferedWriter(new FileWriter(textscFile)));
		}
		if (factorsFile != null) {
			ccgBankTaskTestbed.log("Writing factors to: " + factorsFile);
            factorsFile.getParentFile().mkdirs();
			factorsPW = new PrintWriter(new BufferedWriter(new FileWriter(factorsFile)));
		}
		if (combosFile != null) {
			ccgBankTaskTestbed.log("Writing supertag-rule combos to: " + combosFile);
            combosFile.getParentFile().mkdirs(); 
			combos = new HashSet<String>();
			combosPW = new PrintWriter(new BufferedWriter(new FileWriter(combosFile)));
		}
		if (predsFile != null) {
			ccgBankTaskTestbed.log("Writing preds to: " + predsFile);
			predsFile.getParentFile().mkdirs();
			predsPW = new PrintWriter(new BufferedWriter(new FileWriter(predsFile)));
		}
		if (treeFile != null) {
			ccgBankTaskTestbed.log("Writing tree node info to: " + treeFile);
            treeFile.getParentFile().mkdirs();
			treePW = new PrintWriter(new BufferedWriter(new FileWriter(treeFile)));
			treeInfoFlag = true;
		}

		// jdom stuff
		SAXBuilder builder = new SAXBuilder();
		XMLOutputter outputter = new XMLOutputter(Format.getPrettyFormat());

		// counters
		int numWithLFs = 0;
		int numSingleRootLFs = 0;
		int numWithoutLFs = 0;

		for (CCGBankTaskSources sources : sourcesSet) {
			for (File file : sources) {
				File testSectDir = new File(testDir, file.getParentFile().getName());
				testSectDir.mkdir();

				ccgBankTaskTestbed.log("Debug Print: " + testSectDir.getAbsolutePath());

				// parse derivations
				Document inDoc = builder.build(file);
				Element inRoot = inDoc.getRootElement();

				// make test doc, sign map
				Document outDoc = new Document();
				Element outRoot = new Element("regression");
				outDoc.setRootElement(outRoot);
				Map<String,Sign> signMap = new HashMap<String,Sign>();

				// loop through derivations, making test items
				List derivElts = inRoot.getChildren();
				for (Object derivObj : derivElts) {
					Element derivElt = (Element) derivObj;
					followDeriv(derivElt);
					if (lf != null) {
						numWithLFs++;
						// check for single root
						if (lf instanceof SatOp)
							numSingleRootLFs++;
						// add test item, sign
						Element item = RegressionInfo.makeTestItem(grammar, str, numParses, lf);
						if (header == null) {
							header = "missing";
							ccgBankTaskTestbed.log("Warning: missing header in " + file);
						}
						item.setAttribute("info", header);
						if (header != null) signMap.put(header, sign);

						// Add parsed words as a separate LF element
						Element fullWordsElt = new Element("full-words");
						fullWordsElt.addContent(tokenizer.format(sign.getWords()));

						// Add info about LF lexical preds as a separate element
						Element predInfoElt = new Element("pred-info");
						String predInfoText = collectPredInfo(header);
						predInfoElt.setAttribute("data", predInfoText);

						item.addContent(fullWordsElt);
						item.addContent(predInfoElt);
						outRoot.addContent(item);

						// append to text, factors files
						if (textPW != null)
							textPW.println(str);
						
						 if (textscPW != null) {
                             textscPW.flush();
                             String textsc="";
                             //Note sem class replacement works only for NE classes spec in the grammar file
                             textsc=tokenizer.getOrthography((List<Word>)sign.getWords(),true);
                             textscPW.println(textsc);
                             textscPW.flush();
						 }

						
						if (factorsPW != null)
							factorsPW.println(tokenizer.format(sign.getWords()));
						// append new combos to combos file
						if (combosPW != null) {
							for (String combo : newCombos()) combosPW.println(combo);
						}
						// also to preds
						if (predsPW != null)
							predsPW.println(predInfoText);

						if (treePW != null) {
							for (String info : treeInfo) {
								treePW.println(info);
								treePW.flush();
							}
						}
						treeInfo = new ArrayList<String>();
					} else
						numWithoutLFs++;
				}

				// write test doc, saved signs
				File regressionFile = new File(testSectDir, file.getName());
				outputter.output(outDoc, new FileOutputStream(regressionFile));
				RegressionInfo.writeSerFile(signMap, regressionFile);
			}
		}

		// flush text, factors, combos, preds, tree files
		if (textPW != null) {
			textPW.flush();
			textPW.close();
		}
		if (factorsPW != null) {
			factorsPW.flush();
			factorsPW.close();
		}
		if (combosPW != null) {
			combosPW.flush();
			combosPW.close();
		}
		if (predsPW != null) {
			predsPW.flush();
			predsPW.close();
		}
		if (treePW != null) {
			treePW.flush();
			treePW.close();
		}

		// summary
		ccgBankTaskTestbed.log("numWithLFs: " + numWithLFs);
		ccgBankTaskTestbed.log("numSingleRootLFs: " + numSingleRootLFs);
		ccgBankTaskTestbed.log("numWithoutLFs: " + numWithoutLFs);
		ccgBankTaskTestbed.log("total: " + (numWithLFs + numWithoutLFs));
	}

	private void followDeriv(Element derivElt) {
		
		// reset
		sign = null;
		lf = null;
		str = "";
		header = derivElt.getAttributeValue("Header");
		
		// bookkeeping
		UnifyControl.startUnifySequence();
		
		try {

			Category cat = null;
			Nominal index = null;
			LF flatLF = null;

			// recurse through deriv
			SignHash signs = followDerivR(derivElt);
			// set results, using first available sign (ie some arbitrary one)
			if (!signs.isEmpty()) {
				Iterator<Sign> iter = signs.asSignSet().iterator();
				// System.out.println("Processing file no: "+header);
				// Count of single rooted LFs produced by the constrained parser
				int matchSRLF = 0;
				// Check whether any of the signs have a single rooted LF
				while (iter.hasNext()) {
					// System.out.println("Found LF");
					sign = iter.next();
					cat = sign.getCategory();
					index = cat.getIndexNominal();
					flatLF = cat.getLF();
					if (flatLF != null) {
						lf = HyloHelper.compactAndConvertNominals(flatLF, index, sign);
						// Break when the first single rooted LF is encountered
						if (lf instanceof SatOp) {
							matchSRLF++;
							// System.out.println("Single root LF found");
							break;
						}
					}
				}

				// If no single rooted LF is there, using first available sign
				// (ie some arbitrary one)
				if (matchSRLF == 0) {
					sign = signs.asSignSet().iterator().next();
					cat = sign.getCategory();
					index = cat.getIndexNominal();
					flatLF = cat.getLF();
					if (flatLF != null) lf = HyloHelper.compactAndConvertNominals(flatLF, index, sign);
				}

				if (flatLF != null) {
					extrPredInfo(flatLF, "");
				}

				numParses = signs.size();
				str = str.trim();
			}
			
		} catch (ParseException exc) {
			ccgBankTaskTestbed.log("Warning for " + header + ": " + exc.toString());
		}
	}

	// recurse through deriv, returning signs
	@SuppressWarnings({ "rawtypes", "unchecked" })
	private SignHash followDerivR(Element derivElt) throws ParseException {
		String eltName = derivElt.getName();
		// follow deriv, applying combinatory rules
		// nb: no checks made for intended deriv!
		if (eltName.equals("Treenode")) {
			String cat = derivElt.getAttributeValue("cat");
			String ntId = derivElt.getAttributeValue("nt_id");
			String simpleCat = derivElt.getAttributeValue("stag");
			List childElts = derivElt.getChildren();
			int numChildren = childElts.size();
			if (numChildren == 0)
				throw new ParseException(header
						+ ": no child elements for TreeNode for cat: " + cat);
			// if no cat element present, adjust list with an initial dummy node, 
			// to avoid code changes in what follows
			Element elt0 = (Element) childElts.get(0);
			String elt0name = elt0.getName();
			if (elt0name.equals("Treenode") || elt0name.equals("Leafnode")) {
				childElts.add(0, new Element("dummy"));
				numChildren++;
			}
			if (numChildren != 2 && numChildren != 3)
				throw new ParseException(header
						+ ": wrong number of child elements: " + numChildren
						+ " for cat: " + cat);
			Element firstInputElt = (Element) childElts.get(1);
			SignHash firstSigns = followDerivR(firstInputElt);
			SignHash retval = new SignHash();
			// unary case
			if (numChildren == 2) {
				// apply rules
				for (Sign s : firstSigns.asSignSet()) {
					List<Sign> results = rules.applyUnaryRules(s);
					for (Sign rSign : results)
						retval.insert(rSign);
				}
				// caution/warn upon failure
				if (!containsCat(retval, simpleCat)) {
					boolean noResults = retval.isEmpty();
					String inCat = firstInputElt.getAttributeValue("cat");
					String msg = "Unable to derive: " + cat + " from: " + inCat;
					if (!noResults)
						ccgBankTaskTestbed.log("Caution for " + header + ": " + msg);
					if (ccgBankTaskTestbed.isDebugDerivations()) {
						ccgBankTaskTestbed.log(header + ": derivation stymied; inputs: ");
						for (Sign s : firstSigns.asSignSet()) {
							ccgBankTaskTestbed.log(s.toString());
						}
						if (!noResults) {
							ccgBankTaskTestbed.log("Outputs: ");
							for (Sign s : retval.asSignSet())
								ccgBankTaskTestbed.log(s.toString());
						}
					}
					if (noResults)
						throw new ParseException("Derivation blocked: " + msg);
				}
			}
			// binary case
			else if (numChildren == 3) {
				Element secondInputElt = (Element) childElts.get(2);
				SignHash secondSigns = followDerivR(secondInputElt);
				// apply rules
				for (Sign sign1 : firstSigns.asSignSet()) {
					for (Sign sign2 : secondSigns.asSignSet()) {
						List<Sign> results = rules.applyBinaryRules(sign1, sign2);
						for (Sign rSign : results)
							retval.insert(rSign);
					}
				}
				// if no results, propagate one input if the other is
				// internal punct
				if (retval.isEmpty()) {
					if (isPunct(secondInputElt))
						return firstSigns;
					else if (isPunct(firstInputElt))
						return secondSigns;
				}
				// caution/warn upon failure
				if (!containsCat(retval, simpleCat)) {
					boolean noResults = retval.isEmpty();
					String inCat1 = firstInputElt.getAttributeValue("cat");
					String inCat2 = secondInputElt.getAttributeValue("cat");
					String msg = "Unable to derive: " + cat + " from: " + inCat1 + " and: " + inCat2;
					if (!noResults)
						ccgBankTaskTestbed.log("Caution for " + header + ": " + msg);
					if (ccgBankTaskTestbed.isDebugDerivations()) {
						ccgBankTaskTestbed.log(header + ": derivation stymied; first inputs: ");
						for (Sign sign1 : firstSigns.asSignSet()) {
							ccgBankTaskTestbed.log(sign1.toString());
						}
						ccgBankTaskTestbed.log("Second inputs: ");
						for (Sign sign2 : secondSigns.asSignSet()) {
							ccgBankTaskTestbed.log(sign2.toString());
						}
						if (!noResults) {
							ccgBankTaskTestbed.log("Outputs: ");
							for (Sign s : retval.asSignSet())
								ccgBankTaskTestbed.log(s.toString());
						}
					}
					if (noResults)
						throw new ParseException("Derivation blocked: " + msg);
				}
			}

			// Store cat ids of tree nodes for printing to aux files
			if (treeInfoFlag) {

				for (Sign s : retval.asSignSet()) {

					Hashtable<String, String> idConvTally = new Hashtable<String, String>();
					Hashtable<String, Integer> freqTally = new Hashtable<String, Integer>();
					ArrayList<String> fullCat = new ArrayList<String>();
					String catId = "";

					Category treeCat = s.getCategory();
					// System.out.println(header+" "+ntId+" "+treeCat);
					recurseCat(treeCat, fullCat, idConvTally, freqTally);
					/*
					 * System.out.println(freqTally);
					 * System.out.println(fullCat); System.out.println('\n');
					 */

					if (fullCat.size() > 1) {

						for (String x : fullCat) {

							String y[] = x.split("_");
							if (y.length == 1) {
								catId = catId + "," + y[0];
								continue;
							}

							int freq = freqTally.get(y[1]);
							freqTally.put(y[1], freq - 1);

							if (x.endsWith("_M") && freq <= 1)
								x = x.replaceFirst("_M", "");

							catId = catId + "," + x;
						}
						catId = catId.replaceFirst(",", "");
						treeInfo.add(header + " " + ntId + " " + catId);
					}
					/*
					 * System.out.println(idConvTally);
					 * System.out.println(fullCat); System.out.println('\n');
					 */
				}

			}

			// done
			return retval;
		}
		// lex lookup
		// nb: not always insisting on right POS, b/c hashing strategy uses
		// surface words,
		// thus doesn't distinguish lex signs based solely on POS
		// nb: might make sense to warn on lex cats with missing semantics
		else if (eltName.equals("Leafnode")) {
			try {
				String lex = derivElt.getAttributeValue("lexeme");
				Word w = lexicon.tokenizer.parseToken(lex);
				str += w.getForm() + " ";
				String cat = derivElt.getAttributeValue("cat");
				String simpleCat = derivElt.getAttributeValue("stag");
				String rel = derivElt.getAttributeValue("rel");
				String indexRel = derivElt.getAttributeValue("indexRel");
				String semClass = "";
				semClass = derivElt.getAttributeValue("class");

				String roles = derivElt.getAttributeValue("argRoles");
				String pos = derivElt.getAttributeValue("pos");
				// nb: for now, need to ignore rel for non-VB pos
				if (!pos.startsWith("VB"))
					rel = null;
				// lex lookup with required supertag
				// NB: there's no guarantee of getting the right arg roles if the word-cat pair is observed 
				lexicon.setSupertagger(supertaggerStandIn);
				supertaggerStandIn.setTag(simpleCat); 
				SignHash lexSigns = lexicon.getSignsFromWord(w);

				if (semClass == null || semClass.length() == 0)
					semClass = "NoClass";

				// add lex signs, filtered by rel, reindexed
				// also check number with matching pos, match on no class
				int matchPOS = 0;
				boolean matchNoClass = false;
				for (Iterator<Sign> it = lexSigns.asSignSet().iterator(); it.hasNext();) {
					Sign s = it.next();

					Word wTemp = s.getWords().get(0);
					String morphClass = wTemp.getSemClass();
					if (morphClass == null || morphClass.length() == 0)
						morphClass = "NoClass";

					Category lexcat = s.getCategory();
					LF lexLF = lexcat.getLF();

					// allow any class if no sem class given
					if (!(semClass.equals("NoClass") || semClass.equals(morphClass))
							|| !containsPred(lexLF, rel)
							|| !containsRoles(lexLF, roles)
							|| !containsRel(lexLF, indexRel, s)) {
						it.remove();
					}
					else {
						UnifyControl.reindex(lexcat);
						if (wTemp.getPOS().equals(pos)) {
							matchPOS++;
							if (semClass.equals("NoClass") && morphClass.equals("NoClass"))
								matchNoClass = true;
						}
					}
				}
				// filter by pos unless none match
				if (matchPOS > 0) {
					for (Iterator<Sign> it = lexSigns.asSignSet().iterator(); it.hasNext();) {
						Sign s = it.next();
						Word wTemp = s.getWords().get(0);
						if (!wTemp.getPOS().equals(pos)) {
							it.remove(); continue;
						}
						// filter by mismatched class if apropos
						if (matchNoClass) {
							String morphClass = wTemp.getSemClass();
							if (morphClass != null && morphClass.length() != 0)
								it.remove();
						}
					}
				}
				if (lexSigns.isEmpty())
					throw new LexException("No matching category " + cat + " for: " + w);
				return lexSigns;
			} catch (LexException exc) {
				// try continuing derivations without lex signs for punctuation,
				// otherwise throw parse exception
				if (isPunct(derivElt)) {
					if (ccgBankTaskTestbed.isDebugDerivations()) {
						ccgBankTaskTestbed.log(header + ": " + exc.toString());
					}
					return new SignHash();
				}
				throw new ParseException(exc.toString());
			} catch (RuntimeException exc) {
				// for other exceptions, throw parse exception
				throw new ParseException(exc.toString());
			}
		} else
			throw new RuntimeException(header + ": unrecognized element in derivation: " + eltName);
	}

	// Recurse through a CCG cat and print out the atomcats and their ids
	private static void recurseCat(Category cat, ArrayList<String> fullCat,
			Hashtable<String, String> idConvTally,
			Hashtable<String, Integer> freqTally) {

		if (cat instanceof ComplexCat) {

			ComplexCat cc = (ComplexCat) cat.copy();
			Category resCat = cc.getResult();

			recurseCat(resCat, fullCat, idConvTally, freqTally);
			int argStart = 0;

			if (resCat instanceof ComplexCat) {
				ComplexCat temp = (ComplexCat) resCat.copy();
				argStart = temp.getArgStack().size();
			}

			ArgStack argStack = cc.getArgStack(argStart);

			for (int i = 0; i < argStack.size(); i++) {
				if (argStack.get(i) instanceof BasicArg) {
					BasicArg bArg = (BasicArg) argStack.get(i);
					Category argCat = (Category) bArg.getCat();
					Slash argSlash = (Slash) bArg.getSlash();
					// System.out.println(argSlash.toString()+'\n');
					fullCat.add(argSlash.toString());
					recurseCat(argCat, fullCat, idConvTally, freqTally);
				}
			}

		} else if (cat instanceof AtomCat) {

			AtomCat ac = (AtomCat) cat.copy();
			FeatureStructure fs = ac.getFeatureStructure();

			if (fs.hasAttribute("index")) {
				String index = fs.getValue("index").toString();
				// System.out.println(index);
				String id[] = index.split(":");

				if (!idConvTally.containsKey(id[0]))
					idConvTally.put(id[0], Integer.toString(idConvTally.size() + 1));
				String numId = idConvTally.get(id[0]);
				String catId = ac.getType() + "_" + numId;

				if (!freqTally.containsKey(numId))
					freqTally.put(numId, 0);

				int freq = freqTally.get(numId);
				freqTally.put(numId, freq + 1);

				if (fs.hasAttribute("mod-index"))
					catId = catId + "_" + "M";

				// System.out.println('\n');

				fullCat.add(catId);
			}
		}
	}

	// returns whether the given LF contains the given the lexical predicate
	private static boolean containsPred(LF lf, String pred) {
		if (pred == null)
			return true;
		if (lf == null)
			return false;
		for (SatOp satOp : HyloHelper.getPreds(lf)) {
			if (HyloHelper.isLexPred(satOp)) {
				if (HyloHelper.getLexPred(satOp).equals(pred))
					return true;
			}
		}
		return false;
	}

	// roles in a given LF
	private static Set<String> rolesSet = new HashSet<String>();

	// returns whether the given LF contains the given the lexical predicate
	private static boolean containsRoles(LF lf, String roles) {
		if (roles == null)
			return true;
		if (lf == null)
			return false;
		String[] rolesArray = roles.split("\\s+");
		// get roles in LF
		rolesSet.clear();
		for (SatOp satOp : HyloHelper.getPreds(lf)) {
			if (HyloHelper.isRelPred(satOp)) {
				rolesSet.add(HyloHelper.getRel(satOp));
			}
		}
		// check presence of roles in LF
		for (String role : rolesArray) {
			if (role.equals("null") || role.equals("e"))
				continue;
			if (!rolesSet.contains(role))
				return false;
		}
		return true;
	}

	// returns whether the given LF contains the given indexRel
	private static boolean containsRel(LF lf, String indexRel, Sign sign) {

		if (indexRel == null)
			return true;
		if (lf == null)
			return false;

		indexRel = "<" + indexRel + ">";

		/*
		 * System.out.println(sign.getSupertag()+" "+sign.getPOS());
		 * System.out.println(indexRel); System.out.println(rolesSet);
		 * System.out.println(lf); System.out.println('\n');
		 */

		// check presence of that rel/feat in LF
		if (!lf.toString().contains(indexRel))
			return false;
		else
			return true;
	}

	// identifies punctuation
	private static boolean isPunct(Element elt) {
		String pos = elt.getAttributeValue("pos");
		if (pos == null)
			return false;

		return (pos.equals("|") || pos.equals(".") || pos.equals(",")
				|| pos.equals(";") || pos.equals(":") || pos.equals("LRB")
				|| pos.equals("RRB") || pos.equals("``") || pos.equals("''"));
	}

	// return whether signs contains cat; filter if so
	private static boolean containsCat(SignHash signs, String cat) {
		// special case: give free pass to cats with dollars
		if (!signs.isEmpty() && cat.indexOf('$') >= 0)
			return true;
		// check for cat
		boolean retval = false;
		for (Sign sign : signs.asSignSet()) {
			String supertag = sign.getCategory().getSupertag();
			// again, give free pass to cats with dollars
			if (supertag.indexOf('$') >= 0 || cat.equals(supertag)) {
				retval = true;
				break;
			}
		}
		// filter if found
		if (retval) {
			for (Iterator<Sign> it = signs.asSignSet().iterator(); it.hasNext();) {
				Sign sign = it.next();
				String supertag = sign.getCategory().getSupertag();
				if (supertag.indexOf('$') >= 0 || cat.equals(supertag))
					continue;
				else
					it.remove();
			}
		}
		return retval;
	}

	// returns new combos for current sign
	private List<String> newCombos() {
		List<String> retval = new ArrayList<String>();
		newCombos(sign, retval);
		return retval;
	}

	// recursively adds new combos for given sign
	private void newCombos(Sign s, List<String> retval) {
		Sign[] inputs = s.getDerivationHistory().getInputs();
		if (inputs != null) {
			StringBuffer sb = new StringBuffer();
			for (int i = 0; i < inputs.length; i++) {
				sb.append(inputs[i].getCategory().getSupertag()).append(' ');
			}
			sb.append(s.getDerivationHistory().getRule().name());
			String combo = sb.toString();
			if (!combos.contains(combo)) {
				retval.add(combo);
				combos.add(combo);
			}
			for (int i = 0; i < inputs.length; i++) {
				newCombos(inputs[i], retval);
			}
		}
	}

	// Extracts nom-id,pos,supertag info related to LF lexical preds
	private void extrPredInfo(LF lf, String sentId) {
		// System.out.println(sentId);
		extractPredInfo(lf, predInfo);
	}

	/**
	 * Extracts the nom id, pos, and supertag info related to LF lexical preds, 
	 * and puts it in the given map keyed off the nom id.
	 * Note that the map should be cleared for each new LF.
	 */
	public static void extractPredInfo(LF lf, Map<String,String> predInfoMap) {

		String predData = "";
		List<SatOp> preds = HyloHelper.getPreds(lf);

		for (SatOp pred : preds) {

			String lexPred = HyloHelper.getLexPred(pred);
			if (lexPred == null)
				continue;

			if (!(pred.getArg() instanceof Proposition))
				continue;

			Proposition p = (Proposition) pred.getArg();

			String lex = (p.getName()).toString();

			// Get supertag & pos tag info and store that
			String stag = pred.getOrigin().getSupertag();
			String pos = pred.getOrigin().getPOS();
			Nominal nom = pred.getNominal();
			String nomInd = nom.toString();
			String nomIndParts[] = nomInd.split(":");

			if (stag == null || pos == null || lex == null)
				continue;

			predData = escape(stag) + ":" + escape(pos) + ":" + escape(lex);
			predInfoMap.put(nomIndParts[0], predData);
		}
	}

	// Collects nom-id,pos,supertag info related to LF lexical preds for this
	// particular LF
	private static String collectPredInfo(String sentId) {

		String predData = "";

		for (Enumeration<String> e = predInfo.keys(); e.hasMoreElements();) {

			String nomId = e.nextElement();
			predData = predData + " " + nomId + ":" + predInfo.get(nomId);
		}

		predInfo = new Hashtable<String, String>();

		return predData.trim();
	}

	/**
	 * Returns the pred info string for the given pred info map (see extractPredInfo).
	 */
	public static String getPredInfo(Map<String,String> predInfoMap) {
		String predData = "";
		for (String nomId : predInfoMap.keySet()) {
			predData = predData + " " + nomId + ":" + predInfoMap.get(nomId);
		}
		return predData.trim();
	}
	
	// escapes a string using DefaultTokenizer
	private static String escape(String s) { return DefaultTokenizer.escape(s); }
	
	// stands in for a supertagger during lex lookup
	private static class SupertaggerStandIn implements SupertaggerAdapter {
		// map for a single key
		private Map<String,Double> map = new HashMap<String,Double>(2);
		public Map<String,Double> getSupertags() { return map; }
		
		// set tag
		void setTag(String tag) { map.clear(); map.put(tag, 1.0); }
		
		// dummy implementations
		public void setIncludeGold(boolean includeGold) {}
		public void resetBeta() {}
		public void resetBetaToMax() {}
		public void nextBeta() {}
		public void previousBeta() {}
		public boolean hasMoreBetas() { return false; }
		public boolean hasLessBetas() { return false; }
		public double[] getBetas() { return new double[]{1.0}; }
		public void setBetas(double[] betas) {}
		public double getCurrentBetaValue() { return 1.0; }
	}
}


================================================
FILE: src/opennlp/ccgbank/lexicon-base.xsl
================================================
<?xml version="1.0"?>
<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

  <xsl:output method="xml" indent="yes" xalan2:indent-amount="2" omit-xml-declaration = "yes"/>
  
  <xsl:strip-space elements="*"/>
  
  <!--Transform which reads in a xml parse rep and creates in temp.xml lexical entries for that file and compiles a freq tally-->
  
  <!--Java Program in the grammar extractor package invoked-->
  <xsl:variable name="obj" select="java:opennlp.ccgbank.extract.FreqTally.new()"/>
  
  
  <!--Eliminating the root of the xml parse rep and processing children-->
  <xsl:template match="Derivation">
    <xsl:apply-templates />
  </xsl:template>
  
  <!--Skip Treenodes-->
  <xsl:template match="Treenode">
    <!--Store ccgbank id for recording example sentences-->	
    <xsl:if test="@Header">
      <xsl:variable name="id" select="java:storeId($obj,@Header)"/>
      <!-- nb: need to pretend to use result to avoid having above call "optimized" away--> 
      <xsl:variable name="boo" select="$id"/>
    </xsl:if>
    <xsl:apply-templates/>
  </xsl:template>
  
  
  <!--Leafnodes Processed-->
  <xsl:template match="Leafnode">

    <!--Load cat into freq tally java class and see whether it is first occurence-->
		<!--Change the case of the lexeme if it is not of pos NNP/NNPS
		<xsl:variable name="lexCase" select="java:changeCase($obj,@lexeme,@pos)"/>-->
    <xsl:variable name="firstCatPos" select="java:loadTally($obj,@lexeme,@cat,@pos)"/>

    <!--First occcurence of a catspec-->
    <xsl:if test="$firstCatPos">
      <!--Lexical entry for openccg lexicon generated-->              
      <family name="{@cat}" pos="{@pos}">
        <xsl:copy-of select="@pos1"/>
        <xsl:copy-of select="@argRoles"/>
        <entry name="Primary">
          <xsl:apply-templates mode="leaf"/>
        </entry>
      </family> 
    </xsl:if>             
    
    <!-- Add lex entry for new lex combos --> 
    <!-- nb: for now, need to ignore rel for particles -->
    <xsl:variable name="rel">
      <xsl:choose>
        <xsl:when test="starts-with(@pos,'VB')"><xsl:value-of select="@rel"/></xsl:when>
        <xsl:otherwise/>
      </xsl:choose>
    </xsl:variable>
    <xsl:variable name="firstLexCombo" select="java:firstLexCombo($obj,@lexeme,@stem,$rel,@cat,@pos,@class)"/>
    <xsl:if test="$firstLexCombo">
      <entry word="{@lexeme}" pos="{@pos}" family="{@cat}">
        <!-- add stems when present -->
        <xsl:copy-of select="@stem"/>
        <!-- add rel too -->
        <xsl:if test="$rel != ''">
          <xsl:attribute name="rel"><xsl:value-of select="$rel"/></xsl:attribute>
        </xsl:if>

				<!--Add BBN semantic class if present-->
				<xsl:if test="@class">
          <xsl:attribute name="class"><xsl:value-of select="@class"/></xsl:attribute>
        </xsl:if>
      </entry>
    </xsl:if>
  
  </xsl:template>
  
  <!--Copy Rule for leaf nodes-->
  <xsl:template match="@*|node()" mode="leaf">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()" mode="leaf"/>
    </xsl:copy>
  </xsl:template>

</xsl:transform>


================================================
FILE: src/opennlp/ccgbank/parse/CCGbankDerivation.jjt
================================================
// Grammar to parse all the ccgbank derivations in a given ccgbank file

options {
    MULTI=true;
    NODE_DEFAULT_VOID=false;
    NODE_SCOPE_HOOK=true;   
    STATIC=true;
    USER_TOKEN_MANAGER=false;
    NODE_PREFIX=""; 
    NODE_USES_PARSER=true;
}

PARSER_BEGIN(CCGbankDerivation)

package opennlp.ccgbank.parse;

import java.util.*;
import org.apache.tools.ant.Task;
//import java.io.*;

public class CCGbankDerivation {

    // The java code to operate the node scope hook
    static void jjtreeOpenNodeScope(Node n) {
        ((SimpleNode)n).first_token = getToken(1);
    }

    static void jjtreeCloseNodeScope(Node n) {
        ((SimpleNode)n).last_token = getToken(0);
    }
}

PARSER_END(CCGbankDerivation)


// enter PROPINFO state (for extra Propbank-derived info) on "{"
// nb: this is a workaround for ATOMCAT being perhaps too broadly defined
TOKEN: { <LCURLY: "{">  : PROPINFO }

// return to normal on ">" at end of node
<*> TOKEN: { <RANGLE: ">"> : DEFAULT }

// tokens in PROPINFO state
<PROPINFO> TOKEN: { <COMMA: ","> }
<PROPINFO> TOKEN: { <DOT: "."> }
<PROPINFO> TOKEN: { <COLON: ":"> }
<PROPINFO> TOKEN: { <ALPHNUMHYPH: (["A"-"Z","a"-"z","-","0"-"9"])+> } // for stems and sem roles
<PROPINFO> TOKEN: { <RCURLY: "}"> }
<PROPINFO> TOKEN: { <LSQUARE: "["> }
<PROPINFO> TOKEN: { <RSQUARE: "]"> }


// regular tokens
// mww: ATOMCAT is really too broad, b/c it's used for words too ...
TOKEN:
{
    <ATOMCAT: (["A"-"Z","a"-"z","[","]","-","'",".",",","$","=","0"-"9","_",":","&","%",";","?","#","@","!","`","*"])+>
    |
    <OP: "/" | "\\">
    |
    <SPL: (<ATOMCAT>("\\/")*)+|("\\*")+>
    //The SPL token is for treebank words like "1\/2" or "bassoonist\/pianist\/composer" or "\*" where the middle tokens stand elsewhere for ccg operations. 
    //So the SPL prevents such words from interfering with the tokenization
}

<*> SKIP: { " " | "\t" | "\n" | "\r" }


SimpleNode start():
{}
{
    // Every file consists of one or more treebank entries
    // Each treebank entry consists of 1 header and 1 or more treenodes or leafnodes
    ( header() ( LOOKAHEAD(2) leafnode() | treenode()) )+
    { return jjtThis; }
}

void header():
{
    Token t1 = new Token();
    Token t2 = new Token();
    Token t3 = new Token();
    jjtThis.type="Header";
}
{
    // Header, eg: ID=wsj_2300.1 PARSER=GOLD NUMPARSE=1
    t1=<ATOMCAT> [t2=<ATOMCAT> t3=<ATOMCAT>]
    {
        jjtThis.header = t1.image + " " + t2.image + " " + t3.image;
    }
}


void treenode():
{
    Token leftover = new Token();
    Token head = new Token();
    Token dtr = new Token();
    Token lex = new Token();
    Token sense = new Token();
    Token role = new Token();
    jjtThis.type="Treenode";
}
{
    // Storing the ccgID.  (mww: huh?)
    // Sample Treenode: <T S[dcl] 0 2>
    // With Propbank roles: <T S[dcl] 0 2 {stop.01:ARG0,use.01:ARG0}>
    "(" 
        "<T" // Root of a treenode
    
            // Treenode category specification 
            catSpecRedundant()
    
            (
                // The lookahead traps [conj] feature which follows the catspec
                LOOKAHEAD(3)
                leftover=<ATOMCAT> head=<ATOMCAT> dtr=<ATOMCAT>
                { jjtThis.leftover=leftover.image; }          
                |
                head=<ATOMCAT>
                dtr=<ATOMCAT>
            )
            
            // Headedness, number of dtrs info stored in the SimpleNode data structure
            { jjtThis.head=head.image; jjtThis.dtr=dtr.image; }
    
            // optional propbank info
            // nb: need to use eg <DOT> instead of "." once in PROPINFO lex state 
            [
                "{"
                    lex=<ALPHNUMHYPH> <DOT> sense=<ALPHNUMHYPH> <COLON> role=<ALPHNUMHYPH> 
                    { 
                    	jjtThis.nodeRoles = new ArrayList<SimpleNode.LexSenseRole>(3);
                    	jjtThis.nodeRoles.add(new SimpleNode.LexSenseRole(lex.image, sense.image, role.image));
                	}
                    (
                        <COMMA>
	                    lex=<ALPHNUMHYPH> <DOT> sense=<ALPHNUMHYPH> <COLON> role=<ALPHNUMHYPH> 
	                    { jjtThis.nodeRoles.add(new SimpleNode.LexSenseRole(lex.image, sense.image, role.image)); }
                    )*
                <RCURLY>
            ]
            
        <RANGLE> // closure of one the root of a treenode
        
        // A treenode consists of 1 or more treenodes or leafnodes. 
        ( LOOKAHEAD(2) leafnode() | treenode() )+
            
    ")" // Close of a treenode
}


void leafnode():
{
    Token t = new Token();
    Token lex = new Token();
    Token sense = new Token();
    Token role = new Token();
    jjtThis.type="Leafnode";
}
{
    /* Sample Leafnode structures:
     (<L S/S RB RB No S_42/S_42>)
     (<L . . . . .>)
     (<L (S[dcl]\S[dcl])\NP VBD VBD reported (S[dcl]\S[dcl]_8)\NP_9 {report.01:rel} [ARG1,ARG0]>)
    */
    "(" 
        "<L" 
            // Parsed but Ignored
            catSpecRedundant()
            //((S[b]\NP)/NP)/    mww: huh?
    
            // POS tag stored in a SimpleNode DS
            t=<ATOMCAT> { jjtThis.pos = t.image; }
        
            // The pos tag has been repeated in the ccgbank. 
            // For numerals (null) is an entry. 
            // Hence the optional brackets in the bnf below.
            ( ["("] <ATOMCAT> [")"])
        
            ( t=<ATOMCAT> | t=<SPL> )
            { jjtThis.lex = t.image; }
        
            catSpec()
            
            // optional propbank info
            [
                "{"
                    lex=<ALPHNUMHYPH> <DOT> sense=<ALPHNUMHYPH> <COLON> role=<ALPHNUMHYPH> // role or 'rel'
                    { 
                    	jjtThis.nodeRoles = new ArrayList<SimpleNode.LexSenseRole>(3);
                    	jjtThis.nodeRoles.add(new SimpleNode.LexSenseRole(lex.image, sense.image, role.image));
                	}
                    (
                        <COMMA>
	                    lex=<ALPHNUMHYPH> <DOT> sense=<ALPHNUMHYPH> <COLON> role=<ALPHNUMHYPH> 
	                    { jjtThis.nodeRoles.add(new SimpleNode.LexSenseRole(lex.image, sense.image, role.image)); }
                    )*
                <RCURLY>
            ]
            [
                <LSQUARE>
                    role=<ALPHNUMHYPH> 
                    { 
                    	jjtThis.argRoles = new ArrayList<String>(4);
                    	jjtThis.argRoles.add(role.image);
                	}
                    (
                        <COMMA>
                        role=<ALPHNUMHYPH> 
                        { jjtThis.argRoles.add(role.image); }
                    )*
                <RSQUARE>
            ]
        <RANGLE> //">" 
    ")"
}

void catSpec():
{ jjtThis.type="complexcat"; }
{
    // The result category (atomic or complex)
    ( 
        ( "(" catSpec() ")" [<ATOMCAT>] )  // mww: the extra "atomcat" is really for an index on the complex cat
        |
        atomcat()
    )
        
    // The argument of the function (atomic or complex). 
    // Note: The following could be processed as a separate production "Embedded category" , but this would produce a node of that name. 
    //       To avoid that, the preceding BNF notation has been repeated here. 
    [
        op()
        ( 
            ( "(" catSpec() ")" [<ATOMCAT>] )
            |
            atomcat()
        )
    ]
}


void catSpecRedundant():
{ jjtThis.type="Redundant"; }  
{
    ( 
        ( "(" catSpec() ")" )
        |
        atomcat()
    )
    [
        op()
        ( 
            ( "(" catSpec() ")" )
            |
            atomcat()
        )
    ]
}


void atomcat():
{ jjtThis.type="atomcat"; }
{
    <ATOMCAT>
}

void op():
{ Token t = new Token(); jjtThis.type="op"; }
{
    t=<OP> { jjtThis.cat=t.image; }
}


================================================
FILE: src/opennlp/ccgbank/parse/SimpleNode.java
================================================
/* Generated By:JJTree: Do not edit this line. SimpleNode.java */

package opennlp.ccgbank.parse;

import java.util.List;

import opennlp.ccgbank.parse.CCGbankDerivation;
import opennlp.ccgbank.parse.CCGbankDerivationTreeConstants;

public class SimpleNode implements Node {
    //Javacc generated variables
    protected Node parent;
    protected Node[] children;
    protected int id;
    protected CCGbankDerivation parser;

    //User defined variables

    // lex, sense, role triples
    public static class LexSenseRole {
        public String lex, sense, role;

        public LexSenseRole(String lex, String sense, String role) {
            this.lex = lex;
            this.sense = sense;
            this.role = role;
        }
    }

    //CCGbank id
    public String header;

    //The serial no of the gold standard parse
    String parseNo = "";

    //Node type eg:-Treenode,Leafnode,atomcat etc
    public String type = "";

    //Traps any feature which is leftover
    public String leftover;

    //Headedness info 0 or 1
    public String head = "";

    //No:of daughters of a node
    public String dtr = "";

    //Category Specification
    public String cat = "";

    //Category Specification without co-indexation info in leafnodes
    public String catRedundant = "";

    //Lexical information
    public String lex = "";

    //Part of speech info. eg: RB, IN etc
    public String pos = "";

    // The roles (or rel) that the node plays
    public List<LexSenseRole> nodeRoles = null;

    // The arg roles of a verbal cat
    public List<String> argRoles = null;

    //First token in the node scope
    Token first_token;

    //Final token in the node scope
    Token last_token;

    //Function which produces the content of the node.
    public String print() throws Exception {

        Token p = first_token;

        while (p != last_token) {
            cat = cat + p.image;
            p = p.next;
        }

        return cat + last_token.image;
    }


    //The remaining part incl comments is Javacc generated.

    public SimpleNode(int i) {
        id = i;
    }

    public SimpleNode(CCGbankDerivation p, int i) {
        this(i);
        parser = p;
    }

    /**
     * @return the header
     */
    public String getHeader() {
        return header;
    }

    /**
     * @param header the header to set
     */
    public void setHeader(String header) {
        this.header = header;
    }

    /**
     * @return the leftover
     */
    public String getLeftover() {
        return leftover;
    }

    public int getId(){
        return id;
    }


    public void jjtOpen() {
    }

    public void jjtClose() {
    }


    public void jjtSetParent(Node n) {
        parent = n;
    }

    public Node jjtGetParent() {
        return parent;
    }

    public void jjtAddChild(Node n, int i) {
        if (children == null) {
            children = new Node[i + 1];
        } else if (i >= children.length) {
            Node c[] = new Node[i + 1];
            System.arraycopy(children, 0, c, 0, children.length);
            children = c;
        }
        children[i] = n;
    }

    public Node jjtGetChild(int i) {
        return children[i];
    }

    public int jjtGetNumChildren() {
        return (children == null) ? 0 : children.length;
    }

    /* You can override these two methods in subclasses of SimpleNode to
       customize the way the node appears when the tree is dumped.  If
       your output uses more than one line you should override
       toString(String), otherwise overriding toString() is probably all
       you need to do. */
    @Override
    public String toString() {
        return CCGbankDerivationTreeConstants.jjtNodeName[id];
    }

    public String toString(String prefix) {
        return prefix + toString();
    }

  /* Override this method if you want to customize how the node dumps
     out its children. */

    public void dump(String prefix) {
        System.out.println(toString(prefix));
        if (children != null) {
            for (int i = 0; i < children.length; ++i) {
                SimpleNode n = (SimpleNode) children[i];
                if (n != null) {
                    n.dump(prefix + " ");
                }
            }
        }
    }
}


================================================
FILE: src/opennlp/ccgbank/parse/grammarInsert
================================================
static void jjtreeOpenNodeScope(Node n)
    {
      ((SimpleNode)n).first_token = getToken(1);
    }

static void jjtreeCloseNodeScope(Node n)
    {
      ((SimpleNode)n).last_token = getToken(0);
    }


================================================
FILE: src/opennlp/ccgbank/rules-base.xsl
================================================
<?xml version="1.0"?>
<xsl:transform
  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
  version="1.0"
  xmlns:xalan="http://xml.apache.org/xalan"
  xmlns:xalan2="http://xml.apache.org/xslt"
  xmlns:java="http://xml.apache.org/xalan/java"
  exclude-result-prefixes="xalan xalan2 java">

  <xsl:output method="xml" indent="yes" xalan2:indent-amount="2" omit-xml-declaration = "yes"/>
  <xsl:strip-space elements="*"/>
  
  
  <!--Transform which extracts unary rules (incl those for conjs) into rules.xml. -->
  
  <!--Declaring java class to store rules,their freqs-->
  <xsl:variable name="obj" select="java:opennlp.ccgbank.extract.RulesTally.new()"/>
    
  <xsl:template match="Derivation">
    <xsl:apply-templates />
  </xsl:template>

  
  <xsl:template match = "Treenode">
    
    <!--Store ccgbank id for recording example sentences-->	
    <xsl:if test="@Header">
      <xsl:variable name="id" select="java:storeId($obj,@Header)"/>
      <!-- nb: need to pretend to use result to avoid having above call "optimized" away -->
    <xsl:variable name="boo" select="$id"/>
    </xsl:if>
    
    <!--Store unary rule in a freq tally-->
    <!--Unary rules present in the xml derivation-->		  
    <xsl:if test="count(*)=2"> <!--and not(@cat0=./*[2]/@cat0)">-->

      <xsl:variable name="rule" select="java:loadTally($obj,@cat,./*[2]/@cat)"/>
      <!--Check if this rule has not been detected hitherto-->		  
      <xsl:if test="java:checkRuleStatus($obj,string($rule))"> 

      	<typechanging name="{$rule}">
        	<arg>
						<xsl:choose>
							<xsl:when test="contains(*[2]/@cat,'$')">
								<xsl:apply-templates select="./*[2]/*[2]/*[1]" mode="unaryRule"/> 
							</xsl:when>
							<xsl:otherwise>
           			<xsl:apply-templates select="./*[2]/*[1]" mode="unaryRule"/> 
							</xsl:otherwise>
						</xsl:choose>
						<!--<xsl:apply-templates select="./*[2]/*[1]" mode="unaryRule"/>--> 
          </arg>
          <result>
           	<xsl:apply-templates select="./*[1]" mode="unaryRule"/> 
          </result>
        </typechanging>
      </xsl:if> 
    </xsl:if>
    <xsl:apply-templates/>
  
  </xsl:template>
  
  
  <!--Special template for extracting unary rules in the xml-->
  <xsl:template match="@*|node()" mode="unaryRule">
    <xsl:copy>
      <xsl:apply-templates select="@*|node()" mode="unaryRule"/>
    </xsl:copy>
  </xsl:template>
      
</xsl:transform>


================================================
FILE: src/pom.xml
================================================
<project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
      xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">

      <modelVersion>4.0.0</modelVersion>
      <groupId>opennlp</groupId>
      <artifactId>openccg</artifactId>
      <version>0.10.0</version>
     
      <properties>
        <maven.compiler.source>1.8</maven.compiler.source>
        <maven.compiler.target>1.8</maven.compiler.target>
          <project.build.gen>${project.build.directory}/generated-sources</project.build.gen>
      </properties>

      <dependencies>
        
        <dependency>
          <groupId>jdom</groupId>
          <artifactId>jdom</artifactId>
          <version>1.1</version>
        </dependency>
        
        <dependency>
          <groupId>trove</groupId>
          <artifactId>trove</artifactId>
          <version>1.0.2</version>
        </dependency>

        <dependency>
          <groupId>org.apache.ant</groupId>
          <artifactId>ant</artifactId>
          <version>1.9.0</version>
        </dependency>

        <dependency>
          <groupId>net.sf.jgrapht</groupId>
          <artifactId>jgrapht</artifactId>
          <version>0.8.3</version>
        </dependency>

        <dependency>
          <groupId>net.sf.jopt-simple</groupId>
          <artifactId>jopt-simple</artifactId>
          <version>3.1</version>
        </dependency>
        
        <dependency>
          <groupId>junit</groupId>
          <artifactId>junit</artifactId>
          <version>4.12</version>
          <!-- <scope>test</scope> -->
        </dependency>

        <dependency>
          <groupId>jline</groupId>
          <artifactId>jline</artifactId>
          <version>1.0</version>
        </dependency>

        <dependency>
          <groupId>org.eclipse.birt.runtime.3_7_1</groupId>
          <artifactId>org.apache.xml.serializer</artifactId>
          <version>2.7.1</version>
        </dependency>


      </dependencies>

      <build>
        <finalName>openccg</finalName>
        <sourceDirectory>.</sourceDirectory>
        <plugins>
          <plugin>
            <artifactId>maven-compiler-plugin</artifactId>
            <version>3.7.0</version>
            <configuration>
              <excludes>
                <exclude>**/.backup.orig/**</exclude>
                <exclude>srilmbridge/</exclude>
                <exclude>kenlm/</exclude>
              </excludes>
            </configuration>
          </plugin>
          <plugin>
            <groupId>org.codehaus.mojo</groupId>
            <artifactId>javacc-maven-plugin</artifactId>
            <version>2.6</version>
            <executions>
                <execution>
                    <id>jjt</id>
                    <phase>generate-sources</phase>
                    <goals>
                        <goal>jjtree-javacc</goal>
                    </goals>
                    <configuration>
                        <sourceDirectory>${basedir}/opennlp/ccgbank/parse/</sourceDirectory>
                        <outputDirectory>${project.build.gen}/jjtree/</outputDirectory>
                    </configuration>
                </execution>
                <execution>
                    <id>jj</id>
                    <phase>generate-sources</phase>
                    <goals>
                        <goal>javacc</goal>
                    </goals>
                    <configuration>
                        <sourceDirectory>${project.build.gen}/jjtree/opennlp/ccgbank/parse/</sourceDirectory>
                        <outputDirectory>${project.build.gen}/jjtree/</outputDirectory>
                    </configuration>
                </execution>
            </executions>
          </plugin>
            <plugin>
                <groupId>org.codehaus.mojo</groupId>
                <artifactId>build-helper-maven-plugin</artifactId>
                <executions>
                    <execution>
                        <phase>generate-sources</phase>
                        <goals>
                            <goal>add-source</goal>
                        </goals>
                        <configuration>
                            <sources>
                                <source>${project.build.gen}</source>
                            </sources>
                        </configuration>
                    </execution>
                </executions>
            </plugin>
            <!--<plugin>
            <artifactId>maven-resources-plugin</artifactId>
            <version>3.1.0</version>
            <executions>
                <execution>
                    <id>copy-resources</id>
                    <phase>generate-sources</phase>
                    <goals>
                        <goal>copy-resources</goal>
                    </goals>
                    <configuration>
                        <outputDirectory>${project.build.directory}/opennlp/ccgbank/parse/</outputDirectory>
                        <resources>
                            <resource>
                                <directory>${basedir}/opennlp/ccgbank/parse/</directory>
                                <includes>
                                    <include>SimpleNode.java</include>
                                </includes>
                            </resource>
                        </resources>
                    </configuration>
                </execution>
            </executions>
        </plugin>-->
        </plugins>
      </build>
    </project>


================================================
FILE: src/srilmbridge/Makefile
================================================

compile:
	javah -d . -classpath ${OPENCCG_HOME}/classes \
		opennlp.ccg.ngrams.SRILMNgramModel
	g++ -o ${OPENCCG_HOME}/lib/libsrilmbridge.so \
		-Wl,-soname,srilmbridge.so \
		-I${JAVA_HOME}/include \
		-I${JAVA_HOME}/include/linux \
		-I${SRILM}/include \
		-L${SRILM}/lib/i686 \
		srilmbridge.cpp ${SRILM}/lm/src/LM.cc \
		-shared -lc -ldstruct -lflm -llattice -lmisc -loolm \
		-Wno-deprecated		

clean:
	rm ${OPENCCG_HOME}/lib/libsrilmbridge.so
	rm opennlp_ccg_ngrams_SRILMNgramModel.h


================================================
FILE: src/srilmbridge/srilmbridge.cpp
================================================
/* $Id: srilmbridge.cpp,v 1.13 2007/06/16 22:26:28 coffeeblack Exp $ */
#include <jni.h>
#include <LM.h>
#include <Ngram.h>
#include <NgramCountLM.h>
#include "opennlp_ccg_ngrams_SRILMNgramModel.h"

/*
 * Bridge from Java to the SRILM toolkit library. Loads a language model based
 * on specified parameters, then calculates the probability of a word within a
 * given context.
 *
 * Author: Scott Martin (http://www.ling.osu.edu/~scott/)
 * Version: $Revision: 1.13 $
 */

const static unsigned STANDARD = 0, COUNT = 1;

/*
 * The language model we will use to calculate word probabilities.
 */
LM *lm = NULL;

/*
 * The type of language model in effect, as specified in loadLM.
 */
unsigned nativeLMType = STANDARD;

/*
 * Loads a language model from a specified file with the specified ngram order.
 * The parameter lmType specifies what type (format) of language model to
 * expect.
 *
 * Throws:
 *	java.io.IOException If fileName is null or empty or if a problem is
 * 		encountered reading the language model file.
 *	java.lang.IllegalStateException If an LM has already been loaded.
 *	java.lang.IllegalArgumentException If the specified LM type is not
 *		supported. Currently supports STANDARD (type 0) and COUNT (type 1).
 */
JNIEXPORT void JNICALL Java_opennlp_ccg_ngrams_SRILMNgramModel_loadLM
  	(JNIEnv *env, jobject obj, jint order, jstring fileName, jint lmType) {
  if(lm != NULL) { // already loaded
  	env->ThrowNew(env->FindClass("java/lang/IllegalStateException"),
  		"LM already loaded");
  	return;
  }
  
  nativeLMType = lmType;
  
  if(nativeLMType < STANDARD || nativeLMType > COUNT) {
  	// only STANDARD and COUNT are allowed
  	env->ThrowNew(env->FindClass("java/lang/IllegalArgumentException"),
  		"LM type not supported");
  	return;
  }
  if(fileName == 0 || env->GetStringLength(fileName) == 0) {
		env->ThrowNew(env->FindClass("java/io/IOException"),
			"problem reading LM: empty file name");
		return;
  }
	
  Vocab *vocab = new Vocab;
  lm = (nativeLMType == COUNT)
  	? (LM *)new NgramCountLM(*vocab, order)
  	:	(LM *)new Ngram(*vocab, order);
  
  const char* nativeFileName = env->GetStringUTFChars(fileName, NULL);
  
  File file(nativeFileName, "r", 0);
  unsigned lmError = 0;
  
  if(((File *)&file)->error() > 0) {
  	lmError = 1;
  	env->ThrowNew(env->FindClass("java/io/IOException"),
  		"problem with LM file");
  }
  else if(!lm->read(file)) {
  	lmError = 1;
		env->ThrowNew(env->FindClass("java/io/IOException"), "problem reading LM");
  }
  //TODO the following just repeats finalize(), should be in reusable function
  if(lmError > 0) { // destroy lm so this can be called again
  	vocab->~Vocab();
  	
  	if(lm != NULL) {
  		if(nativeLMType == STANDARD) {
	  		((Ngram *)lm)->~Ngram();
	  	}
	  	else if(nativeLMType == COUNT) {
	  		((NgramCountLM *)lm)->~NgramCountLM();
	  	}
	  	else { // as a failsafe, call the abstract destructor
		  	lm->~LM();
		  }
  	
	  	delete lm;
  	}
  	
		lm = NULL; //TODO clean up file somehow?
  }
  
  ((File *)&file)->close();
  env->ReleaseStringUTFChars(fileName, nativeFileName);
}

/*
 * Uses the SRILM toolkit library to calculate the log prob of a word in a
 * specified context. The context is a history of tokens preceeding the
 * specified word specified in reverse order. For example, to find the
 * probability of "rain" in the context "in the rain", this method should be
 * called with "rain" as the parameter `word' and the array {"the", "in"} in
 * the parameter `context'.
 *
 * To calculate the log probability of a single word with no context, call this
 * method with either (1) NULL, or (2) a zero-length array as the value of
 * the parameter `context'.
 *
 * Throws:
 *	java.lang.IllegalStateException If an error happened while loading
 * 		the LM and word probabilities can not be computed.
 *	java.lang.IllegalArgumentException If the specified word is null or
 *		zero-length or if the specified context contains a null or zero-length
 *		string.
 */
JNIEXPORT jfloat JNICALL Java_opennlp_ccg_ngrams_SRILMNgramModel_doLogProb
  	(JNIEnv *env, jobject obj, jstring word, jobjectArray context) {
  // make sure LM is ok to use
  if(lm == NULL) {
  	env->ThrowNew(env->FindClass("java/lang/IllegalStateException"),
  		"LM not loaded");
  	return 0;
  }
  
  // sanity checks must throw Java exceptions
  if(word == NULL || env->GetStringLength(word) == 0) {
  	env->ThrowNew(env->FindClass("java/lang/IllegalArgumentException"),
			"word is null or zero-length");
  	return 0;
  }
  
  int contextLength = (context == NULL) ? 0 : env->GetArrayLength(context);

	VocabString nativeWord = (VocabString)env->GetStringUTFChars(word, NULL);
  VocabString nativeContext[contextLength + 1];
  nativeContext[contextLength] = NULL; // context must be terminated by NULL
  
  // build context, converting each Java string to a VocabString
  jstring jstr = NULL;
  for(unsigned i = 0; i < contextLength; i++) {
  	jstr = (jstring)env->GetObjectArrayElement(context, i);
  	
  	if(jstr == NULL || env->GetStringLength(jstr) == 0) {
  		env->ThrowNew(env->FindClass("java/lang/IllegalArgumentException"),
  			"context contains null or zero-length string");
  		
  		env->DeleteLocalRef(jstr);
  		env->ReleaseStringUTFChars(word, nativeWord); // release word
  		// release already translated strings
  		for(unsigned j = (i - 1); j >= 0; j--) {
  			env->ReleaseStringUTFChars(
  				(jstring)env->GetObjectArrayElement(context, j), nativeContext[j]);
  		}
  		
  		return 0;
  	}
  	
  	nativeContext[i] = (VocabString)env->GetStringUTFChars(jstr, NULL);
  }
  
  if(jstr != NULL) {
	  env->DeleteLocalRef(jstr);
	}
  
  LogP prob = lm->wordProb(nativeWord, nativeContext);
  
  // clean up
  env->ReleaseStringUTFChars(word, nativeWord); // release word
  
  // release context strings if any
  for(unsigned k = 0; k < contextLength; k++) {
  	env->ReleaseStringUTFChars((jstring)env->GetObjectArrayElement(context, k),
  		nativeContext[k]);
	}
  
  return prob;
}

/*
 * Should be called by a finalize() method from within Java. Calls the
 * destructor method on the language model object we are using.
 */
JNIEXPORT void JNICALL Java_opennlp_ccg_ngrams_SRILMNgramModel_finalize
  (JNIEnv *env, jobject obj) {
 if(lm != NULL) { // call local destructors if type was specified
  	if(nativeLMType == STANDARD) {
  		((Ngram *)lm)->~Ngram();
  	}
  	else if(nativeLMType == COUNT) {
  		((NgramCountLM *)lm)->~NgramCountLM();
  	}
  	else { // as a failsafe, call the abstract destructor
	  	lm->~LM();
	  }
  	
  	delete lm;
  }
}


================================================
FILE: test/grammar.xml
================================================
<?xml version="1.0"?>
<grammar name="base"
  xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
  xsi:noNamespaceSchemaLocation="../grammars/grammar.xsd"
>
  <lexicon file="lexicon.xml"/>
  <morphology file="morph.xml"/>
  <rules file="rules.xml"/>
  
  <LF-from-XML>
    <transform file="../grammars/convert-to-hlds.xsl"/>
    <transform file="../grammars/add-chunks.xsl"/>
  </LF-from-XML>
  
</grammar>


================================================
FILE: test/lexicon.xml
================================================
<?xml version="1.0" encoding="UTF-8"?><ccg-lexicon xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" name="protogrammar" xsi:noNamespaceSchemaLocation="../lexicon.xsd">
  <licensing-features>
    <feat location="target-only" val="emb" attr="form"/>
    <feat location="target-only" val="to" attr="form"/>
  </licensing-features>
  <family closed="false" pos="NN" name="n_1" pos1="NN">
    <entry name="Primary">
      <atomcat type="n">
        <fs id="1">
          <feat attr="index">
            <lf>
              <nomvar name="X1"/>
            </lf>
          </feat>
          <feat val="3s" attr="pnum"/>
        </fs>
        <lf>
          <satop nomvar="X1">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="num">
              <prop name="sg"/>
            </diamond>
          </satop>
        </lf>
      </atomcat>
    </entry>
  </family>
  <family unmatched="true" closed="true" pos="DT" name="np_1/n_1" pos1="DT">
    <entry name="Primary">
      <complexcat>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="n">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="a"/>
    <member stem="an"/>
    <member stem="any"/>
    <member stem="la"/>
    <member stem="lrb"/>
    <member stem="marshall"/>
    <member stem="no"/>
    <member stem="some"/>
    <member stem="that"/>
    <member stem="the"/>
    <member stem="these"/>
    <member stem="this"/>
  </family>
  <family closed="false" pos="JJ" name="n_~1/n_1" pos1="JJ">
    <entry name="Primary">
      <complexcat>
        <atomcat type="n">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="n">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
  <family closed="true" pos="IN" name="np_~1\np_1/np_2" pos1="IN">
    <entry name="Primary">
      <complexcat>
        <atomcat type="np">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Arg1">
                <nomvar name="X2"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem=":"/>
    <member stem="against"/>
    <member stem="along"/>
    <member stem="around"/>
    <member stem="as"/>
    <member stem="at"/>
    <member stem="before"/>
    <member stem="by"/>
    <member stem="for"/>
    <member stem="from"/>
    <member stem="in"/>
    <member stem="like"/>
    <member stem="near"/>
    <member stem="of"/>
    <member stem="on"/>
    <member stem="outside"/>
    <member stem="rrb"/>
    <member stem="since"/>
    <member stem="through"/>
    <member stem="up"/>
    <member stem="with"/>
    <member stem="within"/>
  </family>
  <family closed="false" pos="NNS" name="n_1" pos1="NNS">
    <entry name="Primary">
      <atomcat type="n">
        <fs id="1">
          <feat attr="index">
            <lf>
              <nomvar name="X1"/>
            </lf>
          </feat>
          <feat val="-3s" attr="pnum"/>
        </fs>
        <lf>
          <satop nomvar="X1">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="num">
              <prop name="pl"/>
            </diamond>
          </satop>
        </lf>
      </atomcat>
    </entry>
  </family>
  <family closed="false" pos="NN" name="n_~1/n_1" pos1="NN">
    <entry name="Primary">
      <complexcat>
        <atomcat type="n">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="n">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="num">
                <prop name="sg"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
  </family>
  <family indexRel="mood" closed="true" name="sent_1\*s[dcl]_1" pos=".">
    <entry name="Primary">
      <complexcat>
        <atomcat type="sent">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="mood">
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member pred="dcl" stem="."/>
  </family>
  <family closed="true" pos="IN" name="s_~1\np_2\(s_1\np_2)/np_3" pos1="IN">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="X3"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Arg1">
                <nomvar name="X3"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="about"/>
    <member stem="after"/>
    <member stem="at"/>
    <member stem="before"/>
    <member stem="by"/>
    <member stem="during"/>
    <member stem="for"/>
    <member stem="from"/>
    <member stem="in"/>
    <member stem="into"/>
    <member stem="near"/>
    <member stem="on"/>
    <member stem="over"/>
    <member stem="since"/>
    <member stem="towards"/>
    <member stem="with"/>
  </family>
  <family closed="true" pos="PRP" name="np_1" pos1="PRP">
    <entry name="Primary">
      <atomcat type="np">
        <fs id="1">
          <feat attr="index">
            <lf>
              <nomvar name="X1"/>
            </lf>
          </feat>
        </fs>
        <lf>
          <satop nomvar="X1">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </atomcat>
    </entry>
    <member stem="he"/>
    <member stem="him"/>
    <member stem="i"/>
    <member stem="it"/>
    <member stem="them"/>
    <member stem="themselves"/>
    <member stem="they"/>
    <member stem="us"/>
    <member stem="we"/>
    <member stem="you"/>
  </family>
  <family unmatched="true" closed="true" pos="VB" name="s[b]_1\np_1/np_2" pos1="VB">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="b"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="extradite"/>
    <member stem="inhabit"/>
    <member stem="accept"/>
    <member stem="affect"/>
    <member stem="be"/>
    <member stem="become"/>
    <member stem="bring"/>
    <member stem="cause"/>
    <member stem="choose"/>
    <member stem="construct"/>
    <member stem="disclose"/>
    <member stem="discuss"/>
    <member stem="do"/>
    <member stem="express"/>
    <member stem="formulate"/>
    <member stem="get"/>
    <member stem="give"/>
    <member stem="hand"/>
    <member stem="have"/>
    <member stem="improve"/>
    <member stem="join"/>
    <member stem="leave"/>
    <member stem="list"/>
    <member stem="make"/>
    <member stem="market"/>
    <member stem="mobilize"/>
    <member stem="need"/>
    <member stem="overlook"/>
    <member stem="overthrow"/>
    <member stem="play"/>
    <member stem="prevent"/>
    <member stem="prolong"/>
    <member stem="promote"/>
    <member stem="rebuild"/>
    <member stem="reclaim"/>
    <member stem="redeem"/>
    <member stem="set"/>
    <member stem="solve"/>
    <member stem="stand"/>
    <member stem="submit"/>
    <member stem="support"/>
  </family>
  <family closed="true" pos="RB" name="s_~1\np_2\(s_1\np_2)" pos1="RB">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="about"/>
    <member stem="abroad"/>
    <member stem="again"/>
    <member stem="also"/>
    <member stem="back"/>
    <member stem="before"/>
    <member stem="directly"/>
    <member stem="just"/>
    <member stem="n't"/>
    <member stem="never"/>
    <member stem="not"/>
    <member stem="now"/>
    <member stem="officially"/>
    <member stem="once"/>
    <member stem="privately"/>
    <member stem="rapidly"/>
    <member stem="recently"/>
    <member stem="repeatedly"/>
    <member stem="soon"/>
    <member stem="still"/>
    <member stem="there"/>
    <member stem="up"/>
  </family>
  <family closed="true" pos="CD" name="n_~1/n_1" pos1="CD">
    <entry name="Primary">
      <complexcat>
        <atomcat type="n">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="n">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="1"/>
    <member stem="10%"/>
    <member stem="11"/>
    <member stem="11,500"/>
    <member stem="150"/>
    <member stem="175"/>
    <member stem="18,000"/>
    <member stem="19"/>
    <member stem="2"/>
    <member stem="20,000"/>
    <member stem="21"/>
    <member stem="260"/>
    <member stem="30"/>
    <member stem="4.5"/>
    <member stem="5,100"/>
    <member stem="50"/>
    <member stem="50-70"/>
    <member stem="53,810,000"/>
    <member stem="70"/>
    <member stem="billion"/>
    <member stem="five"/>
    <member stem="hundred"/>
    <member stem="million"/>
    <member stem="one"/>
    <member stem="two"/>
  </family>
  <family unmatched="true" closed="true" pos="TO" name="s[to]_~1\np_1/(s[b]_1\np_1)" pos1="TO">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="form" val="to"/>
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="form" val="b"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
      </complexcat>
    </entry>
    <member stem="to"/>
  </family>
  <family unmatched="true" closed="true" pos="IN" name="pp_~2/np_1" pos1="IN">
    <entry name="Primary">
      <complexcat>
        <atomcat type="pp">
          <fs inheritsFrom="2">
            <feat attr="form">
              <featvar name="FORM"/>
            </feat>
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="about"/>
    <member stem="as"/>
    <member stem="at"/>
    <member stem="by"/>
    <member stem="for"/>
    <member stem="from"/>
    <member stem="in"/>
    <member stem="into"/>
    <member stem="of"/>
    <member stem="on"/>
    <member stem="with"/>
  </family>
  <family unmatched="true" closed="true" pos="MD" name="s[dcl]_1\np_1/(s[b]_2\np_1)" pos1="MD">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="2">
              <feat attr="form" val="b"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
      </complexcat>
    </entry>
    <member stem="can"/>
    <member stem="may"/>
    <member stem="might"/>
    <member stem="must"/>
    <member stem="should"/>
    <member stem="will"/>
    <member stem="would"/>
  </family>
  <family unmatched="true" closed="true" pos="VBD" name="s[dcl]_1\np_1/np_2" pos1="VBD">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="utilized"/>
    <member stem="announce"/>
    <member stem="be"/>
    <member stem="become"/>
    <member stem="erect"/>
    <member stem="establish"/>
    <member stem="express"/>
    <member stem="have"/>
    <member stem="help"/>
    <member stem="hold"/>
    <member stem="kill"/>
    <member stem="make"/>
    <member stem="miss"/>
    <member stem="pick"/>
    <member stem="reach"/>
    <member stem="see"/>
    <member stem="sign"/>
    <member stem="wave"/>
    <member stem="welcome"/>
  </family>
  <family closed="true" pos="," name="np_1\*np_2/*np_3" pos1="PUNCT_CONJ">
    <entry name="Primary">
      <complexcat>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="X3"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Arg1">
                <nomvar name="X3"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem=","/>
  </family>
  <family closed="true" pos="IN" name="s[em]_~1/s[dcl]_1" pos1="IN" indexRel="*NoSem*">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="form" val="em"/>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="that"/>
  </family>
  <family unmatched="true" closed="true" pos="PRP$" name="np_1/n_1" pos1="PRP$">
    <entry name="Primary">
      <complexcat>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="n">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="his"/>
    <member stem="its"/>
    <member stem="our"/>
    <member stem="their"/>
  </family>
  <family unmatched="true" closed="true" pos="TO" name="pp_~2/np_1" pos1="TO">
    <entry name="Primary">
      <complexcat>
        <atomcat type="pp">
          <fs inheritsFrom="2">
            <feat attr="form">
              <featvar name="FORM"/>
            </feat>
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="to"/>
  </family>
  <family closed="true" pos="IN" name="s_~1/s_1/np_2" pos1="IN">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Arg1">
                <nomvar name="X2"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="as"/>
    <member stem="at"/>
    <member stem="by"/>
    <member stem="from"/>
    <member stem="in"/>
    <member stem="of"/>
    <member stem="on"/>
  </family>
  <family unmatched="true" closed="true" pos="VBN" name="s[pss]_1\np_1" pos1="VBN">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="pss"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="garrisoned"/>
    <member stem="utilized"/>
    <member stem="base"/>
    <member stem="blacken"/>
    <member stem="control"/>
    <member stem="establish"/>
    <member stem="estimate"/>
    <member stem="follow"/>
    <member stem="gather"/>
    <member stem="hold"/>
    <member stem="include"/>
    <member stem="locate"/>
    <member stem="release"/>
    <member stem="take"/>
    <member stem="try"/>
    <member stem="understand"/>
  </family>
  <family closed="true" pos="NNP" name="n_1" pos1="NNP">
    <entry name="Primary">
      <atomcat type="n">
        <fs id="1">
          <feat attr="index">
            <lf>
              <nomvar name="X1"/>
            </lf>
          </feat>
          <feat val="3s" attr="pnum"/>
        </fs>
        <lf>
          <satop nomvar="X1">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="num">
              <prop name="sg"/>
            </diamond>
          </satop>
        </lf>
      </atomcat>
    </entry>
    <member stem="china"/>
    <member stem="gansu"/>
    <member stem="gusa"/>
    <member stem="i.e."/>
    <member stem="israel"/>
    <member stem="min"/>
    <member stem="october"/>
    <member stem="u.s."/>
    <member stem="un."/>
    <member stem="washington"/>
    <member stem="wuhan"/>
    <member stem="xianglong"/>
    <member stem="xiaoshan"/>
  </family>
  <family unmatched="true" closed="true" pos="VBZ" name="s[dcl]_1\np_1/np_2" pos1="VBZ">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
            <feat val="3s" attr="pnum"/>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="be"/>
    <member stem="become"/>
    <member stem="establish"/>
    <member stem="exceed"/>
    <member stem="have"/>
    <member stem="help"/>
    <member stem="remain"/>
  </family>
  <family unmatched="true" closed="true" pos="VBG" name="s[ng]_1\np_1/np_2" pos1="VBG">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="ng"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="defaming"/>
    <member stem="hong"/>
    <member stem="affect"/>
    <member stem="attend"/>
    <member stem="cover"/>
    <member stem="draft"/>
    <member stem="eat"/>
    <member stem="enter"/>
    <member stem="experience"/>
    <member stem="implement"/>
    <member stem="make"/>
    <member stem="produce"/>
    <member stem="reach"/>
    <member stem="rob"/>
  </family>
  <family closed="true" pos="RB" name="s_~1\np_2/(s_1\np_2)" pos1="RB">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="actually"/>
    <member stem="also"/>
    <member stem="currently"/>
    <member stem="fully"/>
    <member stem="never"/>
    <member stem="now"/>
    <member stem="obviously"/>
    <member stem="once"/>
    <member stem="still"/>
    <member stem="then"/>
  </family>
  <family closed="true" pos="CC" name="np_1\*np_2/*np_3" pos1="CC">
    <entry name="Primary">
      <complexcat>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="X3"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="First">
              <nomvar name="X2"/>
            </diamond>
            <diamond mode="Next">
              <nomvar name="X3"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="and"/>
    <member stem="or"/>
  </family>
  <family unmatched="true" closed="true" pos="VBD" name="s[dcl]_1\np_1/s[em]_2" pos1="VBD">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="s">
          <fs id="2">
            <feat attr="form" val="em"/>
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="emphasize"/>
    <member stem="indicate"/>
    <member stem="reiterate"/>
    <member stem="repeat"/>
    <member stem="say"/>
    <member stem="state"/>
  </family>
  <family closed="true" pos="DT" name="np_1" pos1="DT">
    <entry name="Primary">
      <atomcat type="np">
        <fs id="1">
          <feat attr="index">
            <lf>
              <nomvar name="X1"/>
            </lf>
          </feat>
        </fs>
        <lf>
          <satop nomvar="X1">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </atomcat>
    </entry>
    <member stem="both"/>
    <member stem="everyone"/>
    <member stem="some"/>
    <member stem="someone"/>
    <member stem="something"/>
    <member stem="that"/>
    <member stem="the"/>
    <member stem="these"/>
    <member stem="this"/>
    <member stem="those"/>
  </family>
  <family closed="true" pos="CD" name="n_1" pos1="CD">
    <entry name="Primary">
      <atomcat type="n">
        <fs id="1">
          <feat attr="index">
            <lf>
              <nomvar name="X1"/>
            </lf>
          </feat>
        </fs>
        <lf>
          <satop nomvar="X1">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </atomcat>
    </entry>
    <member stem="18%"/>
    <member stem="1975"/>
    <member stem="1997"/>
    <member stem="1998"/>
    <member stem="2000"/>
    <member stem="30%"/>
    <member stem="35.9%"/>
    <member stem="40"/>
    <member stem="65%"/>
    <member stem="billion"/>
    <member stem="one"/>
  </family>
  <family closed="true" pos="POS" name="np_1/n_1\np_2" pos1="POS" indexRel="GenOwn">
    <entry name="Primary">
      <complexcat>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="n">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="GenOwn">
              <nomvar name="X2"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="'s"/>
  </family>
  <family closed="true" pos="RB" name="s[adj]_~1\np_2/(s[adj]_1\np_2)" pos1="RB">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="form" val="adj"/>
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="form" val="adj"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="anwar"/>
    <member stem="possibly"/>
    <member stem="quite"/>
    <member stem="very"/>
  </family>
  <family unmatched="true" closed="true" pos="JJ" name="s[adj]_1\np_1/pp_2" pos1="JJ">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="adj"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="pp">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="close"/>
    <member stem="guilty"/>
    <member stem="incapable"/>
    <member stem="july"/>
    <member stem="portugal"/>
    <member stem="proud"/>
    <member stem="similar"/>
    <member stem="toady"/>
  </family>
  <family unmatched="true" closed="true" pos="VBN" name="s[pss]_1\np_1/pp_2" pos1="VBN">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="pss"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="pp">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="belonged"/>
    <member stem="deed"/>
    <member stem="accept"/>
    <member stem="ask"/>
    <member stem="compare"/>
    <member stem="cooperate"/>
    <member stem="postpone"/>
    <member stem="rate"/>
    <member stem="want"/>
  </family>
  <family closed="true" pos="CD" name="n_~1/n_1/(n_~1/n_1)" pos1="CD">
    <entry name="Primary">
      <complexcat>
        <atomcat type="n">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="n">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="n">
            <fs inheritsFrom="1">
              <feat attr="mod-index">
                <lf>
                  <nomvar name="M"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="/" mode="&gt;"/>
          <atomcat type="n">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="M">
            <diamond mode="Mod">
              <nomvar name="R"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="1"/>
    <member stem="1.3"/>
    <member stem="100"/>
    <member stem="245"/>
    <member stem="248"/>
    <member stem="26"/>
    <member stem="30"/>
    <member stem="9"/>
  </family>
  <family closed="true" pos="CC" name="s[dcl]_1$_1\*(s[dcl]_2$_1)/*(s[dcl]_3$_1)" pos1="CC">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash/>
        <dollar name="1"/>
        <slash mode="*" dir="\"/>
        <complexcat>
          <atomcat type="s">
            <fs id="2">
              <feat attr="form" val="dcl"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
        </complexcat>
        <slash mode="*" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="3">
              <feat attr="form" val="dcl"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X3"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
        </complexcat>
        <lf>
          <satop nomvar="X1">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="First">
              <nomvar name="X2"/>
            </diamond>
            <diamond mode="Next">
              <nomvar name="X3"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="and"/>
    <member stem="but"/>
  </family>
  <family unmatched="true" closed="true" pos="VBD" name="s[dcl]_1\np_1/s[dcl]_2" pos1="VBD">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="s">
          <fs id="2">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="mean"/>
    <member stem="say"/>
  </family>
  <family unmatched="true" closed="true" pos="VBP" name="s[dcl]_1\np_1/(s[adj]_2\np_1)" pos1="VBP">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
            <feat val="-3s" attr="pnum"/>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="2">
              <feat attr="form" val="adj"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
      </complexcat>
    </entry>
    <member stem="be"/>
    <member stem="feel"/>
    <member stem="recognize"/>
  </family>
  <family closed="true" pos="CC" name="n_1\*n_2/*n_3" pos1="CC">
    <entry name="Primary">
      <complexcat>
        <atomcat type="n">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <atomcat type="n">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="X3"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="First">
              <nomvar name="X2"/>
            </diamond>
            <diamond mode="Next">
              <nomvar name="X3"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="and"/>
  </family>
  <family unmatched="true" closed="true" pos="CC" name="s[dcl]_1\*,_2/*s[dcl]_3" pos1="CC">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type=",">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <atomcat type="s">
          <fs id="3">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X3"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="and"/>
    <member stem="but"/>
  </family>
  <family unmatched="true" closed="true" pos="VBD" name="s[dcl]_1\np_1" pos1="VBD">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="bring"/>
    <member stem="disclose"/>
    <member stem="fall"/>
    <member stem="go"/>
    <member stem="say"/>
    <member stem="think"/>
  </family>
  <family closed="true" pos="TO" name="s_~1\np_2\(s_1\np_2)/np_3" pos1="TO">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="X3"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Arg1">
                <nomvar name="X3"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="to"/>
  </family>
  <family closed="true" pos="CC" name="n_1/n_1\*(n_2/n_2)/*(n_3/n_3)" pos1="CC">
    <entry name="Primary">
      <complexcat>
        <atomcat type="n">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="n">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <complexcat>
          <atomcat type="n">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="/" mode="&gt;"/>
          <atomcat type="n">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash mode="*" dir="/"/>
        <complexcat>
          <atomcat type="n">
            <fs id="3">
              <feat attr="index">
                <lf>
                  <nomvar name="X3"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="/" mode="&gt;"/>
          <atomcat type="n">
            <fs id="3">
              <feat attr="index">
                <lf>
                  <nomvar name="X3"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Arg2">
                <nomvar name="X2"/>
              </diamond>
              <diamond mode="Arg1">
                <nomvar name="X3"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="and"/>
  </family>
  <family closed="true" pos="RP" name="s_~1\np_2\(s_1\np_2)" pos1="RP">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="away"/>
    <member stem="back"/>
    <member stem="off"/>
    <member stem="over"/>
    <member stem="up"/>
  </family>
  <family unmatched="true" closed="true" pos="JJ" name="s[adj]_1\np_1" pos1="JJ">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="adj"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="burnt"/>
    <member stem="close"/>
    <member stem="disappointing"/>
    <member stem="glorious"/>
    <member stem="good"/>
    <member stem="normal"/>
    <member stem="proud"/>
  </family>
  <family unmatched="true" closed="true" pos="VB" name="s[b]_1\np_1/(s[pss]_2\np_1)" pos1="VB">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="b"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="2">
              <feat attr="form" val="pss"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
      </complexcat>
    </entry>
    <member stem="be" pred="PASS"/>
  </family>
  <family closed="true" pos="TO" name="np_~1\np_1/np_2" pos1="TO">
    <entry name="Primary">
      <complexcat>
        <atomcat type="np">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Arg1">
                <nomvar name="X2"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="to"/>
  </family>
  <family unmatched="true" closed="true" pos="VBZ" name="s[dcl]_1\np_1/(s[ng]_2\np_1)" pos1="VBZ">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
            <feat val="3s" attr="pnum"/>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="2">
              <feat attr="form" val="ng"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
      </complexcat>
    </entry>
    <member stem="be" pred="PROG"/>
  </family>
  <family closed="true" pos="EX" name="np[thr]_1" pos1="EX" indexRel="*NoSem*">
    <entry name="Primary">
      <atomcat type="np">
        <fs id="1">
          <feat val="thr" attr="lex"/>
        </fs>
      </atomcat>
    </entry>
    <member stem="there"/>
  </family>
  <family closed="true" pos="IN" name="s_~1\np_2\(s_1\np_2)/s[dcl]_3" pos1="IN">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="s">
          <fs id="3">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X3"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Arg1">
                <nomvar name="X3"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="after"/>
    <member stem="because"/>
    <member stem="that"/>
    <member stem="though"/>
  </family>
  <family unmatched="true" closed="true" pos="VBN" name="s[pt]_1\np_1/np_2" pos1="VBN">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="pt"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="eleven"/>
    <member stem="bomb"/>
    <member stem="determine"/>
    <member stem="express"/>
    <member stem="make"/>
    <member stem="take"/>
  </family>
  <family closed="true" pos="RB" name="n_~1/n_1/(n_~1/n_1)" pos1="RB">
    <entry name="Primary">
      <complexcat>
        <atomcat type="n">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="n">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="n">
            <fs inheritsFrom="1">
              <feat attr="mod-index">
                <lf>
                  <nomvar name="M"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="/" mode="&gt;"/>
          <atomcat type="n">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="M">
            <diamond mode="Mod">
              <nomvar name="R"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="about"/>
    <member stem="financially"/>
    <member stem="just"/>
    <member stem="so"/>
    <member stem="very"/>
    <member stem="yet"/>
  </family>
  <family closed="true" pos="RB" name="s_~1\np_2\(s_1\np_2)/(s_~1\np_2\(s_1\np_2))" pos1="RB">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="s">
            <fs inheritsFrom="1">
              <feat attr="mod-index">
                <lf>
                  <nomvar name="M"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <complexcat>
            <atomcat type="s">
              <fs id="1">
                <feat attr="index">
                  <lf>
                    <nomvar name="X1"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
            <slash dir="\" mode="&lt;"/>
            <atomcat type="np">
              <fs id="2">
                <feat attr="index">
                  <lf>
                    <nomvar name="X2"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
          </complexcat>
        </complexcat>
        <lf>
          <satop nomvar="M">
            <diamond mode="Mod">
              <nomvar name="R"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="all"/>
    <member stem="even"/>
    <member stem="just"/>
    <member stem="only"/>
    <member stem="so"/>
  </family>
  <family closed="true" pos="NNS" name="n_~1/n_1" pos1="NNS">
    <entry name="Primary">
      <complexcat>
        <atomcat type="n">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="n">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="num">
                <prop name="pl"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="affair"/>
    <member stem="benefit"/>
    <member stem="creditor"/>
    <member stem="rights"/>
    <member stem="year"/>
  </family>
  <family unmatched="true" closed="true" pos="VBZ" name="s[dcl]_1\np_1/(s[pt]_2\np_1)" pos1="VBZ">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
            <feat val="3s" attr="pnum"/>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="2">
              <feat attr="form" val="pt"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
      </complexcat>
    </entry>
    <member stem="have" pred="PERF"/>
  </family>
  <family closed="true" pos="JJS" name="n_~1/n_1" pos1="JJS">
    <entry name="Primary">
      <complexcat>
        <atomcat type="n">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="n">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="best"/>
    <member stem="biggest"/>
    <member stem="greatest"/>
    <member stem="most"/>
  </family>
  <family closed="true" pos="VBG" name="s_~1/s_1/pp_2" pos1="VBG">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="pp">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="partic">
                <prop name="pres"/>
              </diamond>
              <diamond mode="Arg1">
                <nomvar name="X2"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="accord"/>
  </family>
  <family closed="true" pos="DT" name="np_~1\np_1/n_2" pos1="DT">
    <entry name="Primary">
      <complexcat>
        <atomcat type="np">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Arg1">
                <nomvar name="X2"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="kong"/>
    <member stem="the"/>
  </family>
  <family unmatched="true" closed="true" pos="VBP" name="s[dcl]_1\np_1/(s[pt]_2\np_1)" pos1="VBP">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
            <feat val="-3s" attr="pnum"/>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="2">
              <feat attr="form" val="pt"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
      </complexcat>
    </entry>
    <member stem="have" pred="PERF"/>
  </family>
  <family closed="true" pos="VBG" name="n_~1/n_1" pos1="VBG">
    <entry name="Primary">
      <complexcat>
        <atomcat type="n">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="n">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="partic">
                <prop name="pres"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="zhejiang"/>
    <member stem="maintain"/>
    <member stem="remain"/>
    <member stem="support"/>
  </family>
  <family unmatched="true" closed="true" pos="VBZ" name="s[dcl]_1\np_1/(s[to]_2\np_1)" pos1="VBZ">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
            <feat val="3s" attr="pnum"/>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="2">
              <feat attr="form" val="to"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
      </complexcat>
    </entry>
    <member stem="be"/>
    <member stem="hope"/>
    <member stem="want"/>
  </family>
  <family unmatched="true" closed="true" pos="VBD" name="s[dcl]_1\np_1/pp_2/np_3" pos1="VBD">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="pp">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="X3"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="accompany"/>
    <member stem="call"/>
    <member stem="express"/>
    <member stem="tell"/>
  </family>
  <family unmatched="true" closed="true" pos="VB" name="s[b]_1\np_1" pos1="VB">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="b"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="re-start"/>
    <member stem="close"/>
    <member stem="fight"/>
    <member stem="go"/>
  </family>
  <family closed="true" pos="IN" name="s_~1\s_1/s[dcl]_2" pos1="IN">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="s">
          <fs id="2">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Arg1">
                <nomvar name="X2"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem=":"/>
  </family>
  <family closed="true" pos="WDT" name="np_~1\np_1/(s[dcl]_2\np_1)" pos1="WDT" indexRel="GenRel">
    <entry name="Primary">
      <complexcat>
        <atomcat type="np">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="2">
              <feat attr="form" val="dcl"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="GenRel">
              <nomvar name="X2"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="that"/>
    <member stem="which"/>
  </family>
  <family unmatched="true" closed="true" pos="VBN" name="s[pt]_1\np_1" pos1="VBN">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="pt"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="drop"/>
    <member stem="fall"/>
    <member stem="increase"/>
    <member stem="step"/>
  </family>
  <family unmatched="true" closed="true" pos="VBG" name="s[ng]_1\np_1" pos1="VBG">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="ng"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="beijing"/>
    <member stem="develop"/>
    <member stem="miss"/>
    <member stem="take"/>
  </family>
  <family closed="true" pos="WP" name="np_~1\np_1/(s[dcl]_2\np_1)" pos1="WP" indexRel="GenRel">
    <entry name="Primary">
      <complexcat>
        <atomcat type="np">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="2">
              <feat attr="form" val="dcl"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="GenRel">
              <nomvar name="X2"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="who"/>
  </family>
  <family unmatched="true" closed="true" pos="VBP" name="s[dcl]_1\np_1/np_2" pos1="VBP">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
            <feat val="-3s" attr="pnum"/>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="administrate"/>
    <member stem="be"/>
    <member stem="become"/>
    <member stem="take"/>
  </family>
  <family unmatched="true" closed="true" pos="VBD" name="s[dcl]_1\np_1/(s[pt]_2\np_1)" pos1="VBD">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="2">
              <feat attr="form" val="pt"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
      </complexcat>
    </entry>
    <member stem="have" pred="PERF"/>
  </family>
  <family closed="true" pos="CD" name="n[num]_1" pos1="CD">
    <entry name="Primary">
      <atomcat type="n">
        <fs id="1">
          <feat attr="form" val="num"/>
          <feat attr="index">
            <lf>
              <nomvar name="X1"/>
            </lf>
          </feat>
        </fs>
        <lf>
          <satop nomvar="X1">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </atomcat>
    </entry>
    <member stem="26"/>
    <member stem="billion"/>
    <member stem="million"/>
  </family>
  <family unmatched="true" closed="true" pos="VBZ" name="s[dcl]_1\np_1" pos1="VBZ">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
            <feat val="3s" attr="pnum"/>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="leave"/>
    <member stem="require"/>
    <member stem="start"/>
    <member stem="work"/>
  </family>
  <family unmatched="true" closed="true" pos="VBZ" name="s[dcl]_1\np_1/s[dcl]_2" pos1="VBZ">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
            <feat val="3s" attr="pnum"/>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="s">
          <fs id="2">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="admit"/>
    <member stem="believe"/>
    <member stem="say"/>
  </family>
  <family closed="true" pos="," name="s[dcl]_1$_1\*(s[dcl]_2$_1)/*(s[dcl]_3$_1)" pos1="PUNCT_CONJ">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash/>
        <dollar name="1"/>
        <slash mode="*" dir="\"/>
        <complexcat>
          <atomcat type="s">
            <fs id="2">
              <feat attr="form" val="dcl"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
        </complexcat>
        <slash mode="*" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="3">
              <feat attr="form" val="dcl"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X3"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
        </complexcat>
        <lf>
          <satop nomvar="X1">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="First">
              <nomvar name="X2"/>
            </diamond>
            <diamond mode="Next">
              <nomvar name="X3"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem=","/>
  </family>
  <family closed="true" pos="," name="n_1\*n_2/*n_3" pos1="PUNCT_CONJ">
    <entry name="Primary">
      <complexcat>
        <atomcat type="n">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <atomcat type="n">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="X3"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Arg1">
                <nomvar name="X3"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem=","/>
  </family>
  <family closed="true" pos="PDT" name="np_~1/np_1" pos1="PDT">
    <entry name="Primary">
      <complexcat>
        <atomcat type="np">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="half"/>
    <member stem="such"/>
  </family>
  <family closed="true" pos="IN" name="s_~1/s_1/s[dcl]_2" pos1="IN">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="s">
          <fs id="2">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Arg1">
                <nomvar name="X2"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="as"/>
    <member stem="because"/>
    <member stem="since"/>
  </family>
  <family unmatched="true" closed="true" pos="VBD" name="s[dcl]_1\np_1/(s[to]_2\np_1)" pos1="VBD">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="2">
              <feat attr="form" val="to"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
      </complexcat>
    </entry>
    <member stem="agree"/>
    <member stem="refuse"/>
    <member stem="start"/>
  </family>
  <family unmatched="true" closed="true" pos="VBZ" name="s[dcl]_1\np_1/(s[pss]_2\np_1)" pos1="VBZ">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
            <feat val="3s" attr="pnum"/>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="2">
              <feat attr="form" val="pss"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
      </complexcat>
    </entry>
    <member stem="philips"/>
    <member stem="be" pred="PASS"/>
  </family>
  <family unmatched="true" closed="true" pos="VBZ" name="s[dcl]_1\np_1/(s[adj]_2\np_1)" pos1="VBZ">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
            <feat val="3s" attr="pnum"/>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="2">
              <feat attr="form" val="adj"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
      </complexcat>
    </entry>
    <member stem="be"/>
  </family>
  <family unmatched="true" closed="true" pos="VBD" name="s[dcl]_1\np_1/(s[adj]_2\np_1)" pos1="VBD">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="2">
              <feat attr="form" val="adj"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
      </complexcat>
    </entry>
    <member stem="be"/>
  </family>
  <family unmatched="true" closed="true" pos="VBG" name="s[ng]_1\np_1/pp_2" pos1="VBG">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="ng"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="pp">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="join"/>
    <member stem="open"/>
    <member stem="transform"/>
  </family>
  <family unmatched="true" closed="true" pos="JJR" name="s[adj]_1\np_1" pos1="JJR">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="adj"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="higher"/>
    <member stem="larger"/>
    <member stem="more"/>
  </family>
  <family closed="true" pos="CC" name="s_~1/s_1" pos1="CC">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="and"/>
    <member stem="but"/>
  </family>
  <family unmatched="true" closed="true" pos="IN" name="pp_~2/(s[ng]_2\np_1)" pos1="IN">
    <entry name="Primary">
      <complexcat>
        <atomcat type="pp">
          <fs inheritsFrom="2">
            <feat attr="form">
              <featvar name="FORM"/>
            </feat>
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="2">
              <feat attr="form" val="ng"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
      </complexcat>
    </entry>
    <member stem="for"/>
    <member stem="from"/>
    <member stem="on"/>
  </family>
  <family unmatched="true" closed="true" pos="VBZ" name="s[dcl]_1\np_1/pp_2" pos1="VBZ">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
            <feat val="3s" attr="pnum"/>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="pp">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="account"/>
    <member stem="belong"/>
    <member stem="take"/>
  </family>
  <family closed="true" pos="RB" name="s_~1/s_1" pos1="RB">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="currently"/>
    <member stem="however"/>
    <member stem="then"/>
  </family>
  <family closed="true" pos="JJ" name="n_1" pos1="JJ">
    <entry name="Primary">
      <atomcat type="n">
        <fs id="1">
          <feat attr="index">
            <lf>
              <nomvar name="X1"/>
            </lf>
          </feat>
        </fs>
        <lf>
          <satop nomvar="X1">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </atomcat>
    </entry>
    <member stem="11th"/>
    <member stem="criminal"/>
    <member stem="right"/>
  </family>
  <family closed="true" pos="CC" name="s[ng]_1$_1\*(s[ng]_2$_1)/*(s[ng]_3$_1)" pos1="CC">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="ng"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash/>
        <dollar name="1"/>
        <slash mode="*" dir="\"/>
        <complexcat>
          <atomcat type="s">
            <fs id="2">
              <feat attr="form" val="ng"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
        </complexcat>
        <slash mode="*" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="3">
              <feat attr="form" val="ng"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X3"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
        </complexcat>
        <lf>
          <satop nomvar="X1">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="First">
              <nomvar name="X2"/>
            </diamond>
            <diamond mode="Next">
              <nomvar name="X3"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="and"/>
  </family>
  <family unmatched="true" closed="true" pos="VBP" name="s[dcl]_1\np[thr]_1/np_2" pos1="VBP">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat val="thr" attr="lex"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
            <feat val="-3s" attr="pnum"/>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="be"/>
  </family>
  <family closed="true" pos="NN" name="s_~1\np_2\(s_1\np_2)" pos1="NN">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="num">
                <prop name="sg"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="friday"/>
    <member stem="night"/>
    <member stem="yesterday"/>
  </family>
  <family closed="true" pos="IN" name="s_~1\np_2\(s_1\np_2)/(s[ng]_3\np_2)" pos1="IN">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="3">
              <feat attr="form" val="ng"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X3"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Arg1">
                <nomvar name="X3"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="from"/>
    <member stem="in"/>
    <member stem="while"/>
  </family>
  <family unmatched="true" closed="true" pos="VBN" name="s[pt]_1\np_1/pp_2" pos1="VBN">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="pt"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="pp">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="hear"/>
    <member stem="rush"/>
    <member stem="talk"/>
  </family>
  <family closed="true" pos="NNP" name="n_~1/n_1" pos1="NNP">
    <entry name="Primary">
      <complexcat>
        <atomcat type="n">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="n">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="num">
                <prop name="sg"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="dai"/>
    <member stem="jiangsu"/>
    <member stem="mr."/>
  </family>
  <family unmatched="true" closed="true" pos="VBD" name="s[dcl]_1\np_1/(s[b]_2\np_1)" pos1="VBD">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="2">
              <feat attr="form" val="b"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
      </complexcat>
    </entry>
    <member stem="do"/>
    <member stem="help"/>
  </family>
  <family closed="true" pos="DT" name="s[em]_~1/s[dcl]_1" pos1="DT" indexRel="*NoSem*">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="form" val="em"/>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="that"/>
  </family>
  <family unmatched="true" closed="true" pos="VBD" name="s[pss]_1\np_1/pp_2" pos1="VBD">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="pss"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="pp">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="make"/>
    <member stem="spend"/>
  </family>
  <family unmatched="true" closed="true" pos="VBD" name="s[dcl]_1\np_1/np_2/np_3" pos1="VBD">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="X3"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="call"/>
  </family>
  <family unmatched="true" closed="true" pos="VBG" name="s[ng]_1\np_1/(s[to]_2\np_1)" pos1="VBG">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="ng"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="2">
              <feat attr="form" val="to"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
      </complexcat>
    </entry>
    <member stem="begin"/>
    <member stem="go"/>
  </family>
  <family unmatched="true" closed="true" pos="VBD" name="s[dcl]_1\np[thr]_1/np_2" pos1="VBD">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat val="thr" attr="lex"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="be"/>
  </family>
  <family closed="true" pos="IN" name="np_~1\np_1/(s[ng]_2\np_3)" pos1="IN">
    <entry name="Primary">
      <complexcat>
        <atomcat type="np">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="2">
              <feat attr="form" val="ng"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="3">
              <feat attr="index">
                <lf>
                  <nomvar name="X3"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Arg1">
                <nomvar name="X2"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="for"/>
    <member stem="of"/>
  </family>
  <family unmatched="true" closed="true" pos="VBG" name="s[ng]_1\np_1/pp_2/np_3" pos1="VBG">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="ng"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="pp">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="X3"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="exchange"/>
    <member stem="make"/>
  </family>
  <family unmatched="true" closed="true" pos="VBP" name="s[dcl]_1\np_1/s[em]_2" pos1="VBP">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
            <feat val="-3s" attr="pnum"/>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="s">
          <fs id="2">
            <feat attr="form" val="em"/>
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="believe"/>
    <member stem="think"/>
  </family>
  <family closed="true" pos="IN" name="np_~1\np_1/(s[dcl]_2/np_1)" pos1="IN" indexRel="GenRel">
    <entry name="Primary">
      <complexcat>
        <atomcat type="np">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="2">
              <feat attr="form" val="dcl"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="/" mode="&gt;"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="GenRel">
              <nomvar name="X2"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="that"/>
  </family>
  <family closed="true" pos="JJ" name="s[adj]_1\np_2/(s[to]_3\np_1)" pos1="JJ">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="adj"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="3">
              <feat attr="form" val="to"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X3"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="X1">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg0">
              <nomvar name="X2"/>
            </diamond>
            <diamond mode="Arg1">
              <nomvar name="X3"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="afraid"/>
    <member stem="prepared"/>
  </family>
  <family closed="true" pos="IN" name="np_~1\np_1/s[dcl]_2" pos1="IN">
    <entry name="Primary">
      <complexcat>
        <atomcat type="np">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="s">
          <fs id="2">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Arg1">
                <nomvar name="X2"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="that"/>
  </family>
  <family closed="true" pos="IN" name="n_~1/n_1/(n_~1/n_1)" pos1="IN">
    <entry name="Primary">
      <complexcat>
        <atomcat type="n">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="n">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="n">
            <fs inheritsFrom="1">
              <feat attr="mod-index">
                <lf>
                  <nomvar name="M"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="/" mode="&gt;"/>
          <atomcat type="n">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="M">
            <diamond mode="Mod">
              <nomvar name="R"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="about"/>
  </family>
  <family closed="true" pos="NNS" name="np_~1\np_1" pos1="NNS">
    <entry name="Primary">
      <complexcat>
        <atomcat type="np">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="num">
                <prop name="pl"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="dollar"/>
  </family>
  <family unmatched="true" closed="true" pos="VBD" name="s[dcl]_1\np_1/(s[to]_2\np_3)/np_3" pos1="VBD">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="2">
              <feat attr="form" val="to"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="3">
              <feat attr="index">
                <lf>
                  <nomvar name="X3"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="X3"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="urge"/>
  </family>
  <family closed="true" pos="FW" name="n_~1\n_1" pos1="FW">
    <entry name="Primary">
      <complexcat>
        <atomcat type="n">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="n">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="etc."/>
    <member stem="ltd."/>
  </family>
  <family unmatched="true" closed="true" pos="RB" name="s[adj]_1\np_1" pos1="RB">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="adj"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="earlier"/>
    <member stem="in"/>
  </family>
  <family unmatched="true" closed="true" pos="VB" name="s[b]_1\np_1/(s[to]_2\np_3)/np_3" pos1="VB">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="b"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="2">
              <feat attr="form" val="to"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="3">
              <feat attr="index">
                <lf>
                  <nomvar name="X3"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="X3"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="allow"/>
    <member stem="use"/>
  </family>
  <family closed="true" pos="RB" name="np_~1\np_1" pos1="RB">
    <entry name="Primary">
      <complexcat>
        <atomcat type="np">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="here"/>
    <member stem="together"/>
  </family>
  <family closed="true" pos="JJ" name="s_~1\np_2\(s_1\np_2)/(s_~1\np_2\(s_1\np_2))" pos1="JJ">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="s">
            <fs inheritsFrom="1">
              <feat attr="mod-index">
                <lf>
                  <nomvar name="M"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <complexcat>
            <atomcat type="s">
              <fs id="1">
                <feat attr="index">
                  <lf>
                    <nomvar name="X1"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
            <slash dir="\" mode="&lt;"/>
            <atomcat type="np">
              <fs id="2">
                <feat attr="index">
                  <lf>
                    <nomvar name="X2"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
          </complexcat>
        </complexcat>
        <lf>
          <satop nomvar="M">
            <diamond mode="Mod">
              <nomvar name="R"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="last"/>
  </family>
  <family closed="true" pos="VBN" name="n_~1/n_1" pos1="VBN">
    <entry name="Primary">
      <complexcat>
        <atomcat type="n">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="n">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="associate"/>
    <member stem="inform"/>
  </family>
  <family closed="true" pos="DT" name="s_~1\np_2\(s_1\np_2)/n_3" pos1="DT">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="n">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="X3"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Arg1">
                <nomvar name="X3"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="all"/>
    <member stem="this"/>
  </family>
  <family unmatched="true" closed="true" pos="VBP" name="s[dcl]_1\np_1/(s[ng]_2\np_1)" pos1="VBP">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
            <feat val="-3s" attr="pnum"/>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="2">
              <feat attr="form" val="ng"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
      </complexcat>
    </entry>
    <member stem="be" pred="PROG"/>
  </family>
  <family unmatched="true" closed="true" pos="VBG" name="s[ng]_1\np_1/s[em]_2" pos1="VBG">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="ng"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="s">
          <fs id="2">
            <feat attr="form" val="em"/>
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="hope"/>
    <member stem="worry"/>
  </family>
  <family closed="true" pos="JJ" name="np_~1\np_1/(np_~1\np_1)" pos1="JJ">
    <entry name="Primary">
      <complexcat>
        <atomcat type="np">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="np">
            <fs inheritsFrom="1">
              <feat attr="mod-index">
                <lf>
                  <nomvar name="M"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="M">
            <diamond mode="Mod">
              <nomvar name="R"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="last"/>
    <member stem="next"/>
  </family>
  <family closed="true" pos="NN" name="np_~1\np_1" pos1="NN">
    <entry name="Primary">
      <complexcat>
        <atomcat type="np">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="num">
                <prop name="sg"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="year"/>
  </family>
  <family unmatched="true" closed="true" pos="VBZ" name="s[dcl]_1\np_1/s[em]_2" pos1="VBZ">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
            <feat val="3s" attr="pnum"/>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="s">
          <fs id="2">
            <feat attr="form" val="em"/>
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="consider"/>
    <member stem="mean"/>
  </family>
  <family closed="true" pos="PRP" name="s_~1\np_2\(s_1\np_2)" pos1="PRP">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="us"/>
  </family>
  <family closed="true" pos="IN" name="s_~1\np_2\(s_1\np_2)/pp_3" pos1="IN">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="pp">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="X3"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Arg1">
                <nomvar name="X3"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="because"/>
    <member stem="outside"/>
  </family>
  <family unmatched="true" closed="true" pos="VBP" name="s[dcl]_1\np_1/(s[to]_2\np_1)" pos1="VBP">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
            <feat val="-3s" attr="pnum"/>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="2">
              <feat attr="form" val="to"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
      </complexcat>
    </entry>
    <member stem="choose"/>
    <member stem="want"/>
  </family>
  <family unmatched="true" closed="true" pos="VB" name="s[b]_1\np_1/pp_2" pos1="VB">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="b"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="pp">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="recover"/>
    <member stem="speak"/>
  </family>
  <family unmatched="true" closed="true" pos="CC" name="s_1\np_2\(s_1\np_2)\*(s_3\np_4\(s_3\np_4))/*(s_5\np_6\(s_5\np_6))" pos1="CC">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash mode="*" dir="\"/>
        <complexcat>
          <atomcat type="s">
            <fs id="3">
              <feat attr="index">
                <lf>
                  <nomvar name="X3"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="4">
              <feat attr="index">
                <lf>
                  <nomvar name="X4"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <complexcat>
            <atomcat type="s">
              <fs id="3">
                <feat attr="index">
                  <lf>
                    <nomvar name="X3"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
            <slash dir="\" mode="&lt;"/>
            <atomcat type="np">
              <fs id="4">
                <feat attr="index">
                  <lf>
                    <nomvar name="X4"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
          </complexcat>
        </complexcat>
        <slash mode="*" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="5">
              <feat attr="index">
                <lf>
                  <nomvar name="X5"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="6">
              <feat attr="index">
                <lf>
                  <nomvar name="X6"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <complexcat>
            <atomcat type="s">
              <fs id="5">
                <feat attr="index">
                  <lf>
                    <nomvar name="X5"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
            <slash dir="\" mode="&lt;"/>
            <atomcat type="np">
              <fs id="6">
                <feat attr="index">
                  <lf>
                    <nomvar name="X6"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
          </complexcat>
        </complexcat>
      </complexcat>
    </entry>
    <member stem="and"/>
  </family>
  <family unmatched="true" closed="true" pos="VBD" name="s[dcl]_1\np_1/(s[pss]_2\np_1)" pos1="VBD">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="2">
              <feat attr="form" val="pss"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
      </complexcat>
    </entry>
    <member stem="be" pred="PASS"/>
  </family>
  <family unmatched="true" closed="true" pos="NN" name="n_1/s[em]_1" pos1="NN">
    <entry name="Primary">
      <complexcat>
        <atomcat type="n">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="em"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="province"/>
  </family>
  <family unmatched="true" closed="true" pos="VBP" name="s[dcl]_1\np_1/s[dcl]_2" pos1="VBP">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
            <feat val="-3s" attr="pnum"/>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="s">
          <fs id="2">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="think"/>
  </family>
  <family unmatched="true" closed="true" pos="VB" name="s[b]_1\np_1/(s[b]_2\np_3)/np_3" pos1="VB">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="b"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="2">
              <feat attr="form" val="b"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="3">
              <feat attr="index">
                <lf>
                  <nomvar name="X3"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="X3"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="help"/>
  </family>
  <family unmatched="true" closed="true" pos="VB" name="s[b]_1\np_1/pp_2/np_3" pos1="VB">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="b"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="pp">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="X3"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="pay"/>
  </family>
  <family unmatched="true" closed="true" pos="RB" name="s[adj]_1\np_1/pp_2/np_3" pos1="RB">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="adj"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="pp">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="X3"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="down"/>
  </family>
  <family unmatched="true" closed="true" pos="TO" name="pp_~2/(s[ng]_2\np_1)" pos1="TO">
    <entry name="Primary">
      <complexcat>
        <atomcat type="pp">
          <fs inheritsFrom="2">
            <feat attr="form">
              <featvar name="FORM"/>
            </feat>
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="2">
              <feat attr="form" val="ng"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
      </complexcat>
    </entry>
    <member stem="to"/>
  </family>
  <family closed="true" pos="IN" name="s[adj]_~1\np_2\(s[adj]_1\np_2)/np_3" pos1="IN">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="form" val="adj"/>
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="form" val="adj"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="X3"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Arg1">
                <nomvar name="X3"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="as"/>
  </family>
  <family closed="true" pos="RB" name="n_1" pos1="RB">
    <entry name="Primary">
      <atomcat type="n">
        <fs id="1">
          <feat attr="index">
            <lf>
              <nomvar name="X1"/>
            </lf>
          </feat>
        </fs>
        <lf>
          <satop nomvar="X1">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </atomcat>
    </entry>
    <member stem="well"/>
  </family>
  <family closed="true" pos="VB" name="n_~1/n_1" pos1="VB">
    <entry name="Primary">
      <complexcat>
        <atomcat type="n">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="n">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="integrate"/>
  </family>
  <family closed="true" pos="RBS" name="n_~1/n_1/(n_~1/n_1)" pos1="RBS">
    <entry name="Primary">
      <complexcat>
        <atomcat type="n">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="n">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="n">
            <fs inheritsFrom="1">
              <feat attr="mod-index">
                <lf>
                  <nomvar name="M"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="/" mode="&gt;"/>
          <atomcat type="n">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="M">
            <diamond mode="Mod">
              <nomvar name="R"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="most"/>
  </family>
  <family unmatched="true" closed="true" pos="VBP" name="s[dcl]_1\np_1" pos1="VBP">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
            <feat val="-3s" attr="pnum"/>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="be"/>
  </family>
  <family closed="true" pos="TO" name="s[adj]_~1\np_2\(s[adj]_1\np_2)/np_3" pos1="TO">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="form" val="adj"/>
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="form" val="adj"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="X3"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Arg1">
                <nomvar name="X3"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="to"/>
  </family>
  <family unmatched="true" closed="true" pos="VBP" name="s[dcl]_1\np_1/(s[pss]_2\np_1)" pos1="VBP">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
            <feat val="-3s" attr="pnum"/>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="2">
              <feat attr="form" val="pss"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
      </complexcat>
    </entry>
    <member stem="be" pred="PASS"/>
  </family>
  <family closed="true" pos="RP" name="n_1" pos1="RP">
    <entry name="Primary">
      <atomcat type="n">
        <fs id="1">
          <feat attr="index">
            <lf>
              <nomvar name="X1"/>
            </lf>
          </feat>
        </fs>
        <lf>
          <satop nomvar="X1">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </atomcat>
    </entry>
    <member stem="out"/>
  </family>
  <family closed="true" pos="IN" name="s_~1\np_2\(s_1\np_2)/(s[adj]_3\np_2)" pos1="IN">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="3">
              <feat attr="form" val="adj"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X3"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Arg1">
                <nomvar name="X3"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="in"/>
  </family>
  <family indexRel="mood" closed="true" name="sent_1\*s[pt]_1" pos=".">
    <entry name="Primary">
      <complexcat>
        <atomcat type="sent">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="pt"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="mood">
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member pred="dcl" stem="."/>
  </family>
  <family unmatched="true" closed="true" pos="VBD" name="s[dcl]_1\np_1/pp_2" pos1="VBD">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="pp">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="turn"/>
  </family>
  <family unmatched="true" closed="true" pos="VB" name="s[b]_1\np_1/(s[ng]_2\np_1)" pos1="VB">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="b"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="2">
              <feat attr="form" val="ng"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
      </complexcat>
    </entry>
    <member stem="continue"/>
  </family>
  <family unmatched="true" closed="true" pos="VB" name="s[b]_1\np_1/(s[to]_2\np_1)" pos1="VB">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="b"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="2">
              <feat attr="form" val="to"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
      </complexcat>
    </entry>
    <member stem="try"/>
  </family>
  <family unmatched="true" closed="true" pos="POS" name="s[dcl]_1\np_1/np_2" pos1="POS">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="'s"/>
  </family>
  <family unmatched="true" closed="true" pos="VB" name="s[dcl]_1\np_1/(s[b]_2\np_3)/np_3" pos1="VB">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="2">
              <feat attr="form" val="b"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="3">
              <feat attr="index">
                <lf>
                  <nomvar name="X3"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="X3"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="let"/>
  </family>
  <family closed="true" pos="," name="s[b]_1$_1\*(s[b]_2$_1)/*(s[b]_3$_1)" pos1="PUNCT_CONJ">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="b"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash/>
        <dollar name="1"/>
        <slash mode="*" dir="\"/>
        <complexcat>
          <atomcat type="s">
            <fs id="2">
              <feat attr="form" val="b"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
        </complexcat>
        <slash mode="*" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="3">
              <feat attr="form" val="b"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X3"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
        </complexcat>
        <lf>
          <satop nomvar="X1">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="First">
              <nomvar name="X2"/>
            </diamond>
            <diamond mode="Next">
              <nomvar name="X3"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem=","/>
  </family>
  <family closed="true" pos="WRB" name="s_~1/s_1/(s[pss]_2\np_3)" pos1="WRB">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="2">
              <feat attr="form" val="pss"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="3">
              <feat attr="index">
                <lf>
                  <nomvar name="X3"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Arg1">
                <nomvar name="X2"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="when"/>
  </family>
  <family unmatched="true" closed="true" pos="VBN" name="s[pt]_1\np_1/(s[pss]_2\np_1)" pos1="VBN">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="pt"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="2">
              <feat attr="form" val="pss"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
      </complexcat>
    </entry>
    <member stem="be" pred="PASS"/>
  </family>
  <family closed="true" pos="JJR" name="n_~1/n_1" pos1="JJR">
    <entry name="Primary">
      <complexcat>
        <atomcat type="n">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="n">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="more"/>
  </family>
  <family closed="true" pos="RB" name="np_~1\np_1/(np_~1\np_1)" pos1="RB">
    <entry name="Primary">
      <complexcat>
        <atomcat type="np">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="np">
            <fs inheritsFrom="1">
              <feat attr="mod-index">
                <lf>
                  <nomvar name="M"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="M">
            <diamond mode="Mod">
              <nomvar name="R"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="already"/>
  </family>
  <family unmatched="true" closed="true" pos="VBD" name="s[pss]_1\np_1/np_2" pos1="VBD">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="pss"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="call"/>
  </family>
  <family indexRel="mood" closed="true" name="sent_1\*np_1" pos=".">
    <entry name="Primary">
      <complexcat>
        <atomcat type="sent">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="mood">
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member pred="dcl" stem="."/>
  </family>
  <family unmatched="true" closed="true" pos="VBN" name="s[pt]_1\np_1/pp_2/np_3" pos1="VBN">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="pt"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="pp">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="X3"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="report"/>
  </family>
  <family closed="true" pos="RB" name="s_~1/s_1/(s_~1/s_1)" pos1="RB">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="s">
            <fs inheritsFrom="1">
              <feat attr="mod-index">
                <lf>
                  <nomvar name="M"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="/" mode="&gt;"/>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="M">
            <diamond mode="Mod">
              <nomvar name="R"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="as"/>
  </family>
  <family closed="true" pos="RB" name="s_~1/s_1/pp_2" pos1="RB">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="pp">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Arg1">
                <nomvar name="X2"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="early"/>
  </family>
  <family unmatched="true" closed="true" pos="IN" name="pp_1/pp_1" pos1="IN">
    <entry name="Primary">
      <complexcat>
        <atomcat type="pp">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="pp">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="as"/>
  </family>
  <family closed="true" pos=":" name="np_~1\np_1/np_2" pos1=":">
    <entry name="Primary">
      <complexcat>
        <atomcat type="np">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
            <feat val="dash" attr="unbal"/>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Arg1">
                <nomvar name="X2"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="--"/>
  </family>
  <family closed="true" pos="CD" name="s_~1\np_2\(s_1\np_2)\(s_~1\np_2\(s_1\np_2))" pos1="CD">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash dir="\" mode="&lt;"/>
        <complexcat>
          <atomcat type="s">
            <fs inheritsFrom="1">
              <feat attr="mod-index">
                <lf>
                  <nomvar name="M"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <complexcat>
            <atomcat type="s">
              <fs id="1">
                <feat attr="index">
                  <lf>
                    <nomvar name="X1"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
            <slash dir="\" mode="&lt;"/>
            <atomcat type="np">
              <fs id="2">
                <feat attr="index">
                  <lf>
                    <nomvar name="X2"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
          </complexcat>
        </complexcat>
        <lf>
          <satop nomvar="M">
            <diamond mode="Mod">
              <nomvar name="R"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="14"/>
  </family>
  <family unmatched="true" closed="true" pos="VBZ" name="s[dcl]_1\np_1/np_2/(s[dcl]_3\np_2)" pos1="VBZ">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
            <feat val="3s" attr="pnum"/>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="3">
              <feat attr="form" val="dcl"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X3"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
      </complexcat>
    </entry>
    <member stem="delegates"/>
  </family>
  <family closed="true" pos="DT" name="np_~1/np_1" pos1="DT">
    <entry name="Primary">
      <complexcat>
        <atomcat type="np">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="the"/>
  </family>
  <family unmatched="true" closed="true" pos="VBD" name="s[dcl]_1\np_1/(s[ng]_2\np_1)" pos1="VBD">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="2">
              <feat attr="form" val="ng"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
      </complexcat>
    </entry>
    <member stem="be" pred="PROG"/>
  </family>
  <family closed="true" pos="CC" name="s[em]_1$_1\*(s[em]_2$_1)/*(s[em]_3$_1)" pos1="CC">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="em"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash/>
        <dollar name="1"/>
        <slash mode="*" dir="\"/>
        <complexcat>
          <atomcat type="s">
            <fs id="2">
              <feat attr="form" val="em"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
        </complexcat>
        <slash mode="*" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="3">
              <feat attr="form" val="em"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X3"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash/>
          <dollar name="1"/>
        </complexcat>
        <lf>
          <satop nomvar="X1">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="First">
              <nomvar name="X2"/>
            </diamond>
            <diamond mode="Next">
              <nomvar name="X3"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="and"/>
  </family>
  <family closed="true" pos="MD" name="s[dcl]_1\np[thr]_2/(s[b]_3\np_1)" pos1="MD">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat val="thr" attr="lex"/>
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="3">
              <feat attr="form" val="b"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X3"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="X1">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg0">
              <nomvar name="X3"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="may"/>
  </family>
  <family closed="true" pos="WDT" name="np_~1\np_1/s[dcl]_2" pos1="WDT">
    <entry name="Primary">
      <complexcat>
        <atomcat type="np">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="s">
          <fs id="2">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Arg1">
                <nomvar name="X2"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="which"/>
  </family>
  <family closed="true" pos="CC" name="s[dcl]_1\np[conj]_2\*,_3/*(s[dcl]_4\np_5)" pos1="CC">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="form" val="conj"/>
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type=",">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="X3"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="4">
              <feat attr="form" val="dcl"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X4"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="5">
              <feat attr="index">
                <lf>
                  <nomvar name="X5"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="X1">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg0">
              <nomvar name="X2"/>
            </diamond>
            <diamond mode="Arg2">
              <nomvar name="X3"/>
            </diamond>
            <diamond mode="Arg1">
              <nomvar name="X4"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="and"/>
  </family>
  <family unmatched="true" closed="true" pos="VBD" name="s[dcl]_1\np_1/s[em]_2/np_3" pos1="VBD">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="s">
          <fs id="2">
            <feat attr="form" val="em"/>
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="X3"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="tell"/>
  </family>
  <family closed="true" pos="JJS" name="n_1" pos1="JJS">
    <entry name="Primary">
      <atomcat type="n">
        <fs id="1">
          <feat attr="index">
            <lf>
              <nomvar name="X1"/>
            </lf>
          </feat>
        </fs>
        <lf>
          <satop nomvar="X1">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </atomcat>
    </entry>
    <member stem="most"/>
  </family>
  <family unmatched="true" closed="true" pos="VB" name="s[b]_1\np_1/(s[pt]_2\np_1)" pos1="VB">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="b"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="2">
              <feat attr="form" val="pt"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
      </complexcat>
    </entry>
    <member stem="have" pred="PERF"/>
  </family>
  <family unmatched="true" closed="true" pos="VBN" name="s[pt]_1\np_1/s[em]_2" pos1="VBN">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="pt"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="s">
          <fs id="2">
            <feat attr="form" val="em"/>
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="think"/>
  </family>
  <family closed="true" pos="IN" name="s_~1\np_2\(s_1\np_2)" pos1="IN">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="over"/>
  </family>
  <family unmatched="true" closed="true" pos="VBN" name="s[pt]_1\np_1/(s[adj]_2\np_1)" pos1="VBN">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="pt"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="2">
              <feat attr="form" val="adj"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
      </complexcat>
    </entry>
    <member stem="be"/>
  </family>
  <family closed="true" pos="RB" name="s_~1\np_2\(s_1\np_2)\np_3" pos1="RB">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="X3"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Arg1">
                <nomvar name="X3"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="later"/>
  </family>
  <family closed="true" pos="VBD" name="s[dcl]_~1\s[dcl]_1\np_2" pos1="VBD">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="form" val="dcl"/>
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="tense">
                <prop name="past"/>
              </diamond>
              <diamond mode="Arg1">
                <nomvar name="X2"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="say"/>
  </family>
  <family closed="true" pos="WP" name="n_1" pos1="WP">
    <entry name="Primary">
      <atomcat type="n">
        <fs id="1">
          <feat attr="index">
            <lf>
              <nomvar name="X1"/>
            </lf>
          </feat>
        </fs>
        <lf>
          <satop nomvar="X1">
            <prop name="[*DEFAULT*]"/>
          </satop>
        </lf>
      </atomcat>
    </entry>
    <member stem="whom"/>
  </family>
  <family unmatched="true" closed="true" pos="," name="sent_1\*np_2/*np_3" pos1="PUNCT_CONJ">
    <entry name="Primary">
      <complexcat>
        <atomcat type="sent">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="X3"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem=","/>
  </family>
  <family closed="true" pos="CC" name="np_1\*n_2/*n_3" pos1="CC">
    <entry name="Primary">
      <complexcat>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <atomcat type="n">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="X3"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="First">
              <nomvar name="X2"/>
            </diamond>
            <diamond mode="Next">
              <nomvar name="X3"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="and"/>
  </family>
  <family closed="true" pos="RB" name="s[adj]_1\np_2/(s[to]_3\np_1)" pos1="RB">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="adj"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="3">
              <feat attr="form" val="to"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X3"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="X1">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg0">
              <nomvar name="X2"/>
            </diamond>
            <diamond mode="Arg1">
              <nomvar name="X3"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="about"/>
  </family>
  <family closed="true" pos="JJ" name="s_~1\np_2\(s_1\np_2)" pos1="JJ">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="nationwide"/>
  </family>
  <family closed="true" pos="VBZ" name="s[dcl]_1\np[expl]_2/s[em]_3/(s[adj]_4\np_1)" pos1="VBZ">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat val="expl" attr="lex"/>
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
            <feat val="3s" attr="pnum"/>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="s">
          <fs id="3">
            <feat attr="form" val="em"/>
            <feat attr="index">
              <lf>
                <nomvar name="X3"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="4">
              <feat attr="form" val="adj"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X4"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="X1">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="tense">
              <prop name="pres"/>
            </diamond>
            <diamond mode="Arg0">
              <nomvar name="X3"/>
            </diamond>
            <diamond mode="Arg1">
              <nomvar name="X4"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="be"/>
  </family>
  <family closed="true" pos="RB" name="np_~1/np_1" pos1="RB">
    <entry name="Primary">
      <complexcat>
        <atomcat type="np">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="nearly"/>
  </family>
  <family unmatched="true" closed="true" pos="VBN" name="s[pss]_1\np_1/(s[to]_2\np_1)" pos1="VBN">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="pss"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="2">
              <feat attr="form" val="to"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
      </complexcat>
    </entry>
    <member stem="estimate"/>
  </family>
  <family unmatched="true" closed="true" pos="VB" name="s[b]_1\np_1/s[dcl]_2" pos1="VB">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="b"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="s">
          <fs id="2">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="think"/>
  </family>
  <family closed="true" pos="IN" name="n_~1/n_1/(n_1/n_1)\(s[adj]_2\np_3)" pos1="IN">
    <entry name="Primary">
      <complexcat>
        <atomcat type="n">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="n">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="n">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="/" mode="&gt;"/>
          <atomcat type="n">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash dir="\" mode="&lt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="2">
              <feat attr="form" val="adj"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="3">
              <feat attr="index">
                <lf>
                  <nomvar name="X3"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="M">
            <diamond mode="Mod">
              <nomvar name="R"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Arg1">
                <nomvar name="X2"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="than"/>
  </family>
  <family unmatched="true" closed="true" pos="VBN" name="s[pss]_1\np_1/np_2" pos1="VBN">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="pss"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="mohamed"/>
  </family>
  <family closed="true" pos="DT" name="s_~1/s_1/n_2" pos1="DT">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Arg1">
                <nomvar name="X2"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="lrb"/>
  </family>
  <family closed="true" pos="RB" name="n_~1/n_1" pos1="RB">
    <entry name="Primary">
      <complexcat>
        <atomcat type="n">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="n">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="south"/>
  </family>
  <family unmatched="true" closed="true" pos="VBD" name="s[dcl]_1\np_1/s[dcl]_2/np_3" pos1="VBD">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="s">
          <fs id="2">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="X3"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="tell"/>
  </family>
  <family closed="true" pos="RB" name="s_~1\s_1" pos1="RB">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="however"/>
  </family>
  <family closed="true" pos="IN" name="s[adj]_~1\np_2\(s[adj]_1\np_2)/(s[adj]_3\np_4)" pos1="IN">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="form" val="adj"/>
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="form" val="adj"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="3">
              <feat attr="form" val="adj"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X3"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="4">
              <feat attr="index">
                <lf>
                  <nomvar name="X4"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Arg1">
                <nomvar name="X3"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="than"/>
  </family>
  <family closed="true" pos="DT" name="s_~1\np_2\(s_1\np_2)/(s_~1\np_2\(s_1\np_2))" pos1="DT">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="s">
            <fs inheritsFrom="1">
              <feat attr="mod-index">
                <lf>
                  <nomvar name="M"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <complexcat>
            <atomcat type="s">
              <fs id="1">
                <feat attr="index">
                  <lf>
                    <nomvar name="X1"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
            <slash dir="\" mode="&lt;"/>
            <atomcat type="np">
              <fs id="2">
                <feat attr="index">
                  <lf>
                    <nomvar name="X2"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
          </complexcat>
        </complexcat>
        <lf>
          <satop nomvar="M">
            <diamond mode="Mod">
              <nomvar name="R"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="all"/>
  </family>
  <family closed="true" pos="RBR" name="n_~1/n_1/(n_~1/n_1)" pos1="RBR">
    <entry name="Primary">
      <complexcat>
        <atomcat type="n">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="n">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="n">
            <fs inheritsFrom="1">
              <feat attr="mod-index">
                <lf>
                  <nomvar name="M"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="/" mode="&gt;"/>
          <atomcat type="n">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="M">
            <diamond mode="Mod">
              <nomvar name="R"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="more"/>
  </family>
  <family closed="true" pos="CC" name="s_1\np_2\(s_1\np_2)\*,_3/*(s_4\np_5\(s_4\np_5))" pos1="CC">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash mode="*" dir="\"/>
        <atomcat type=",">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="X3"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <complexcat>
          <atomcat type="s">
            <fs id="4">
              <feat attr="index">
                <lf>
                  <nomvar name="X4"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="5">
              <feat attr="index">
                <lf>
                  <nomvar name="X5"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <complexcat>
            <atomcat type="s">
              <fs id="4">
                <feat attr="index">
                  <lf>
                    <nomvar name="X4"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
            <slash dir="\" mode="&lt;"/>
            <atomcat type="np">
              <fs id="5">
                <feat attr="index">
                  <lf>
                    <nomvar name="X5"/>
                  </lf>
                </feat>
              </fs>
            </atomcat>
          </complexcat>
        </complexcat>
        <lf>
          <satop nomvar="M">
            <diamond mode="Mod">
              <nomvar name="R"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Arg1">
                <nomvar name="X4"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="and"/>
  </family>
  <family closed="true" pos="RBR" name="n_~1/n_1" pos1="RBR">
    <entry name="Primary">
      <complexcat>
        <atomcat type="n">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="n">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="more"/>
  </family>
  <family closed="true" pos="VBN" name="s_~1/s_1/pp_2" pos1="VBN">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="pp">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Arg1">
                <nomvar name="X2"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="compare"/>
  </family>
  <family unmatched="true" closed="true" pos="RB" name="s[adj]_1\np_1/np_2" pos1="RB">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="adj"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="down"/>
  </family>
  <family indexRel="mood" closed="true" name="sent_1\*(s_1/s)" pos=".">
    <entry name="Primary">
      <complexcat>
        <atomcat type="sent">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="/" mode="&gt;"/>
          <atomcat type="s"/>
        </complexcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="mood">
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member pred="dcl" stem="."/>
  </family>
  <family closed="true" pos="NNS" name="s_~1\np_2\(s_1\np_2)" pos1="NNS">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="num">
                <prop name="pl"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="dollar"/>
  </family>
  <family closed="true" pos="VBZ" name="s[dcl]_~1\s[dcl]_1\np_2" pos1="VBZ">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="form" val="dcl"/>
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
            <feat val="3s" attr="pnum"/>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="tense">
                <prop name="pres"/>
              </diamond>
              <diamond mode="Arg1">
                <nomvar name="X2"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="say"/>
  </family>
  <family closed="true" pos="RB" name="n_1\*n_2/*n_3" pos1="RB">
    <entry name="Primary">
      <complexcat>
        <atomcat type="n">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="\"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="*" dir="/"/>
        <atomcat type="n">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="X3"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Arg1">
                <nomvar name="X3"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="not"/>
  </family>
  <family unmatched="true" closed="true" pos="VBD" name="s[pss]_1\np_1/(s[adj]_2\np_1)" pos1="VBD">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="pss"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="2">
              <feat attr="form" val="adj"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
      </complexcat>
    </entry>
    <member stem="hold"/>
  </family>
  <family closed="true" pos="JJ" name="n_~1/n_1/(n_~1/n_1)" pos1="JJ">
    <entry name="Primary">
      <complexcat>
        <atomcat type="n">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="n">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="n">
            <fs inheritsFrom="1">
              <feat attr="mod-index">
                <lf>
                  <nomvar name="M"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="/" mode="&gt;"/>
          <atomcat type="n">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="M">
            <diamond mode="Mod">
              <nomvar name="R"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="us$"/>
  </family>
  <family closed="true" pos="CD" name="n_~1\n_1" pos1="CD">
    <entry name="Primary">
      <complexcat>
        <atomcat type="n">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="n">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="3"/>
  </family>
  <family closed="true" pos="NNP" name="n_~1/n[num]_1" pos1="NNP">
    <entry name="Primary">
      <complexcat>
        <atomcat type="n">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="n">
          <fs id="1">
            <feat attr="form" val="num"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="num">
                <prop name="sg"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="us$"/>
  </family>
  <family unmatched="true" closed="true" pos="VBZ" name="s[dcl]_1\np_1/pp_2/np_3" pos1="VBZ">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
            <feat val="3s" attr="pnum"/>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="pp">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="X3"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </entry>
    <member stem="forbid"/>
  </family>
  <family closed="true" pos="CD" name="s_~1\np_2\(s_1\np_2)" pos1="CD">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="4.5%"/>
  </family>
  <family closed="true" pos="WDT" name="np_~1\np_1/s[dcl]_2\(np_3\np_3/np_4)" pos1="WDT">
    <entry name="Primary">
      <complexcat>
        <atomcat type="np">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="s">
          <fs id="2">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <complexcat>
          <atomcat type="np">
            <fs id="3">
              <feat attr="index">
                <lf>
                  <nomvar name="X3"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="3">
              <feat attr="index">
                <lf>
                  <nomvar name="X3"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="/" mode="&gt;"/>
          <atomcat type="np">
            <fs id="4">
              <feat attr="index">
                <lf>
                  <nomvar name="X4"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="M">
            <diamond mode="Mod">
              <nomvar name="R"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Arg1">
                <nomvar name="X3"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="which"/>
  </family>
  <family closed="true" pos="PRP" name="np[expl]_1" pos1="PRP" indexRel="*NoSem*">
    <entry name="Primary">
      <atomcat type="np">
        <fs id="1">
          <feat val="expl" attr="lex"/>
        </fs>
      </atomcat>
    </entry>
    <member stem="it"/>
  </family>
  <family closed="true" pos="VBZ" name="s[dcl]_1\np[expl]_2/s_3/(s[adj]_4\np_1)" pos1="VBZ">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="form" val="dcl"/>
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat val="expl" attr="lex"/>
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
            <feat val="3s" attr="pnum"/>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="s">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="X3"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="4">
              <feat attr="form" val="adj"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X4"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="X1">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="tense">
              <prop name="pres"/>
            </diamond>
            <diamond mode="Arg0">
              <nomvar name="X3"/>
            </diamond>
            <diamond mode="Arg1">
              <nomvar name="X4"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="be"/>
  </family>
  <family closed="true" pos="IN" name="s_1/(s[to]_2\np_1)/np_1" pos1="IN">
    <entry name="Primary">
      <complexcat>
        <atomcat type="s">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="2">
              <feat attr="form" val="to"/>
              <feat attr="index">
                <lf>
                  <nomvar name="X2"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="1">
              <feat attr="index">
                <lf>
                  <nomvar name="X1"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <prop name="[*DEFAULT*]"/>
            <diamond mode="Arg1">
              <nomvar name="X2"/>
            </diamond>
            <diamond mode="Arg0">
              <nomvar name="X1"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="for"/>
  </family>
  <family closed="true" pos="IN" name="np_~1\np_1/pp_2" pos1="IN">
    <entry name="Primary">
      <complexcat>
        <atomcat type="np">
          <fs inheritsFrom="1">
            <feat attr="mod-index">
              <lf>
                <nomvar name="M"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="1">
            <feat attr="index">
              <lf>
                <nomvar name="X1"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="pp">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X2"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X1">
            <diamond mode="Mod">
              <nomvar name="M"/>
              <prop name="[*DEFAULT*]"/>
              <diamond mode="Arg1">
                <nomvar name="X2"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </entry>
    <member stem="instead"/>
  </family>
</ccg-lexicon>


================================================
FILE: test/morph.xml
================================================
<?xml version="1.0" encoding="UTF-8"?><morph xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" name="protogrammar" xsi:noNamespaceSchemaLocation="../morph.xsd">
  <entry pos=":" word="--"/>
  <entry pos="," word=","/>
  <!-- <entry pos=":" word=":"/> -->
  <entry pos="IN" word=":"/>
  <!-- <entry pos="." word="?"/> -->
  <entry pos="." word="."/>
  <entry pos="POS" word="'s"/>
  <entry pos="VBZ" word="'s" stem="be"/>
  <entry pos="CD" word="1"/>
  <entry pos="CD" word="1.3"/>
  <entry pos="CD" word="10%"/>
  <entry pos="CD" word="100"/>
  <entry pos="JJ" word="107-year-old"/>
  <entry pos="CD" word="11"/>
  <entry pos="CD" word="11,500"/>
  <entry pos="JJ" word="11th"/>
  <entry pos="CD" word="14"/>
  <entry pos="CD" word="150"/>
  <entry pos="CD" word="175"/>
  <entry pos="CD" word="18,000"/>
  <entry pos="CD" word="18%"/>
  <entry pos="CD" word="19"/>
  <entry pos="CD" word="1975"/>
  <entry pos="CD" word="1997"/>
  <entry pos="CD" word="1998"/>
  <entry pos="CD" word="2"/>
  <entry pos="CD" word="20,000"/>
  <entry pos="CD" word="2000"/>
  <entry pos="CD" word="21"/>
  <entry pos="CD" word="245"/>
  <entry pos="CD" word="248"/>
  <entry pos="CD" word="26"/>
  <entry pos="CD" word="260"/>
  <entry pos="CD" word="3"/>
  <entry pos="CD" word="30"/>
  <entry pos="CD" word="30%"/>
  <entry pos="CD" word="35.9%"/>
  <entry pos="CD" word="4.5"/>
  <entry pos="CD" word="4.5%"/>
  <entry pos="CD" word="40"/>
  <entry pos="CD" word="5,100"/>
  <entry pos="CD" word="50"/>
  <entry pos="CD" word="50-70"/>
  <entry pos="CD" word="53,810,000"/>
  <entry pos="CD" word="65%"/>
  <entry pos="CD" word="70"/>
  <entry pos="JJ" word="75-year-old"/>
  <entry pos="JJ" word="7th"/>
  <entry pos="NNS" word="80s" stem="80"/>
  <entry pos="CD" word="9"/>
  <entry pos="DT" word="a"/>
  <entry pos="IN" word="about"/>
  <entry pos="RB" word="about"/>
  <entry pos="JJ" word="above"/>
  <entry pos="NN" word="above"/>
  <entry pos="RB" word="abroad"/>
  <entry pos="VB" word="accept" stem="accept"/>
  <entry pos="VBN" word="accepted" stem="accept"/>
  <entry pos="VBD" word="accompanied" stem="accompany"/>
  <entry pos="VBG" word="according" stem="accord"/>
  <entry pos="VBZ" word="accounts" stem="account"/>
  <entry pos="NNS" word="actions" stem="action"/>
  <entry pos="NNS" word="activities" stem="activity"/>
  <entry pos="NN" word="activity"/>
  <entry pos="RB" word="actually"/>
  <entry pos="NN" word="addition"/>
  <entry pos="NN" word="address"/>
  <entry pos="VBP" word="administrate"/>
  <entry pos="NN" word="administration"/>
  <entry pos="JJ" word="administrative"/>
  <entry pos="VBZ" word="admits" stem="admit"/>
  <entry pos="NNS" word="affairs" stem="affair"/>
  <entry pos="VB" word="affect" stem="affect"/>
  <entry pos="VBG" word="affecting" stem="affect"/>
  <entry pos="JJ" word="afp"/>
  <entry pos="JJ" word="afraid"/>
  <entry pos="IN" word="after"/>
  <entry pos="RB" word="again"/>
  <entry pos="IN" word="against"/>
  <entry pos="VBD" word="agreed" stem="agree"/>
  <entry pos="NN" word="agreement"/>
  <entry pos="JJ" word="agricultural"/>
  <entry pos="NN" word="aid"/>
  <entry pos="NN" word="air"/>
  <entry pos="NN" word="airport,"/>
  <entry pos="DT" word="all"/>
  <entry pos="RB" word="all"/>
  <entry pos="VB" word="allow" stem="allow"/>
  <entry pos="IN" word="along"/>
  <entry pos="RB" word="already"/>
  <entry pos="RB" word="also"/>
  <entry pos="VBP" word="am" stem="be"/>
  <entry pos="NN" word="ambassador"/>
  <entry pos="NNS" word="ambassadors" stem="ambassador"/>
  <entry pos="NN" word="america"/>
  <entry pos="JJ" word="american"/>
  <entry pos="NN" word="amount"/>
  <entry pos="DT" word="an"/>
  <entry pos="NNS" word="analysts" stem="analyst"/>
  <entry pos="CC" word="and"/>
  <entry pos="VBD" word="announced" stem="announce"/>
  <entry pos="RB" word="anwar"/>
  <entry pos="DT" word="any"/>
  <entry pos="NNS" word="appearances" stem="appearance"/>
  <entry pos="NN" word="april"/>
  <entry pos="NN" word="arafat"/>
  <entry pos="VBP" word="are" stem="be"/>
  <entry pos="NN" word="area"/>
  <entry pos="IN" word="around"/>
  <entry pos="NN" word="article"/>
  <entry pos="IN" word="as"/>
  <entry pos="RB" word="as"/>
  <entry pos="NN" word="asean"/>
  <entry pos="NN" word="asia"/>
  <entry pos="JJ" word="asian"/>
  <entry pos="VBN" word="asked" stem="ask"/>
  <entry pos="NNS" word="assets" stem="asset"/>
  <entry pos="NN" word="assistance"/>
  <entry pos="VBN" word="associated" stem="associate"/>
  <entry pos="IN" word="at"/>
  <entry pos="NN" word="attack"/>
  <entry pos="VBG" word="attending" stem="attend"/>
  <entry pos="NN" word="attention"/>
  <entry pos="NN" word="attitude"/>
  <entry pos="NN" word="august"/>
  <entry pos="NN" word="australia"/>
  <entry pos="JJ" word="australian"/>
  <entry pos="NNS" word="authorities" stem="authority"/>
  <entry pos="RP" word="away"/>
  <entry pos="RB" word="back"/>
  <entry pos="RP" word="back"/>
  <entry pos="NN" word="balawang"/>
  <entry pos="NN" word="bangkok"/>
  <entry pos="NN" word="bank"/>
  <entry pos="NN" word="bankruptcy"/>
  <entry pos="VBN" word="based" stem="base"/>
  <entry pos="VB" word="be" stem="be"/>
  <entry pos="NN" word="beach"/>
  <entry pos="VBD" word="became" stem="become"/>
  <entry pos="IN" word="because"/>
  <entry pos="VB" word="become" stem="become"/>
  <entry pos="VBP" word="become" stem="become"/>
  <entry pos="VBZ" word="becomes" stem="become"/>
  <entry pos="VBN" word="been" stem="be"/>
  <entry pos="IN" word="before"/>
  <entry pos="RB" word="before"/>
  <entry pos="NN" word="beginning"/>
  <entry pos="VBG" word="beginning" stem="begin"/>
  <entry pos="VBG" word="beijing"/>
  <entry pos="VBP" word="believe" stem="believe"/>
  <entry pos="VBZ" word="believes" stem="believe"/>
  <entry pos="VBN" word="belonged"/>
  <entry pos="VBZ" word="belongs" stem="belong"/>
  <entry pos="NNS" word="benefits" stem="benefit"/>
  <entry pos="JJS" word="best"/>
  <entry pos="NN" word="beverage"/>
  <entry pos="JJS" word="biggest"/>
  <entry pos="CD" word="billion"/>
  <entry pos="VBN" word="blackened" stem="blacken"/>
  <entry pos="VBN" word="bombed" stem="bomb"/>
  <entry pos="NN" word="bond"/>
  <entry pos="DT" word="both"/>
  <entry pos="VB" word="bring" stem="bring"/>
  <entry pos="NNS" word="britons"/>
  <entry pos="VBD" word="brought" stem="bring"/>
  <entry pos="NN" word="building"/>
  <entry pos="NN" word="bureau"/>
  <entry pos="NN" word="burning"/>
  <entry pos="JJ" word="burnt"/>
  <entry pos="NN" word="business"/>
  <entry pos="CC" word="but"/>
  <entry pos="IN" word="by"/>
  <entry pos="VBD" word="called" stem="call"/>
  <entry pos="NN" word="cambodia"/>
  <entry pos="JJ" word="cambodian"/>
  <entry pos="MD" word="can"/>
  <entry pos="NN" word="canada"/>
  <entry pos="JJ" word="canadian"/>
  <entry pos="NN" word="capital"/>
  <entry pos="NNS" word="cases" stem="case"/>
  <entry pos="NN" word="catering"/>
  <entry pos="VB" word="cause" stem="cause"/>
  <entry pos="JJ" word="certain"/>
  <entry pos="NNS" word="changes" stem="change"/>
  <entry pos="JJ" word="changfei"/>
  <entry pos="NN" word="charge"/>
  <entry pos="NN" word="chea"/>
  <entry pos="NN" word="chee-hwa"/>
  <entry pos="NN" word="chernomyrdin"/>
  <entry pos="JJ" word="chief"/>
  <entry pos="NN" word="chief"/>
  <entry pos="NNS" word="children" stem="child"/>
  <entry pos="NN" word="china"/>
  <entry pos="NNP" word="china"/>
  <entry pos="NN" word="chinatown"/>
  <entry pos="JJ" word="chinese"/>
  <entry pos="NN" word="chinese"/>
  <entry pos="NN" word="choice"/>
  <entry pos="VB" word="choose" stem="choose"/>
  <entry pos="VBP" word="choose" stem="choose"/>
  <entry pos="JJ" word="chuan"/>
  <entry pos="NN" word="citizen"/>
  <entry pos="NNS" word="citizens" stem="citizen"/>
  <entry pos="NN" word="class"/>
  <entry pos="JJ" word="climatic"/>
  <entry pos="JJ" word="close"/>
  <entry pos="VB" word="close" stem="close"/>
  <entry pos="NN" word="cloth"/>
  <entry pos="NNS" word="co."/>
  <entry pos="NN" word="coastline"/>
  <entry pos="NN" word="college"/>
  <entry pos="NN" word="committee"/>
  <entry pos="NNS" word="committees" stem="committee"/>
  <entry pos="JJ" word="common"/>
  <entry pos="JJ" word="communist"/>
  <entry pos="NNS" word="companies" stem="company"/>
  <entry pos="NN" word="company"/>
  <entry pos="VBN" word="compared" stem="compare"/>
  <entry pos="NN" word="comparison"/>
  <entry pos="JJ" word="complementary"/>
  <entry pos="JJ" word="complete"/>
  <entry pos="NN" word="computer"/>
  <entry pos="NN" word="concern"/>
  <entry pos="NNS" word="conditions" stem="condition"/>
  <entry pos="NN" word="conference"/>
  <entry pos="JJ" word="congratulatory"/>
  <entry pos="NN" word="congress"/>
  <entry pos="JJ" word="consecutive"/>
  <entry pos="VBZ" word="considers" stem="consider"/>
  <entry pos="VB" word="construct" stem="construct"/>
  <entry pos="NN" word="construction"/>
  <entry pos="VB" word="continue" stem="continue"/>
  <entry pos="NN" word="contrary"/>
  <entry pos="NN" word="contribution"/>
  <entry pos="VBN" word="controlled" stem="control"/>
  <entry pos="VBN" word="cooperated" stem="cooperate"/>
  <entry pos="JJ" word="co-operational"/>
  <entry pos="NN" word="corporation"/>
  <entry pos="NN" word="correspondent"/>
  <entry pos="NN" word="council"/>
  <entry pos="NNS" word="countries" stem="country"/>
  <entry pos="NN" word="country"/>
  <entry pos="VBG" word="covering" stem="cover"/>
  <entry pos="NN" word="creativity"/>
  <entry pos="NN" word="creditor"/>
  <entry pos="NNS" word="creditors" stem="creditor"/>
  <entry pos="NN" word="cresson"/>
  <entry pos="JJ" word="criminal"/>
  <entry pos="NN" word="crisis"/>
  <entry pos="NN" word="crowd"/>
  <entry pos="JJ" word="current"/>
  <entry pos="RB" word="currently"/>
  <entry pos="NNP" word="dai"/>
  <entry pos="NN" word="damage"/>
  <entry pos="NN" word="day"/>
  <entry pos="NNS" word="days" stem="day"/>
  <entry pos="NN" word="death"/>
  <entry pos="NN" word="december"/>
  <entry pos="NNS" word="decisions" stem="decision"/>
  <entry pos="VBN" word="deed"/>
  <entry pos="JJ" word="deep"/>
  <entry pos="VBG" word="defaming"/>
  <entry pos="NN" word="defense"/>
  <entry pos="VBZ" word="delegates"/>
  <entry pos="NN" word="democracy"/>
  <entry pos="NNS" word="demonstrators" stem="demonstrator"/>
  <entry pos="NN" word="desert"/>
  <entry pos="VBN" word="determined" stem="determine"/>
  <entry pos="NN" word="detroit"/>
  <entry pos="VBG" word="developing" stem="develop"/>
  <entry pos="NN" word="development"/>
  <entry pos="VBD" word="did" stem="do"/>
  <entry pos="JJ" word="different"/>
  <entry pos="NN" word="ding"/>
  <entry pos="JJ" word="direct"/>
  <entry pos="RB" word="directly"/>
  <entry pos="NN" word="disability"/>
  <entry pos="NN" word="disabled"/>
  <entry pos="JJ" word="disappointing"/>
  <entry pos="VB" word="disclose" stem="disclose"/>
  <entry pos="VBD" word="disclosed" stem="disclose"/>
  <entry pos="VB" word="discuss" stem="discuss"/>
  <entry pos="NN" word="discussion"/>
  <entry pos="NNS" word="discussions" stem="discussion"/>
  <entry pos="VB" word="do" stem="do"/>
  <entry pos="NN" word="doctor"/>
  <entry pos="NN" word="document"/>
  <entry pos="NN" word="dole"/>
  <entry pos="NNS" word="dollars" stem="dollar"/>
  <entry pos="JJ" word="dong"/>
  <entry pos="RB" word="down"/>
  <entry pos="NN" word="draft"/>
  <entry pos="VBG" word="drafting" stem="draft"/>
  <entry pos="VBN" word="dropped" stem="drop"/>
  <entry pos="IN" word="during"/>
  <entry pos="NN" word="dust"/>
  <entry pos="JJ" word="dutch"/>
  <entry pos="RB" word="earlier"/>
  <entry pos="RB" word="early"/>
  <entry pos="JJ" word="east"/>
  <entry pos="VBG" word="eating" stem="eat"/>
  <entry pos="JJ" word="economic"/>
  <entry pos="NN" word="economy"/>
  <entry pos="NN" word="effect"/>
  <entry pos="JJ" word="el"/>
  <entry pos="NN" word="el"/>
  <entry pos="VBN" word="eleven"/>
  <entry pos="NNS" word="embassies" stem="embassy"/>
  <entry pos="VBD" word="emphasized" stem="emphasize"/>
  <entry pos="NN" word="end"/>
  <entry pos="JJ" word="enlarged"/>
  <entry pos="NN" word="entanglement"/>
  <entry pos="VBG" word="entering" stem="enter"/>
  <entry pos="NN" word="enterprise"/>
  <entry pos="NNS" word="enterprises" stem="enterprise"/>
  <entry pos="JJ" word="entire"/>
  <entry pos="VBD" word="erected" stem="erect"/>
  <entry pos="VBD" word="established" stem="establish"/>
  <entry pos="VBN" word="established" stem="establish"/>
  <entry pos="VBZ" word="establishes" stem="establish"/>
  <entry pos="NN" word="estate"/>
  <entry pos="VBN" word="estimated" stem="estimate"/>
  <entry pos="FW" word="etc."/>
  <entry pos="NN" word="europe"/>
  <entry pos="RB" word="even"/>
  <entry pos="DT" word="everyone"/>
  <entry pos="VBZ" word="exceeds" stem="exceed"/>
  <entry pos="NN" word="exchange"/>
  <entry pos="VBG" word="exchanging" stem="exchange"/>
  <entry pos="NN" word="executive"/>
  <entry pos="VBG" word="experiencing" stem="experience"/>
  <entry pos="NNS" word="experts" stem="expert"/>
  <entry pos="NN" word="export"/>
  <entry pos="NNS" word="exports" stem="export"/>
  <entry pos="VB" word="express" stem="express"/>
  <entry pos="VBD" word="expressed" stem="express"/>
  <entry pos="VBN" word="expressed" stem="express"/>
  <entry pos="JJ" word="external"/>
  <entry pos="VB" word="extradite"/>
  <entry pos="NN" word="extradition"/>
  <entry pos="NN" word="factor"/>
  <entry pos="VBN" word="fallen" stem="fall"/>
  <entry pos="JJ" word="february"/>
  <entry pos="NN" word="february"/>
  <entry pos="VBP" word="feel" stem="feel"/>
  <entry pos="NNS" word="feet" stem="foot"/>
  <entry pos="VBD" word="fell" stem="fall"/>
  <entry pos="JJ" word="fenglingdu"/>
  <entry pos="JJ" word="few"/>
  <entry pos="JJ" word="fiber-cable"/>
  <entry pos="JJ" word="fiber-optical"/>
  <entry pos="VB" word="fight" stem="fight"/>
  <entry pos="NN" word="figure"/>
  <entry pos="NN" word="finance"/>
  <entry pos="JJ" word="financial"/>
  <entry pos="RB" word="financially"/>
  <entry pos="JJ" word="first"/>
  <entry pos="CD" word="five"/>
  <entry pos="JJ" word="fixed"/>
  <entry pos="NN" word="flag"/>
  <entry pos="VBN" word="followed" stem="follow"/>
  <entry pos="NN" word="food"/>
  <entry pos="NN" word="foot"/>
  <entry pos="IN" word="for"/>
  <entry pos="VBZ" word="forbids" stem="forbid"/>
  <entry pos="NNS" word="forces" stem="force"/>
  <entry pos="JJ" word="foreign"/>
  <entry pos="JJ" word="former"/>
  <entry pos="VB" word="formulate" stem="formulate"/>
  <entry pos="JJ" word="fourth"/>
  <entry pos="NN" word="fox"/>
  <entry pos="NNS" word="freedoms" stem="freedom"/>
  <entry pos="JJ" word="french"/>
  <entry pos="NN" word="friday"/>
  <entry pos="IN" word="from"/>
  <entry pos="NN" word="front"/>
  <entry pos="RB" word="fully"/>
  <entry pos="NNS" word="functions" stem="function"/>
  <entry pos="JJ" word="further"/>
  <entry pos="JJ" word="g-7"/>
  <entry pos="NNP" word="gansu"/>
  <entry pos="VBN" word="garrisoned"/>
  <entry pos="VBN" word="gathered" stem="gather"/>
  <entry pos="JJ" word="general"/>
  <entry pos="JJ" word="german"/>
  <entry pos="NN" word="germany"/>
  <entry pos="VB" word="get" stem="get"/>
  <entry pos="VB" word="give" stem="give"/>
  <entry pos="JJ" word="glorious"/>
  <entry pos="NN" word="go"/>
  <entry pos="VB" word="go" stem="go"/>
  <entry pos="VBG" word="going" stem="go"/>
  <entry pos="JJ" word="good"/>
  <entry pos="NN" word="government"/>
  <entry pos="JJ" word="governmental"/>
  <entry pos="JJS" word="greatest"/>
  <entry pos="JJ" word="gross"/>
  <entry pos="NN" word="group"/>
  <entry pos="NNS" word="groups" stem="group"/>
  <entry pos="NN" word="growth"/>
  <entry pos="NN" word="guangxi"/>
  <entry pos="NN" word="guard"/>
  <entry pos="NN" word="guidance"/>
  <entry pos="JJ" word="guilty"/>
  <entry pos="NNP" word="gusa"/>
  <entry pos="NN" word="habibie"/>
  <entry pos="VBD" word="had" stem="have"/>
  <entry pos="PDT" word="half"/>
  <entry pos="NN" word="hand"/>
  <entry pos="VB" word="hand" stem="hand"/>
  <entry pos="NN" word="hao"/>
  <entry pos="VBZ" word="has" stem="have"/>
  <entry pos="VB" word="have" stem="have"/>
  <entry pos="VBP" word="have" stem="have"/>
  <entry pos="PRP" word="he"/>
  <entry pos="NN" word="head"/>
  <entry pos="NN" word="health"/>
  <entry pos="NN" word="heap"/>
  <entry pos="VBN" word="heard" stem="hear"/>
  <entry pos="NNS" word="hectares"/>
  <entry pos="VBD" word="held" stem="hold"/>
  <entry pos="VBN" word="held" stem="hold"/>
  <entry pos="NN" word="help"/>
  <entry pos="VB" word="help" stem="help"/>
  <entry pos="VBD" word="helped" stem="help"/>
  <entry pos="VBZ" word="helps" stem="help"/>
  <entry pos="RB" word="here"/>
  <entry pos="JJ" word="high"/>
  <entry pos="JJR" word="higher"/>
  <entry pos="PRP" word="him"/>
  <entry pos="PRP$" word="his"/>
  <entry pos="NN" word="hoe"/>
  <entry pos="NN" word="holland"/>
  <entry pos="NN" word="home"/>
  <entry pos="NNS" word="homes" stem="home"/>
  <entry pos="JJ" word="hong"/>
  <entry pos="NN" word="hong"/>
  <entry pos="VBG" word="hong"/>
  <entry pos="NN" word="hongkongnese"/>
  <entry pos="NN" word="hope"/>
  <entry pos="VBZ" word="hopes" stem="hope"/>
  <entry pos="VBG" word="hoping" stem="hope"/>
  <entry pos="RB" word="however"/>
  <entry pos="JJ" word="huang"/>
  <entry pos="NN" word="hudson"/>
  <entry pos="JJ" word="human"/>
  <entry pos="JJ" word="hun"/>
  <entry pos="CD" word="hundred"/>
  <entry pos="NNS" word="hundreds" stem="hundred"/>
  <entry pos="PRP" word="i"/>
  <entry pos="NNS" word="i" stem="i"/>
  <entry pos="NNP" word="i.e."/>
  <entry pos="NN" word="idea"/>
  <entry pos="NNS" word="immigrants" stem="immigrant"/>
  <entry pos="NN" word="immigration"/>
  <entry pos="VBG" word="implementing" stem="implement"/>
  <entry pos="NN" word="import"/>
  <entry pos="JJ" word="important"/>
  <entry pos="NNS" word="imports" stem="import"/>
  <entry pos="VB" word="improve" stem="improve"/>
  <entry pos="JJ" word="improved"/>
  <entry pos="IN" word="in"/>
  <entry pos="RB" word="in"/>
  <entry pos="JJ" word="incapable"/>
  <entry pos="VBN" word="included" stem="include"/>
  <entry pos="NN" word="increase"/>
  <entry pos="VBN" word="increased" stem="increase"/>
  <entry pos="JJ" word="independent"/>
  <entry pos="NN" word="index"/>
  <entry pos="VBD" word="indicated" stem="indicate"/>
  <entry pos="NN" word="indonesia"/>
  <entry pos="JJ" word="indonesian"/>
  <entry pos="JJ" word="industrial"/>
  <entry pos="NNS" word="industries" stem="industry"/>
  <entry pos="NN" word="industry"/>
  <entry pos="NN" word="inflation"/>
  <entry pos="NN" word="influence"/>
  <entry pos="NN" word="information"/>
  <entry pos="VBN" word="informed" stem="inform"/>
  <entry pos="NN" word="infrastructure"/>
  <entry pos="VB" word="inhabit"/>
  <entry pos="JJ" word="initial"/>
  <entry pos="NN" word="initiative"/>
  <entry pos="JJ" word="inland"/>
  <entry pos="NN" word="inland"/>
  <entry pos="IN" word="instead"/>
  <entry pos="NN" word="institute"/>
  <entry pos="NN" word="insurance"/>
  <entry pos="JJ" word="integral"/>
  <entry pos="VB" word="integrate" stem="integrate"/>
  <entry pos="JJ" word="intellectual"/>
  <entry pos="IN" word="into"/>
  <entry pos="NN" word="investigation"/>
  <entry pos="NN" word="investment"/>
  <entry pos="NNS" word="investors" stem="investor"/>
  <entry pos="JJ" word="iraqi"/>
  <entry pos="VBZ" word="is" stem="be"/>
  <entry pos="NN" word="island"/>
  <entry pos="NNP" word="israel"/>
  <entry pos="JJ" word="israeli"/>
  <entry pos="NN" word="issue"/>
  <entry pos="NNS" word="issues" stem="issue"/>
  <entry pos="PRP" word="it"/>
  <entry pos="PRP$" word="its"/>
  <entry pos="NN" word="japan"/>
  <entry pos="NN" word="japanese"/>
  <entry pos="NNP" word="jiangsu"/>
  <entry pos="NN" word="jianhua"/>
  <entry pos="NN" word="jiaxuan"/>
  <entry pos="VB" word="join" stem="join"/>
  <entry pos="VBG" word="joining" stem="join"/>
  <entry pos="JJ" word="joint"/>
  <entry pos="NN" word="jordan"/>
  <entry pos="NNS" word="journalists" stem="journalist"/>
  <entry pos="JJ" word="july"/>
  <entry pos="RB" word="just"/>
  <entry pos="NN" word="khieu"/>
  <entry pos="NN" word="khmer"/>
  <entry pos="VBD" word="killed" stem="kill"/>
  <entry pos="NNS" word="kilometers" stem="kilometer"/>
  <entry pos="NN" word="kind"/>
  <entry pos="NN" word="kingdom"/>
  <entry pos="DT" word="kong"/>
  <entry pos="JJ" word="kong"/>
  <entry pos="NN" word="kong"/>
  <entry pos="NN" word="korea"/>
  <entry pos="JJ" word="korean"/>
  <entry pos="NN" word="kremlin"/>
  <entry pos="NN" word="kuala"/>
  <entry pos="DT" word="la"/>
  <entry pos="NN" word="land"/>
  <entry pos="JJ" word="large"/>
  <entry pos="JJR" word="larger"/>
  <entry pos="JJ" word="last"/>
  <entry pos="RB" word="later"/>
  <entry pos="NNS" word="leaders" stem="leader"/>
  <entry pos="NN" word="league"/>
  <entry pos="VB" word="leave" stem="leave"/>
  <entry pos="VBZ" word="leaves" stem="leave"/>
  <entry pos="NN" word="lee"/>
  <entry pos="JJ" word="legal"/>
  <entry pos="VB" word="let" stem="let"/>
  <entry pos="NN" word="level"/>
  <entry pos="NN" word="lien"/>
  <entry pos="IN" word="like"/>
  <entry pos="NN" word="list"/>
  <entry pos="VB" word="list" stem="list"/>
  <entry pos="NN" word="loan"/>
  <entry pos="NNS" word="loans" stem="loan"/>
  <entry pos="JJ" word="local"/>
  <entry pos="VBN" word="located" stem="locate"/>
  <entry pos="NN" word="location"/>
  <entry pos="NN" word="look"/>
  <entry pos="NNS" word="looters"/>
  <entry pos="NN" word="loss"/>
  <entry pos="NN" word="lot"/>
  <entry pos="JJ" word="low"/>
  <entry pos="DT" word="lrb"/>
  <entry pos="FW" word="ltd."/>
  <entry pos="NN" word="lumpur"/>
  <entry pos="NN" word="macao"/>
  <entry pos="VBD" word="made" stem="make"/>
  <entry pos="VBN" word="made" stem="make"/>
  <entry pos="VBG" word="maintaining" stem="maintain"/>
  <entry pos="VB" word="make" stem="make"/>
  <entry pos="VBG" word="making" stem="make"/>
  <entry pos="NN" word="malay"/>
  <entry pos="NN" word="malaysia"/>
  <entry pos="JJ" word="malaysian"/>
  <entry pos="NN" word="management"/>
  <entry pos="JJ" word="many"/>
  <entry pos="NN" word="many"/>
  <entry pos="NN" word="marge"/>
  <entry pos="NN" word="market"/>
  <entry pos="VB" word="market" stem="market"/>
  <entry pos="DT" word="marshall"/>
  <entry pos="NN" word="marshall"/>
  <entry pos="NN" word="material"/>
  <entry pos="NNS" word="materials" stem="material"/>
  <entry pos="MD" word="may"/>
  <entry pos="VBZ" word="means" stem="mean"/>
  <entry pos="VBD" word="meant" stem="mean"/>
  <entry pos="NN" word="meeting"/>
  <entry pos="NNS" word="meetings" stem="meeting"/>
  <entry pos="NNS" word="members" stem="member"/>
  <entry pos="NNS" word="men" stem="man"/>
  <entry pos="NN" word="merger"/>
  <entry pos="MD" word="might"/>
  <entry pos="JJ" word="military"/>
  <entry pos="NNS" word="militiamen"/>
  <entry pos="CD" word="million"/>
  <entry pos="NNS" word="millions" stem="million"/>
  <entry pos="NNP" word="min"/>
  <entry pos="NN" word="minister"/>
  <entry pos="NN" word="ministry"/>
  <entry pos="VBD" word="missed" stem="miss"/>
  <entry pos="VBG" word="missing" stem="miss"/>
  <entry pos="NN" word="miyazawa"/>
  <entry pos="VB" word="mobilize" stem="mobilize"/>
  <entry pos="NN" word="model"/>
  <entry pos="VBN" word="mohamed"/>
  <entry pos="NN" word="money"/>
  <entry pos="NN" word="month"/>
  <entry pos="NN" word="moore"/>
  <entry pos="JJR" word="more"/>
  <entry pos="RBR" word="more"/>
  <entry pos="NN" word="moscow"/>
  <entry pos="JJS" word="most"/>
  <entry pos="RBS" word="most"/>
  <entry pos="NN" word="movement"/>
  <entry pos="NNP" word="mr."/>
  <entry pos="JJ" word="multinational"/>
  <entry pos="NN" word="muslim"/>
  <entry pos="MD" word="must"/>
  <entry pos="RB" word="n't"/>
  <entry pos="NN" word="nanyang"/>
  <entry pos="JJ" word="national"/>
  <entry pos="NNS" word="nations" stem="nation"/>
  <entry pos="JJ" word="nationwide"/>
  <entry pos="IN" word="near"/>
  <entry pos="RB" word="nearly"/>
  <entry pos="VB" word="need" stem="need"/>
  <entry pos="NN" word="neighbor"/>
  <entry pos="NNS" word="neighbors" stem="neighbor"/>
  <entry pos="RB" word="never"/>
  <entry pos="JJ" word="new"/>
  <entry pos="JJ" word="next"/>
  <entry pos="NN" word="nicaragua"/>
  <entry pos="NN" word="night"/>
  <entry pos="NN" word="nin"/>
  <entry pos="NN" word="nina"/>
  <entry pos="NN" word="nino"/>
  <entry pos="DT" word="no"/>
  <entry pos="JJ" word="normal"/>
  <entry pos="RB" word="not"/>
  <entry pos="NN" word="note"/>
  <entry pos="RB" word="now"/>
  <entry pos="NN" word="number"/>
  <entry pos="JJ" word="numerous"/>
  <entry pos="NN" word="nuon"/>
  <entry pos="RB" word="obviously"/>
  <entry pos="NNP" word="october"/>
  <entry pos="IN" word="of"/>
  <entry pos="NNS" word="of."/>
  <entry pos="RP" word="off"/>
  <entry pos="NN" word="office"/>
  <entry pos="NNS" word="officers" stem="officer"/>
  <entry pos="RB" word="officially"/>
  <entry pos="NNS" word="officials" stem="official"/>
  <entry pos="JJ" word="old"/>
  <entry pos="IN" word="on"/>
  <entry pos="RB" word="once"/>
  <entry pos="CD" word="one"/>
  <entry pos="JJ" word="only"/>
  <entry pos="RB" word="only"/>
  <entry pos="JJ" word="open"/>
  <entry pos="NN" word="opening"/>
  <entry pos="VBG" word="opening" stem="open"/>
  <entry pos="NN" word="operation"/>
  <entry pos="NNS" word="options" stem="option"/>
  <entry pos="CC" word="or"/>
  <entry pos="NNS" word="organs" stem="organ"/>
  <entry pos="NN" word="orphan"/>
  <entry pos="NN" word="orphanage"/>
  <entry pos="JJ" word="other"/>
  <entry pos="PRP$" word="our"/>
  <entry pos="RP" word="out"/>
  <entry pos="IN" word="outside"/>
  <entry pos="JJ" word="outside"/>
  <entry pos="IN" word="over"/>
  <entry pos="RP" word="over"/>
  <entry pos="JJ" word="overhead"/>
  <entry pos="VB" word="overlook" stem="overlook"/>
  <entry pos="VB" word="overthrow" stem="overthrow"/>
  <entry pos="JJ" word="own"/>
  <entry pos="NN" word="package"/>
  <entry pos="NNS" word="pai"/>
  <entry pos="NN" word="palace"/>
  <entry pos="NNS" word="palestinians"/>
  <entry pos="NN" word="paris"/>
  <entry pos="NN" word="part"/>
  <entry pos="NN" word="partner"/>
  <entry pos="NN" word="party"/>
  <entry pos="NN" word="passageway"/>
  <entry pos="NN" word="past"/>
  <entry pos="VB" word="pay" stem="pay"/>
  <entry pos="NN" word="penh"/>
  <entry pos="NNS" word="people" stem="people"/>
  <entry pos="NN" word="percent"/>
  <entry pos="NNS" word="performers" stem="performer"/>
  <entry pos="NN" word="period"/>
  <entry pos="JJ" word="permanent"/>
  <entry pos="NN" word="person"/>
  <entry pos="NN" word="pfizer"/>
  <entry pos="NN" word="phase"/>
  <entry pos="NN" word="phenomenon"/>
  <entry pos="NNS" word="philippines"/>
  <entry pos="VBZ" word="philips"/>
  <entry pos="NN" word="phnom"/>
  <entry pos="VBD" word="picked" stem="pick"/>
  <entry pos="NNS" word="places" stem="place"/>
  <entry pos="NN" word="plan"/>
  <entry pos="NN" word="plane"/>
  <entry pos="VB" word="play" stem="play"/>
  <entry pos="NN" word="policy"/>
  <entry pos="NN" word="poll"/>
  <entry pos="JJ" word="portugal"/>
  <entry pos="NN" word="position"/>
  <entry pos="JJ" word="positive"/>
  <entry pos="RB" word="possibly"/>
  <entry pos="VBN" word="postponed" stem="postpone"/>
  <entry pos="JJ" word="premier"/>
  <entry pos="JJ" word="prepared"/>
  <entry pos="NN" word="press"/>
  <entry pos="VB" word="prevent" stem="prevent"/>
  <entry pos="NN" word="price"/>
  <entry pos="RB" word="privately"/>
  <entry pos="NN" word="problem"/>
  <entry pos="NN" word="process"/>
  <entry pos="NN" word="processing"/>
  <entry pos="VBG" word="producing" stem="produce"/>
  <entry pos="NN" word="product"/>
  <entry pos="NN" word="progress"/>
  <entry pos="NN" word="project"/>
  <entry pos="NNS" word="projects" stem="project"/>
  <entry pos="VB" word="prolong" stem="prolong"/>
  <entry pos="VB" word="promote" stem="promote"/>
  <entry pos="NN" word="promotion"/>
  <entry pos="NN" word="property"/>
  <entry pos="NN" word="protection"/>
  <entry pos="NN" word="protest"/>
  <entry pos="JJ" word="proud"/>
  <entry pos="NN" word="province"/>
  <entry pos="JJ" word="public"/>
  <entry pos="JJ" word="pudong"/>
  <entry pos="NN" word="puppet"/>
  <entry pos="NN" word="pursuant"/>
  <entry pos="RB" word="quite"/>
  <entry pos="NN" word="rahmat"/>
  <entry pos="NN" word="railway"/>
  <entry pos="NN" word="rain"/>
  <entry pos="RB" word="rapidly"/>
  <entry pos="NN" word="rate"/>
  <entry pos="VBN" word="rated" stem="rate"/>
  <entry pos="VBD" word="reached" stem="reach"/>
  <entry pos="VBG" word="reaching" stem="reach"/>
  <entry pos="JJ" word="real"/>
  <entry pos="VB" word="rebuild" stem="rebuild"/>
  <entry pos="JJ" word="recent"/>
  <entry pos="RB" word="recently"/>
  <entry pos="VB" word="reclaim" stem="reclaim"/>
  <entry pos="NN" word="reclamation"/>
  <entry pos="VBP" word="recognize" stem="recognize"/>
  <entry pos="NN" word="reconciliation"/>
  <entry pos="NN" word="reconstruction"/>
  <entry pos="VB" word="recover" stem="recover"/>
  <entry pos="NN" word="recovery"/>
  <entry pos="VB" word="redeem" stem="redeem"/>
  <entry pos="NN" word="reef"/>
  <entry pos="NN" word="reform"/>
  <entry pos="VBD" word="refused" stem="refuse"/>
  <entry pos="NN" word="region"/>
  <entry pos="NN" word="regulation"/>
  <entry pos="NNS" word="regulations" stem="regulation"/>
  <entry pos="VBD" word="reiterated" stem="reiterate"/>
  <entry pos="NNS" word="relations" stem="relation"/>
  <entry pos="VBN" word="released" stem="release"/>
  <entry pos="JJ" word="religious"/>
  <entry pos="VBG" word="remaining" stem="remain"/>
  <entry pos="VBZ" word="remains" stem="remain"/>
  <entry pos="NN" word="remark"/>
  <entry pos="NNS" word="renminbi"/>
  <entry pos="NN" word="reorganization"/>
  <entry pos="JJ" word="rep"/>
  <entry pos="VBD" word="repeated" stem="repeat"/>
  <entry pos="RB" word="repeatedly"/>
  <entry pos="NN" word="report"/>
  <entry pos="VBN" word="reported" stem="report"/>
  <entry pos="NN" word="reporter"/>
  <entry pos="NNS" word="reporters" stem="reporter"/>
  <entry pos="NN" word="request"/>
  <entry pos="VBZ" word="requires" stem="require"/>
  <entry pos="NN" word="rescue"/>
  <entry pos="JJ" word="reserved"/>
  <entry pos="JJ" word="resident"/>
  <entry pos="VB" word="re-start"/>
  <entry pos="NN" word="return"/>
  <entry pos="JJ" word="rid"/>
  <entry pos="JJ" word="right"/>
  <entry pos="NNS" word="rights" stem="rights"/>
  <entry pos="NN" word="ringgit"/>
  <entry pos="NN" word="riot"/>
  <entry pos="NN" word="road"/>
  <entry pos="VBG" word="robbing" stem="rob"/>
  <entry pos="NN" word="role"/>
  <entry pos="NN" word="rouge"/>
  <entry pos="JJ" word="round"/>
  <entry pos="IN" word="rrb"/>
  <entry pos="NNS" word="ruins" stem="ruin"/>
  <entry pos="NN" word="runway"/>
  <entry pos="JJ" word="rural"/>
  <entry pos="VBN" word="rushed" stem="rush"/>
  <entry pos="NN" word="russia"/>
  <entry pos="NN" word="sacasa"/>
  <entry pos="VBD" word="said" stem="say"/>
  <entry pos="JJ" word="same"/>
  <entry pos="NN" word="samphan"/>
  <entry pos="NN" word="sarawak"/>
  <entry pos="VBD" word="saw" stem="see"/>
  <entry pos="VBZ" word="says" stem="say"/>
  <entry pos="NN" word="scheme"/>
  <entry pos="NN" word="school"/>
  <entry pos="NN" word="science"/>
  <entry pos="NN" word="scope"/>
  <entry pos="NN" word="sea"/>
  <entry pos="JJ" word="second"/>
  <entry pos="NNS" word="seconds" stem="seconds"/>
  <entry pos="NN" word="security"/>
  <entry pos="JJ" word="sen"/>
  <entry pos="NN" word="service"/>
  <entry pos="NNS" word="services" stem="service"/>
  <entry pos="NN" word="session"/>
  <entry pos="VB" word="set" stem="set"/>
  <entry pos="NN" word="settlement"/>
  <entry pos="JJ" word="seventh"/>
  <entry pos="NN" word="sex"/>
  <entry pos="NN" word="shanxi"/>
  <entry pos="NN" word="sherman"/>
  <entry pos="NN" word="shine"/>
  <entry pos="MD" word="should"/>
  <entry pos="NN" word="siazon"/>
  <entry pos="NNS" word="sides" stem="side"/>
  <entry pos="VBD" word="signed" stem="sign"/>
  <entry pos="NN" word="sihua"/>
  <entry pos="JJ" word="similar"/>
  <entry pos="IN" word="since"/>
  <entry pos="JJ" word="singapore"/>
  <entry pos="NN" word="site"/>
  <entry pos="JJ" word="skilled"/>
  <entry pos="JJ" word="small"/>
  <entry pos="RB" word="so"/>
  <entry pos="JJ" word="social"/>
  <entry pos="NN" word="sodomy"/>
  <entry pos="NN" word="soeharto"/>
  <entry pos="NNS" word="soldiers" stem="soldier"/>
  <entry pos="VB" word="solve" stem="solve"/>
  <entry pos="DT" word="some"/>
  <entry pos="DT" word="someone"/>
  <entry pos="DT" word="something"/>
  <entry pos="RB" word="soon"/>
  <entry pos="RB" word="south"/>
  <entry pos="JJ" word="southeast"/>
  <entry pos="NN" word="southeast"/>
  <entry pos="VB" word="speak" stem="speak"/>
  <entry pos="JJ" word="special"/>
  <entry pos="NN" word="speech"/>
  <entry pos="VBD" word="spent" stem="spend"/>
  <entry pos="JJ" word="square"/>
  <entry pos="NN" word="stability"/>
  <entry pos="NN" word="stage"/>
  <entry pos="VB" word="stand" stem="stand"/>
  <entry pos="VBD" word="started" stem="start"/>
  <entry pos="VBZ" word="starts" stem="start"/>
  <entry pos="NN" word="state"/>
  <entry pos="VBD" word="stated" stem="state"/>
  <entry pos="NN" word="statement"/>
  <entry pos="JJ" word="state-owned"/>
  <entry pos="NNS" word="states" stem="state"/>
  <entry pos="NN" word="station"/>
  <entry pos="NNS" word="statistics" stem="statistics"/>
  <entry pos="VBN" word="stepped" stem="step"/>
  <entry pos="RB" word="still"/>
  <entry pos="NN" word="stipulation"/>
  <entry pos="NNS" word="stipulations"/>
  <entry pos="NNS" word="strips" stem="strip"/>
  <entry pos="JJ" word="structural"/>
  <entry pos="NN" word="student"/>
  <entry pos="VB" word="submit" stem="submit"/>
  <entry pos="NN" word="subsidiary"/>
  <entry pos="NN" word="subversion"/>
  <entry pos="PDT" word="such"/>
  <entry pos="NN" word="supervision"/>
  <entry pos="NN" word="support"/>
  <entry pos="VB" word="support" stem="support"/>
  <entry pos="VBG" word="supporting" stem="support"/>
  <entry pos="NN" word="surabaya"/>
  <entry pos="NN" word="surface"/>
  <entry pos="NN" word="surrender"/>
  <entry pos="NNS" word="survivors" stem="survivor"/>
  <entry pos="NN" word="system"/>
  <entry pos="NN" word="table"/>
  <entry pos="NN" word="taiwan"/>
  <entry pos="VBP" word="take" stem="take"/>
  <entry pos="VBN" word="taken" stem="take"/>
  <entry pos="VBZ" word="takes" stem="take"/>
  <entry pos="VBG" word="taking" stem="take"/>
  <entry pos="NN" word="talent"/>
  <entry pos="NN" word="talin"/>
  <entry pos="VBN" word="talked" stem="talk"/>
  <entry pos="NNS" word="talks" stem="talk"/>
  <entry pos="NN" word="tang"/>
  <entry pos="NN" word="target"/>
  <entry pos="NNS" word="teachers" stem="teacher"/>
  <entry pos="NN" word="technology"/>
  <entry pos="NN" word="television"/>
  <entry pos="NN" word="temperature"/>
  <entry pos="NNS" word="tens" stem="ten"/>
  <entry pos="JJ" word="thai"/>
  <entry pos="NN" word="thailand"/>
  <entry pos="IN" word="than"/>
  <entry pos="DT" word="that"/>
  <entry pos="IN" word="that"/>
  <entry pos="WDT" word="that"/>
  <entry pos="DT" word="the"/>
  <entry pos="PRP$" word="their"/>
  <entry pos="PRP" word="them"/>
  <entry pos="PRP" word="themselves"/>
  <entry pos="RB" word="then"/>
  <entry pos="EX" word="there"/>
  <entry pos="RB" word="there"/>
  <entry pos="DT" word="these"/>
  <entry pos="PRP" word="they"/>
  <entry pos="VB" word="think" stem="think"/>
  <entry pos="VBP" word="think" stem="think"/>
  <entry pos="JJ" word="third"/>
  <entry pos="DT" word="this"/>
  <entry pos="DT" word="those"/>
  <entry pos="IN" word="though"/>
  <entry pos="VBD" word="thought" stem="think"/>
  <entry pos="VBN" word="thought" stem="think"/>
  <entry pos="IN" word="through"/>
  <entry pos="NNS" word="thugs" stem="thug"/>
  <entry pos="NN" word="tie"/>
  <entry pos="NN" word="time"/>
  <entry pos="JJ" word="timely"/>
  <entry pos="NN" word="timetable"/>
  <entry pos="NN" word="timor"/>
  <entry pos="NN" word="title"/>
  <entry pos="TO" word="to"/>
  <entry pos="JJ" word="toady"/>
  <entry pos="RB" word="together"/>
  <entry pos="NN" word="tokyo"/>
  <entry pos="VBD" word="told" stem="tell"/>
  <entry pos="NN" word="total"/>
  <entry pos="IN" word="towards"/>
  <entry pos="NN" word="town"/>
  <entry pos="NN" word="township"/>
  <entry pos="NN" word="trade"/>
  <entry pos="VBG" word="transforming" stem="transform"/>
  <entry pos="NN" word="transportation"/>
  <entry pos="NN" word="travel"/>
  <entry pos="VBN" word="tried" stem="try"/>
  <entry pos="NN" word="trustee"/>
  <entry pos="VB" word="try" stem="try"/>
  <entry pos="NN" word="tung"/>
  <entry pos="NN" word="turbulence"/>
  <entry pos="VBD" word="turned" stem="turn"/>
  <entry pos="NN" word="tv"/>
  <entry pos="NN" word="tv."/>
  <entry pos="CD" word="two"/>
  <entry pos="JJ" word="u.s."/>
  <entry pos="NNP" word="u.s."/>
  <entry pos="NN" word="uk"/>
  <entry pos="JJ" word="un"/>
  <entry pos="NN" word="un"/>
  <entry pos="NNP" word="un."/>
  <entry pos="VBN" word="understood" stem="understand"/>
  <entry pos="NN" word="unemployment"/>
  <entry pos="JJ" word="united"/>
  <entry pos="NN" word="university"/>
  <entry pos="IN" word="up"/>
  <entry pos="RB" word="up"/>
  <entry pos="RP" word="up"/>
  <entry pos="JJ" word="upper"/>
  <entry pos="JJ" word="urban"/>
  <entry pos="VBD" word="urged" stem="urge"/>
  <entry pos="PRP" word="us"/>
  <entry pos="NN" word="us."/>
  <entry pos="JJ" word="us$"/>
  <entry pos="NNP" word="us$"/>
  <entry pos="NN" word="usd"/>
  <entry pos="VB" word="use" stem="use"/>
  <entry pos="VBD" word="utilized"/>
  <entry pos="VBN" word="utilized"/>
  <entry pos="JJ" word="various"/>
  <entry pos="JJ" word="vast"/>
  <entry pos="NN" word="venture"/>
  <entry pos="RB" word="very"/>
  <entry pos="NN" word="viagra"/>
  <entry pos="NN" word="viktor"/>
  <entry pos="NN" word="violence"/>
  <entry pos="NN" word="visit"/>
  <entry pos="NN" word="voa"/>
  <entry pos="VBP" word="want" stem="want"/>
  <entry pos="VBN" word="wanted" stem="want"/>
  <entry pos="VBZ" word="wants" stem="want"/>
  <entry pos="NN" word="war"/>
  <entry pos="VBD" word="was" stem="be"/>
  <entry pos="NNP" word="washington"/>
  <entry pos="NN" word="water"/>
  <entry pos="VBD" word="waved" stem="wave"/>
  <entry pos="NN" word="way"/>
  <entry pos="PRP" word="we"/>
  <entry pos="NN" word="wednesday"/>
  <entry pos="NNS" word="weekends" stem="weekend"/>
  <entry pos="VBD" word="welcomed" stem="welcome"/>
  <entry pos="NN" word="welfare"/>
  <entry pos="RB" word="well"/>
  <entry pos="VBD" word="went" stem="go"/>
  <entry pos="VBD" word="were" stem="be"/>
  <entry pos="JJ" word="west"/>
  <entry pos="JJ" word="western"/>
  <entry pos="WRB" word="when"/>
  <entry pos="WDT" word="which"/>
  <entry pos="IN" word="while"/>
  <entry pos="WP" word="who"/>
  <entry pos="WP" word="whom"/>
  <entry pos="MD" word="will"/>
  <entry pos="NN" word="wiranto"/>
  <entry pos="NN" word="wire"/>
  <entry pos="NN" word="wiser"/>
  <entry pos="IN" word="with"/>
  <entry pos="IN" word="within"/>
  <entry pos="NN" word="work"/>
  <entry pos="NN" word="worker"/>
  <entry pos="NNS" word="workers" stem="worker"/>
  <entry pos="VBZ" word="works" stem="work"/>
  <entry pos="NN" word="world"/>
  <entry pos="VBG" word="worrying" stem="worry"/>
  <entry pos="MD" word="would"/>
  <entry pos="JJ" word="wuhan"/>
  <entry pos="NN" word="wuhan"/>
  <entry pos="NNP" word="wuhan"/>
  <entry pos="NNP" word="xianglong"/>
  <entry pos="NNP" word="xiaoshan"/>
  <entry pos="NN" word="xin"/>
  <entry pos="NN" word="xining"/>
  <entry pos="NN" word="year"/>
  <entry pos="NNS" word="years" stem="year"/>
  <entry pos="NN" word="yesterday"/>
  <entry pos="RB" word="yet"/>
  <entry pos="PRP" word="you"/>
  <entry pos="JJ" word="young"/>
  <entry pos="NN" word="youth"/>
  <entry pos="NN" word="yuan"/>
  <entry pos="NN" word="yulang"/>
  <entry pos="NN" word="zealand"/>
  <entry pos="VBG" word="zhejiang"/>
  <entry pos="NN" word="zone"/>
</morph>


================================================
FILE: test/opennlp/ccg/alignment/AlignmentTest.java
================================================
package opennlp.ccg.alignment;

import static opennlp.ccg.alignment.PhrasePosition.A;
import static opennlp.ccg.alignment.PhrasePosition.B;
import static org.junit.Assert.assertEquals;
import static org.junit.Assert.assertFalse;
import static org.junit.Assert.assertNotSame;
import static org.junit.Assert.assertNull;
import static org.junit.Assert.assertTrue;
import static org.junit.Assert.fail;

import java.util.Collections;
import java.util.HashMap;
import java.util.HashSet;
import java.util.Iterator;
import java.util.Map;
import java.util.Set;

import org.junit.Before;
import org.junit.Test;

public class AlignmentTest {

	Integer id;
	Phrase one, two;
	Set<Mapping> mappings;
	Alignment alignment;
	
	Map<Integer, Set<Integer>> map, pam;
	
	Set<Integer> twoAVals;
	
	@Before
	public void setUp() throws Exception {
		id = new Integer(37);
		one = new Phrase(id, Alignments.tokenize("This is it ."));
		two = new Phrase(id, Alignments.tokenize("A test this is ."));
		
		mappings = new HashSet<Mapping>();
		mappings.add(new Mapping(id, 0, 2));
		mappings.add(new Mapping(id, 1, 3));
		mappings.add(new Mapping(id, 3, 4));
		mappings.add(new Mapping(id, 2, 0));
		mappings.add(new Mapping(id, 2, 1));
		
		map = new HashMap<Integer, Set<Integer>>();
		pam = new HashMap<Integer, Set<Integer>>();
		
		map.put(0, new HashSet<Integer>(Collections.singleton(2)));
		map.put(1, new HashSet<Integer>(Collections.singleton(3)));
		map.put(3, new HashSet<Integer>(Collections.singleton(4)));
		
		twoAVals = new HashSet<Integer>();
		twoAVals.add(0);
		twoAVals.add(1);
		twoAVals = Collections.unmodifiableSet(twoAVals);
		
		map.put(2, twoAVals);
		
		pam.put(2, new HashSet<Integer>(Collections.singleton(0)));
		pam.put(3, new HashSet<Integer>(Collections.singleton(1)));
		pam.put(4, new HashSet<Integer>(Collections.singleton(3)));
		pam.put(0, new HashSet<Integer>(Collections.singleton(2)));
		pam.put(1, new HashSet<Integer>(Collections.singleton(2)));
		
		alignment = new Alignment(one, two, mappings);
		assertEquals(mappings, alignment);
	}
	
	@Test
	public void testCompare() {
		Phrase o = new Phrase(43, one), t = new Phrase(43, two);
		
		Set<Mapping> ms = new HashSet<Mapping>();
		for(Mapping m : mappings) {
			ms.add(m.copyWithPhraseNumber(43));
		}
		
		Alignment a = new Alignment(o, t, ms);
		
		assertEquals(-1, alignment.compareTo(a));
		assertEquals(1, a.compareTo(alignment));
		assertEquals(0, a.compareTo(a));
		assertEquals(0, alignment.compareTo(alignment));
	}

	@Test
	public void testAlignment() {
		try {
			new Alignment(null, two, mappings);
			fail("able to create alignment with null phrase");
		}
		catch(IllegalArgumentException expected) {
			// do nothing
		}
		
		try {
			new Alignment(one, null, mappings);
			fail("able to create alignment with null phrase");
		}
		catch(IllegalArgumentException expected) {
			// do nothing
		}
		
		try {
			new Alignment(one, two, null);
			fail("able to create alignment with null mappings");
		}
		catch(IllegalArgumentException expected) {
			// do nothing
		}
	}
	
	@Test
	public void testSize() {
		assertEquals(mappings.size(), alignment.size());
	}

	@Test
	public void testGet() {
		assertEquals(one, alignment.getA());
		assertEquals(two, alignment.getB());
		assertNotSame(one, alignment.getB());
	}

	@Test
	public void testAddMapping() {
		Mapping m = new Mapping(id, 0, 4);
		
		assertTrue(alignment.add(m));
		assertFalse(alignment.add(new Mapping(id, 3, 4)));
		
		alignment.remove(m);
		
		try {
			alignment.add(new Mapping(id + 1, 0, 4));
			fail("able to add mapping with non-matching ID");
		}
		catch(IllegalArgumentException expected) {
			// do nothing
		}
		
		try {
			alignment.add(new Mapping(id, null, 5));
			fail("able to add mapping with null index");
		}
		catch(IllegalArgumentException expected) {
			// do nothing
		}
		
		try {
			alignment.add(new Mapping(id, 0, 5));
			fail("able to add mapping with out of bounds index");
		}
		catch(IndexOutOfBoundsException expected) {
			// do nothing
		}
		
		try {
			alignment.add(new Mapping(id, -2, 3));
			fail("able to add mapping with out of bounds index");
		}
		catch(IndexOutOfBoundsException expected) {
			// do nothing
		}
		
		try {
			alignment.add(new Mapping(id, 5, 3));
			fail("able to add mapping with out of bounds index");
		}
		catch(IndexOutOfBoundsException expected) {
			// do nothing
		}
		
		try {
			alignment.add(new Mapping(id, 3, -3));
			fail("able to add mapping with out of bounds index");
		}
		catch(IndexOutOfBoundsException expected) {
			// do nothing
		}
	}
	
	@Test
	public void testGetTargets() {
		Set<Integer> ts = alignment.getTargets(2, A);
		Set<Integer> s = new HashSet<Integer>();
		s.add(0);
		s.add(1);
		
		assertFalse(s.retainAll(ts));
		assertEquals(s.size(), ts.size());
		
		ts.add(4);
		assertTrue(ts.contains(4));
		
		try {
			ts.remove(4);
			assertFalse(ts.contains(4));
		}
		catch(UnsupportedOperationException e) {
			fail("unable to call remove()");			
		}
		
		try {
			Iterator<Integer> i = ts.iterator();
			i.next();
			i.remove();
		}
		catch(UnsupportedOperationException e) {
			fail("unable to call iterator().remove()");
		}
	}
	
	@Test
	public void testMapEntrySet() {
		Map<Integer, Set<Integer>> amap = alignment.asMap(A), bmap = alignment.asMap(B);
		Set<Integer> s = new HashSet<Integer>(twoAVals);
		
		for(Map.Entry<Integer, Set<Integer>> e : amap.entrySet()) {
			if(e.getKey().equals(2)) {
				assertEquals(s, e.getValue());
			}
		}
		
		Iterator<Map.Entry<Integer, Set<Integer>>> i = bmap.entrySet().iterator();
		while(i.hasNext()) {
			Map.Entry<Integer, Set<Integer>> e = i.next();
			if(e.getKey().equals(1)) {
				assertEquals(Collections.singleton(2), e.getValue());
			}
			else if(e.getKey().equals(4)) {
				assertEquals(Collections.singleton(3), e.getValue());
			}
			else {
				try {
					i.remove();
				}
				catch(UnsupportedOperationException ex) {
					fail("unable to call Iterator.remove()");
				}
				
				try {
					assertTrue(e.getValue().add(3));
					assertTrue(e.getValue().contains(3));
					assertFalse(e.getValue().add(3));
				}
				catch(UnsupportedOperationException ex) {
					fail("unable to add to entry value");			
				}
				
				try {
					assertTrue(e.getValue().remove(3));
					assertFalse(e.getValue().contains(3));
					assertFalse(e.getValue().remove(3));
				}
				catch(UnsupportedOperationException ex) {
					fail("unable to remove from entry value");			
				}
				
				try {
					if(!e.getValue().isEmpty()) {
						e.getValue().remove(e.getValue().iterator().next());
					}
				}
				catch(UnsupportedOperationException ex) {
					fail("unable to call remove() for entry value");			
				}
				
				try {
					if(!e.getValue().isEmpty()) {
						Iterator<Integer> it = e.getValue().iterator();
						it.next();
						it.remove();
					}
				}
				catch(UnsupportedOperationException ex) {
					fail("unable to call remove() for entry value iterator");			
				}
				
				try {
					e.setValue(new HashSet<Integer>(Collections.singleton(0)));
				}
				catch(UnsupportedOperationException ex) {
					fail("unable to set entry value");
				}
			}
		}
	}
	
	@Test
	public void testMapValues() {
		Set<Set<Integer>> as = new HashSet<Set<Integer>>();
		as.add(Collections.singleton(2));
		as.add(Collections.singleton(3));
		as.add(Collections.singleton(4));
		
		Set<Integer> s = new HashSet<Integer>(twoAVals);
		as.add(s);
		
		Map<Integer, Set<Integer>> amap = alignment.asMap(A), bmap = alignment.asMap(B);
		
		assertTrue(amap.values().size() == as.size() && amap.values().containsAll(as));
		
		Set<Set<Integer>> bvals = new HashSet<Set<Integer>>(); // avoid doubling
		bvals.addAll(bmap.values());
		
		as.remove(s);
		as.add(Collections.singleton(0));
		as.add(Collections.singleton(1));
		as.remove(Collections.singleton(4));
		
		assertEquals(as, bvals);
		assertTrue(bmap.values().contains(Collections.singleton(2)));
		
		try {
			amap.values().add(Collections.singleton(1));
			fail("able to add value");
		}
		catch(UnsupportedOperationException expected) {
			// do nothing			
		}
		
		try {
			if(!amap.values().isEmpty()) {
				amap.values().remove(amap.values().iterator().next());
			}
		}
		catch(UnsupportedOperationException ex) {
			fail("unable to remove value");
		}
	}
	
	@Test
	public void testMapKeySet() {
		Map<Integer, Set<Integer>> amap = alignment.asMap(A), bmap = alignment.asMap(B);
		
		assertTrue(amap.keySet().contains(1));
		assertTrue(bmap.keySet().contains(3));
		
		assertFalse(amap.keySet().contains(4));
		assertFalse(amap.keySet().contains(null));
		assertFalse(bmap.keySet().contains(5));
				
		try {
			amap.keySet().add(4);
			fail("able to add key to key set");
		}
		catch(UnsupportedOperationException expected) {
			// do nothing, expected
		}
		
		try {
			bmap.keySet().add(4);
			fail("able to add key to key set");
		}
		catch(UnsupportedOperationException expected) {
			// do nothing, expected
		}
		
		try {
			amap.keySet().remove(1);
			assertFalse(amap.keySet().contains(1));
		}
		catch(UnsupportedOperationException ex) {
			fail("unable to remove key from key set");
		}
		
		try {
			bmap.keySet().remove(3);
			assertFalse(bmap.keySet().contains(3));
		}
		catch(UnsupportedOperationException ex) {
			fail("unable to remove key from key set");
		}
		
		try {
			amap.keySet().clear();
			assertTrue(amap.keySet().isEmpty());
		}
		catch(UnsupportedOperationException expected) {
			fail("unable to clear key set");
		}
		
		try {
			bmap.keySet().clear();
			assertTrue(bmap.keySet().isEmpty());
		}
		catch(UnsupportedOperationException expected) {
			fail("able to clear key set");
		}
		
		try{
			amap.keySet().add(5);
			fail("able to add to key set");
		}
		catch(UnsupportedOperationException ex) {
			// expected
		}
	}
	
	@Test
	public void testMapContains() {
		Map<Integer, Set<Integer>> amap = alignment.asMap(A), bmap = alignment.asMap(B);
		
		for(int i = 0; i < 4; i++) {
			assertTrue(amap.containsKey(i));
			assertTrue(bmap.containsKey(i));
		}
		
		assertTrue(bmap.containsKey(4));
		assertFalse(amap.containsKey(4));
		
		assertTrue(bmap.containsValue(Collections.singleton(2)));
		
		Set<Integer> s = new HashSet<Integer>(twoAVals);
		assertTrue(amap.containsValue(s));
	}
	
	@Test
	public void testMapGet() {
		Map<Integer, Set<Integer>> amap = alignment.asMap(A), bmap = alignment.asMap(B);
		
		Set<Integer> s = new HashSet<Integer>(twoAVals);
		
		assertEquals(s, amap.get(2));
		assertEquals(Collections.singleton(3), bmap.get(4));
		assertNull(amap.get(4));
		
		try {
			assertTrue(amap.get(2).contains(1));
			amap.get(2).remove(1);
			assertFalse(amap.get(2).contains(1));
		}
		catch(UnsupportedOperationException expected) {
			fail("unable remove from value set");
		}
		
		try {
			assertFalse(bmap.get(4).contains(2));
			bmap.get(4).add(2);
			assertTrue(bmap.get(4).contains(2));
		}
		catch(UnsupportedOperationException expected) {
			fail("unable add to value set");
		}
	}

	@Test
	public void testMapPut() {
		Map<Integer, Set<Integer>> amap = alignment.asMap(A), bmap = alignment.asMap(B);
		
		try {
			assertEquals(Collections.singleton(3), amap.put(1, Collections.singleton(2)));
			assertEquals(Collections.singleton(2), amap.get(1));
		}
		catch(UnsupportedOperationException expected) {
			fail("unable to put");
		}
		
		try {
			assertEquals(Collections.singleton(0), bmap.put(2, Collections.singleton(3)));
			assertEquals(Collections.singleton(3), bmap.get(2));
		}
		catch(UnsupportedOperationException expected) {
			fail("unable to put");
		}
		
		amap.remove(1);
		assertNull(amap.put(1, Collections.singleton(0)));
		
		
	}
	
	@Test
	public void testMapRemove() {
		Map<Integer, Set<Integer>> amap = alignment.asMap(A), bmap = alignment.asMap(B);
		
		try {
			assertTrue(amap.containsKey(1));
			amap.remove(1);
			assertFalse(amap.containsKey(1));
		}
		catch(UnsupportedOperationException expected) {
			fail("unable to remove");
		}
		
		try {
			assertTrue(bmap.containsKey(2));
			bmap.remove(2);
			assertFalse(bmap.containsKey(2));
		}
		catch(UnsupportedOperationException expected) {
			fail("unable to remove");
		}
	}
	
	@Test
	public void testMapAdd() {
		Map<Integer, Set<Integer>> amap = alignment.asMap(A), bmap = alignment.asMap(B);
		
		try {
			amap.get(1).add(0);
			assertTrue(amap.get(1).contains(0));
		}
		catch(UnsupportedOperationException expected) {
			fail("unable to add");
		}
		
		try {
			bmap.get(2).add(3);
			assertTrue(bmap.get(2).contains(3));
		}
		catch(UnsupportedOperationException expected) {
			fail("unable to add");
		}
	}
	
	@Test
	public void testMapClear() {
		Map<Integer, Set<Integer>> amap = alignment.asMap(A), bmap = alignment.asMap(B);
		
		try {
			amap.clear();
			assertTrue(amap.isEmpty());
		}
		catch(UnsupportedOperationException expected) {
			fail("unable to clear");
		}
		
		try {
			bmap.clear();
			assertTrue(bmap.isEmpty());
		}
		catch(UnsupportedOperationException expected) {
			fail("unable to clear");
		}
	}
	
	@Test
	public void testAsMap() {
		Map<Integer, Set<Integer>> amap = alignment.asMap(A), bmap = alignment.asMap(B);
		
		assertEquals(map, amap);
		assertEquals(pam, bmap);
		
		assertTrue(map.keySet().containsAll(amap.keySet()));
		assertTrue(pam.keySet().containsAll(bmap.keySet()));
		
		assertTrue(map.values().containsAll(amap.values()));
		assertTrue(pam.values().containsAll(bmap.values()));
		
		assertEquals(4, amap.size());
		assertEquals(5, bmap.size());
		
		assertFalse(amap.isEmpty());
		assertFalse(bmap.isEmpty());
		
		alignment.add(new Mapping(id, 2, 2));
		assertTrue(alignment.asMap(A).get(2).contains(2));
	}

	@Test
	public void testFromMap() {
		assertEquals(alignment, Alignment.fromMap(one, two, map));
		assertEquals(alignment.reverse(), Alignment.fromMap(two, one, pam));
		
		assertEquals(alignment, Alignment.fromMap(one, two, alignment.asMap(A)));
		assertEquals(alignment.reverse(), Alignment.fromMap(two, one, alignment.asMap(B)));
	}
	
	@Test
	public void testReverse() {
		for(PhrasePosition pos : PhrasePosition.values()) {
			assertEquals(alignment.get(pos), alignment.reverse().get(pos.opposite()));
		}
		
		for(Mapping r : alignment.reverse()) {
			assertTrue(alignment.contains(r.reverse()));
		}
		
		assertEquals(alignment, alignment.reverse().reverse());
	}
	
	@Test
	public void testGetIndices() {
		Set<Integer> is = new HashSet<Integer>();
		for(int i = 0; i < 4; i++) {
			is.add(i);
		}
		
		assertEquals(is, alignment.getIndices(A));
		
		is.add(4);
		
		assertEquals(is, alignment.getIndices(B));
	}
}


================================================
FILE: test/opennlp/ccg/alignment/IdentifiedPhraseReaderWriterTest.java
================================================
package opennlp.ccg.alignment;
import static org.junit.Assert.assertEquals;
import static org.junit.Assert.assertNull;
import static org.junit.Assert.fail;

import java.io.IOException;
import java.io.StringReader;
import java.io.StringWriter;
import java.util.ArrayList;
import java.util.Iterator;
import java.util.List;

import org.junit.Before;
import org.junit.Test;


public class IdentifiedPhraseReaderWriterTest {

	String lineSep = System.getProperty("line.separator");
	
	String input = "<s snum=\"157\'>First phrase.</s>\n<s snum=\'387b\'> Second phrase</s>\r\n<s snum=\"55\"> Third phrase . </s>",
		output = "<s snum=\"157\">First phrase.</s>" + lineSep + "<s snum=\"387b\">Second phrase</s>"
			+ lineSep + "<s snum=\"55\">Third phrase .</s>" + lineSep,
		paddedOutput = "<s snum=\"157\"> First phrase. </s>" + lineSep + "<s snum=\"387b\"> Second phrase </s>"
				+ lineSep + "<s snum=\"55\"> Third phrase . </s>" + lineSep;
	
	List<Phrase> phrases;
	
	@Before
	public void setUp() throws Exception {
		phrases = new ArrayList<Phrase>();
		phrases.add(new Phrase("157", 0, Alignments.tokenize("First phrase.")));
		phrases.add(new Phrase("387b", 1, Alignments.tokenize("Second phrase")));
		phrases.add(new Phrase("55", 2, Alignments.tokenize("Third phrase .")));
	}
	
	@Test
	public void testIdentifiedPhraseReader() {
		try {
			new IdentifiedPhraseReader(new StringReader(""), null);
			fail("able to specify null number base");
		}
		catch(IllegalArgumentException expected) {
			// do nothing
		}
		
		try {
			new IdentifiedPhraseReader(new StringReader(""), IndexBase.ZERO, null, "");
			fail("able to specify null string");
		}
		catch(IllegalArgumentException expected) {
			// do nothing
		}
		
		try {
			new IdentifiedPhraseReader(new StringReader(""), IndexBase.ZERO, "", null);
			fail("able to specify null string");
		}
		catch(IllegalArgumentException expected) {
			// do nothing
		}
	}
	
	@Test
	public void testBoth() {
		StringWriter sw = new StringWriter();
		IdentifiedPhraseWriter writer = new IdentifiedPhraseWriter(sw);
		
		try {
			for(Phrase p : phrases) {
				writer.writePhrase(p);
			}
		}
		catch(IOException io) {
			fail(io.getMessage());
		}
		
		IdentifiedPhraseReader reader = new IdentifiedPhraseReader(new StringReader(sw.getBuffer().toString()));
		Iterator<Phrase> i = phrases.iterator();
		
		try {
			Phrase p;
			while((p = reader.readPhrase()) != null) {
				assertEquals(i.next(), p);
			}
		}
		catch(IOException io) {
			fail(io.getMessage());
		}
	}

	@Test
	public void testReadPhrase() {
		IdentifiedPhraseReader reader = new IdentifiedPhraseReader(new StringReader(input));
		
		try {
			Iterator<Phrase> i = phrases.iterator();
			Phrase p;
			while((p = reader.readPhrase()) != null) {
				assertEquals(i.next(), p);
			}
			
			reader = new IdentifiedPhraseReader(new StringReader(""));
			assertNull(reader.readPhrase());
			
			reader.close();
		}
		catch(IOException io) {
			fail(io.getMessage());
		}
	}

	@Test
	public void testWritePhrase() {
		StringWriter sw = new StringWriter();
		IdentifiedPhraseWriter writer = new IdentifiedPhraseWriter(sw);
		
		try {
			for(Phrase p : phrases) {
				writer.writePhrase(p);
			}
			
			assertEquals(output, sw.getBuffer().toString());
			
			writer.close();
		}
		catch(IOException io) {
			fail(io.getMessage());
		}
		
		// test padded version
		sw = new StringWriter();
		writer = new IdentifiedPhraseWriter(sw, writer.getWordSeparator(), writer.getPhraseTag(),
				writer.getPhraseIdentifierAttribute(), true);
		
		try {
			for(Phrase p : phrases) {
				writer.writePhrase(p);
			}
			
			assertEquals(paddedOutput, sw.getBuffer().toString());
			
			writer.close();
		}
		catch(IOException io) {
			fail(io.getMessage());
		}
	}
}


================================================
FILE: test/opennlp/ccg/alignment/IndexBaseTest.java
================================================
package opennlp.ccg.alignment;

import static opennlp.ccg.alignment.IndexBase.ONE;
import static opennlp.ccg.alignment.IndexBase.ZERO;
import static org.junit.Assert.assertEquals;
import static org.junit.Assert.assertFalse;
import static org.junit.Assert.assertTrue;
import static org.junit.Assert.fail;

import org.junit.Test;

public class IndexBaseTest {

	Integer zero = new Integer(0), one = new Integer(1),
			two = new Integer(2), negOne = new Integer(-1),
			negTwo = new Integer(-2);
	
	@Test
	public void testGetStart() {
		assertEquals(zero, ZERO.start);
		assertEquals(one, ONE.start);
	}

	@Test
	public void testGetNullValue() {
		assertEquals(negOne, ZERO.nullValue);
		assertEquals(zero, ONE.nullValue);
	}

	@Test
	public void testIsValidIndex() {
		assertTrue(ZERO.isValidIndex(zero));
		assertTrue(ZERO.isValidIndex(one));
		assertTrue(ZERO.isValidIndex(negOne));
		assertFalse(ZERO.isValidIndex(negTwo));
		
		assertTrue(ONE.isValidIndex(zero));
		assertTrue(ONE.isValidIndex(one));
		assertFalse(ONE.isValidIndex(negOne));
		assertFalse(ONE.isValidIndex(negTwo));
		
		assertTrue(ZERO.isValidIndex(two));
		assertTrue(ONE.isValidIndex(two));
	}

	@Test
	public void testTranslate() {
		try {
			ZERO.translate(negTwo, ONE);
			fail("ZERO able to translate " + negTwo);
		}
		catch(IllegalArgumentException expected) {
			// do nothing
		}
		
		try {
			ONE.translate(negOne, ZERO);
			fail("ONE able to translate " + negOne);
		}
		catch(IllegalArgumentException expected) {
			// do nothing
		}
				
		// identity tests
		
		assertEquals(one, ZERO.translate(one, ZERO));
		assertEquals(one, ONE.translate(one, ONE));
		
		assertEquals(zero, ZERO.translate(zero, ZERO));
		assertEquals(zero, ONE.translate(zero, ONE));
		
		// actual translations
		
		assertEquals(zero, ZERO.translate(negOne, ONE));
		assertEquals(one, ZERO.translate(zero, ONE));
		assertEquals(two, ZERO.translate(one, ONE));
		
		assertEquals(negOne, ONE.translate(zero, ZERO));
		assertEquals(zero, ONE.translate(one, ZERO));
		assertEquals(one, ONE.translate(two, ZERO));
	}

}


================================================
FILE: test/opennlp/ccg/alignment/MappingFormatTest.java
================================================
package opennlp.ccg.alignment;

import static org.junit.Assert.*;

import java.text.ParseException;
import java.util.HashSet;
import java.util.Set;

import opennlp.ccg.alignment.MappingFormat.Field;

import org.junit.Before;
import org.junit.Test;

import static opennlp.ccg.alignment.Alignments.*;

public class MappingFormatTest {

	Set<MappingFormat> formats;
	Mapping vanilla, chocolate, nullId, nullValue;
	
	@Before
	public void setUp() throws Exception {
		MappingFormat moses = MappingFormat.getInstance(MOSES_ENCODING_SCHEME),
			mosesShort = MappingFormat.getInstance(MOSES_ENCODING_SCHEME,
				Alignments.MOSES_SHORT_FIELDS),
			mosesShortStrict = MappingFormat.getInstance(MOSES_ENCODING_SCHEME,
				Alignments.MOSES_SHORT_FIELDS, true),
			naacl = MappingFormat.getInstance(NAACL_ENCODING_SCHEME),
			naaclShort = MappingFormat.getInstance(NAACL_ENCODING_SCHEME, Alignments.NAACL_SHORT_FIELDS),
			naaclShortStrict = MappingFormat.getInstance(NAACL_ENCODING_SCHEME, Alignments.NAACL_SHORT_FIELDS,
					true),
			naaclVeryShort = MappingFormat.getInstance(NAACL_ENCODING_SCHEME, Alignments.NAACL_VERY_SHORT_FIELDS);
		
		formats = new HashSet<MappingFormat>();
		formats.add(moses);
		formats.add(mosesShort);
		formats.add(mosesShortStrict);
		formats.add(naacl);
		formats.add(naaclShort);
		formats.add(naaclShortStrict);
		formats.add(naaclVeryShort);
		
		vanilla = new Mapping(31, 4, 9);
		chocolate = new Mapping(31, 13, 5, Status.POSSIBLE, 0.75);
		nullId = new Mapping(null, 2, 2);
		nullValue = new Mapping(17, -1, 5);
	}
	
	@Test
	public void testMappingFormat() {
		Set<Field> fields = new HashSet<Field>();
		
		fields.add(Field.PHRASE_NUMBER_FIELD);
		
		try {
			MappingFormat.getInstance(MOSES_ENCODING_SCHEME, fields, true);
			fail("able to create Moses formatter with ID field");
		}
		catch(IllegalArgumentException expected) {
			// should happen
		}
		
		try {
			MappingFormat.getInstance(NAACL_ENCODING_SCHEME, fields, false);
			fail("able to create NAACL formatter with only ID field");
		}
		catch(IllegalArgumentException expected) {
			// should happen
		}
		
		try {
			MappingFormat.getInstance(MOSES_ENCODING_SCHEME, null, true);
			fail("able to create Moses formatter with null fields");
		}
		catch(IllegalArgumentException expected) {
			// should happen
		}
		
		try {
			MappingFormat.getInstance(NAACL_ENCODING_SCHEME, null, false);
			fail("able to create NAACL formatter with null fields");
		}
		catch(IllegalArgumentException expected) {
			// should happen
		}
		
		try {
			MappingFormat.getInstance(null, fields, true);
			fail("able to create formatter null scheme");
		}
		catch(IllegalArgumentException expected) {
			// should happen
		}
	}

	@Test
	public void testFormatMapping() {
		for(MappingFormat mf : formats) {
			String v = mf.format(vanilla), c = mf.format(chocolate), ni = null;
			EncodingScheme es = mf.encodingScheme;
			
			try {
				ni = mf.formatMapping(nullId);
			}
			catch(IllegalArgumentException e) {
				if(!es.getRequired().contains(MappingFormat.Field.PHRASE_NUMBER_FIELD)) {
					fail("unexpected exception: " + e.getMessage());
				}
			}
			
			try {
				mf.format(nullValue);
				fail("able to format mapping with null index");
			}
			catch(IllegalArgumentException expected) {
				// should happen
			}
				
			if(es.equals(MOSES_ENCODING_SCHEME)) {
				if(mf.fields.contains(MappingFormat.Field.STATUS_FIELD)) {
					assertEquals("13-5-P", c);
					if(mf.isStrict()) {
						assertEquals("4-9-S", v);
						assertEquals("2-2-S", ni);
					}
					else {
						assertEquals("4-9", v);
						assertEquals("2-2", ni);
					}
				}
				else {
					assertEquals("4-9", v);
					assertEquals("13-5", c);
					assertEquals("2-2", ni);
				}
			}
			else if(es.equals(NAACL_ENCODING_SCHEME)) {
				try {
					ni = mf.formatMapping(nullId);
					fail("able to format mapping with null id");
				}
				catch(IllegalArgumentException expected) {
					// should happen
				}
				
				if(mf.fields.contains(MappingFormat.Field.STATUS_FIELD)) {
					if(mf.fields.contains(MappingFormat.Field.CONFIDENCE_FIELD)) {
						if(mf.isStrict()) {
							assertEquals("31 5 10 S 1.0", v);
							assertEquals("31 14 6 P 0.75", c);
						}
						else {
							assertEquals("31 5 10", v);
							assertEquals("31 14 6 P 0.75", c);
						}
					}
					else {
						assertEquals("31 14 6 P", c);						
						
						if(mf.isStrict()) {
							assertEquals("31 5 10 S", v);
						}
						else {
							assertEquals("31 5 10", v);
						}
					}
				}
				else {
					assertEquals("31 5 10", v);
					assertEquals("31 14 6", c);
				}
			}
		}
	}

	@Test
	public void testParseMapping() {
		for(MappingFormat mf : formats) {
			EncodingScheme es = mf.encodingScheme;
			Mapping v, c, ni;
			
			if(es.equals(MOSES_ENCODING_SCHEME)) {
				try {
					mf.parseMapping("-1-5");
					fail("able to parse mapping with negative index");
				}
				catch(ParseException expected) {
					// should
				}
				
				if(mf.fields.contains(MappingFormat.Field.STATUS_FIELD)) {
					try {
						v = mf.parseMapping("4-9-S").copyWithPhraseNumber(chocolate.phraseNumber);
						
						assertEquals(vanilla, v);
						
						c = mf.parseMapping("13-5-P").copyWithPhraseNumber(chocolate.phraseNumber);
						c.setConfidence(chocolate.confidence);
						assertEquals(chocolate, c);
						
						ni = mf.parseMapping("2-2-S");
						assertEquals(nullId, ni);
						
						if(mf.isStrict()) {
							try {
								mf.parseMapping("4-9");
								fail("strict format able to parse loose input");
							}
							catch(ParseException expected) {
								assertEquals(3, expected.getErrorOffset());
							}
						}
						else {
							v = mf.parseMapping("4-9").copyWithPhraseNumber(chocolate.phraseNumber);
							assertEquals(vanilla, v);
							
							ni = mf.parseMapping("2-2");
							assertEquals(nullId, ni);
						}
					}
					catch(ParseException p) {
						fail("parse exception: " + p.getMessage());
					}					
				}
				else {
					try {
						v = mf.parseMapping("4-9").copyWithPhraseNumber(chocolate.phraseNumber);
						assertEquals(vanilla, v);
						
						c = mf.parseMapping("13-5").copyWithPhraseNumber(chocolate.phraseNumber);
						c.setStatus(Status.POSSIBLE);
						c.setConfidence(chocolate.confidence);
						assertEquals(chocolate, c);
						
						ni = mf.parseMapping("2-2");
						assertEquals(nullId, ni);
					}
					catch(ParseException p) {
						fail("parse exception: " + p.getMessage());
					}
				}
			}
			else if(es.equals(NAACL_ENCODING_SCHEME)) {
				try {
					mf.parseMapping("31 0 6 S 1.0");
					fail("able to parse mapping with 0 index, but index base is 1");
				}
				catch(ParseException expected) {
					// should
				}
				
				if(mf.fields.contains(MappingFormat.Field.STATUS_FIELD)) {
					if(mf.fields.contains(MappingFormat.Field.CONFIDENCE_FIELD)) {
						try {
							if(mf.isStrict()) {
								v = mf.parseMapping("31 5 10 S 1.0");
								assertEquals(vanilla, v);
								
								try {
									mf.parseMapping("31 5 10");
									fail("able to parse loose input with strict format");
								}
								catch(ParseException expected) {
									assertEquals(7, expected.getErrorOffset());
								}
							}
							else {
								v = mf.parseMapping("31 5 10");
								assertEquals(vanilla, v);
							}
							
							c = mf.parseMapping("31 14 6 P 0.75");
							assertEquals(chocolate, c);
							
							try {
								ni = mf.parseMapping("3 3 S");
							}
							catch(ParseException should) {
								// expected
								assertEquals(4, should.getErrorOffset());
							}
						}
						catch(ParseException p) {
							fail("parse exception: " + p.getMessage());
						}
					}
					else {
						try {
							if(mf.isStrict()) {
								v = mf.parseMapping("31 5 10 S");
								assertEquals(vanilla, v);
								
								try {
									mf.parseMapping("31 5 10");
									fail("able to parse loose input with strict format");
								}
								catch(ParseException expected) {
									assertEquals(7, expected.getErrorOffset());
								}
							}
							else {
								v = mf.parseMapping("31 5 10");
								assertEquals(vanilla, v);
							}
							
							c = mf.parseMapping("31 14 6 P");
							c.setConfidence(chocolate.confidence);
							assertEquals(chocolate, c);
							
							try {
								ni = mf.parseMapping("3 3 S");
							}
							catch(ParseException should) {
								// expected
								assertEquals(4, should.getErrorOffset());
							}
						}
						catch(ParseException p) {
							fail("parse exception: " + p.getMessage());
						}
					}
				}
				else {
					try {
						v = mf.parseMapping("31 5 10");
						assertEquals(vanilla, v);
						
						c = mf.parseMapping("31 14 6");
						c.setStatus(Status.POSSIBLE);
						c.setConfidence(chocolate.confidence);
						assertEquals(chocolate, c);
						
						try {
							ni = mf.parseMapping("3 3 S");
							fail("able to parse mapping without ID");
						}
						catch(ParseException should) {
							// expected
							assertEquals(4, should.getErrorOffset());
						}
					}
					catch(ParseException p) {
						fail("parse exception: " + p.getMessage());
					}
				}
			}			
		}
	}

}


================================================
FILE: test/opennlp/ccg/alignment/MappingGroupTest.java
================================================
package opennlp.ccg.alignment;

import static org.junit.Assert.assertEquals;
import static org.junit.Assert.assertNotSame;
import static org.junit.Assert.fail;

import org.junit.Before;
import org.junit.Test;

public class MappingGroupTest {

	MappingGroup one, two;
	
	@Before
	public void setUp() throws Exception {
		one = new MappingGroup(37, 12);
		two = new MappingGroup(1, 8);
	}
	
	@Test
	public void testMappingGroup() {
		try {
			new MappingGroup(null, 1);
			fail("able to specify null number");
		}
		catch(IllegalArgumentException expected) {
			// do nothing
		}
		
		try {
			new MappingGroup(37, -1);
			fail("able to specify negative length");
		}
		catch(IllegalArgumentException expected) {
			// do nothing
		}
	}

	@Test
	public void testEqualsObject() {
		assertNotSame(one, two);
		assertNotSame(two, null);
		assertEquals(one, new MappingGroup(one.phraseNumber, one.length));
	}

	@Test
	public void testCompareTo() {
		assertEquals(0, one.compareTo(one));
		assertEquals(1, one.compareTo(two));
	}

}


================================================
FILE: test/opennlp/ccg/alignment/MappingReaderWriterTest.java
================================================
package opennlp.ccg.alignment;

import static opennlp.ccg.alignment.Status.POSSIBLE;
import static opennlp.ccg.alignment.Status.SURE;
import static org.junit.Assert.assertEquals;
import static org.junit.Assert.assertFalse;
import static org.junit.Assert.assertNull;
import static org.junit.Assert.fail;

import java.io.IOException;
import java.io.StringReader;
import java.io.StringWriter;
import java.util.Iterator;
import java.util.LinkedHashSet;
import java.util.Set;

import org.junit.Before;
import org.junit.Test;

import static opennlp.ccg.alignment.Alignments.*;

public class MappingReaderWriterTest {

	MappingReader mosesReader, naaclReader;
	MappingWriter mosesWriter, naaclWriter;
	StringWriter mosesStringWriter, naaclStringWriter;
	MappingFormat mosesFormat = MappingFormat.getInstance(MOSES_ENCODING_SCHEME),
		naaclFormat = MappingFormat.getInstance(NAACL_ENCODING_SCHEME, Alignments.NAACL_SHORT_FIELDS, false);
	
	Set<Mapping> mosesMappings = new LinkedHashSet<Mapping>(), naaclMappings = new LinkedHashSet<Mapping>();
	Set<MappingGroup> mosesGroups = new LinkedHashSet<MappingGroup>(),
			naaclGroups = new LinkedHashSet<MappingGroup>();
	
	String lineSep = System.getProperty("line.separator");
	
	String mosesInput = "0-1-S 0-0 2-1-P 3-3 4-8 21-23\r\n3-4 34-55-P 1-4 23-1-S\n",
			mosesOutput = "0-1 0-0 2-1-P 3-3 4-8 21-23" + lineSep + "3-4 34-55-P 1-4 23-1",
			naaclInput = "17 1 1 S\r17 2 3 P\n17 5 5\r\n17 4 4 S 0.75\n37 3 2 P",
			naaclOutput = "17 1 1" + lineSep + "17 2 3 P" + lineSep + "17 5 5"
				+ lineSep + "17 4 4" + lineSep + "37 3 2 P",
			emptyInput = "",
			lineEndingOnly = "\n";
	
	@Before
	public void setUp() throws Exception {
		mosesReader = new MappingReader(new StringReader(mosesInput), mosesFormat);
		naaclReader = new MappingReader(new StringReader(naaclInput), naaclFormat);
		
		mosesStringWriter = new StringWriter();
		mosesWriter = new MappingWriter(mosesStringWriter, mosesFormat);
		naaclStringWriter = new StringWriter();
		naaclWriter = new MappingWriter(naaclStringWriter, naaclFormat);
		
		mosesMappings.add(new Mapping(0, 0, 1, SURE));
		mosesMappings.add(new Mapping(0, 0, 0));
		mosesMappings.add(new Mapping(0, 2, 1, POSSIBLE));
		mosesMappings.add(new Mapping(0, 3, 3));
		mosesMappings.add(new Mapping(0, 4, 8));
		mosesMappings.add(new Mapping(0, 21, 23));
		mosesMappings.add(new Mapping(1, 3, 4));
		mosesMappings.add(new Mapping(1, 34, 55, POSSIBLE));
		mosesMappings.add(new Mapping(1, 1, 4));
		mosesMappings.add(new Mapping(1, 23, 1, SURE));
		
		naaclMappings.add(new Mapping(17, 0, 0, SURE));
		naaclMappings.add(new Mapping(17, 1, 2, POSSIBLE));
		naaclMappings.add(new Mapping(17, 4, 4));
		naaclMappings.add(new Mapping(17, 3, 3, SURE, new Double(0.75d)));
		naaclMappings.add(new Mapping(37, 2, 1, POSSIBLE));
		
		mosesGroups.add(new MappingGroup(0, 6));
		mosesGroups.add(new MappingGroup(1, 4));
		
		naaclGroups.add(new MappingGroup(17, 4));
		naaclGroups.add(new MappingGroup(37, 1));
	}
	
	@Test
	public void testConstructors() {
		try {
			new MappingReader(new StringReader(""), null);
			fail("able to specify null format");
		}
		catch(IllegalArgumentException expected) {
			// do nothing
		}
		
		try {
			new MappingWriter(new StringWriter(), null);
			fail("able to specify null format");
		}
		catch(IllegalArgumentException expected) {
			// do nothing
		}
	}
	
	@Test
	public void testBoth() {
		Iterator<Mapping> mi = mosesMappings.iterator();
		Iterator<MappingGroup> gi = mosesGroups.iterator();
		
		StringWriter sw = new StringWriter();
		MappingWriter mw = new MappingWriter(sw, mosesFormat);
		
		try {
			while(gi.hasNext()) {
				mw.startGroup(gi.next());
				while(mw.canWrite() && mi.hasNext()) {
					mw.writeMapping(mi.next());
				}
			}
			
			gi = mosesGroups.iterator();
			mi = mosesMappings.iterator();
			MappingReader mr = new MappingReader(new StringReader(sw.getBuffer().toString()), mosesFormat);
			
			while(gi.hasNext()) {
				MappingGroup g = gi.next();
				assertEquals(g, mr.nextGroup());
				while(mr.canRead()) {
					assertEquals(mi.next(), mr.readMapping());
				}
			}
			
			mi = naaclMappings.iterator();
			gi = naaclGroups.iterator();
			sw = new StringWriter();
			
			mw.close();
			mw = new MappingWriter(sw, naaclFormat);
			
			while(gi.hasNext()) {
				mw.startGroup(gi.next());
				while(mw.canWrite() && mi.hasNext()) {
					mw.writeMapping(mi.next());
				}
			}
			
			mi = naaclMappings.iterator();
			gi = naaclGroups.iterator();
			
			mr.close();
			mr = new MappingReader(new StringReader(sw.getBuffer().toString()), naaclFormat);
			
			while(gi.hasNext()) {
				MappingGroup g = gi.next();
				assertEquals(g, mr.nextGroup());
				while(mr.canRead()) {
					Mapping m = mi.next();
					m.setConfidence(Alignments.DEFAULT_CONFIDENCE);
					assertEquals(m, mr.readMapping());
				}
			}
			
			mosesWriter.close();
			naaclWriter.close();
			mr.close();
			mw.close();
		}
		catch(IOException io) {
			fail(io.getMessage());
		}
	}
	
	@Test
	public void testMappingWriter() {
		Iterator<Mapping> mi = mosesMappings.iterator();
		Iterator<MappingGroup> gi = mosesGroups.iterator();
		
		try {
			while(gi.hasNext()) {
				mosesWriter.startGroup(gi.next());
				while(mosesWriter.canWrite()) {
					mosesWriter.writeMapping(mi.next());
				}
			}
			
			mosesWriter.close();
			
			assertEquals(mosesOutput, mosesStringWriter.getBuffer().toString());
			
			mi = naaclMappings.iterator();
			gi = naaclGroups.iterator();
						
			while(gi.hasNext()) {
				naaclWriter.startGroup(gi.next());
				while(naaclWriter.canWrite()) {
					naaclWriter.writeMapping(mi.next());
				}
			}
			
			naaclWriter.close();
			
			assertEquals(naaclOutput, naaclStringWriter.getBuffer().toString());
			
		}
		catch(IOException io) {
			fail(io.getMessage());
		}
		
		MappingWriter mw = new MappingWriter(new StringWriter(), naaclFormat);
		try {
			mw.writeMapping(new Mapping(1, 0));
			fail("able to write mapping without starting group");
		}
		catch(IOException expected) {
			//should happen
		}
		
		mw = new MappingWriter(new StringWriter(), mosesFormat);
		
		try {
			mw.startGroup(new MappingGroup(0, 1));
			try {
				mw.writeMapping(new Mapping(1, 1, 1));
				fail("able to write mapping from different group");
			}
			catch(IOException expected) {
				//should happen
			}
		}
		catch(IOException io) {
			fail("problem testing: " + io.getMessage());
		}
		
		mw = new MappingWriter(new StringWriter(), naaclFormat);
		
		try {
			mw.startGroup(new MappingGroup(0, 1));
			mw.writeMapping(new Mapping(0, 1, 1));
			try {
				mw.writeMapping(new Mapping(0, 1, 2));
				fail("able to write too many mappings");
			}
			catch(IOException expected) {
				//should happen
			}
		}
		catch(IOException io) {
			fail("problem testing: " + io.getMessage());
		}
		
		mw = new MappingWriter(new StringWriter(), mosesFormat);
		
		try {
			mw.startGroup(new MappingGroup(0, 2));
			mw.writeMapping(new Mapping(0, 1, 1));
			try {
				mw.close();
				fail("able to write too few mappings");
			}
			catch(IOException expected) {
				//should happen
			}
		}
		catch(IOException io) {
			fail("problem testing: " + io.getMessage());
		}
		
		StringWriter sw = new StringWriter();		
		mw = new MappingWriter(sw, naaclFormat);
		
		try {
			mw.startGroup(new MappingGroup(0, 0));
			mw.endGroup();
			mw.close();
			assertEquals("", sw.getBuffer().toString());
		}
		catch(IOException io) {
			fail("problem testing: " + io.getMessage());
		}
	}

	@Test
	public void testMappingReader() {
		Iterator<Mapping> mi = mosesMappings.iterator();
		Iterator<MappingGroup> gi = mosesGroups.iterator();
		
		try {
			MappingGroup g;
			while((g = mosesReader.nextGroup()) != null) {
				assertEquals(gi.next(), g);
				while(mosesReader.canRead()) {
					assertEquals(mi.next(), mosesReader.readMapping());
				}
			}
			
			mosesReader.close();
			
			mi = naaclMappings.iterator();
			gi = naaclGroups.iterator();
			
			while((g = naaclReader.nextGroup()) != null) {
				assertEquals(gi.next(), g);
				while(naaclReader.canRead()) {
					assertEquals(mi.next(), naaclReader.readMapping());
				}
			}
			
			naaclReader.close();
			
			mosesReader = new MappingReader(new StringReader(emptyInput), mosesFormat);
			naaclReader = new MappingReader(new StringReader(emptyInput), naaclFormat);
			
			try {
				assertFalse(mosesReader.ready());
				assertFalse(mosesReader.canRead());
				assertNull(mosesReader.nextGroup());
			}
			catch(IOException io) {
				fail("problem testing: " + io.getMessage());
			}
			
			try {
				assertFalse(naaclReader.ready());
				assertFalse(naaclReader.canRead());
				assertNull(naaclReader.nextGroup());
			}
			catch(IOException expected) {
				// should happen
			}
			
			mosesReader = new MappingReader(new StringReader(lineEndingOnly), mosesFormat);
			naaclReader = new MappingReader(new StringReader(lineEndingOnly), naaclFormat);
			
			try {
				assertFalse(mosesReader.ready());
				assertFalse(mosesReader.canRead());
				assertNull(mosesReader.nextGroup());
			}
			catch(IOException io) {
				fail("problem testing: " + io.getMessage());
			}
			
			try {
				assertFalse(naaclReader.ready());
				assertFalse(naaclReader.canRead());
				assertNull(naaclReader.nextGroup());
			}
			catch(IOException io) {
				fail("problem testing: " + io.getMessage());
			}
			
			mosesReader = new MappingReader(new StringReader("5-4-"), mosesFormat);
			naaclReader = new MappingReader(new StringReader("0 S\n"), naaclFormat);
			
			try {
				mosesReader.nextGroup();
				fail("able to get next group from garbage input");
			}
			catch(IOException expected) {
				// should happen
			}
			
			try {
				naaclReader.nextGroup();
				fail("able to get next group from garbage input");
			}
			catch(IOException expected) {
				// should happen
			}
			
			mosesReader = new MappingReader(new StringReader(mosesInput), mosesFormat);
			naaclReader = new MappingReader(new StringReader(naaclInput), naaclFormat);
			
			try {
				mosesReader.readMapping();
				fail("able to read mapping without group");
			}
			catch(IOException expected) {
				// should happen
			}
			
			try {
				naaclReader.readMapping();
				fail("able to read mapping without group");
			}
			catch(IOException expected) {
				// should happen
			}
			
			mosesReader = new MappingReader(new StringReader(mosesInput), mosesFormat);
			naaclReader = new MappingReader(new StringReader(naaclInput), naaclFormat);
			
			MappingGroup mg = mosesReader.nextGroup();
			for(int i = 0; i < mg.length - 1; i++) {
				mosesReader.readMapping();
			}
			
			try {
				mosesReader.close();
				fail("able to read too few mappings");
			}
			catch(IOException expected) {
				// should happen
			}
			
			mg = naaclReader.nextGroup();
			for(int i = 0; i < mg.length - 1; i++) {
				naaclReader.readMapping();
			}
			
			try {
				naaclReader.close();
				fail("able to read too few mappings");
			}
			catch(IOException expected) {
				// should happen
			}
		}
		catch(IOException io) {
			fail(io.getMessage());
		}
	}

}


================================================
FILE: test/opennlp/ccg/alignment/MappingTest.java
================================================
package opennlp.ccg.alignment;

import static org.junit.Assert.assertEquals;
import static org.junit.Assert.assertNotSame;
import static org.junit.Assert.fail;

import org.junit.Before;
import org.junit.Test;

public class MappingTest {

	Integer id, first, second;
	Mapping mapping;
	
	@Before
	public void setUp() throws Exception {
		id = new Integer(37);
		first = new Integer(4);
		second = new Integer(7);
		mapping = new Mapping(id, first, second);
	}

	@Test
	public void testMapping() {
		try {
			new Mapping(null, 3);
			fail("able to specify null index");
		}
		catch(IllegalArgumentException expected) {
			// do nothing
		}
		
		try {
			new Mapping(3, null);
			fail("able to specify null index");
		}
		catch(IllegalArgumentException expected) {
			// do nothing
		}
		
		try {
			new Mapping(1, 2, 3, null);
			fail("able to specify null status");
		}
		catch(IllegalArgumentException expected) {
			// do nothing
		}
		
		try {
			new Mapping(1, 2, 3, Status.SURE, null);
			fail("able to specify null confidence");
		}
		catch(IllegalArgumentException expected) {
			// do nothing
		}
	}
	
	@Test
	public void testGet() {
		assertEquals(id, mapping.getPhraseNumber());
		
		assertEquals(first, mapping.getA());
		assertEquals(first, mapping.get(PhrasePosition.A));
		
		assertEquals(second, mapping.getB());
		assertEquals(second, mapping.get(PhrasePosition.B));
	}

	@Test
	public void testCompareTo() {
		Mapping m = new Mapping(id, first, second),
				n = new Mapping(id, first - 1, second + 1),
				o = new Mapping(id, first, second - 1),
				p = new Mapping(id, first + 1, second);
		
		assertEquals(0, mapping.compareTo(m));
		assertEquals(0, m.compareTo(mapping));
		
		assertEquals(1, mapping.compareTo(n));
		assertEquals(-1, n.compareTo(mapping));
		
		assertEquals(1, mapping.compareTo(o));
		assertEquals(-1, o.compareTo(mapping));
		
		assertEquals(-1, mapping.compareTo(p));
		assertEquals(1, p.compareTo(mapping));
	}

	@Test
	public void testEqualsObject() {
		Mapping m = new Mapping(id, first, second),
				n = new Mapping(id, first - 1, second + 1),
				o = new Mapping(id, first, second - 1),
				p = new Mapping(id, first + 1, second);
		
		assertEquals(mapping, m);
		assertNotSame(mapping, n);
		assertNotSame(mapping, o);
		assertNotSame(mapping, p);
	}
	
	@Test
	public void testReverse() {
		assertEquals(new Mapping(id, second, first), mapping.reverse());
	}

	@Test
	public void testSet() {
		assertEquals(Alignments.DEFAULT_STATUS, mapping.getStatus());
		mapping.setStatus(Status.POSSIBLE);
		assertEquals(Status.POSSIBLE, mapping.getStatus());
		
		assertEquals(Alignments.DEFAULT_CONFIDENCE, mapping.getConfidence());
		mapping.setConfidence(0.5);
		assertEquals(Double.valueOf(0.5d), mapping.getConfidence());
	}
	
	@Test
	public void testHashCode() {
		int hash = mapping.hashCode();
		
		mapping.setStatus(Status.POSSIBLE);
		assertEquals(hash, mapping.hashCode());
		mapping.setConfidence(0.5);
		assertEquals(hash, mapping.hashCode());
	}
}


================================================
FILE: test/opennlp/ccg/alignment/PhraseReaderWriterTest.java
================================================
package opennlp.ccg.alignment;

import static org.junit.Assert.assertEquals;
import static org.junit.Assert.assertNull;
import static org.junit.Assert.fail;

import java.io.IOException;
import java.io.StringReader;
import java.io.StringWriter;
import java.util.ArrayList;
import java.util.Iterator;
import java.util.List;

import org.junit.Before;
import org.junit.Test;

public class PhraseReaderWriterTest {

	String lineSep = System.getProperty("line.separator");
	
	String input = "Phrase one.\nPhrase two\r\nPhrase three .",
			output = "Phrase one." + lineSep + "Phrase two" + lineSep + "Phrase three ." + lineSep;
	
	PhraseReader reader;
	PhraseWriter writer;
	List<Phrase> phrases;
	
	@Before
	public void setUp() throws Exception {
		phrases = new ArrayList<Phrase>();
		phrases.add(new Phrase(0, Alignments.tokenize("Phrase one.")));
		phrases.add(new Phrase(1, Alignments.tokenize("Phrase two")));
		phrases.add(new Phrase(2, Alignments.tokenize("Phrase three .")));
	}

	@Test
	public void testConstructors() {
		try {
			new PhraseReader(new StringReader(""), null);
			fail("able to specify null number base");
		}
		catch(IllegalArgumentException expected) {
			// do nothing
		}
		
		try {
			new PhraseWriter(new StringWriter(), null);
			fail("able to specify null number base");
		}
		catch(IllegalArgumentException expected) {
			// do nothing
		}
	}
	
	@Test
	public void testBoth() {
		StringWriter sw = new StringWriter();
		writer = new PhraseWriter(sw);
		
		try {
			for(Phrase p : phrases) {
				writer.writePhrase(p);
			}
		}
		catch(IOException io) {
			fail(io.getMessage());
		}
		
		reader = new PhraseReader(new StringReader(sw.getBuffer().toString()));
		Iterator<Phrase> i = phrases.iterator();
		
		try {
			Phrase p;
			while((p = reader.readPhrase()) != null) {
				assertEquals(i.next(), p);
			}
		}
		catch(IOException io) {
			fail(io.getMessage());
		}
	}
	
	@Test
	public void testReadPhrase() {
		reader = new PhraseReader(new StringReader(input));
		
		try {
			Iterator<Phrase> i = phrases.iterator();
			Phrase p;
			while((p = reader.readPhrase()) != null) {
				assertEquals(i.next(), p);
			}
			
			reader = new PhraseReader(new StringReader(""), reader.getNumberBase());
			assertNull(reader.readPhrase());
		}
		catch(IOException io) {
			fail(io.getMessage());
		}
	}
	
	@Test
	public void testWritePhrase() {
		StringWriter sw = new StringWriter();
		writer = new PhraseWriter(sw);
		
		try {
			for(Phrase p : phrases) {
				writer.writePhrase(p);
			}
			
			assertEquals(output, sw.getBuffer().toString());
		}
		catch(IOException io) {
			fail(io.getMessage());
		}
	}

}


================================================
FILE: test/opennlp/ccg/alignment/PhraseTest.java
================================================
package opennlp.ccg.alignment;

import static org.junit.Assert.assertEquals;
import static org.junit.Assert.assertNotSame;
import static org.junit.Assert.fail;

import java.util.ArrayList;
import java.util.Iterator;
import java.util.List;

import org.junit.Before;
import org.junit.Test;

public class PhraseTest {

	Phrase phrase;
	
	String[] wordList = Alignments.tokenize("This is a test .");
	
	
	@Before
	public void setUp() throws Exception {
		phrase = new Phrase(37, wordList);
	}

	@Test
	public void testCompare() {
		Phrase o = new Phrase(43, phrase), t = new Phrase(43, phrase);
		
		assertEquals(-1, phrase.compareTo(o));
		assertEquals(1, t.compareTo(phrase));
		assertEquals(0, o.compareTo(t));
		assertEquals(0, phrase.compareTo(phrase));
	}
	
	@Test
	public void testSize() {
		assertEquals(5, phrase.size());
	}

	@Test
	public void testPhraseComparableOfIListOfString() {
		assertEquals(phrase, new Phrase(phrase.getNumber(), wordList));
		
		String[] str = null;
		
		try {
			new Phrase(phrase.getNumber(), str);
			fail("able to create phrase with null word list");
		}
		catch(IllegalArgumentException ex) {
			// expected
		}
		
		str = new String[]{"blah", null, "blah"};
		
		try {
			new Phrase(phrase.getNumber(), str);
			fail("able to create phrase with null word in list");
		}
		catch(IllegalArgumentException ex) {
			// expected
		}
	}

	@Test
	public void testGetNumber() {
		assertEquals(new Integer(37), phrase.getNumber());
	}

	@Test
	public void testGetInt() {
		assertEquals("is", phrase.get(1));
		assertEquals("a", phrase.get(2));
		assertEquals(".", phrase.get(4));
		
		try {
			phrase.get(phrase.size());
			fail("able to access word in phrase after end");
		}
		catch(IndexOutOfBoundsException expected) {
			// do nothing
		}
	}

	@Test
	public void testSetIntString() {
		try {
			phrase.set(2, "sdfskjdlkjflksjdlkj");
			fail("able to set");
		}
		catch(UnsupportedOperationException expected) {
			// noop
		}
	}
	
	@Test
	public void testAdd() {
		try {
			phrase.add("blah");
			fail("able to add");
		}
		catch(UnsupportedOperationException expected) {
			// noop
		}
	}
	
	public void testRemove() {
		try {
			phrase.remove("is");
			fail("able to remove");
		}
		catch(UnsupportedOperationException expected) {
			// noop
		}
	}
	
	public void testIteratorRemove() {
		try {
			Iterator<String> i = phrase.iterator();
			i.next();
			i.remove();
			fail("able to remove via iterator");
		}
		catch(UnsupportedOperationException expected) {
			// noop
		}
	}

	@Test
	public void testEqualsObject() {
		List<String> l = new ArrayList<String>();
		
		for(int i = 0; i < 3; i++) {
			l.add("blah");
		}
		
		Phrase same = new Phrase(phrase.getNumber(), phrase), diff = new Phrase(17, l);
		
		assertEquals(phrase, same);
		assertNotSame(phrase, diff);
		
		if(!phrase.equals(same)) {
			fail("not equal");
		}
		if(phrase.equals(diff)) {
			fail("equal");
		}
	}

}


================================================
FILE: test/opennlp/ccg/disjunctivizer/AlignedEdgeFilterTest.java
================================================
package opennlp.ccg.disjunctivizer;

import static org.junit.Assert.assertEquals;
import static org.junit.Assert.assertFalse;
import static org.junit.Assert.assertTrue;
import static org.junit.Assert.fail;

import java.util.Collections;
import java.util.HashSet;
import java.util.Set;

import opennlp.ccg.disjunctivizer.AlignedEdgeFilter;
import opennlp.ccg.disjunctivizer.MatchType;
import opennlp.ccg.hylo.ModeLabel;
import opennlp.ccg.hylo.NominalAtom;
import opennlp.ccg.hylo.Proposition;
import opennlp.ccg.hylo.graph.LFEdge;
import opennlp.ccg.hylo.graph.LFEdgeLabel;
import opennlp.ccg.hylo.graph.LFBaseTest;
import opennlp.ccg.hylo.graph.LFVertex;

import org.junit.Before;
import org.junit.Test;

public class AlignedEdgeFilterTest extends LFBaseTest {

	AlignedEdgeFilter filter;
	Set<Integer> indices;
	
	@Before
	public void setUp() throws Exception {
		super.setUp();
		
		indices = new HashSet<Integer>();
		indices.add(0);
		indices.add(2);
		indices.add(3);
		
		filter = new AlignedEdgeFilter(indices, MatchType.SOURCE_ALIGNED, MatchType.TARGET_UNALIGNED);
	}
	
	@Test
	public void testAlignedEdgeFilter() {
		try {
			new AlignedEdgeFilter(null, MatchType.SOURCE_ALIGNED);
			fail("able to specify null alignment indices");
		}
		catch(IllegalArgumentException expected) {
			// do nothing
		}
	}

	@Test
	public void testGetAlignmentIndices() {
		assertEquals(indices, filter.getAlignmentIndices());
	}

	@SuppressWarnings("unchecked")
	@Test
	public void testSetAlignmentIndices() {
		filter.setAlignmentIndices(Collections.EMPTY_SET);
		assertTrue(filter.getAlignmentIndices().isEmpty());
		
		try {
			filter.setAlignmentIndices(null);
			fail("able to specify null alignment indices");
		}
		catch(IllegalArgumentException expected) {
			// do nothing
		}
	}

	@SuppressWarnings("unchecked")
	@Test
	public void testAllows() {
		LFEdge one = new LFEdge(new LFVertex(new NominalAtom("w0"), new Proposition("blah")),
				new LFVertex(new NominalAtom("w1"), new Proposition("blah blah")),
				new LFEdgeLabel(new ModeLabel("blase"))),
			two = new LFEdge(new LFVertex(new NominalAtom("w2"), new Proposition("blah")),
				new LFVertex(new NominalAtom("w3"), new Proposition("blah blah")),
				new LFEdgeLabel(new ModeLabel("blase")));
		
		assertTrue(filter.allows(one));
		assertFalse(filter.allows(two));
		
		filter.setAlignmentIndices(Collections.EMPTY_SET);
		assertFalse(filter.allows(one));
		assertFalse(filter.allows(two));
		
		// make self-contradictory filter
		filter = new AlignedEdgeFilter(indices, MatchType.SOURCE_ALIGNED, MatchType.SOURCE_UNALIGNED);
		assertFalse(filter.allows(one));
		assertFalse(filter.allows(two));
	}

}


================================================
FILE: test/opennlp/ccg/disjunctivizer/DisjunctivizerTest.java
================================================
package opennlp.ccg.disjunctivizer;

import static org.junit.Assert.*;

import java.io.BufferedWriter;
import java.io.File;
import java.io.FileWriter;
import java.util.LinkedHashSet;
import java.util.Properties;
import java.util.Set;

import javax.xml.parsers.DocumentBuilder;
import javax.xml.parsers.DocumentBuilderFactory;
import javax.xml.parsers.ParserConfigurationException;

import opennlp.ccg.alignment.Alignment;
import opennlp.ccg.alignment.Alignments;
import opennlp.ccg.alignment.Mapping;
import opennlp.ccg.alignment.Phrase;
import opennlp.ccg.alignment.PhrasePosition;
import opennlp.ccg.alignment.Status;
import opennlp.ccg.hylo.graph.LFGraphFactory;
import opennlp.ccg.hylo.graph.LFBaseTest;

import org.apache.xml.serializer.OutputPropertiesFactory;
import org.apache.xml.serializer.Serializer;
import org.apache.xml.serializer.SerializerFactory;
import org.jdom.input.DOMBuilder;
import org.junit.Before;
import org.junit.Test;
import org.w3c.dom.Document;
import org.w3c.dom.Element;
import org.w3c.dom.NodeList;

public class DisjunctivizerTest extends LFBaseTest {

	static Properties OUTPUT_PROPERTIES = OutputPropertiesFactory.getDefaultMethodProperties("xml");
	
	static {
		OUTPUT_PROPERTIES.setProperty("indent", "yes");
		OUTPUT_PROPERTIES.setProperty("media-type", "text/xml");
		OUTPUT_PROPERTIES.setProperty(OutputPropertiesFactory.S_KEY_INDENT_AMOUNT, "2");
		OUTPUT_PROPERTIES.setProperty("{http\u003a//xml.apache.org/xalan}indent-amount", "2");
	}
	
	DocumentBuilder documentBuilder;
	DOMBuilder domBuilder;
	File alignmentsFile, paraphrasesFile, outputFile;
	
	@Before
	public void setUp() throws Exception {
		super.setUp();
		
		try {
			documentBuilder = DocumentBuilderFactory.newInstance().newDocumentBuilder();
		}
		catch(ParserConfigurationException e) {
			throw new Exception("problem with parser configuration: " + e.getLocalizedMessage(), e);
		}
		
		domBuilder = new DOMBuilder();
		
		File testDir = new File(System.getProperty("user.dir"), "test");
		
		paraphrasesFile = new File(testDir, "paraphrases.xml");
		outputFile = new File(testDir, "output.xml");
	}
	
	@Test
	public void testDisjunctivizer() {
		try {
			new Disjunctivizer(null);
			fail("able to create disjunctivizer with null document");
		}
		catch(IllegalArgumentException expected) {
			// do nothing
		}
	}

	@Test
	public void testBuildDisjunctiveLF() throws Exception {
		Document paraphrases = documentBuilder.parse(paraphrasesFile);
		
		Serializer s = SerializerFactory.getSerializer(OUTPUT_PROPERTIES);
		s.setOutputFormat(OUTPUT_PROPERTIES);
		s.setWriter(new BufferedWriter(new FileWriter(outputFile)));
		
		Disjunctivizer disj = null;
		NodeList paras = paraphrases.getElementsByTagName("paraphrase");
		Document out = documentBuilder.newDocument();
		Element dlfsElement = out.createElement("dlfs");
		out.appendChild(dlfsElement);
		
		for(int i = 0; i < paras.getLength(); i++) {
			Element para = (Element)paras.item(i);
			Integer id = Integer.parseInt(para.getAttribute("id"));
			
			Element first = (Element)para.getElementsByTagName("first").item(0), 
					second = (Element)para.getElementsByTagName("second").item(0);
			
			Set<Mapping> ms = new LinkedHashSet<Mapping>();
			NodeList als = para.getElementsByTagName("alignments");
			for(int j = 0; j < als.getLength(); j++) {
				Element al = (Element)als.item(j);
				if(al.getAttribute("source").equals("ANNOTATOR")) {
					NodeList as = al.getElementsByTagName("alignment");
					for(int k = 0; k < as.getLength(); k++) {
						Element a = (Element)as.item(k);
						ms.add(new Mapping(id, Integer.parseInt(a.getAttribute("first")),
								Integer.parseInt(a.getAttribute("second")),
										Status.forAbbreviation(a.getAttribute("status"))));
					}
				}
			}
			
			Alignment a = new Alignment(new Phrase(id,
						Alignments.tokenize(first.getElementsByTagName("string").item(0).getTextContent())),
							new Phrase(id,
								Alignments.tokenize(second.getElementsByTagName("string").item(0).getTextContent())),
						ms);
			
			Element firstLF = (Element)first.getElementsByTagName("lf").item(0),
					secondLF = (Element)second.getElementsByTagName("lf").item(0);
			
			LFGraphDifference diff = (firstLF != null && secondLF != null)
					? new LFGraphDifference(LFGraphFactory.newGraphFrom(firstLF),
							LFGraphFactory.newGraphFrom(secondLF), a)
					: null;
			
			for(PhrasePosition pos : PhrasePosition.values()) {
				Element str = out.createElement("string");
				str.setAttribute("number", Integer.toString(id));
				str.setAttribute("position", pos.name());
				str.setTextContent(Alignments.untokenize(a.get(pos)));
				
				dlfsElement.appendChild(str);
			}
			
			Element msEl = out.createElement("mappings");
			msEl.appendChild(out.createCDATASection(ms.toString()));
			dlfsElement.appendChild(msEl);
			
			if(diff == null) {
				dlfsElement.appendChild(out.createComment("missing LF!"));
			}
			else {
				if(disj == null) {
					disj = new Disjunctivizer(out);
				}
				
				Element dlf = disj.buildDisjunctiveLFFor(diff);
				dlfsElement.appendChild(dlf);
				
				assertEquals(dlf, disj.buildDisjunctiveLFFor(diff));
				
				dlfsElement.appendChild(disj.buildDisjunctiveLFFor(diff.reverse()));
				
				assertNotSame(dlf, disj.buildDisjunctiveLFFor(diff.reverse()));
			}
		}
		
		s.asDOMSerializer().serialize(out);
	}

}


================================================
FILE: test/opennlp/ccg/disjunctivizer/EdgeMatchFilterTest.java
================================================
package opennlp.ccg.disjunctivizer;

import static org.junit.Assert.assertFalse;
import static org.junit.Assert.assertTrue;
import static org.junit.Assert.fail;
import opennlp.ccg.disjunctivizer.EdgeMatchFilter;
import opennlp.ccg.disjunctivizer.MatchType;
import opennlp.ccg.hylo.ModeLabel;
import opennlp.ccg.hylo.NominalAtom;
import opennlp.ccg.hylo.Proposition;
import opennlp.ccg.hylo.graph.LFEdge;
import opennlp.ccg.hylo.graph.LFEdgeLabel;
import opennlp.ccg.hylo.graph.LFBaseTest;
import opennlp.ccg.hylo.graph.LFVertex;

import org.junit.Before;
import org.junit.Test;

public class EdgeMatchFilterTest extends LFBaseTest {

	EdgeMatchFilter filter;
	LFEdge edge;
	
	@Before
	public void setUp() throws Exception {
		super.setUp();
		
		edge = new LFEdge(new LFVertex(new NominalAtom("w0"), new Proposition("blah")),
				new LFVertex(new NominalAtom("w1"), new Proposition("blah blah")),
				new LFEdgeLabel(new ModeLabel("blase")));
		
		filter = new EdgeMatchFilter(edge, MatchType.LABEL_MISMATCH, MatchType.SOURCE_PREDICATE_MISMATCH,
				MatchType.TARGET_PREDICATE_MATCH);
	}

	@Test
	public void testEdgeMatchFilter() {
		try {
			new EdgeMatchFilter(null, MatchType.LABEL_MATCH);
			fail("able to specify null edge");
		}
		catch(IllegalArgumentException expected) {
			// do nothing
		}
	}
	
	@Test
	public void testAllows() {
		LFEdge test = new LFEdge(new LFVertex(new NominalAtom("w0"), new Proposition("blah blah")),
				new LFVertex(new NominalAtom("w1"), new Proposition("blah blah")),
				new LFEdgeLabel(new ModeLabel("boring")));
		
		assertTrue(filter.allows(test));
		
		test = new LFEdge(test.getSource(), test.getTarget(), edge.getLabel());
		assertFalse(filter.allows(test));
	}

}


================================================
FILE: test/opennlp/ccg/disjunctivizer/FilteredLFEdgeSetTest.java
================================================
package opennlp.ccg.disjunctivizer;

import static org.junit.Assert.*;

import java.util.HashSet;
import java.util.LinkedHashSet;
import java.util.Set;

import opennlp.ccg.disjunctivizer.AlignedEdgeFilter;
import opennlp.ccg.disjunctivizer.EdgeMatchFilter;
import opennlp.ccg.disjunctivizer.FilteredLFEdgeSet;
import opennlp.ccg.disjunctivizer.MatchType;
import opennlp.ccg.hylo.ModeLabel;
import opennlp.ccg.hylo.NominalAtom;
import opennlp.ccg.hylo.Proposition;
import opennlp.ccg.hylo.graph.LFEdge;
import opennlp.ccg.hylo.graph.LFEdgeLabel;
import opennlp.ccg.hylo.graph.LFBaseTest;
import opennlp.ccg.hylo.graph.LFVertex;
import opennlp.ccg.util.CompositeFilter;
import opennlp.ccg.util.Filter;

import org.junit.Before;
import org.junit.Test;

public class FilteredLFEdgeSetTest extends LFBaseTest {

	FilteredLFEdgeSet set;
	Set<LFEdge> edges;
	Filter<LFEdge> edgeFilter;
	
	LFEdge one, two, three;
	
	@SuppressWarnings("unchecked")
	@Before
	public void setUp() throws Exception {
		super.setUp();
		
		one = new LFEdge(new LFVertex(new NominalAtom("w0"), new Proposition("blah")),
				new LFVertex(new NominalAtom("w1"), new Proposition("blah blah")),
				new LFEdgeLabel(new ModeLabel("blase")));
		two = new LFEdge(new LFVertex(new NominalAtom("w2"), new Proposition("blah")),
				new LFVertex(new NominalAtom("w3"), new Proposition("blah blah")),
				new LFEdgeLabel(new ModeLabel("bored")));
		three = new LFEdge(new LFVertex(new NominalAtom("w0"), new Proposition("zzz")),
				new LFVertex(new NominalAtom("w2"), new Proposition("snooze")),
				new LFEdgeLabel(new ModeLabel("blase")));
		
		edges = new LinkedHashSet<LFEdge>();
		edges.add(one);
		edges.add(two);
		edges.add(three);
		
		Set<Integer> indices = new HashSet<Integer>();
		indices.add(0);
		indices.add(2);
		indices.add(3);
		
		edgeFilter = new CompositeFilter<LFEdge>(new EdgeMatchFilter(one, MatchType.SOURCE_PREDICATE_MATCH,
				MatchType.LABEL_MISMATCH), new AlignedEdgeFilter(indices,
						MatchType.TARGET_ALIGNED, MatchType.SOURCE_ALIGNED));
		
		set = new FilteredLFEdgeSet(edges, edgeFilter);
	}

	@Test
	public void testSourceView() {
		assertTrue(set.sourceView().contains(two.getSource()));
		assertEquals(1, set.sourceView().size());
	}

	@Test
	public void testTargetView() {
		assertTrue(set.targetView().contains(two.getTarget()));
		assertEquals(1, set.targetView().size());
	}

	@Test
	public void testLabelView() {
		assertTrue(set.labelView().contains(two.getLabel()));
		assertEquals(1, set.labelView().size());
	}

}


================================================
FILE: test/opennlp/ccg/disjunctivizer/LFGraphDifferenceTest.java
================================================
package opennlp.ccg.disjunctivizer;

import static org.junit.Assert.assertEquals;
import static org.junit.Assert.assertFalse;
import static org.junit.Assert.assertTrue;
import static org.junit.Assert.fail;

import java.util.Collections;
import java.util.Iterator;
import java.util.Map;
import java.util.Set;

import opennlp.ccg.alignment.Alignment;
import opennlp.ccg.alignment.Mapping;
import opennlp.ccg.alignment.Phrase;
import opennlp.ccg.alignment.PhrasePosition;
import opennlp.ccg.hylo.ModeLabel;
import opennlp.ccg.hylo.NominalAtom;
import opennlp.ccg.hylo.Proposition;
import opennlp.ccg.hylo.graph.LFEdge;
import opennlp.ccg.hylo.graph.LFEdgeLabel;
import opennlp.ccg.hylo.graph.LFGraph;
import opennlp.ccg.hylo.graph.LFBaseTest;
import opennlp.ccg.hylo.graph.LFVertex;

import org.junit.Before;
import org.junit.Test;

public class LFGraphDifferenceTest extends LFBaseTest {

	LFGraph aGraph, bGraph;
	Alignment alignment;
	LFGraphDifference diff;
	
	LFEdge aDet, aArg0, aMod, bArg0;
	
	@SuppressWarnings("unchecked")
	@Before
	public void setUp() throws Exception {
		super.setUp();
		
		alignment = new Alignment(new Phrase(337, "A", "boy", "walks", "quickly"),
				new Phrase(337, "He", "moves"),
				Collections.EMPTY_SET);
		
		alignment.add(new Mapping(0, 0));
		alignment.add(new Mapping(1, 0));
		alignment.add(new Mapping(2, 1));
		
		aGraph = new LFGraph();
		
		LFVertex aw0 = new LFVertex(new NominalAtom("w0"), new Proposition("a")),
			aw1 = new LFVertex(new NominalAtom("w1"), new Proposition("boy")),
			aw2 = new LFVertex(new NominalAtom("w2"), new Proposition("walk")),
			aw3 = new LFVertex(new NominalAtom("w3"), new Proposition("quickly"));
		
		aGraph.addVertex(aw0);
		aGraph.addVertex(aw1);
		aGraph.addVertex(aw2);
		aGraph.addVertex(aw3);
				
		aDet = aGraph.addLabeledEdge(aw1, aw0, LFEdgeLabel.forMode(new ModeLabel("Det")));
		aArg0 = aGraph.addLabeledEdge(aw2, aw1, LFEdgeLabel.forMode(new ModeLabel("Arg0")));
		aMod = aGraph.addLabeledEdge(aw2, aw3, LFEdgeLabel.forMode(new ModeLabel("Mod")));
		
		bGraph = new LFGraph();
		
		LFVertex bw0 = new LFVertex(new NominalAtom("w0"), new Proposition("he")),
			bw1 = new LFVertex(new NominalAtom("w1"), new Proposition("move"));
		
		bGraph.addVertex(bw0);
		bGraph.addVertex(bw1);
				
		bArg0 = bGraph.addLabeledEdge(bw1, bw0, LFEdgeLabel.forMode(new ModeLabel("Arg0")));
		
		diff = new LFGraphDifference(aGraph, bGraph, alignment);
	}
	
	@Test
	public void testLFGraphDifference() {
		try {
			new LFGraphDifference(null, bGraph, alignment);
			fail("able to create LF graph difference with null graph");
		}
		catch(IllegalArgumentException expected) {
			// do nothing
		}
		
		try {
			new LFGraphDifference(aGraph, null, alignment);
			fail("able to create LF graph difference with null graph");
		}
		catch(IllegalArgumentException expected) {
			// do nothing
		}
		
		try {
			new LFGraphDifference(aGraph, bGraph, null);
			fail("able to create LF graph difference with null graph");
		}
		catch(IllegalArgumentException expected) {
			// do nothing
		}
	}

	@Test
	public void testReverse() {
		LFGraphDifference ffid = diff.reverse();
		
		assertEquals(diff.a.vertexSet(), ffid.b.vertexSet());
		assertEquals(diff.a.edgeSet(), ffid.b.edgeSet());
		
		for(PhrasePosition pos : PhrasePosition.values()) {
			assertEquals(diff.alignment.get(pos), ffid.alignment.get(pos.opposite()));
		}
		
		Map<Integer, Set<Integer>> m = ffid.alignment.asMap();
		
		assertTrue(m.get(0).contains(0));
		assertTrue(m.get(0).contains(1));
		assertTrue(m.get(1).contains(2));
	}

	@Test
	public void testDeletes() {
		Set<LFEdge> dels = diff.deletes();
		
		try {
			dels.add(bArg0);
			fail("able to add edge");
		}
		catch(UnsupportedOperationException expected) {
			// noop
		}
		
		try {
			dels.remove(bArg0);
			fail("able to remove edge");
		}
		catch(UnsupportedOperationException expected) {
			// noop
		}
		
		try {
			Iterator<LFEdge> i = dels.iterator();
			i.next();
			i.remove();
			fail("able to remove edge");
		}
		catch(UnsupportedOperationException expected) {
			// noop
		}
		
		assertEquals(Collections.singleton(aMod), diff.deletes());
		assertEquals(Collections.emptySet(), diff.reverse().deletes());
	}

	@Test
	public void testInserts() {
		Set<LFEdge> ins = diff.inserts();
		
		try {
			ins.add(bArg0);
			fail("able to add edge");
		}
		catch(UnsupportedOperationException expected) {
			// noop
		}
		
		try {
			ins.remove(bArg0);
			fail("able to remove edge");
		}
		catch(UnsupportedOperationException expected) {
			// noop
		}
		
		assertEquals(Collections.emptySet(), diff.inserts());
		assertEquals(Collections.singleton(aMod), diff.reverse().inserts());
	}

	@Test
	public void testSubstitutions() {
		Set<LFEdge> subs = diff.substitutions();
		
		try {
			subs.add(bArg0);
			fail("able to add edge");
		}
		catch(UnsupportedOperationException expected) {
			// noop
		}
		
		try {
			subs.remove(bArg0);
			fail("able to remove edge");
		}
		catch(UnsupportedOperationException expected) {
			// noop
		}
		
		try {
			Iterator<LFEdge> i = subs.iterator();
			i.next();
			i.remove();
			fail("able to remove edge");
		}
		catch(UnsupportedOperationException expected) {
			// noop
		}
		
		assertTrue(subs.contains(bArg0));
		assertFalse(subs.contains(aArg0));
		assertFalse(subs.contains(aDet));
		assertFalse(subs.contains(aMod));
		
		assertEquals(Collections.singleton(bArg0), diff.substitutionsFor(aArg0));
		assertEquals(Collections.singleton(aArg0), diff.reverse().substitutionsFor(bArg0));
	}

	@Test
	public void testSubstitutionsBySource() {
		Map<LFVertex, Set<LFEdge>> map = diff.substitutionsBySource();
		assertTrue(map.keySet().contains(bArg0.getSource()));
		assertTrue(map.get(bArg0.getSource()).contains(bArg0));
		assertEquals(1, map.size());
		
		try {
			map.remove(bArg0.getSource());
			fail("able to remove edge");
		}
		catch(UnsupportedOperationException expected) {
			// noop
		}
		
		try {
			map.put(aArg0.getSource(), Collections.singleton(aArg0));
			fail("able to put edge");
		}
		catch(UnsupportedOperationException expected) {
			// noop
		}
		
		try {
			Iterator<Map.Entry<LFVertex, Set<LFEdge>>> i = map.entrySet().iterator();
			i.next();
			i.remove();
			fail("able to remove entry");
		}
		catch(UnsupportedOperationException expected) {
			// noop
		}
	}
	
	@Test
	public void testSubstitutionsBySourceFor() {
		Map<LFVertex, Set<LFEdge>> map = diff.substitutionsBySourceFor(aArg0);
		assertTrue(map.keySet().contains(bArg0.getSource()));
		assertTrue(map.get(bArg0.getSource()).contains(bArg0));
		assertEquals(1, map.size());
		
		try {
			map.remove(bArg0.getSource());
			fail("able to remove edge");
		}
		catch(UnsupportedOperationException expected) {
			// noop
		}
		
		try {
			map.put(aArg0.getSource(), Collections.singleton(aArg0));
			fail("able to put edge");
		}
		catch(UnsupportedOperationException expected) {
			// noop
		}
		
		try {
			Iterator<Map.Entry<LFVertex, Set<LFEdge>>> i = map.entrySet().iterator();
			i.next();
			i.remove();
			fail("able to remove entry");
		}
		catch(UnsupportedOperationException expected) {
			// noop
		}
		
		map = diff.substitutionsBySourceFor(aDet);
		assertTrue(map.isEmpty());
	}
}


================================================
FILE: test/opennlp/ccg/disjunctivizer/LabelMatchFilterTest.java
================================================
package opennlp.ccg.disjunctivizer;

import static org.junit.Assert.*;

import opennlp.ccg.disjunctivizer.LabelMatchFilter;
import opennlp.ccg.hylo.ModeLabel;
import opennlp.ccg.hylo.NominalAtom;
import opennlp.ccg.hylo.Proposition;
import opennlp.ccg.hylo.graph.LFEdge;
import opennlp.ccg.hylo.graph.LFEdgeLabel;
import opennlp.ccg.hylo.graph.LFBaseTest;
import opennlp.ccg.hylo.graph.LFVertex;

import org.junit.Before;
import org.junit.Test;

public class LabelMatchFilterTest extends LFBaseTest {

	LabelMatchFilter filter;
	LFEdgeLabel label;
	LFEdge one, two;
	
	@Before
	public void setUp() throws Exception {
		super.setUp();
		
		one = new LFEdge(new LFVertex(new NominalAtom("w0"), new Proposition("blah")),
				new LFVertex(new NominalAtom("w1"), new Proposition("blah blah")),
				new LFEdgeLabel(new ModeLabel("blase")));
		two = new LFEdge(new LFVertex(new NominalAtom("w2"), new Proposition("blah")),
				new LFVertex(new NominalAtom("w3"), new Proposition("blah blah")),
				new LFEdgeLabel(new ModeLabel("blurg")));
		
		label = new LFEdgeLabel(new ModeLabel("blase"));
		
		filter = new LabelMatchFilter(label);
	}
	
	@Test
	public void testLabelMatchFilter() {
		try {
			new LabelMatchFilter(null);
			fail("able to specify null label");
		}
		catch(IllegalArgumentException expected) {
			// do nothing
		}
	}

	@Test
	public void testSetBasis() {
		filter.setBasis(new LFEdgeLabel(new ModeLabel("boo")));
		
		assertFalse(filter.allows(one));
		assertFalse(filter.allows(two));
		
		try {
			filter.setBasis(null);
			fail("able to specify null label");
		}
		catch(IllegalArgumentException expected) {
			// do nothing
		}
	}

	@Test
	public void testAllows() {
		assertTrue(filter.allows(one));
		assertFalse(filter.allows(two));
	}

}


================================================
FILE: test/opennlp/ccg/disjunctivizer/VertexMatchFilterTest.java
================================================
package opennlp.ccg.disjunctivizer;

import static org.junit.Assert.*;

import opennlp.ccg.disjunctivizer.MatchType;
import opennlp.ccg.disjunctivizer.VertexMatchFilter;
import opennlp.ccg.hylo.ModeLabel;
import opennlp.ccg.hylo.NominalAtom;
import opennlp.ccg.hylo.Proposition;
import opennlp.ccg.hylo.graph.LFEdge;
import opennlp.ccg.hylo.graph.LFEdgeLabel;
import opennlp.ccg.hylo.graph.LFBaseTest;
import opennlp.ccg.hylo.graph.LFVertex;

import org.junit.Before;
import org.junit.Test;

public class VertexMatchFilterTest extends LFBaseTest {
	
	VertexMatchFilter filter;
	LFVertex one, two;
	LFEdge edge;

	@Before
	public void setUp() throws Exception {
		super.setUp();
		
		one = new LFVertex(new NominalAtom("w0"), new Proposition("blah"));
		two = new LFVertex(new NominalAtom("w1"), new Proposition("blah"));
		
		edge = new LFEdge(two,
				new LFVertex(new NominalAtom("w2"), new Proposition("blah blah")),
				new LFEdgeLabel(new ModeLabel("blase")));
		
		filter = new VertexMatchFilter(two, MatchType.SOURCE_MATCH);
	}

	@Test
	public void testVertexMatchFilter() {
		try {
			new VertexMatchFilter(null, MatchType.SOURCE_PREDICATE_MATCH);
			fail("able to specify null basis");
		}
		catch(IllegalArgumentException expected) {
			// do nothing
		}
	}
	
	@Test
	public void testSetBasis() {
		filter.setBasis(one);
		assertFalse(filter.allows(edge));
		
		edge = new LFEdge(one, edge.getTarget(), edge.getLabel());
		assertTrue(filter.allows(edge));
		
		try {
			filter.setBasis(null);
			fail("able to specify null basis");
		}
		catch(IllegalArgumentException expected) {
			// do nothing
		}
	}

	@Test
	public void testAllows() {
		assertTrue(filter.allows(edge));
		
		edge = new LFEdge(one, edge.getTarget(), edge.getLabel());
		assertFalse(filter.allows(edge));
	}

}


================================================
FILE: test/opennlp/ccg/hylo/graph/LFBaseTest.java
================================================
package opennlp.ccg.hylo.graph;

import java.io.File;

import opennlp.ccg.grammar.Grammar;

import org.junit.Before;
import org.junit.Test;

public class LFBaseTest {

	static Grammar grammar = null;
	
	@Before
	@SuppressWarnings("deprecation")
	public void setUp() throws Exception {
		if(grammar == null) {
			grammar = new Grammar(new File(new File(
					new File(System.getProperty("user.dir")), "test"),
					"grammar.xml").toURL());
		}
	}

	@Test
	public void dummy() {}

}


================================================
FILE: test/opennlp/ccg/hylo/graph/LFEdgeFactoryTest.java
================================================
package opennlp.ccg.hylo.graph;

import static org.junit.Assert.*;

import org.junit.Before;
import org.junit.Test;

public class LFEdgeFactoryTest extends LFEdgeTest {

	LFEdgeFactory factory;
	
	@Before
	public void setUp() throws Exception {
		super.setUp();
		
		factory = new DefaultLFEdgeFactory();
	}

	@Test
	public void testCreateEdge() {
		assertNotSame(edge, factory.createEdge(edge.source, edge.target));
		
		edge = new LFEdge(edge.source, edge.target, null);
		assertEquals(edge, factory.createLabeledEdge(edge.source, edge.target, null));
	}

	@Test
	public void testCreateLabeledEdge() {
		assertEquals(edge, factory.createLabeledEdge(edge.source, edge.target, edge.label));
	}

}


================================================
FILE: test/opennlp/ccg/hylo/graph/LFEdgeTest.java
================================================
package opennlp.ccg.hylo.graph;

import static org.junit.Assert.*;

import opennlp.ccg.hylo.ModeLabel;
import opennlp.ccg.hylo.NominalAtom;
import opennlp.ccg.hylo.Proposition;

import org.junit.Before;
import org.junit.Test;

public class LFEdgeTest extends LFBaseTest {

	LFVertex source, target;
	LFEdgeLabel label;
	LFEdge edge;
	
	@Before
	public void setUp() throws Exception {
		super.setUp();
		
		source = new LFVertex(new NominalAtom("w3"), new Proposition("prop1"));
		target = new LFVertex(new NominalAtom("w9"), new Proposition("prop2"));
		label = new LFEdgeLabel(new ModeLabel("Arg0"));
		
		edge = new LFEdge(source, target, label);
	}

	@Test
	public void testLFEdge() {
		try {
			new LFEdge(null, target);
			fail("able to specify null target");
		}
		catch(IllegalArgumentException expected) {
			// do nothing
		}
		
		try {
			new LFEdge(source, null);
			fail("able to specify null target");
		}
		catch(IllegalArgumentException expected) {
			// do nothing
		}
		
		try {
			new LFEdge(source, target, null);
		}
		catch(IllegalArgumentException expected) {
			fail("unable to specify null label");
		}
	}
	
	@Test
	public void testEqualsObject() {
		assertEquals(edge, new LFEdge(edge.source, edge.target, edge.label));
	}

}


================================================
FILE: test/opennlp/ccg/hylo/graph/LFGraphTest.java
================================================
package opennlp.ccg.hylo.graph;

import static org.junit.Assert.*;

import java.io.File;
import java.util.HashSet;

import javax.xml.parsers.DocumentBuilder;
import javax.xml.parsers.DocumentBuilderFactory;
import javax.xml.parsers.ParserConfigurationException;

import opennlp.ccg.hylo.ModeLabel;
import opennlp.ccg.hylo.NominalAtom;
import opennlp.ccg.hylo.Proposition;
import opennlp.ccg.realize.Realizer;
import opennlp.ccg.synsem.LF;

import org.jdom.input.DOMBuilder;
import org.junit.Before;
import org.junit.Test;

public class LFGraphTest extends LFBaseTest {

	LF testLF;
	LFGraph graph, expected;
	
	@Before
	public void setUp() throws Exception {
		super.setUp();
		
		DocumentBuilder db;
		try {
			db = DocumentBuilderFactory.newInstance().newDocumentBuilder();
		}
		catch(ParserConfigurationException e) {
			throw new Exception("problem with parser configuration: " + e.getLocalizedMessage(), e);
		}
		
		File testFile = new File(new File(new File(System.getProperty("user.dir")), "test"), "testlf.xml");
		testLF = Realizer.getLfFromElt(new DOMBuilder().build(db.parse(testFile).getDocumentElement()));
		
		graph = LFGraphFactory.newGraphFrom(testLF);
		
		expected = new LFGraph(LFGraphFactory.DEFAULT_EDGE_FACTORY);
		LFVertex w7 = new LFVertex(new NominalAtom("w7"), new Proposition("be"));
		w7.setAttribute(new ModeLabel("mood"), new Proposition("dcl"));
		w7.setAttribute(new ModeLabel("tense"), new Proposition("past"));
		expected.addVertex(w7);
		
		LFVertex w0 = new LFVertex(new NominalAtom("w0"), new Proposition("bank"));
		w0.setAttribute(new ModeLabel("det"), new Proposition("nil"));
		expected.addVertex(w0);
		
		LFVertex w1 = new LFVertex(new NominalAtom("w1"), new Proposition("of"));
		expected.addVertex(w1);
		
		LFVertex w2 = new LFVertex(new NominalAtom("w2"), new Proposition("holland"));
		w2.setAttribute(new ModeLabel("det"), new Proposition("nil"));
		w2.setAttribute(new ModeLabel("num"), new Proposition("sg"));
		expected.addVertex(w2);
		
		LFVertex w5 = new LFVertex(new NominalAtom("w5"), new Proposition("office"));
		w5.setAttribute(new ModeLabel("det"), new Proposition("nil"));
		w5.setAttribute(new ModeLabel("num"), new Proposition("sg"));
		expected.addVertex(w5);
		
		LFVertex w4 = new LFVertex(new NominalAtom("w4"), new Proposition("wuhan"));
		w4.setAttribute(new ModeLabel("num"), new Proposition("sg"));
		expected.addVertex(w4);
		
		LFVertex w9 = new LFVertex(new NominalAtom("w9"), new Proposition("officially"));
		expected.addVertex(w9);
		
		LFVertex w8 = new LFVertex(new NominalAtom("w8"), new Proposition("also"));
		expected.addVertex(w8);
		
		LFVertex w10 = new LFVertex(new NominalAtom("w10"), new Proposition("establish"));
		w10.setAttribute(new ModeLabel("tense"), new Proposition("past"));
		expected.addVertex(w10);
		
		LFVertex w11 = new LFVertex(new NominalAtom("w11"), new Proposition("just"));
		expected.addVertex(w11);
		
		LFVertex w12 = new LFVertex(new NominalAtom("w12"), new Proposition("recently"));
		expected.addVertex(w12);
		
		expected.addLabeledEdge(w7, w0, LFEdgeLabel.forMode(new ModeLabel("Arg0")));
		expected.addLabeledEdge(w0, w1, LFEdgeLabel.forMode(new ModeLabel("Mod")));
		expected.addLabeledEdge(w1, w2, LFEdgeLabel.forMode(new ModeLabel("Arg1")));
		expected.addLabeledEdge(w2, w5, LFEdgeLabel.forMode(new ModeLabel("ApposRel")));
		expected.addLabeledEdge(w5, w4, LFEdgeLabel.forMode(new ModeLabel("Mod")));
		
		expected.addLabeledEdge(w7, w9, LFEdgeLabel.forMode(new ModeLabel("Arg1")));
		expected.addLabeledEdge(w9, w0, LFEdgeLabel.forMode(new ModeLabel("Arg0")));
		
		expected.addLabeledEdge(w7, w8, LFEdgeLabel.forMode(new ModeLabel("Mod")));
		expected.addLabeledEdge(w7, w10, LFEdgeLabel.forMode(new ModeLabel("GenRel")));
		expected.addLabeledEdge(w10, w0, LFEdgeLabel.forMode(new ModeLabel("Arg1")));
		expected.addLabeledEdge(w10, w11, LFEdgeLabel.forMode(new ModeLabel("Mod")));
		expected.addLabeledEdge(w10, w12, LFEdgeLabel.forMode(new ModeLabel("Mod")));		
	}

	@Test
	public void testLFGraph() {
		assertEquals(expected.vertexSet(), graph.vertexSet());
		assertEquals(expected.edgeSet(), graph.edgeSet());
	}

	@Test
	public void testRemoveVertex() {
		for(LFVertex v : new HashSet<LFVertex>(graph.vertexSet())) {
			graph.removeVertex(v);
			assertNull(graph.findVertexByNominal(v.nominal));
		}
	}
	
	@Test
	public void testFindVertexByNominal() {
		for(LFVertex vertex : expected.vertexSet()) {
			assertEquals(vertex, graph.findVertexByNominal(vertex.nominal));
		}
	}

}


================================================
FILE: test/opennlp/ccg/hylo/graph/LFVertexTest.java
================================================
package opennlp.ccg.hylo.graph;

import static org.junit.Assert.*;

import java.util.Collections;
import java.util.HashMap;
import java.util.Iterator;
import java.util.Map;

import opennlp.ccg.hylo.Mode;
import opennlp.ccg.hylo.ModeLabel;
import opennlp.ccg.hylo.Nominal;
import opennlp.ccg.hylo.NominalAtom;
import opennlp.ccg.hylo.Proposition;

import org.junit.Before;
import org.junit.Test;

public class LFVertexTest extends LFBaseTest {

	Nominal wordNominal, nonwordNominal;
	Proposition proposition;
	
	Integer wordIndex, nonwordIndex;
	LFVertex word, nonword;
	
	Map<Mode, Proposition> attrs;
	
	@Before
	public void setUp() throws Exception {
		super.setUp();
		
		wordNominal = new NominalAtom("w7");
		nonwordNominal = new NominalAtom("x1");
		proposition = new Proposition("prop");
		
		wordIndex = Integer.valueOf(7);
		nonwordIndex = Integer.valueOf(1);
		
		attrs = new HashMap<Mode, Proposition>();
		attrs.put(new ModeLabel("num"), new Proposition("sg"));
		attrs.put(new ModeLabel("det"), new Proposition("nil"));
		attrs.put(new ModeLabel("tense"), new Proposition("past"));
		
		word = new LFVertex(wordNominal, proposition, attrs);
		nonword = new LFVertex(nonwordNominal, proposition);
	}

	@Test
	public void testLFVertex() {
		try {
			new LFVertex((Nominal)null);
			fail("able to specify null nominal");
		}
		catch(IllegalArgumentException expected) {
			// do nothing
		}
		
		try {
			new LFVertex(wordNominal, null);
		}
		catch(IllegalArgumentException expected) {
			fail("unable to specify null proposition");
		}
	}
	
	@Test
	public void testGetType() {
		assertEquals(LFVertexType.WORD, word.getType());
		assertEquals(LFVertexType.NONWORD, nonword.getType());
		
		assertNotSame(LFVertexType.WORD, nonword.getType());
		assertNotSame(LFVertexType.NONWORD, word.getType());
	}

	@Test
	public void testGetIndex() {
		assertEquals(wordIndex, word.getIndex());
		assertEquals(nonwordIndex, nonword.getIndex());
	}

	@Test
	public void testAttributeNames() {
		assertEquals(attrs.keySet(), word.attributeNames());
		assertEquals(Collections.emptySet(), nonword.attributeNames());
		
		try {
			Iterator<Mode> i = word.attributeNames().iterator();
			i.next();
			i.remove();
			fail("able to remove attribute name");
		}
		catch(UnsupportedOperationException expected) {
			// do nothing
		}
	}
	
	@Test
	public void testContainsAttribute() {
		Mode num = new ModeLabel("num");
		assertTrue(word.containsAttribute(num));
		word.removeAttribute(num);
		assertFalse(word.containsAttribute(num));
	}

	@Test
	public void testGetAttribute() {
		for(Mode m : attrs.keySet()) {
			assertEquals(attrs.get(m), word.getAttributeValue(m));
			assertNull(nonword.getAttributeValue(m));
		}
	}

	@Test
	public void testAddAttribute() {
		Mode num = new ModeLabel("num");
		Proposition prop = new Proposition("pl");
		
		assertFalse(word.addAttribute(num, new Proposition("sg")));
		assertTrue(word.addAttribute(num, prop));
		assertFalse(word.addAttribute(num, prop));
		assertTrue(word.containsAttribute(num));
		
		assertTrue(nonword.addAttribute(num, new Proposition("sg")));
		assertFalse(nonword.addAttribute(num, new Proposition("sg")));
		assertTrue(nonword.containsAttribute(num));
		assertTrue(nonword.addAttribute(num, prop));
		assertFalse(nonword.addAttribute(num, prop));
		assertTrue(nonword.containsAttribute(num));
	}
	
	@Test
	public void testSetAttribute() {
		Mode num = new ModeLabel("num");
		Proposition prop = new Proposition("pl");
		
		assertEquals(attrs.get(num), word.setAttribute(num, prop));
		assertEquals(prop, word.getAttributeValue(num));
		
		assertNull(nonword.setAttribute(num, prop));
		assertEquals(prop, nonword.getAttributeValue(num));
	}
	
	@Test
	public void testRemoveAttribute() {
		Mode num = new ModeLabel("num");
		
		assertEquals(attrs.get(num), word.removeAttribute(num));
		assertNull(nonword.removeAttribute(num));
	}

	@Test
	public void testEqualsObject() {
		LFVertex v = new LFVertex(wordNominal, proposition);
		for(Mode m : attrs.keySet()) {
			v.setAttribute(m, attrs.get(m));
		}
		
		assertEquals(v, word);
		assertNotSame(v, nonword);
	}
	
	@Test
	public void testGetAttributeMap() {
		Map<Mode,Proposition> m = word.getAttributeMap();
		assertEquals(attrs, m);
		
		try {
			Iterator<Map.Entry<Mode,Proposition>> i = m.entrySet().iterator();
			i.next();
			i.remove();
			fail("able to remove from attribute map");
		}
		catch(UnsupportedOperationException expected) {
			// do nothing
		}
		
		try {
			m.put(new ModeLabel("foo"), new Proposition("bar"));
			fail("able to put into attribute map");
		}
		catch(UnsupportedOperationException expected) {
			// do nothing
		}
	}
}


================================================
FILE: test/opennlp/ccg/util/CompositeFilterTest.java
================================================
package opennlp.ccg.util;

import static org.junit.Assert.*;

import java.util.HashSet;
import java.util.Set;

import org.junit.Before;
import org.junit.Test;

public class CompositeFilterTest {

	VisitedFilter<Integer> visited;
	Integer target = 37;
	Filter<Integer> lessThanFilter, greaterThanFilter;
	CompositeFilter<Integer> bothFilter, equalToFilter;
	
	@SuppressWarnings("unchecked")
	@Before
	public void setUp() throws Exception {
		visited = new VisitedFilter<Integer>();
		
		lessThanFilter = new Filter<Integer>() {
			@Override
			public boolean allows(Integer e) {
				return e < target;
			}
		};
		
		greaterThanFilter = new Filter<Integer>() {
			@Override
			public boolean allows(Integer e) {
				return e > target;
			}
		};
		
		Set<Filter<Integer>> s = new HashSet<Filter<Integer>>();
		s.add(lessThanFilter);
		s.add(greaterThanFilter);
		
		bothFilter = new CompositeFilter<Integer>(s);
		equalToFilter = new CompositeFilter<Integer>(new InverseFilter<Integer>(bothFilter));
	}

	@Test
	public void testContainsFilter() {
		assertTrue(bothFilter.containsFilter(lessThanFilter));
		assertTrue(bothFilter.containsFilter(greaterThanFilter));
		assertFalse(bothFilter.containsFilter(bothFilter));
	}

	@Test
	public void testAddFilter() {
		Filter<Integer> f = new VisitedFilter<Integer>();
		equalToFilter.addFilter(f);
		
		assertTrue(equalToFilter.allows(37));
		assertFalse(equalToFilter.allows(37));
		
		try {
			equalToFilter.addFilter(null);
			fail("able to add null filter");
		}
		catch(IllegalArgumentException expected) {
			// do nothing
		}
	}

	@Test
	public void testRemoveFilter() {
		Filter<Integer> f = new VisitedFilter<Integer>();
		equalToFilter.addFilter(f);
		assertTrue(equalToFilter.allows(37));
		
		equalToFilter.removeFilter(f);
		
		assertTrue(equalToFilter.allows(37));
		assertTrue(equalToFilter.allows(37));
	}

	@Test
	public void testAllows() {
		assertTrue(lessThanFilter.allows(17));
		assertFalse(lessThanFilter.allows(38));
		
		assertFalse(greaterThanFilter.allows(17));
		assertTrue(greaterThanFilter.allows(38));
		
		assertFalse(bothFilter.allows(37));
		assertTrue(equalToFilter.allows(37));
	}

}


================================================
FILE: test/opennlp/ccg/util/DelegatedFilterTest.java
================================================
package opennlp.ccg.util;

import static org.junit.Assert.*;

import org.junit.Before;
import org.junit.Test;

public class DelegatedFilterTest {

	Filter<Integer> lengthFilter;
	DelegatedFilter<String, Integer> stringFilter;
	
	@Before
	public void setUp() throws Exception {
		lengthFilter = new Filter<Integer>() {
			@Override
			public boolean allows(Integer i) {
				return i <= 5;
			}
		};
		
		stringFilter = new DelegatedFilter<String, Integer>(lengthFilter) {
			@Override
			public Integer delegateValueFor(String e) {
				return e.length();
			}
		};
	}

	@Test
	public void testAllows() {
		assertTrue(stringFilter.allows("Scott"));
		assertTrue(stringFilter.allows("Mike"));
		assertTrue(stringFilter.allows("Jason"));
		assertFalse(stringFilter.allows("Dominic"));
		assertFalse(stringFilter.allows("Dennis"));
	}

	@Test
	public void testDelegateValueFor() {
		assertEquals(Integer.valueOf(5), stringFilter.delegateValueFor("Scott"));
	}

}


================================================
FILE: test/opennlp/ccg/util/FilteredMapTest.java
================================================
package opennlp.ccg.util;

import static org.junit.Assert.assertEquals;
import static org.junit.Assert.assertFalse;
import static org.junit.Assert.assertNull;
import static org.junit.Assert.assertTrue;
import static org.junit.Assert.fail;

import java.util.HashMap;
import java.util.Map;
import java.util.Map.Entry;

import org.junit.Before;
import org.junit.Test;

public class FilteredMapTest {

	Map<Integer,String> map;
	FilteredMap<Integer, String> filteredMap;
	Filter<Integer> keyFilter;
	
	Integer target = 37;
	
	@Before
	public void setUp() throws Exception {
		map = new HashMap<Integer, String>();
		map.put(17, "seventeen");
		map.put(31, "thirty-one");
		map.put(37, "thirty-seven");
		map.put(43, "forty-three");
		
		keyFilter = new Filter<Integer>() {
			
			@Override
			public boolean allows(Integer e) {
				return target >= e;
			}
		};
		
		filteredMap = new FilteredMap<Integer, String>(map, keyFilter);
	}

	@Test
	public void testFilteredMap() {
		try {
			new FilteredMap<Integer, String>(map, null);
			fail("able to specify null key filter");
		}
		catch(IllegalArgumentException expected) {
			// do nothing
		}
	}
	
	@Test
	public void testGetOriginalMap() {
		assertEquals(map, filteredMap.getOriginalMap());
	}

	@Test
	public void testGetKeyFilter() {
		assertEquals(keyFilter, filteredMap.getKeyFilter());
	}

	@Test
	public void testEntrySet() {
		for(Entry<Integer, String> e : filteredMap.entrySet()) {
			if(e.getKey() > target) {
				fail("filtered map contains bad key");
			}
		}
	}

	@Test
	public void testPut() {
		assertNull(filteredMap.put(47, "blah"));
		assertNull(filteredMap.put(29, "twenty-nine"));
		
		assertFalse(filteredMap.containsKey(47));
		assertTrue(filteredMap.containsKey(29));
		
		assertEquals("twenty-nine", filteredMap.put(29, "blah"));
		assertEquals("blah", filteredMap.get(29));
	}

	@Test
	public void testContainsValue() {
		assertTrue(filteredMap.containsValue("seventeen"));
		assertFalse(filteredMap.containsValue("forty-three"));
	}

	@Test
	public void testContainsKey() {
		assertTrue(filteredMap.containsKey(31));
		assertFalse(filteredMap.containsKey(43));
	}

	@Test
	public void testKeySet() {
		for(Integer k : filteredMap.keySet()) {
			if(k.equals(43)) {
				fail("filtered map contains bad key");
			}
		}
	}

	@Test
	public void testValues() {
		assertTrue(filteredMap.values().contains("seventeen"));
		assertFalse(filteredMap.values().contains("forty-three"));
		
		filteredMap.remove(17);
		assertFalse(filteredMap.values().contains("seventeen"));
	}

}


================================================
FILE: test/opennlp/ccg/util/FilteredSetTest.java
================================================
package opennlp.ccg.util;

import static org.junit.Assert.*;

import java.util.ArrayList;
import java.util.Arrays;
import java.util.Iterator;
import java.util.List;

import org.junit.Before;
import org.junit.Test;

public class FilteredSetTest {

	FilteredSet<String> testSet, sameSet;
	List<String> values;
	
	Filter<String> testFilter, sameFilter;
	
	@Before
	public void setUp() throws Exception {
		values = new ArrayList<String>(Arrays.asList("test", "test", "other", "different"));
		
		testFilter = new Filter<String>() {
			
			@Override
			public boolean allows(String e) {
				return e.equals("test");
			}
		};
		
		sameFilter = new VisitedFilter<String>();
		
		testSet = new FilteredSet<String>(values, testFilter);
		sameSet = new FilteredSet<String>(values, sameFilter);
	}

	@Test
	public void testFilteredSet() {
		try {
			new FilteredSet<String>(testSet, null);
			fail("able to specify null filter");
		}
		catch(IllegalArgumentException expected) {
			// do nothing
		}
	}
	
	@Test
	public void testSize() {
		assertEquals(1, testSet.size());
		assertEquals(values.size() - 1, sameSet.size());
	}

	@Test
	public void testAdd() {
		int sz = testSet.size();
		assertFalse(testSet.add("test"));
		assertTrue(testSet.remove("test"));
		assertEquals(sz - 1, testSet.size());
		
		assertFalse(sameSet.add("test"));
		assertTrue(sameSet.add("blah"));
		assertTrue(sameSet.add("xyxyx"));
		assertFalse(sameSet.add("xyxyx"));
		assertEquals(5, sameSet.size());
	}

	@Test
	public void testIterator() {
		Iterator<String> i = testSet.iterator();
		assertTrue(i.hasNext());
		assertEquals("test", i.next());
		assertFalse(i.hasNext());
		
		i = sameSet.iterator();
		assertTrue(i.hasNext());
		assertEquals("test", i.next());
		assertEquals("other", i.next());
		assertEquals("different", i.next());
		
		i = sameSet.iterator();
		assertEquals("test", i.next());
		i.remove();
		assertFalse(sameSet.contains("test"));
	}

	@Test
	public void testRemove() {
		testSet.remove("test");
		assertFalse(testSet.contains("test"));
		
		sameSet.remove("test");
		assertFalse(sameSet.contains("test"));
	}

	@Test
	public void testClear() {
		testSet.clear();
		assertEquals(0, testSet.size());
		sameSet.clear();
		assertEquals(0, sameSet.size());
	}
	
	@Test
	public void testGetOriginalCollection() {
		assertEquals(values, testSet.getOriginalCollection());
		assertEquals(values, sameSet.getOriginalCollection());
	}
}


================================================
FILE: test/opennlp/ccg/util/InverseFilterTest.java
================================================
package opennlp.ccg.util;

import static org.junit.Assert.*;

import org.junit.Before;
import org.junit.Test;

public class InverseFilterTest {

	VisitedFilter<Integer> visited;
	InverseFilter<Integer> inverse;
	
	@Before
	public void setUp() throws Exception {
		visited = new VisitedFilter<Integer>();
		inverse = new InverseFilter<Integer>(visited);
	}

	@Test
	public void testInverseFilter() {
		try {
			new InverseFilter<Integer>(null);
			fail("able to specify null filter");
		}
		catch(IllegalArgumentException expected) {
			// do nothing
		}
	}
	
	@Test
	public void testGetOriginalFilter() {
		assertEquals(visited, inverse.getOriginalFilter());
	}

	@Test
	public void testAllows() {
		assertTrue(visited.allows(37));
		assertFalse(visited.allows(37));
		
		assertTrue(inverse.allows(37));
		assertFalse(inverse.allows(17));
		assertFalse(visited.allows(17));
		assertTrue(inverse.allows(17));
	}

}


================================================
FILE: test/opennlp/ccg/util/MembershipFilterTest.java
================================================
package opennlp.ccg.util;

import static org.junit.Assert.*;

import java.util.HashSet;
import java.util.Set;

import org.junit.Before;
import org.junit.Test;

public class MembershipFilterTest {

	Filter<String> filter;
	Set<String> strings;
	
	@Before
	public void setUp() throws Exception {
		strings = new HashSet<String>();
		strings.add("test");
		strings.add("one");
		strings.add("two");
		strings.add("three");
		
		filter = new MembershipFilter<String>(strings);
	}

	@Test
	public void testMembershipFilter() {
		try {
			new MembershipFilter<String>(null);
			fail("able to specify null members");
		}
		catch(IllegalArgumentException expected) {
			// do nothing
		}
	}
	
	@Test
	public void testAllows() {
		for(String s : strings) {
			assertTrue(filter.allows(s));
		}
		
		assertFalse(filter.allows("blah"));
		assertFalse(filter.allows(""));
		assertFalse(filter.allows(null));
	}

}


================================================
FILE: test/opennlp/ccg/util/VisitedFilterTest.java
================================================
package opennlp.ccg.util;

import static org.junit.Assert.*;

import org.junit.Before;
import org.junit.Test;

public class VisitedFilterTest {
	
	VisitedFilter<Integer> filter;

	@Before
	public void setUp() throws Exception {
		filter = new VisitedFilter<Integer>();
	}

	@Test
	public void testAllows() {
		assertTrue(filter.allows(1));
		assertFalse(filter.allows(1));
		assertTrue(filter.allows(0));
	}

	@Test
	public void testHasVisited() {
		assertTrue(filter.allows(1));
		assertTrue(filter.hasVisited(1));
		assertFalse(filter.hasVisited(13));
	}

}


================================================
FILE: test/output.xml
================================================
<?xml version="1.0" encoding="UTF-8"?><dlfs>
  <string number="32" position="A">chinese officials have repeatedly indicated that taiwan is a province of china and that china is a domestic chinese issue .</string>
  <string number="32" position="B">the chinese government has always been signifying that taiwan is a province of china and taiwan issue is the internal issue of china .</string>
  <mappings><![CDATA[[0 <-> 1, 1 <-> 2, 2 <-> 3, 2 <-> 5, 2 <-> 6, 3 <-> 4, 4 <-> 3, 4 <-> 5, 4 <-> 6, 5 <-> 7, 6 <-> 8, 6 <-> 15, 7 <-> 9, 8 <-> 10, 9 <-> 11, 10 <-> 12, 11 <-> 13, 12 <-> 14, 15 <-> 17, 16 <-> 18, 17 <-> 19, 18 <-> 21, 18 <-> 22, 19 <-> 20, 20 <-> 23]]]></mappings>
  <dlf>
    <node id="w2" mood="dcl" tense="pres">
      <one-of>
        <atts pred="PERF"/>
        <atts pred="PROG"/>
        <atts pred="signify"/>
      </one-of>
      <rel name="Arg0">
        <node det="nil" id="w1" num="pl">
          <one-of>
            <atts pred="official"/>
            <atts pred="government"/>
          </one-of>
          <rel name="Mod">
            <node id="w0" num="sg" pred="chinese"/>
          </rel>
        </node>
      </rel>
      <rel name="Arg0">
        <node idref="w1"/>
      </rel>
      <rel name="Arg1">
        <node id="w4" partic="past">
          <one-of>
            <atts pred="indicate"/>
            <atts pred="PERF"/>
            <atts pred="PROG"/>
            <atts pred="signify"/>
          </one-of>
          <rel name="Arg0">
            <node idref="w1"/>
          </rel>
          <rel name="Arg0">
            <node idref="w1"/>
          </rel>
          <rel name="Arg1">
            <node id="w12" pred="and">
              <rel name="First">
                <node id="w7" pred="be" tense="pres">
                  <rel name="Arg0">
                    <node det="nil" id="w6" num="sg" pred="taiwan"/>
                  </rel>
                  <rel name="Arg1">
                    <node id="w9" num="sg" pred="province">
                      <rel name="Det">
                        <node id="w8" pred="a"/>
                      </rel>
                      <rel name="Mod">
                        <node id="w10" pred="of">
                          <rel name="Arg1">
                            <node det="nil" id="w11" num="sg" pred="china"/>
                          </rel>
                        </node>
                      </rel>
                    </node>
                  </rel>
                </node>
              </rel>
              <rel name="Next">
                <node det="nil" id="w15" num="sg" pred="be" tense="pres">
                  <opt>
                    <rel name="Arg0">
                      <node det="nil" id="w14" num="sg" pred="china"/>
                    </rel>
                  </opt>
                  <rel name="Arg1">
                    <node id="w19" num="sg" pred="issue">
                      <rel name="Det">
                        <one-of>
                          <node id="w16" pred="a"/>
                          <node id="w16" pred="the"/>
                        </one-of>
                      </rel>
                      <rel name="Mod">
                        <one-of>
                          <node id="w17" pred="domestic"/>
                          <node id="w17" pred="internal"/>
                        </one-of>
                      </rel>
                      <rel name="Mod">
                        <node id="w18" num="sg" pred="chinese"/>
                      </rel>
                    </node>
                  </rel>
                </node>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
      <rel name="Mod">
        <one-of>
          <node id="w3" pred="repeatedly"/>
          <node id="w3" pred="always"/>
        </one-of>
      </rel>
    </node>
  </dlf>
  <dlf>
    <node id="w3" mood="dcl" tense="pres">
      <one-of>
        <atts pred="PERF"/>
        <atts pred="indicate"/>
      </one-of>
      <rel name="Arg0">
        <node id="w2" num="sg" pred="government">
          <opt>
            <rel name="Det">
              <node id="w0" pred="the"/>
            </rel>
          </opt>
          <rel name="Mod">
            <node id="w1" pred="chinese"/>
          </rel>
        </node>
      </rel>
      <rel name="Arg1">
        <node id="w5" partic="past">
          <one-of>
            <atts pred="PROG"/>
            <atts pred="PERF"/>
            <atts pred="indicate"/>
          </one-of>
          <rel name="Arg0">
            <node idref="w2"/>
          </rel>
          <rel name="Arg1">
            <node id="w6" partic="pres">
              <one-of>
                <atts pred="signify"/>
                <atts pred="PERF"/>
                <atts pred="indicate"/>
              </one-of>
              <rel name="Arg0">
                <node idref="w2"/>
              </rel>
              <rel name="Arg1">
                <node id="w14" pred="and">
                  <rel name="First">
                    <node id="w9" pred="be" tense="pres">
                      <rel name="Arg0">
                        <node det="nil" id="w8" num="sg" pred="taiwan"/>
                      </rel>
                      <rel name="Arg1">
                        <node id="w11" num="sg" pred="province">
                          <rel name="Det">
                            <node id="w10" pred="a"/>
                          </rel>
                          <rel name="Mod">
                            <node id="w12" pred="of">
                              <rel name="Arg1">
                                <node det="nil" id="w13" num="sg" pred="china"/>
                              </rel>
                            </node>
                          </rel>
                        </node>
                      </rel>
                    </node>
                  </rel>
                  <rel name="Next">
                    <node det="nil" id="w17" num="sg" pred="be" tense="pres">
                      <opt>
                        <rel name="Arg0">
                          <node det="nil" id="w16" num="sg" pred="issue">
                            <rel name="Mod">
                              <node id="w15" pred="taiwan"/>
                            </rel>
                          </node>
                        </rel>
                      </opt>
                      <rel name="Arg1">
                        <node id="w20" num="sg" pred="issue">
                          <rel name="Det">
                            <one-of>
                              <node id="w18" pred="the"/>
                              <node id="w18" pred="a"/>
                            </one-of>
                          </rel>
                          <rel name="Mod">
                            <one-of>
                              <node id="w19" pred="internal"/>
                              <node id="w19" pred="domestic"/>
                            </one-of>
                          </rel>
                          <rel name="Mod">
                            <one-of>
                              <node id="w21" pred="of">
                                <rel name="Arg1">
                                  <node det="nil" id="w22" num="sg" pred="china"/>
                                </rel>
                              </node>
                              <node id="w21" num="sg" pred="chinese"/>
                            </one-of>
                          </rel>
                        </node>
                      </rel>
                    </node>
                  </rel>
                </node>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
      <rel name="Mod">
        <one-of>
          <node id="w4" pred="always"/>
          <node id="w4" pred="repeatedly"/>
        </one-of>
      </rel>
    </node>
  </dlf>
  <string number="33" position="A">the government of qinghai province made the best use of the situation , coming up with an idea to commercialize the urban infrastructure construction , and ratified , at the beginning of this year , provisions for xining city to encourage and guide foreign investments .</string>
  <string number="33" position="B">the government of qinghai province put forward the idea of commercialization of city infrastructure , and approved some regulations on encouraging and attracting foreign investment in xining city early this year .</string>
  <mappings><![CDATA[[0 <-> 0, 1 <-> 1, 2 <-> 2, 3 <-> 3, 4 <-> 4, 13 <-> 5, 13 <-> 6, 14 <-> 5, 14 <-> 6, 15 <-> 5, 15 <-> 6, 16 <-> 7, 17 <-> 8, 18 <-> 9, 18 <-> 10, 19 <-> 9, 19 <-> 10, 21 <-> 12, 22 <-> 13, 24 <-> 14, 25 <-> 15, 26 <-> 16, 28 <-> 28, 29 <-> 28, 30 <-> 28, 32 <-> 29, 33 <-> 30, 35 <-> 18, 36 <-> 19, 36 <-> 25, 37 <-> 26, 38 <-> 27, 39 <-> 19, 40 <-> 20, 41 <-> 21, 42 <-> 22, 43 <-> 23, 44 <-> 24, 45 <-> 31]]]></mappings>
  <dlf>
    <node id="w25" mood="dcl" pred="and" tense="past">
      <opt>
        <rel name="First">
          <node id="w5" pred="make" tense="past">
            <rel name="Arg0">
              <node id="w1" num="sg" pred="government">
                <rel name="Det">
                  <node id="w0" pred="the"/>
                </rel>
                <rel name="Mod">
                  <node id="w2" pred="of">
                    <rel name="Arg1">
                      <node det="nil" id="w4" num="sg" pred="province">
                        <rel name="Mod">
                          <node id="w3" num="sg" pred="qinghai"/>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
            <rel name="Arg1">
              <node id="w8" num="sg" pred="use">
                <rel name="Det">
                  <node id="w6" pred="the"/>
                </rel>
                <rel name="Mod">
                  <node id="w7" pred="best"/>
                </rel>
                <rel name="Mod">
                  <node id="w9" pred="of">
                    <rel name="Arg1">
                      <node id="w11" num="sg" pred="situation">
                        <rel name="Det">
                          <node id="w10" pred="the"/>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
            <rel name="InterruptRel">
              <node id="w13" partic="pres">
                <one-of>
                  <atts pred="come"/>
                  <atts pred="put"/>
                </one-of>
                <rel name="Arg0">
                  <node idref="w1"/>
                </rel>
                <rel name="Arg1">
                  <node id="w15">
                    <one-of>
                      <atts pred="with"/>
                      <atts pred="put"/>
                    </one-of>
                    <rel name="Arg1">
                      <node id="w17" num="sg" pred="idea">
                        <rel name="Det">
                          <one-of>
                            <node id="w16" pred="an"/>
                            <node id="w16" pred="the"/>
                          </one-of>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
                <rel name="Mod">
                  <node id="w14" pred="up"/>
                </rel>
                <rel name="Purpose">
                  <node id="w19" num="sg" pred="commercialize">
                    <opt>
                      <rel name="Arg1">
                        <node id="w23" num="sg" pred="construction">
                          <rel name="Det">
                            <node id="w20" pred="the"/>
                          </rel>
                          <rel name="Mod">
                            <node id="w21" pred="urban"/>
                          </rel>
                          <rel name="Mod">
                            <node id="w22" num="sg" pred="infrastructure"/>
                          </rel>
                        </node>
                      </rel>
                    </opt>
                    <rel name="Arg0">
                      <node idref="w1"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </opt>
      <rel name="Next">
        <node id="w26" tense="past">
          <one-of>
            <atts pred="ratify"/>
            <atts pred="approve"/>
          </one-of>
          <rel name="Arg0">
            <node idref="w1"/>
          </rel>
          <rel name="Mod">
            <node id="w28" pred="at">
              <opt>
                <rel name="Arg1">
                  <node id="w34" pred=",">
                    <rel name="First">
                      <node id="w30" num="sg" pred="beginning">
                        <opt>
                          <rel name="Mod">
                            <node id="w31" pred="of">
                              <rel name="Arg1">
                                <node id="w33" num="sg" pred="year">
                                  <rel name="Det">
                                    <node id="w32" pred="this"/>
                                  </rel>
                                </node>
                              </rel>
                            </node>
                          </rel>
                        </opt>
                        <rel name="Det">
                          <node id="w29" pred="the"/>
                        </rel>
                      </node>
                    </rel>
                    <rel name="Next">
                      <node det="nil" id="w35" num="pl">
                        <one-of>
                          <atts pred="provision"/>
                          <atts pred="regulation"/>
                        </one-of>
                        <rel name="Mod">
                          <node id="w36">
                            <one-of>
                              <atts pred="for"/>
                              <atts pred="in"/>
                            </one-of>
                            <rel name="Arg1">
                              <node id="w37" partic="pres" pred="xining">
                                <rel name="Arg0">
                                  <node id="x1"/>
                                </rel>
                                <rel name="Arg1">
                                  <node det="nil" id="w38" num="sg" pred="city"/>
                                </rel>
                                <rel name="Purpose">
                                  <node id="w41" pred="and">
                                    <rel name="First">
                                      <node id="w40" pred="encourage">
                                        <rel name="Arg0">
                                          <node idref="x1"/>
                                        </rel>
                                        <rel name="Arg1">
                                          <node id="w44"/>
                                        </rel>
                                      </node>
                                    </rel>
                                    <rel name="Next">
                                      <node id="w42">
                                        <one-of>
                                          <atts pred="guide"/>
                                          <atts pred="attract"/>
                                        </one-of>
                                        <rel name="Arg0">
                                          <node idref="x1"/>
                                        </rel>
                                        <rel name="Arg1">
                                          <node idref="w44"/>
                                        </rel>
                                      </node>
                                    </rel>
                                  </node>
                                </rel>
                              </node>
                            </rel>
                          </node>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
              </opt>
            </node>
          </rel>
        </node>
      </rel>
    </node>
    <node id="w43" pred="investment"/>
    <node id="x1"/>
    <node id="w44"/>
  </dlf>
  <dlf>
    <node id="w15" mood="dcl" pred="and">
      <rel name="First">
        <node id="w5" tense="past">
          <one-of>
            <atts pred="put"/>
            <atts pred="come"/>
          </one-of>
          <rel name="Arg0">
            <node id="w1" num="sg" pred="government">
              <rel name="Det">
                <node id="w0" pred="the"/>
              </rel>
              <rel name="Mod">
                <node id="w2" pred="of">
                  <rel name="Arg1">
                    <node det="nil" id="w4" num="sg" pred="province">
                      <rel name="Mod">
                        <node id="w3" num="sg" pred="qinghai"/>
                      </rel>
                    </node>
                  </rel>
                </node>
              </rel>
            </node>
          </rel>
          <rel name="Arg1">
            <node id="w8" num="sg" pred="idea">
              <rel name="Det">
                <one-of>
                  <node id="w7" pred="the"/>
                  <node id="w7" pred="an"/>
                </one-of>
              </rel>
              <rel name="Mod">
                <node id="w9" pred="of">
                  <rel name="Arg1">
                    <node det="nil" id="w10" num="sg" pred="commercialization">
                      <opt>
                        <rel name="Mod">
                          <node id="w11" pred="of">
                            <rel name="Arg1">
                              <node det="nil" id="w13" num="sg" pred="infrastructure">
                                <rel name="Mod">
                                  <node id="w12" num="sg" pred="city"/>
                                </rel>
                              </node>
                            </rel>
                          </node>
                        </rel>
                      </opt>
                    </node>
                  </rel>
                </node>
              </rel>
            </node>
          </rel>
          <rel name="Mod">
            <node id="w6" pred="forward"/>
          </rel>
        </node>
      </rel>
      <rel name="Next">
        <node id="w16" tense="past">
          <one-of>
            <atts pred="approve"/>
            <atts pred="ratify"/>
          </one-of>
          <rel name="Arg0">
            <node idref="w1"/>
          </rel>
          <rel name="Arg1">
            <node id="w18" num="pl" pred="regulation">
              <opt>
                <rel name="Det">
                  <node id="w17" pred="some"/>
                </rel>
              </opt>
              <rel name="Mod">
                <node id="w19" pred="on">
                  <rel name="Arg1">
                    <node id="w21" pred="and">
                      <rel name="First">
                        <node id="w20" partic="pres" pred="encourage">
                          <rel name="Arg0">
                            <one-of>
                              <node id="x1"/>
                              <node idref="x1"/>
                            </one-of>
                          </rel>
                          <rel name="Arg1">
                            <one-of>
                              <node det="nil" id="w24" num="sg" pred="investment">
                                <rel name="Mod">
                                  <node id="w23" pred="foreign"/>
                                </rel>
                                <rel name="Mod">
                                  <node id="w25">
                                    <one-of>
                                      <atts pred="in"/>
                                      <atts pred="for"/>
                                    </one-of>
                                    <rel name="Arg1">
                                      <node id="w26" partic="pres" pred="xining">
                                        <rel name="Arg0">
                                          <node id="x2"/>
                                        </rel>
                                        <rel name="Arg1">
                                          <node det="nil" id="w27" num="sg" pred="city"/>
                                        </rel>
                                        <rel name="Mod">
                                          <node id="w29" pred="this">
                                            <rel name="Arg1">
                                              <node id="w30" num="sg" pred="year"/>
                                            </rel>
                                            <rel name="Mod">
                                              <node id="w28" pred="early"/>
                                            </rel>
                                          </node>
                                        </rel>
                                      </node>
                                    </rel>
                                  </node>
                                </rel>
                              </node>
                              <node id="w24"/>
                            </one-of>
                          </rel>
                        </node>
                      </rel>
                      <rel name="Next">
                        <node id="w22" partic="pres">
                          <one-of>
                            <atts pred="attract"/>
                            <atts pred="guide"/>
                          </one-of>
                          <rel name="Arg0">
                            <node idref="x1"/>
                          </rel>
                          <rel name="Arg1">
                            <node idref="w24"/>
                          </rel>
                        </node>
                      </rel>
                    </node>
                  </rel>
                </node>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
    </node>
    <node id="x1"/>
    <node id="x2"/>
  </dlf>
  <string number="34" position="A">relevant sections of the henan government released their foreign cooperation projects concerning economy and technology . representatives attending the meeting consulted on information of some projects they interested in.</string>
  <string number="34" position="B">the competent agencies of the henan provincial government released [ a list of ] foreign economic technological cooperation projects of the province at the meeting and held discussions regarding the purpose of cooperation in the related projects with representatives at the meeting .</string>
  <mappings><![CDATA[[0 <-> 1, 1 <-> 2, 2 <-> 3, 3 <-> 4, 4 <-> 5, 4 <-> 21, 5 <-> 7, 6 <-> 8, 8 <-> 14, 9 <-> 17, 9 <-> 32, 10 <-> 18, 12 <-> 15, 14 <-> 16, 16 <-> 38, 17 <-> 39, 18 <-> 40, 19 <-> 24, 19 <-> 41, 20 <-> 26, 20 <-> 27, 21 <-> 28, 21 <-> 29, 21 <-> 30, 21 <-> 31, 23 <-> 33, 24 <-> 34, 24 <-> 35, 25 <-> 36]]]></mappings>
  <dlf>
    <node id="w1" num="pl">
      <one-of>
        <atts pred="section"/>
        <atts pred="agency"/>
      </one-of>
      <rel name="Mod">
        <one-of>
          <node id="w0" pred="relevant"/>
          <node id="w0" pred="competent"/>
        </one-of>
      </rel>
    </node>
    <node id="w19" pred="consulted"/>
    <node id="w19" num="sg" pred="meeting" tense="past">
      <opt>
        <rel name="Arg2">
          <node id="w26" pred="they">
            <rel name="GenRel">
              <node id="w27" pred="interested">
                <rel name="Mod">
                  <node id="w28" num="sg" pred="in."/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </opt>
      <rel name="Arg0">
        <node det="nil" id="w16" num="pl" pred="representative">
          <rel name="GenRel">
            <node id="w17" partic="pres" pred="attend">
              <rel name="Arg0">
                <node idref="w16"/>
              </rel>
              <rel name="Arg1">
                <node idref="w19"/>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
      <rel name="Det">
        <node id="w18" pred="the"/>
      </rel>
      <rel name="Arg1">
        <node det="nil" id="w21" num="sg" pred="on">
          <opt>
            <rel name="Arg1">
              <node det="nil" id="w22" num="sg" pred="information">
                <rel name="Mod">
                  <node id="w23">
                    <one-of>
                      <atts pred="of"/>
                      <atts pred="in"/>
                    </one-of>
                    <rel name="Arg1">
                      <node id="w25" num="pl" pred="project">
                        <rel name="Det">
                          <one-of>
                            <node id="w24" pred="some"/>
                            <node id="w24" pred="the"/>
                          </one-of>
                        </rel>
                        <one-of>
                          <rel name="Det">
                            <node idref="w24"/>
                          </rel>
                          <rel name="Mod">
                            <node id="w24" pred="related"/>
                          </rel>
                        </one-of>
                      </node>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </opt>
        </node>
      </rel>
    </node>
    <node id="w6" pred="release" tense="past">
      <opt>
        <rel name="Arg1">
          <node id="w13" pred="and">
            <rel name="Det">
              <node id="w7" pred="their"/>
            </rel>
            <rel name="First">
              <node id="w12" num="sg" partic="pres" pred="economy">
                <opt>
                  <rel name="Mod">
                    <node id="w11" partic="pres" pred="concern"/>
                  </rel>
                </opt>
                <rel name="Mod">
                  <node id="w10" num="pl" pred="project"/>
                </rel>
                <rel name="Mod">
                  <node id="w8" pred="foreign"/>
                </rel>
                <rel name="Mod">
                  <node id="w9" num="sg" pred="cooperation"/>
                </rel>
              </node>
            </rel>
            <rel name="Next">
              <node id="w14" num="sg" pred="technology"/>
            </rel>
          </node>
        </rel>
      </opt>
      <rel name="Arg0">
        <node id="x1">
          <rel name="Mod">
            <node id="w2" pred="of">
              <rel name="Arg1">
                <node id="w5" num="sg" pred="government">
                  <rel name="Det">
                    <node id="w3" pred="the"/>
                  </rel>
                  <rel name="Mod">
                    <node id="w4" pred="henan"/>
                  </rel>
                </node>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
    </node>
    <node id="x1">
      <rel name="Mod">
        <node id="w2" pred="of">
          <rel name="Arg1">
            <node id="w5" num="sg" pred="government">
              <rel name="Det">
                <node id="w3" pred="the"/>
              </rel>
              <rel name="Mod">
                <node id="w4" pred="henan"/>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
    </node>
  </dlf>
  <dlf>
    <node id="w25" mood="dcl" pred="and">
      <rel name="First">
        <node id="w8" pred="release" tense="past">
          <opt>
            <rel name="Mod">
              <node id="w22" pred="at">
                <rel name="Arg1">
                  <node id="w24" num="sg" pred="meeting">
                    <opt>
                      <rel name="Det">
                        <node id="w23" pred="the"/>
                      </rel>
                    </opt>
                  </node>
                </rel>
              </node>
            </rel>
          </opt>
          <opt>
            <rel name="Mod">
              <node id="w9" pred="lsb">
                <rel name="Arg1">
                  <node id="w11" num="sg" pred="list">
                    <rel name="Det">
                      <node id="w10" pred="a"/>
                    </rel>
                    <rel name="Mod">
                      <node id="w12" pred="of">
                        <rel name="Arg1">
                          <node det="nil" id="w18" num="pl" pred="project">
                            <opt>
                              <rel name="Mod">
                                <node id="w13" pred="rsb"/>
                              </rel>
                            </opt>
                            <opt>
                              <rel name="Mod">
                                <node id="w19" pred="of">
                                  <rel name="Arg1">
                                    <node id="w21" num="sg" pred="province">
                                      <opt>
                                        <rel name="Det">
                                          <node id="w20" pred="the"/>
                                        </rel>
                                      </opt>
                                    </node>
                                  </rel>
                                </node>
                              </rel>
                            </opt>
                            <rel name="Mod">
                              <node id="w14" pred="foreign"/>
                            </rel>
                            <rel name="Mod">
                              <node id="w15" pred="economic"/>
                            </rel>
                            <rel name="Mod">
                              <node id="w16" pred="technological"/>
                            </rel>
                            <rel name="Mod">
                              <node id="w17" num="sg" pred="cooperation"/>
                            </rel>
                          </node>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </opt>
          <rel name="Arg0">
            <node id="w2" num="pl" pred="agency">
              <opt>
                <rel name="Det">
                  <node id="w0" pred="the"/>
                </rel>
              </opt>
              <rel name="Mod">
                <one-of>
                  <node id="w1" pred="competent"/>
                  <node id="w1" pred="relevant"/>
                </one-of>
              </rel>
              <rel name="Mod">
                <node id="w3" pred="of">
                  <rel name="Arg1">
                    <node id="w7" num="sg" pred="government">
                      <opt>
                        <rel name="Mod">
                          <node id="w6" pred="provincial"/>
                        </rel>
                      </opt>
                      <rel name="Det">
                        <node id="w4" pred="the"/>
                      </rel>
                      <rel name="Mod">
                        <node id="w5" pred="henan"/>
                      </rel>
                    </node>
                  </rel>
                </node>
              </rel>
            </node>
          </rel>
          <rel name="Arg1">
            <node det="nil" id="w27" num="pl" pred="discussion">
              <rel name="GenRel">
                <node id="w28" partic="pres" pred="regard">
                  <rel name="Arg0">
                    <node idref="w27"/>
                  </rel>
                  <rel name="Arg1">
                    <node id="w30" num="sg" pred="purpose"/>
                  </rel>
                </node>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
      <rel name="Next">
        <node id="w26" pred="hold" tense="past">
          <rel name="Arg0">
            <node idref="w2"/>
          </rel>
          <rel name="Arg1">
            <node idref="w27"/>
          </rel>
        </node>
      </rel>
    </node>
  </dlf>
  <string number="35" position="A">foreign minister duma expressed his thoughts that the un was born after world war ii , and that france and other permanent member countries were all the victors of that war .</string>
  <string number="35" position="B">the foreign minister feels that the united nations was born out of the second world war , and that france and the other permanent members of the council were victors in that war .</string>
  <mappings><![CDATA[[0 <-> 1, 1 <-> 2, 3 <-> 3, 5 <-> 3, 6 <-> 4, 7 <-> 5, 8 <-> 6, 8 <-> 7, 9 <-> 8, 10 <-> 9, 11 <-> 10, 11 <-> 11, 12 <-> 14, 13 <-> 15, 14 <-> 13, 15 <-> 16, 16 <-> 17, 17 <-> 18, 18 <-> 19, 19 <-> 20, 20 <-> 22, 21 <-> 23, 22 <-> 24, 23 <-> 24, 24 <-> 28, 27 <-> 29, 28 <-> 30, 29 <-> 31, 30 <-> 32, 31 <-> 33]]]></mappings>
  <dlf>
    <node det="nil" id="w3" mood="dcl" num="sg" pred="express" tense="past">
      <opt>
        <rel name="Arg0">
          <node det="nil" id="w2" num="sg" pred="duma">
            <rel name="Mod">
              <node id="w0" pred="foreign"/>
            </rel>
            <rel name="Mod">
              <node id="w1" num="sg" pred="minister"/>
            </rel>
          </node>
        </rel>
      </opt>
      <rel name="Arg1">
        <node id="w5" num="pl">
          <opt>
            <rel name="Det">
              <node id="w4" pred="his"/>
            </rel>
          </opt>
          <one-of>
            <atts pred="thought"/>
            <atts pred="feel"/>
          </one-of>
          <one-of>
            <rel name="Arg">
              <node id="w16" pred="and">
                <rel name="First">
                  <node id="w9" pred="PASS" tense="past">
                    <rel name="Arg0">
                      <node id="w8" num="sg">
                        <one-of>
                          <atts pred="un"/>
                          <atts pred="nation"/>
                        </one-of>
                        <rel name="Det">
                          <node id="w7" pred="the"/>
                        </rel>
                      </node>
                    </rel>
                    <rel name="Arg1">
                      <node id="w10" partic="pass" pred="bear">
                        <rel name="Arg1">
                          <node idref="w8"/>
                        </rel>
                        <rel name="Mod">
                          <node id="w11" pred="after">
                            <rel name="Arg1">
                              <node det="nil" id="w14" num="pl" pred="ii">
                                <rel name="Mod">
                                  <node id="w12" num="sg" pred="world"/>
                                </rel>
                                <rel name="Mod">
                                  <node id="w13" num="sg" pred="war"/>
                                </rel>
                              </node>
                            </rel>
                          </node>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
                <rel name="Next">
                  <node id="w24" pred="be" tense="past">
                    <rel name="Arg0">
                      <node det="nil" id="w19" pred="and">
                        <rel name="Arg0">
                          <node id="h1" pred="has-rel">
                            <rel name="Mod">
                              <node id="w18" num="sg" pred="france"/>
                            </rel>
                            <rel name="Of">
                              <node id="w23" num="pl">
                                <one-of>
                                  <atts pred="country"/>
                                  <atts pred="member"/>
                                </one-of>
                                <rel name="Mod">
                                  <node id="w20" pred="other"/>
                                </rel>
                                <rel name="Mod">
                                  <node id="w21" pred="permanent"/>
                                </rel>
                                <rel name="Mod">
                                  <node id="w22" num="sg" pred="member"/>
                                </rel>
                              </node>
                            </rel>
                          </node>
                        </rel>
                        <one-of>
                          <rel name="Arg1">
                            <node idref="w23"/>
                          </rel>
                          <rel name="Next">
                            <node id="w23" num="pl" pred="member">
                              <rel name="Det">
                                <node id="w21f" pred="the"/>
                              </rel>
                              <rel name="Mod">
                                <node id="w22f" pred="other"/>
                              </rel>
                              <rel name="Mod">
                                <node id="w23f" pred="permanent"/>
                              </rel>
                              <rel name="Mod">
                                <node id="w25f" pred="of">
                                  <rel name="Arg1">
                                    <node id="w27f" num="sg" pred="council">
                                      <rel name="Det">
                                        <node id="w26f" pred="the"/>
                                      </rel>
                                    </node>
                                  </rel>
                                </node>
                              </rel>
                            </node>
                          </rel>
                        </one-of>
                      </node>
                    </rel>
                    <rel name="Arg1">
                      <node id="w27" num="pl" pred="victors">
                        <opt>
                          <rel name="Det">
                            <node idref="w26f"/>
                          </rel>
                        </opt>
                        <opt>
                          <rel name="Mod">
                            <node id="w25" pred="all"/>
                          </rel>
                        </opt>
                        <rel name="Mod">
                          <node id="w28">
                            <one-of>
                              <atts pred="of"/>
                              <atts pred="in"/>
                            </one-of>
                            <rel name="Arg1">
                              <node id="w30" num="sg" pred="war">
                                <rel name="Det">
                                  <node id="w29" pred="that"/>
                                </rel>
                              </node>
                            </rel>
                          </node>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
            <rel name="Arg1">
              <node id="w16" pred="and">
                <rel name="First">
                  <node id="w8f" pred="PASS" tense="past">
                    <rel name="Arg0">
                      <node id="w7f" num="pl" pred="nation">
                        <rel name="Det">
                          <node id="w5f" pred="the"/>
                        </rel>
                        <rel name="Mod">
                          <node id="w6f" pred="united"/>
                        </rel>
                      </node>
                    </rel>
                    <rel name="Arg1">
                      <node id="w9f" partic="pass" pred="bear">
                        <rel name="Arg1">
                          <node idref="w7f"/>
                        </rel>
                        <rel name="Mod">
                          <node id="w10f" pred="out">
                            <rel name="Arg1">
                              <node id="w11f" pred="of">
                                <rel name="Arg1">
                                  <node id="w15f" num="sg" pred="war">
                                    <rel name="Det">
                                      <node id="w12f" pred="the"/>
                                    </rel>
                                    <rel name="Mod">
                                      <node id="w13f" pred="second"/>
                                    </rel>
                                    <rel name="Mod">
                                      <node id="w14f" num="sg" pred="world"/>
                                    </rel>
                                  </node>
                                </rel>
                              </node>
                            </rel>
                          </node>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
                <rel name="Next">
                  <node id="w28f" pred="be" tense="past">
                    <rel name="Arg0">
                      <node id="w20f" pred="and">
                        <rel name="First">
                          <node det="nil" id="w19f" num="sg" pred="france"/>
                        </rel>
                        <rel name="Next">
                          <node idref="w23"/>
                        </rel>
                      </node>
                    </rel>
                    <rel name="Arg1">
                      <node det="nil" id="w29f" num="pl" pred="victors"/>
                    </rel>
                    <rel name="Mod">
                      <node id="w30f" pred="in">
                        <rel name="Arg1">
                          <node id="w32f" num="sg" pred="war">
                            <rel name="Det">
                              <node id="w31f" pred="that"/>
                            </rel>
                          </node>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </one-of>
        </node>
      </rel>
    </node>
  </dlf>
  <dlf>
    <node id="w3" mood="dcl" pred="feel" tense="pres">
      <rel name="Arg0">
        <node id="w2" num="sg" pred="minister">
          <opt>
            <rel name="Det">
              <node id="w0" pred="the"/>
            </rel>
          </opt>
          <rel name="Mod">
            <node id="w1" pred="foreign"/>
          </rel>
        </node>
      </rel>
      <one-of>
        <rel name="Arg1">
          <node id="w17" pred="and">
            <rel name="First">
              <node id="w8" pred="PASS" tense="past">
                <rel name="Arg0">
                  <node id="w7" num="pl">
                    <one-of>
                      <atts pred="nation"/>
                      <atts pred="un"/>
                    </one-of>
                    <rel name="Det">
                      <node id="w5" pred="the"/>
                    </rel>
                    <rel name="Mod">
                      <node id="w6" pred="united"/>
                    </rel>
                  </node>
                </rel>
                <rel name="Arg1">
                  <node id="w9" partic="pass" pred="bear">
                    <rel name="Arg1">
                      <node idref="w7"/>
                    </rel>
                    <rel name="Mod">
                      <node id="w10" pred="out">
                        <rel name="Arg1">
                          <node id="w11" pred="of">
                            <rel name="Arg1">
                              <node id="w15" num="sg" pred="war">
                                <opt>
                                  <rel name="Det">
                                    <node id="w12" pred="the"/>
                                  </rel>
                                </opt>
                                <rel name="Mod">
                                  <node id="w13" pred="second"/>
                                </rel>
                                <rel name="Mod">
                                  <node id="w14" num="sg" pred="world"/>
                                </rel>
                              </node>
                            </rel>
                          </node>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
            <rel name="Next">
              <node id="w28" pred="be" tense="past">
                <rel name="Arg0">
                  <node id="w20" pred="and">
                    <rel name="First">
                      <node det="nil" id="w19" num="sg" pred="france"/>
                    </rel>
                    <one-of>
                      <rel name="Next">
                        <node id="w24" num="pl" pred="member">
                          <opt>
                            <rel name="Det">
                              <node id="w21" pred="the"/>
                            </rel>
                          </opt>
                          <opt>
                            <rel name="Mod">
                              <node id="w25" pred="of">
                                <rel name="Arg1">
                                  <node id="w27" num="sg" pred="council"/>
                                </rel>
                              </node>
                            </rel>
                          </opt>
                          <rel name="Mod">
                            <node id="w22" pred="other"/>
                          </rel>
                          <rel name="Mod">
                            <node id="w23" pred="permanent"/>
                          </rel>
                        </node>
                      </rel>
                      <rel name="Arg1">
                        <node id="w24" num="pl" pred="country">
                          <rel name="Mod">
                            <node id="w20f" pred="other"/>
                          </rel>
                          <rel name="Mod">
                            <node id="w21f" pred="permanent"/>
                          </rel>
                          <rel name="Mod">
                            <node id="w22f" num="sg" pred="member"/>
                          </rel>
                        </node>
                      </rel>
                    </one-of>
                  </node>
                </rel>
                <rel name="Arg1">
                  <node det="nil" id="w29" num="pl" pred="victors"/>
                </rel>
                <rel name="Mod">
                  <node id="w30">
                    <one-of>
                      <atts pred="in"/>
                      <atts pred="of"/>
                    </one-of>
                    <rel name="Arg1">
                      <node id="w32" num="sg" pred="war">
                        <rel name="Det">
                          <node id="w31" pred="that"/>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="Arg">
          <node id="w17" pred="and">
            <rel name="First">
              <node id="w9f" pred="PASS" tense="past">
                <rel name="Arg0">
                  <node id="w8f" num="sg" pred="un"/>
                </rel>
                <rel name="Arg1">
                  <node id="w10f" partic="pass" pred="bear">
                    <rel name="Arg1">
                      <node idref="w8f"/>
                    </rel>
                    <rel name="Mod">
                      <node id="w11f" pred="after">
                        <rel name="Arg1">
                          <node det="nil" id="w14f" num="pl" pred="ii">
                            <rel name="Mod">
                              <node id="w12f" num="sg" pred="world"/>
                            </rel>
                            <rel name="Mod">
                              <node id="w13f" num="sg" pred="war"/>
                            </rel>
                          </node>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
            <rel name="Next">
              <node id="w24f" pred="be" tense="past">
                <rel name="Arg0">
                  <node det="nil" id="w19f" pred="and">
                    <rel name="Arg0">
                      <node id="h1f" pred="has-rel">
                        <rel name="Mod">
                          <node id="w18f" num="sg" pred="france"/>
                        </rel>
                        <rel name="Of">
                          <node idref="w24"/>
                        </rel>
                      </node>
                    </rel>
                    <rel name="Arg1">
                      <node idref="w24"/>
                    </rel>
                  </node>
                </rel>
                <rel name="Arg1">
                  <node id="w27f" num="pl" pred="victors">
                    <rel name="Mod">
                      <node id="w25f" pred="all"/>
                    </rel>
                    <rel name="Mod">
                      <node id="w28f" pred="of">
                        <rel name="Arg1">
                          <node id="w30f" num="sg" pred="war">
                            <rel name="Det">
                              <node id="w29f" pred="that"/>
                            </rel>
                          </node>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </one-of>
    </node>
  </dlf>
  <string number="36" position="A">moore said the australian military attache to jakarta will conduct free investigations after he arrives in east timor tomorrow .</string>
  <string number="36" position="B">moore said , after the australian military attache to jakarta arrives in east timor tomorrow , he can conduct investigations freely in the area .</string>
  <mappings><![CDATA[[0 <-> 0, 1 <-> 1, 2 <-> 4, 3 <-> 5, 4 <-> 6, 5 <-> 7, 5 <-> 16, 6 <-> 8, 7 <-> 9, 8 <-> 17, 8 <-> 18, 9 <-> 17, 9 <-> 18, 10 <-> 20, 11 <-> 19, 14 <-> 10, 15 <-> 11, 16 <-> 12, 16 <-> 23, 17 <-> 13, 17 <-> 23, 18 <-> 14, 19 <-> 24]]]></mappings>
  <dlf>
    <node id="w1" mood="dcl" pred="say" tense="past">
      <rel name="Arg0">
        <node det="nil" id="w0" num="sg" pred="moore"/>
      </rel>
      <rel name="Arg1">
        <node id="w8">
          <one-of>
            <atts pred="will"/>
            <atts pred="can"/>
            <atts pred="conduct"/>
          </one-of>
          <rel name="Arg0">
            <one-of>
              <node id="w5" num="sg" pred="attache">
                <rel name="Det">
                  <node id="w2" pred="the"/>
                </rel>
                <rel name="Mod">
                  <node id="w3" pred="australian"/>
                </rel>
                <rel name="Mod">
                  <node id="w4" pred="military"/>
                </rel>
                <rel name="Mod">
                  <node id="w6" pred="to">
                    <rel name="Arg1">
                      <node det="nil" id="w7" num="sg" pred="jakarta"/>
                    </rel>
                  </node>
                </rel>
              </node>
              <node id="w5" pred="he"/>
            </one-of>
          </rel>
          <rel name="Arg0">
            <node idref="w5"/>
          </rel>
          <rel name="Arg1">
            <node id="w9">
              <opt>
                <rel name="Mod">
                  <node id="w12" pred="after">
                    <rel name="Arg1">
                      <node id="w14" pred="arrive" tense="pres">
                        <opt>
                          <rel name="Arg0">
                            <node id="w13" pred="he"/>
                          </rel>
                        </opt>
                        <rel name="Mod">
                          <node id="w15" pred="in">
                            <rel name="Arg1">
                              <node det="nil" id="w17" num="sg" pred="timor">
                                <rel name="Mod">
                                  <node id="w16" pred="east"/>
                                </rel>
                              </node>
                            </rel>
                          </node>
                        </rel>
                        <rel name="Mod">
                          <node id="w18" num="sg" pred="tomorrow"/>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
              </opt>
              <one-of>
                <atts pred="conduct"/>
                <atts pred="can"/>
              </one-of>
              <rel name="Arg0">
                <node idref="w5"/>
              </rel>
              <rel name="Arg1">
                <node det="nil" id="w11" num="pl" pred="investigation">
                  <rel name="Mod">
                    <node id="w10" pred="free"/>
                  </rel>
                </node>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
    </node>
  </dlf>
  <dlf>
    <node id="w1" mood="dcl" pred="say" tense="past">
      <rel name="Arg0">
        <node det="nil" id="w0" num="sg" pred="moore"/>
      </rel>
      <rel name="Arg1">
        <node emph-intro="+" id="w17">
          <opt>
            <rel name="Mod">
              <node emph-intro="+" id="w3" pred="after">
                <rel name="Arg1">
                  <node id="w10" pred="arrive" tense="pres">
                    <rel name="Arg0">
                      <node id="w7" num="sg" pred="attache">
                        <rel name="Det">
                          <node id="w4" pred="the"/>
                        </rel>
                        <rel name="Mod">
                          <node id="w5" pred="australian"/>
                        </rel>
                        <rel name="Mod">
                          <node id="w6" pred="military"/>
                        </rel>
                        <rel name="Mod">
                          <node id="w8" pred="to">
                            <rel name="Arg1">
                              <node det="nil" id="w9" num="sg" pred="jakarta"/>
                            </rel>
                          </node>
                        </rel>
                      </node>
                    </rel>
                    <rel name="Mod">
                      <node id="w11" pred="in">
                        <rel name="Arg1">
                          <node det="nil" id="w13" num="sg" pred="timor">
                            <rel name="Mod">
                              <node id="w12" pred="east"/>
                            </rel>
                          </node>
                        </rel>
                      </node>
                    </rel>
                    <rel name="Mod">
                      <node id="w14" num="sg" pred="tomorrow"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </opt>
          <one-of>
            <atts pred="can"/>
            <atts pred="will"/>
            <atts pred="conduct"/>
          </one-of>
          <rel name="Arg0">
            <node id="w16" pred="he"/>
          </rel>
          <rel name="Arg1">
            <node id="w18">
              <opt>
                <rel name="Mod">
                  <node id="w21" pred="in">
                    <rel name="Arg1">
                      <node id="w23" num="sg" pred="area">
                        <opt>
                          <rel name="Det">
                            <node id="w22" pred="the"/>
                          </rel>
                        </opt>
                      </node>
                    </rel>
                  </node>
                </rel>
              </opt>
              <one-of>
                <atts pred="conduct"/>
                <atts pred="will"/>
              </one-of>
              <rel name="Arg0">
                <node idref="w16"/>
              </rel>
              <rel name="Arg1">
                <node det="nil" id="w19" num="pl" pred="investigation"/>
              </rel>
              <rel name="Mod">
                <node id="w20" pred="freely"/>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
    </node>
  </dlf>
  <string number="37" position="A">at that time , jiang zeming indicated that china would consider joining the missile technology control regime . the indication has been taken as the principle result of the meeting between the two state heads .</string>
  <string number="37" position="B">jiang zemin promised at that time that china would consider joining the missile technology control agreement , which was seen as one of the major achievements in the china-us summit meeting .</string>
  <mappings><![CDATA[[0 <-> 3, 1 <-> 4, 2 <-> 5, 4 <-> 0, 5 <-> 1, 6 <-> 2, 7 <-> 6, 8 <-> 7, 9 <-> 8, 10 <-> 9, 11 <-> 10, 12 <-> 11, 13 <-> 12, 14 <-> 13, 15 <-> 14, 16 <-> 15, 17 <-> 16, 18 <-> 17, 19 <-> 17, 20 <-> 18, 20 <-> 19, 21 <-> 18, 21 <-> 19, 22 <-> 18, 22 <-> 19, 23 <-> 20, 24 <-> 21, 24 <-> 23, 25 <-> 24, 26 <-> 25, 27 <-> 26, 28 <-> 27, 29 <-> 29, 29 <-> 30, 30 <-> 28, 31 <-> 28, 32 <-> 28, 33 <-> 28, 34 <-> 29, 35 <-> 31]]]></mappings>
  <dlf>
    <node id="w6" mood="dcl" tense="past">
      <one-of>
        <atts pred="indicate"/>
        <atts pred="promise"/>
      </one-of>
      <rel name="Arg0">
        <node det="nil" id="w5" partic="pres">
          <one-of>
            <atts pred="zeming"/>
            <atts pred="zemin"/>
          </one-of>
          <rel name="Mod">
            <node id="w4" partic="pres" pred="jiang"/>
          </rel>
        </node>
      </rel>
      <rel name="Arg1">
        <node id="w9" pred="would">
          <rel name="Arg0">
            <node det="nil" id="w8" num="sg" pred="china"/>
          </rel>
          <rel name="Arg1">
            <node id="w10" pred="consider">
              <rel name="Arg0">
                <node idref="w8"/>
              </rel>
              <rel name="Arg1">
                <node det="nil" id="w26" num="sg">
                  <one-of>
                    <atts pred="result"/>
                    <atts pred="achievement"/>
                  </one-of>
                  <rel name="Mod">
                    <node id="w27">
                      <one-of>
                        <atts pred="of"/>
                        <atts pred="in"/>
                      </one-of>
                      <rel name="Arg1">
                        <node id="w29" num="sg" pred="meeting">
                          <rel name="Det">
                            <node id="w28" pred="the"/>
                          </rel>
                          <rel name="Mod">
                            <one-of>
                              <node id="w30" pred="between">
                                <rel name="Arg1">
                                  <node id="w34" num="pl" pred="head">
                                    <rel name="Det">
                                      <node id="w31" pred="the"/>
                                    </rel>
                                    <rel name="Mod">
                                      <node id="w32" pred="two"/>
                                    </rel>
                                    <rel name="Mod">
                                      <node id="w33" num="sg" pred="state"/>
                                    </rel>
                                  </node>
                                </rel>
                              </node>
                              <node id="w30" pred="china-us"/>
                            </one-of>
                          </rel>
                        </node>
                      </rel>
                    </node>
                  </rel>
                </node>
              </rel>
              <one-of>
                <rel name="GenRel">
                  <node id="w11" partic="pres" pred="join">
                    <rel name="Arg0">
                      <node idref="w8"/>
                    </rel>
                    <rel name="Arg1">
                      <node id="w16" num="sg">
                        <one-of>
                          <atts pred="regime"/>
                          <atts pred="agreement"/>
                        </one-of>
                        <rel name="Det">
                          <node id="w12" pred="the"/>
                        </rel>
                        <rel name="Mod">
                          <node id="w13" num="sg" pred="missile"/>
                        </rel>
                        <rel name="Mod">
                          <node id="w14" num="sg" pred="technology"/>
                        </rel>
                        <rel name="Mod">
                          <node id="w15" num="sg" pred="control"/>
                        </rel>
                        <one-of>
                          <rel name="GenRel">
                            <node id="w20" pred="PERF" tense="pres">
                              <rel name="Arg0">
                                <node id="w19" num="sg" pred="indication">
                                  <rel name="Det">
                                    <node id="w18" pred="the"/>
                                  </rel>
                                </node>
                              </rel>
                              <rel name="Arg1">
                                <node id="w21" partic="past" pred="PASS">
                                  <rel name="Arg0">
                                    <node idref="w19"/>
                                  </rel>
                                  <rel name="Arg1">
                                    <node id="w22" partic="pass" pred="take">
                                      <rel name="Arg1">
                                        <node idref="w19"/>
                                      </rel>
                                      <rel name="Arg2">
                                        <node id="w23" pred="as">
                                          <rel name="Arg1">
                                            <node id="w25" num="sg" pred="principle">
                                              <rel name="Det">
                                                <node id="w24" pred="the"/>
                                              </rel>
                                            </node>
                                          </rel>
                                        </node>
                                      </rel>
                                    </node>
                                  </rel>
                                </node>
                              </rel>
                              <rel name="Mod">
                                <node id="x1"/>
                              </rel>
                            </node>
                          </rel>
                          <rel name="whApposRel">
                            <node id="w20" pred="PASS" tense="past">
                              <rel name="Arg0">
                                <node id="w15f" num="sg" pred="agreement">
                                  <rel name="Det">
                                    <node id="w11f" pred="the"/>
                                  </rel>
                                  <rel name="Mod">
                                    <node id="w12f" num="sg" pred="missile"/>
                                  </rel>
                                  <rel name="Mod">
                                    <node id="w13f" num="sg" pred="technology"/>
                                  </rel>
                                  <rel name="Mod">
                                    <node id="w14f" num="sg" pred="control"/>
                                  </rel>
                                  <rel name="whApposRel">
                                    <node idref="w20"/>
                                  </rel>
                                </node>
                              </rel>
                              <rel name="Arg1">
                                <node id="w19f" partic="pass" pred="see">
                                  <rel name="Arg1">
                                    <node idref="w15f"/>
                                  </rel>
                                  <rel name="Arg2">
                                    <node id="w20f" pred="as">
                                      <rel name="Arg1">
                                        <node det="nil" id="w21f" pred="one">
                                          <rel name="Mod">
                                            <node id="w22f" pred="of">
                                              <rel name="Arg1">
                                                <node id="w25f" num="pl" pred="achievement">
                                                  <rel name="Det">
                                                    <node id="w23f" pred="the"/>
                                                  </rel>
                                                  <rel name="Mod">
                                                    <node id="w24f" pred="major"/>
                                                  </rel>
                                                  <rel name="Mod">
                                                    <node id="w26f" pred="in">
                                                      <rel name="Arg1">
                                                        <node id="w30f" num="sg" pred="meeting">
                                                          <rel name="Det">
                                                            <node id="w27f" pred="the"/>
                                                          </rel>
                                                          <rel name="Mod">
                                                            <node idref="w30"/>
                                                          </rel>
                                                          <rel name="Mod">
                                                            <node id="w29f" num="sg" pred="summit"/>
                                                          </rel>
                                                        </node>
                                                      </rel>
                                                    </node>
                                                  </rel>
                                                </node>
                                              </rel>
                                            </node>
                                          </rel>
                                        </node>
                                      </rel>
                                    </node>
                                  </rel>
                                </node>
                              </rel>
                            </node>
                          </rel>
                        </one-of>
                      </node>
                    </rel>
                  </node>
                </rel>
                <rel name="Arg1">
                  <node id="w11" partic="pres" pred="join">
                    <rel name="Arg0">
                      <node det="nil" id="w7f" num="sg" pred="china"/>
                    </rel>
                    <rel name="Arg1">
                      <node id="w5f" num="sg" pred="time">
                        <rel name="Det">
                          <node id="w4f" pred="that"/>
                        </rel>
                        <rel name="GenRel">
                          <node id="w8f" pred="would">
                            <rel name="Arg0">
                              <node idref="w7f"/>
                            </rel>
                            <rel name="Arg1">
                              <node id="w9f" pred="consider">
                                <rel name="Arg0">
                                  <node idref="w7f"/>
                                </rel>
                                <rel name="Arg1">
                                  <node idref="w11"/>
                                </rel>
                              </node>
                            </rel>
                          </node>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
              </one-of>
            </node>
          </rel>
        </node>
      </rel>
      <rel name="Mod">
        <node emph-intro="+" id="w0" pred="at">
          <rel name="Arg1">
            <node id="w2" num="sg" pred="time">
              <rel name="Det">
                <node id="w1" pred="that"/>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
    </node>
    <node id="x1"/>
  </dlf>
  <dlf>
    <node id="w2" mood="dcl" tense="past">
      <one-of>
        <atts pred="promise"/>
        <atts pred="indicate"/>
      </one-of>
      <rel name="Arg0">
        <node det="nil" id="w1" num="sg">
          <one-of>
            <atts pred="zemin"/>
            <atts pred="zeming"/>
          </one-of>
          <rel name="Mod">
            <node id="w0" num="sg" pred="jiang"/>
          </rel>
        </node>
      </rel>
      <rel name="Arg1">
        <node id="w15" num="sg">
          <one-of>
            <atts pred="agreement"/>
            <atts pred="regime"/>
          </one-of>
          <rel name="Det">
            <node id="w11" pred="the"/>
          </rel>
          <rel name="Mod">
            <node id="w12" num="sg" pred="missile"/>
          </rel>
          <rel name="Mod">
            <node id="w13" num="sg" pred="technology"/>
          </rel>
          <rel name="Mod">
            <node id="w14" num="sg" pred="control"/>
          </rel>
          <one-of>
            <rel name="whApposRel">
              <node id="w18" pred="PASS" tense="past">
                <rel name="Arg0">
                  <node idref="w15"/>
                </rel>
                <rel name="Arg1">
                  <node id="w19" partic="pass" pred="see">
                    <rel name="Arg1">
                      <node idref="w15"/>
                    </rel>
                    <rel name="Arg2">
                      <node id="w20" pred="as">
                        <rel name="Arg1">
                          <node det="nil" id="w21" pred="one">
                            <opt>
                              <rel name="Mod">
                                <node id="w22" pred="of">
                                  <rel name="Arg1">
                                    <node id="w25" num="pl" pred="achievement">
                                      <rel name="Det">
                                        <node id="w23" pred="the"/>
                                      </rel>
                                      <rel name="Mod">
                                        <node id="w24" pred="major"/>
                                      </rel>
                                      <rel name="Mod">
                                        <node id="w26">
                                          <one-of>
                                            <atts pred="in"/>
                                            <atts pred="of"/>
                                          </one-of>
                                          <rel name="Arg1">
                                            <node id="w30" num="sg" pred="meeting">
                                              <rel name="Det">
                                                <node id="w27" pred="the"/>
                                              </rel>
                                              <rel name="Mod">
                                                <node id="w28" pred="china-us"/>
                                              </rel>
                                              <rel name="Mod">
                                                <node id="w29" num="sg" pred="summit"/>
                                              </rel>
                                            </node>
                                          </rel>
                                        </node>
                                      </rel>
                                    </node>
                                  </rel>
                                </node>
                              </rel>
                            </opt>
                          </node>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
            <rel name="GenRel">
              <node id="w18" pred="PERF" tense="pres">
                <rel name="Arg0">
                  <node id="w19f" num="sg" pred="indication">
                    <rel name="Det">
                      <node id="w18f" pred="the"/>
                    </rel>
                  </node>
                </rel>
                <rel name="Arg1">
                  <node id="w21f" partic="past" pred="PASS">
                    <rel name="Arg0">
                      <node idref="w19f"/>
                    </rel>
                    <rel name="Arg1">
                      <node id="w22f" partic="pass" pred="take">
                        <rel name="Arg1">
                          <node idref="w19f"/>
                        </rel>
                        <rel name="Arg2">
                          <node id="w23f" pred="as">
                            <rel name="Arg1">
                              <node id="w25f" num="sg" pred="principle">
                                <rel name="Det">
                                  <node id="w24f" pred="the"/>
                                </rel>
                              </node>
                            </rel>
                          </node>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
                <rel name="Mod">
                  <node id="x1f"/>
                </rel>
              </node>
            </rel>
          </one-of>
        </node>
      </rel>
      <rel name="Mod">
        <node id="w3" pred="at">
          <rel name="Arg1">
            <node id="w5" num="sg" pred="time">
              <rel name="Det">
                <node id="w4" pred="that"/>
              </rel>
              <rel name="GenRel">
                <node id="w8" pred="would">
                  <rel name="Arg0">
                    <node det="nil" id="w7" num="sg" pred="china"/>
                  </rel>
                  <rel name="Arg1">
                    <node id="w9" pred="consider">
                      <rel name="Arg0">
                        <node idref="w7"/>
                      </rel>
                      <one-of>
                        <rel name="Arg1">
                          <node id="w10" partic="pres" pred="join">
                            <rel name="Arg0">
                              <node idref="w7"/>
                            </rel>
                            <rel name="Arg1">
                              <node idref="w5"/>
                            </rel>
                          </node>
                        </rel>
                        <rel name="GenRel">
                          <node id="w10" partic="pres" pred="join">
                            <rel name="Arg0">
                              <node det="nil" id="w8f" num="sg" pred="china"/>
                            </rel>
                            <rel name="Arg1">
                              <node id="w16f" num="sg" pred="regime">
                                <rel name="Det">
                                  <node id="w12f" pred="the"/>
                                </rel>
                                <rel name="Mod">
                                  <node id="w13f" num="sg" pred="missile"/>
                                </rel>
                                <rel name="Mod">
                                  <node id="w14f" num="sg" pred="technology"/>
                                </rel>
                                <rel name="Mod">
                                  <node id="w15f" num="sg" pred="control"/>
                                </rel>
                                <rel name="GenRel">
                                  <node idref="w18"/>
                                </rel>
                              </node>
                            </rel>
                          </node>
                        </rel>
                      </one-of>
                    </node>
                  </rel>
                </node>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
    </node>
  </dlf>
  <string number="38" position="A">more than 90% of china 's people centralize on one third of its territory .</string>
  <string number="38" position="B">more than 90 percent of the population is compacted into one-third of the country 's territory .</string>
  <mappings><![CDATA[[0 <-> 0, 1 <-> 1, 2 <-> 2, 2 <-> 3, 3 <-> 4, 4 <-> 13, 6 <-> 6, 7 <-> 7, 7 <-> 8, 8 <-> 9, 9 <-> 10, 10 <-> 10, 11 <-> 11, 12 <-> 13, 12 <-> 14, 13 <-> 15, 14 <-> 16]]]></mappings>
  <dlf>
    <node id="w7" mood="dcl" tense="pres">
      <one-of>
        <atts pred="centralize"/>
        <atts pred="PASS"/>
        <atts pred="compact"/>
      </one-of>
      <rel name="Arg0">
        <node det="nil" id="w2" pred="90%">
          <rel name="Mod">
            <node id="w1" pred="than">
              <rel name="Arg1">
                <node id="w0" pred="more">
                  <rel name="Arg0">
                    <node id="x1"/>
                  </rel>
                </node>
              </rel>
            </node>
          </rel>
          <rel name="Mod">
            <node id="w3" pred="of">
              <rel name="Arg1">
                <node id="w6" num="pl" pred="people">
                  <rel name="GenOwn">
                    <node det="nil" id="w4" num="sg" pred="china"/>
                  </rel>
                </node>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
      <one-of>
        <rel name="Arg0">
          <node idref="w2"/>
        </rel>
        <rel name="Arg1">
          <node det="nil" id="w2" num="sg" pred="percent">
            <rel name="Mod">
              <node id="w2f" pred="90"/>
            </rel>
            <rel name="Mod">
              <node id="w4f" pred="of">
                <rel name="Arg1">
                  <node id="w6f" num="sg" pred="population">
                    <rel name="Det">
                      <node id="w5f" pred="the"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </one-of>
      <one-of>
        <rel name="Arg1">
          <node id="w8" pred="on">
            <rel name="Arg1">
              <node det="nil" id="w10" num="sg" pred="third">
                <rel name="Mod">
                  <node id="w11" pred="of">
                    <rel name="Arg1">
                      <node id="w13" num="sg" pred="territory">
                        <one-of>
                          <rel name="Det">
                            <node id="w12" pred="its"/>
                          </rel>
                          <rel name="GenOwn">
                            <node id="w12" num="sg" pred="country">
                              <rel name="Det">
                                <node id="w12f" pred="the"/>
                              </rel>
                            </node>
                          </rel>
                        </one-of>
                      </node>
                    </rel>
                  </node>
                </rel>
                <rel name="Mod">
                  <node id="w9" pred="one"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="Arg2">
          <node id="w8" pred="into">
            <rel name="Arg1">
              <node id="x3f">
                <rel name="Mod">
                  <node idref="w11f"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </one-of>
    </node>
    <node id="x1"/>
  </dlf>
  <dlf>
    <node id="w10" num="sg" pred="one-third"/>
    <node id="w7" mood="dcl" tense="pres">
      <one-of>
        <atts pred="PASS"/>
        <atts pred="centralize"/>
      </one-of>
      <rel name="Arg0">
        <node det="nil" id="w3" num="sg" pred="percent">
          <rel name="Mod">
            <node id="w2" pred="90"/>
          </rel>
          <rel name="Mod">
            <node id="w4" pred="of">
              <rel name="Arg1">
                <node id="w6" num="sg" pred="population">
                  <opt>
                    <rel name="Det">
                      <node id="w5" pred="the"/>
                    </rel>
                  </opt>
                </node>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
      <rel name="Arg1">
        <node id="w8" partic="pass">
          <one-of>
            <atts pred="compact"/>
            <atts pred="centralize"/>
          </one-of>
          <one-of>
            <rel name="Arg1">
              <node idref="w3"/>
            </rel>
            <rel name="Arg0">
              <node det="nil" id="w3" pred="90%">
                <rel name="Mod">
                  <node id="w1f" pred="than">
                    <rel name="Arg1">
                      <node id="w0f" pred="more">
                        <rel name="Arg0">
                          <node id="x1f"/>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
                <rel name="Mod">
                  <node id="w3f" pred="of">
                    <rel name="Arg1">
                      <node id="w6f" num="pl" pred="people">
                        <rel name="GenOwn">
                          <node det="nil" id="w4f" num="sg" pred="china"/>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </one-of>
          <one-of>
            <rel name="Arg2">
              <node id="w9" pred="into">
                <rel name="Arg1">
                  <node id="x3">
                    <rel name="Mod">
                      <node id="w11" pred="of">
                        <rel name="Arg1">
                          <node id="w15" num="sg" pred="territory">
                            <one-of>
                              <rel name="GenOwn">
                                <node id="w13" num="sg" pred="country">
                                  <opt>
                                    <rel name="Det">
                                      <node id="w12" pred="the"/>
                                    </rel>
                                  </opt>
                                </node>
                              </rel>
                              <rel name="Det">
                                <node id="w13" pred="its"/>
                              </rel>
                            </one-of>
                          </node>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
            <rel name="Arg1">
              <node id="w9" pred="on">
                <rel name="Arg1">
                  <node det="nil" id="w10f" num="sg" pred="third">
                    <rel name="Mod">
                      <node idref="w11f"/>
                    </rel>
                    <rel name="Mod">
                      <node id="w9f" pred="one"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </one-of>
        </node>
      </rel>
    </node>
    <node id="x3">
      <rel name="Mod">
        <node id="w11f" pred="of">
          <rel name="Arg1">
            <node id="w15f" num="sg" pred="territory">
              <rel name="GenOwn">
                <node id="w13f" num="sg" pred="country">
                  <rel name="Det">
                    <node id="w12f" pred="the"/>
                  </rel>
                </node>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
    </node>
    <node id="x1f">
      <rel name="Mod">
        <node id="w1f" pred="than">
          <rel name="Arg1">
            <node id="w0f" pred="more">
              <rel name="Arg0">
                <node id="x2f"/>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
    </node>
    <node id="x2f"/>
  </dlf>
  <string number="39" position="A">what 's more , next year la nina will be just as bad as el nino .</string>
  <string number="39" position="B">and la nina will put on a frightening display next year no less devastating than that of el nino .</string>
  <mappings><![CDATA[[0 <-> 0, 1 <-> 0, 2 <-> 0, 4 <-> 9, 5 <-> 10, 6 <-> 1, 7 <-> 2, 8 <-> 3, 8 <-> 4, 8 <-> 5, 8 <-> 6, 8 <-> 7, 8 <-> 8, 8 <-> 11, 8 <-> 12, 8 <-> 13, 8 <-> 14, 9 <-> 3, 9 <-> 4, 9 <-> 5, 9 <-> 6, 9 <-> 7, 9 <-> 8, 9 <-> 11, 9 <-> 12, 9 <-> 13, 9 <-> 14, 10 <-> 3, 10 <-> 4, 10 <-> 6, 10 <-> 8, 10 <-> 11, 10 <-> 12, 10 <-> 13, 10 <-> 14, 11 <-> 3, 11 <-> 4, 11 <-> 6, 11 <-> 8, 11 <-> 11, 11 <-> 12, 11 <-> 13, 11 <-> 14, 12 <-> 3, 12 <-> 4, 12 <-> 6, 12 <-> 8, 12 <-> 11, 12 <-> 12, 12 <-> 13, 12 <-> 14, 13 <-> 3, 13 <-> 4, 13 <-> 6, 13 <-> 8, 13 <-> 11, 13 <-> 12, 13 <-> 13, 13 <-> 14, 14 <-> 17, 15 <-> 18, 16 <-> 19]]]></mappings>
  <dlf>
    <node id="w8" mood="dcl" pred="will">
      <one-of>
        <rel name="ApposRel">
          <node id="x1">
            <rel name="GenRel">
              <node id="w1" pred="be" tense="pres">
                <rel name="Arg0">
                  <node id="x2"/>
                </rel>
                <rel name="Arg1">
                  <node det="nil" id="w2" pred="more"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="Mod">
          <node id="x1" pred="and"/>
        </rel>
      </one-of>
      <rel name="Arg0">
        <node id="w7" num="sg" pred="nina">
          <rel name="Det">
            <node id="w6" pred="la"/>
          </rel>
        </node>
      </rel>
      <rel name="Arg1">
        <node id="w9">
          <one-of>
            <atts pred="be"/>
            <atts pred="will"/>
            <atts pred="put"/>
          </one-of>
          <rel name="Arg0">
            <node idref="w7"/>
          </rel>
          <rel name="Arg1">
            <node id="w12">
              <one-of>
                <atts pred="bad"/>
                <atts pred="will"/>
                <atts pred="put"/>
              </one-of>
              <rel name="Arg0">
                <node idref="w7"/>
              </rel>
              <rel name="Mod">
                <node id="w10" pred="just"/>
              </rel>
              <rel name="Mod">
                <node id="w11" pred="as"/>
              </rel>
              <rel name="Mod">
                <node id="w13" pred="as">
                  <rel name="Arg1">
                    <node det="nil" id="w15" num="sg" pred="nino">
                      <rel name="Mod">
                        <node id="w14" pred="el"/>
                      </rel>
                    </node>
                  </rel>
                </node>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
      <rel name="Mod">
        <node id="w5" num="sg" pred="year">
          <rel name="Mod">
            <node id="w4" pred="next"/>
          </rel>
        </node>
      </rel>
    </node>
    <node id="x1">
      <rel name="GenRel">
        <node id="w1" pred="be" tense="pres">
          <rel name="Arg0">
            <node id="x2"/>
          </rel>
          <rel name="Arg1">
            <node det="nil" id="w2" pred="more"/>
          </rel>
        </node>
      </rel>
    </node>
    <node id="x2"/>
  </dlf>
  <dlf>
    <node id="w3" mood="dcl">
      <one-of>
        <atts pred="will"/>
        <atts pred="be"/>
        <atts pred="bad"/>
      </one-of>
      <rel name="Arg0">
        <node id="w2" num="sg" pred="nina">
          <rel name="Det">
            <node id="w1" pred="la"/>
          </rel>
        </node>
      </rel>
      <rel name="Arg0">
        <node idref="w2"/>
      </rel>
      <rel name="Arg1">
        <node id="w4">
          <one-of>
            <atts pred="put"/>
            <atts pred="will"/>
            <atts pred="be"/>
            <atts pred="bad"/>
          </one-of>
          <rel name="Arg0">
            <node idref="w2"/>
          </rel>
          <rel name="Arg0">
            <node idref="w2"/>
          </rel>
          <rel name="Arg1">
            <node id="w5" pred="on">
              <rel name="Arg1">
                <node id="w8" num="sg" pred="display">
                  <rel name="Det">
                    <node id="w6" pred="a"/>
                  </rel>
                  <rel name="Mod">
                    <node id="w10" num="sg" pred="year">
                      <rel name="Mod">
                        <node id="w9" pred="next"/>
                      </rel>
                    </node>
                  </rel>
                  <rel name="Mod">
                    <node id="w7" pred="frightening"/>
                  </rel>
                  <rel name="GenRel">
                    <node id="w13" pred="devastating">
                      <rel name="Arg0">
                        <node idref="w8"/>
                      </rel>
                      <rel name="Mod">
                        <node id="w11" pred="no"/>
                      </rel>
                      <rel name="Mod">
                        <node id="w12" pred="less"/>
                      </rel>
                      <rel name="Mod">
                        <node id="w14" pred="than">
                          <opt>
                            <rel name="Arg1">
                              <node id="w15" pred="that">
                                <rel name="Mod">
                                  <node id="w16" pred="of">
                                    <rel name="Arg1">
                                      <node det="nil" id="w18" num="sg" pred="nino">
                                        <rel name="Mod">
                                          <node id="w17" pred="el"/>
                                        </rel>
                                      </node>
                                    </rel>
                                  </node>
                                </rel>
                              </node>
                            </rel>
                          </opt>
                        </node>
                      </rel>
                    </node>
                  </rel>
                </node>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
      <one-of>
        <rel name="Mod">
          <node id="w0" pred="and"/>
        </rel>
        <rel name="ApposRel">
          <node id="w0">
            <rel name="GenRel">
              <node id="w1f" pred="be" tense="pres">
                <rel name="Arg0">
                  <node id="x2f"/>
                </rel>
                <rel name="Arg1">
                  <node det="nil" id="w2f" pred="more"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </one-of>
    </node>
  </dlf>
  <string number="40" position="A">russian prime minister on domestic economy</string>
  <string number="40" position="B">russian prime minister talked about russian economic situation .</string>
  <mappings><![CDATA[[0 <-> 0, 1 <-> 1, 2 <-> 2, 3 <-> 4, 4 <-> 5, 5 <-> 6, 5 <-> 7]]]></mappings>
  <dlf>
    <node det="nil" id="w2" num="sg" pred="minister">
      <rel name="Mod">
        <node id="w0" pred="russian"/>
      </rel>
      <rel name="Mod">
        <node id="w1" pred="prime"/>
      </rel>
      <rel name="Mod">
        <node id="w3">
          <one-of>
            <atts pred="on"/>
            <atts pred="about"/>
          </one-of>
          <rel name="Arg1">
            <node det="nil" id="w5" num="sg">
              <one-of>
                <atts pred="economy"/>
                <atts pred="situation"/>
              </one-of>
              <rel name="Mod">
                <one-of>
                  <node id="w4" pred="domestic"/>
                  <node id="w4" pred="russian"/>
                </one-of>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
    </node>
  </dlf>
  <dlf>
    <node id="w3" mood="dcl" pred="talk" tense="past">
      <rel name="Arg0">
        <node det="nil" id="w2" num="sg" pred="minister">
          <rel name="Mod">
            <node id="w0" pred="russian"/>
          </rel>
          <rel name="Mod">
            <node id="w1" pred="prime"/>
          </rel>
        </node>
      </rel>
      <rel name="Arg1">
        <node id="w4">
          <one-of>
            <atts pred="about"/>
            <atts pred="on"/>
          </one-of>
          <rel name="Arg1">
            <node det="nil" id="w7" num="sg">
              <one-of>
                <atts pred="situation"/>
                <atts pred="economy"/>
              </one-of>
              <rel name="Mod">
                <one-of>
                  <node id="w5" pred="russian"/>
                  <node id="w5" pred="domestic"/>
                </one-of>
              </rel>
              <rel name="Mod">
                <node id="w6" pred="economic"/>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
    </node>
  </dlf>
  <string number="41" position="A">nowadays , there appeared a lot of enterprise groups with high technology and strong stamina .</string>
  <string number="41" position="B">nowadays , there appeared a lot of enterprise groups with high technology and strong stamina .</string>
  <mappings><![CDATA[[0 <-> 0, 1 <-> 1, 2 <-> 2, 3 <-> 3, 4 <-> 4, 5 <-> 5, 6 <-> 6, 7 <-> 7, 8 <-> 8, 9 <-> 9, 10 <-> 10, 11 <-> 11, 12 <-> 12, 13 <-> 13, 14 <-> 14, 15 <-> 15]]]></mappings>
  <dlf>
    <node id="w3" mood="dcl" pred="appear" tense="past">
      <rel name="Arg0">
        <node id="x1"/>
      </rel>
      <rel name="Mod">
        <node emph-intro="+" id="w0" pred="nowadays"/>
      </rel>
      <rel name="Mod">
        <node id="w4" pred="a">
          <rel name="Arg1">
            <node id="w5" num="sg" pred="lot"/>
          </rel>
          <rel name="Mod">
            <node id="w6" pred="of">
              <rel name="Arg1">
                <node idref="w3"/>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
      <rel name="Mod">
        <node id="w9" pred="with">
          <rel name="Arg1">
            <node det="nil" id="w12" pred="and">
              <rel name="First">
                <node id="w11" num="sg" pred="technology">
                  <rel name="Mod">
                    <node id="w10" pred="high"/>
                  </rel>
                </node>
              </rel>
              <rel name="Next">
                <node id="w14" num="sg" pred="stamina">
                  <rel name="Mod">
                    <node id="w13" pred="strong"/>
                  </rel>
                </node>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
    </node>
    <node id="w8" num="pl" pred="group">
      <rel name="Mod">
        <node id="w7" num="sg" pred="enterprise"/>
      </rel>
    </node>
    <node id="x1"/>
  </dlf>
  <dlf>
    <node id="w3" mood="dcl" pred="appear" tense="past">
      <rel name="Arg0">
        <node id="x1"/>
      </rel>
      <rel name="Mod">
        <node emph-intro="+" id="w0" pred="nowadays"/>
      </rel>
      <rel name="Mod">
        <node id="w4" pred="a">
          <rel name="Arg1">
            <node id="w5" num="sg" pred="lot"/>
          </rel>
          <rel name="Mod">
            <node id="w6" pred="of">
              <rel name="Arg1">
                <node idref="w3"/>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
      <rel name="Mod">
        <node id="w9" pred="with">
          <rel name="Arg1">
            <node det="nil" id="w12" pred="and">
              <rel name="First">
                <node id="w11" num="sg" pred="technology">
                  <rel name="Mod">
                    <node id="w10" pred="high"/>
                  </rel>
                </node>
              </rel>
              <rel name="Next">
                <node id="w14" num="sg" pred="stamina">
                  <rel name="Mod">
                    <node id="w13" pred="strong"/>
                  </rel>
                </node>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
    </node>
    <node id="w8" num="pl" pred="group">
      <rel name="Mod">
        <node id="w7" num="sg" pred="enterprise"/>
      </rel>
    </node>
    <node id="x1"/>
  </dlf>
  <string number="42" position="A">the gnp created by the village and township enterprises occupied about 1\/3 of the total gnp in fujian province .</string>
  <string number="42" position="B">the gross national product of the industry of villages and towns made up 1\/3 of the gnp of fujian province .</string>
  <mappings><![CDATA[[0 <-> 0, 1 <-> 1, 1 <-> 2, 1 <-> 3, 3 <-> 4, 4 <-> 5, 5 <-> 8, 6 <-> 9, 7 <-> 10, 8 <-> 6, 9 <-> 11, 9 <-> 12, 11 <-> 13, 12 <-> 14, 13 <-> 15, 15 <-> 16, 16 <-> 17, 17 <-> 18, 18 <-> 19, 19 <-> 20]]]></mappings>
  <dlf>
    <node id="w9" mood="dcl" tense="past">
      <one-of>
        <atts pred="occupy"/>
        <atts pred="make"/>
      </one-of>
      <rel name="Arg0">
        <node id="w1" num="sg" partic="pass">
          <opt>
            <rel name="GenRel">
              <node id="w2" partic="pass" pred="create">
                <rel name="Arg1">
                  <node idref="w1"/>
                </rel>
                <rel name="Mod">
                  <node id="w3" pred="by">
                    <rel name="Arg1">
                      <node id="w6" pred="and">
                        <rel name="Arg0">
                          <node id="h1" pred="has-rel">
                            <rel name="Mod">
                              <node id="w5" num="sg" pred="village"/>
                            </rel>
                            <rel name="Of">
                              <node id="w8" num="pl" pred="enterprise">
                                <rel name="Mod">
                                  <node id="w7" num="sg" pred="township"/>
                                </rel>
                              </node>
                            </rel>
                          </node>
                        </rel>
                        <rel name="Arg1">
                          <node idref="w8"/>
                        </rel>
                        <rel name="Det">
                          <node id="w4" pred="the"/>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </opt>
          <one-of>
            <atts pred="gnp"/>
            <atts pred="product"/>
          </one-of>
          <rel name="Det">
            <node id="w0" pred="the"/>
          </rel>
        </node>
      </rel>
      <rel name="Arg1">
        <node det="nil" id="w11" pred="1\/3">
          <opt>
            <rel name="Mod">
              <node id="w10" pred="about"/>
            </rel>
          </opt>
          <rel name="Mod">
            <node id="w12" pred="of">
              <rel name="Arg1">
                <node id="w15" num="sg" pred="gnp">
                  <opt>
                    <rel name="Mod">
                      <node id="w14" pred="total"/>
                    </rel>
                  </opt>
                  <rel name="Det">
                    <node id="w13" pred="the"/>
                  </rel>
                  <rel name="Mod">
                    <node id="w16">
                      <one-of>
                        <atts pred="in"/>
                        <atts pred="of"/>
                      </one-of>
                      <rel name="Arg1">
                        <node det="nil" id="w18" num="sg" pred="province">
                          <rel name="Mod">
                            <node id="w17" pred="fujian"/>
                          </rel>
                        </node>
                      </rel>
                    </node>
                  </rel>
                </node>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
    </node>
  </dlf>
  <dlf>
    <node id="w11" mood="dcl" tense="past">
      <one-of>
        <atts pred="make"/>
        <atts pred="occupy"/>
      </one-of>
      <rel name="Arg0">
        <node id="w3" num="sg">
          <opt>
            <rel name="Mod">
              <node id="w7" pred="of">
                <rel name="Arg1">
                  <node id="w9" pred="and">
                    <rel name="First">
                      <node det="nil" id="w8" num="pl" pred="village"/>
                    </rel>
                    <rel name="Next">
                      <node det="nil" id="w10" num="pl" pred="town"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </opt>
          <one-of>
            <atts pred="product"/>
            <atts pred="gnp"/>
          </one-of>
          <rel name="Det">
            <node id="w0" pred="the"/>
          </rel>
          <rel name="Mod">
            <node id="w1" pred="gross"/>
          </rel>
          <rel name="Mod">
            <node id="w2" pred="national"/>
          </rel>
        </node>
      </rel>
      <rel name="Arg1">
        <node det="nil" id="w13" pred="1\/3">
          <rel name="Mod">
            <node id="w14" pred="of">
              <rel name="Arg1">
                <node id="w16" num="sg" pred="gnp">
                  <rel name="Det">
                    <node id="w15" pred="the"/>
                  </rel>
                  <rel name="Mod">
                    <node id="w17">
                      <one-of>
                        <atts pred="of"/>
                        <atts pred="in"/>
                      </one-of>
                      <rel name="Arg1">
                        <node det="nil" id="w19" num="sg" pred="province">
                          <rel name="Mod">
                            <node id="w18" pred="fujian"/>
                          </rel>
                        </node>
                      </rel>
                    </node>
                  </rel>
                </node>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
      <rel name="Mod">
        <node id="w12" pred="up"/>
      </rel>
    </node>
  </dlf>
  <string number="43" position="A">both parties expressed satisfaction for the friendly cooperation between the two armies in the past 30 years .</string>
  <string number="43" position="B">both parties expressed satisfaction for the friendly cooperation between the two armies in the past 30 years .</string>
  <mappings><![CDATA[[0 <-> 0, 1 <-> 1, 2 <-> 2, 3 <-> 3, 4 <-> 4, 5 <-> 5, 6 <-> 6, 7 <-> 7, 8 <-> 8, 9 <-> 9, 10 <-> 10, 11 <-> 11, 12 <-> 12, 13 <-> 13, 14 <-> 14, 15 <-> 15, 16 <-> 16, 17 <-> 17]]]></mappings>
  <dlf>
    <node id="w2" mood="dcl" pred="express" tense="past">
      <rel name="Arg0">
        <node id="w1" num="pl" pred="party">
          <rel name="Det">
            <node id="w0" pred="both"/>
          </rel>
        </node>
      </rel>
      <rel name="Arg1">
        <node det="nil" id="w3" num="sg" pred="satisfaction">
          <rel name="Mod">
            <node id="w4" pred="for">
              <rel name="Arg1">
                <node id="w7" num="sg" pred="cooperation">
                  <rel name="Det">
                    <node id="w5" pred="the"/>
                  </rel>
                  <rel name="Mod">
                    <node id="w12" pred="in">
                      <rel name="Arg1">
                        <node id="w16" num="pl" pred="year">
                          <rel name="Det">
                            <node id="w13" pred="the"/>
                          </rel>
                          <rel name="Mod">
                            <node id="w14" pred="past"/>
                          </rel>
                          <rel name="Mod">
                            <node id="w15" pred="30"/>
                          </rel>
                        </node>
                      </rel>
                    </node>
                  </rel>
                  <rel name="Mod">
                    <node id="w6" pred="friendly"/>
                  </rel>
                  <rel name="Mod">
                    <node id="w8" pred="between">
                      <rel name="Arg1">
                        <node id="w11" num="pl" pred="army">
                          <rel name="Det">
                            <node id="w9" pred="the"/>
                          </rel>
                          <rel name="Mod">
                            <node id="w10" pred="two"/>
                          </rel>
                        </node>
                      </rel>
                    </node>
                  </rel>
                </node>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
    </node>
  </dlf>
  <dlf>
    <node id="w2" mood="dcl" pred="express" tense="past">
      <rel name="Arg0">
        <node id="w1" num="pl" pred="party">
          <rel name="Det">
            <node id="w0" pred="both"/>
          </rel>
        </node>
      </rel>
      <rel name="Arg1">
        <node det="nil" id="w3" num="sg" pred="satisfaction">
          <rel name="Mod">
            <node id="w4" pred="for">
              <rel name="Arg1">
                <node id="w7" num="sg" pred="cooperation">
                  <rel name="Det">
                    <node id="w5" pred="the"/>
                  </rel>
                  <rel name="Mod">
                    <node id="w12" pred="in">
                      <rel name="Arg1">
                        <node id="w16" num="pl" pred="year">
                          <rel name="Det">
                            <node id="w13" pred="the"/>
                          </rel>
                          <rel name="Mod">
                            <node id="w14" pred="past"/>
                          </rel>
                          <rel name="Mod">
                            <node id="w15" pred="30"/>
                          </rel>
                        </node>
                      </rel>
                    </node>
                  </rel>
                  <rel name="Mod">
                    <node id="w6" pred="friendly"/>
                  </rel>
                  <rel name="Mod">
                    <node id="w8" pred="between">
                      <rel name="Arg1">
                        <node id="w11" num="pl" pred="army">
                          <rel name="Det">
                            <node id="w9" pred="the"/>
                          </rel>
                          <rel name="Mod">
                            <node id="w10" pred="two"/>
                          </rel>
                        </node>
                      </rel>
                    </node>
                  </rel>
                </node>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
    </node>
  </dlf>
  <string number="44" position="A">also present at the seminar will be long yongtu , vice minister of china 's ministry of foreign trade and economic cooperation who will accompany rugerro to shanghai , and shen jueren , former chief negotiator of china in gatt negotiations .</string>
  <string number="44" position="B">attendees will also include the vice minister of foreign trade &amp; economic cooperation , yongtu long , who accompanied ruggiero to shanghai , and former chief representative for trade negotiations of the moftec .</string>
  <mappings><![CDATA[[0 <-> 2, 1 <-> 0, 1 <-> 3, 5 <-> 1, 6 <-> 3, 7 <-> 15, 8 <-> 14, 9 <-> 16, 10 <-> 5, 11 <-> 6, 16 <-> 7, 17 <-> 8, 18 <-> 9, 19 <-> 10, 20 <-> 11, 21 <-> 12, 22 <-> 17, 23 <-> 18, 24 <-> 18, 25 <-> 19, 26 <-> 20, 27 <-> 21, 28 <-> 22, 29 <-> 23, 33 <-> 24, 34 <-> 25, 35 <-> 26, 35 <-> 27, 35 <-> 29, 36 <-> 30, 37 <-> 32, 38 <-> 27, 39 <-> 28, 40 <-> 29, 41 <-> 33]]]></mappings>
  <!--missing LF!-->
  <string number="45" position="A">xinhua news agency , nanjing , 16 december , by zhoufang the investment of foreign capital in agriculture of jiangsu increased .</string>
  <string number="45" position="B">xinhua news agency , nanjing , dec. 16 . ( reporter zhou fang ) an increasing number of investments from foreign capital are being made on agriculture in jiangsu .</string>
  <mappings><![CDATA[[0 <-> 0, 1 <-> 1, 2 <-> 2, 3 <-> 3, 4 <-> 4, 5 <-> 5, 6 <-> 7, 7 <-> 6, 8 <-> 8, 10 <-> 11, 10 <-> 12, 12 <-> 18, 13 <-> 19, 14 <-> 20, 15 <-> 21, 16 <-> 25, 17 <-> 26, 18 <-> 27, 19 <-> 28, 20 <-> 15, 21 <-> 29]]]></mappings>
  <!--missing LF!-->
  <string number="46" position="A">france ministry of foreign affairs said that leaders of iraq refused to co-operate with united nations and have caused this deeply regretted outcome .</string>
  <string number="46" position="B">the french foreign ministry said that because iraqi leader refuses to cooperate with the un caused this sad events .</string>
  <mappings><![CDATA[[0 <-> 1, 1 <-> 3, 2 <-> 2, 3 <-> 2, 4 <-> 2, 5 <-> 4, 6 <-> 5, 7 <-> 8, 8 <-> 7, 9 <-> 7, 10 <-> 9, 11 <-> 10, 12 <-> 11, 13 <-> 12, 14 <-> 14, 15 <-> 14, 17 <-> 15, 18 <-> 15, 19 <-> 16, 20 <-> 17, 21 <-> 17, 22 <-> 18, 23 <-> 19]]]></mappings>
  <dlf>
    <node id="w5" mood="dcl" pred="say" tense="past">
      <opt>
        <rel name="Arg1">
          <node id="w16" pred="and">
            <rel name="First">
              <node id="w10" pred="refuse" tense="past">
                <rel name="Arg0">
                  <node id="w7" num="pl" pred="leader">
                    <rel name="Det">
                      <node id="w6" pred="that"/>
                    </rel>
                    <rel name="Mod">
                      <one-of>
                        <node id="w8" pred="of">
                          <rel name="Arg1">
                            <node det="nil" id="w9" num="pl" pred="iraq"/>
                          </rel>
                        </node>
                        <node id="w8" pred="iraqi"/>
                      </one-of>
                    </rel>
                  </node>
                </rel>
                <rel name="Arg1">
                  <node id="w12">
                    <one-of>
                      <atts pred="co-operate"/>
                      <atts pred="cooperate"/>
                    </one-of>
                    <rel name="Arg0">
                      <node idref="w7"/>
                    </rel>
                    <rel name="Arg1">
                      <node id="w13" pred="with">
                        <rel name="Arg1">
                          <node det="nil" id="w15" num="pl" pred="nation">
                            <rel name="Mod">
                              <node id="w14" pred="united"/>
                            </rel>
                          </node>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
            <rel name="Next">
              <node id="w17" pred="PERF" tense="pres">
                <rel name="Arg0">
                  <node idref="w7"/>
                </rel>
                <rel name="Arg1">
                  <node id="w18" partic="past" pred="cause">
                    <rel name="Arg0">
                      <node idref="w7"/>
                    </rel>
                    <rel name="Arg1">
                      <node id="w22" num="sg">
                        <one-of>
                          <atts pred="outcome"/>
                          <atts pred="event"/>
                        </one-of>
                        <rel name="Det">
                          <node id="w19" pred="this"/>
                        </rel>
                        <rel name="Mod">
                          <one-of>
                            <node id="w21" pred="regretted">
                              <rel name="Mod">
                                <node id="w20" pred="deeply"/>
                              </rel>
                            </node>
                            <node id="w21" pred="sad"/>
                          </one-of>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </opt>
      <rel name="Arg0">
        <node det="nil" id="w1" num="sg" pred="ministry">
          <rel name="Mod">
            <one-of>
              <node id="w0" num="sg" pred="france"/>
              <node id="w0" pred="french"/>
            </one-of>
          </rel>
          <rel name="Mod">
            <one-of>
              <node id="w2" pred="of">
                <rel name="Arg1">
                  <node det="nil" id="w4" num="pl" pred="affair">
                    <rel name="Mod">
                      <node id="w3" pred="foreign"/>
                    </rel>
                  </node>
                </rel>
              </node>
              <node id="w2" pred="foreign"/>
            </one-of>
          </rel>
        </node>
      </rel>
    </node>
  </dlf>
  <dlf>
    <node id="w4" mood="dcl" pred="say" tense="past">
      <rel name="Arg0">
        <node id="w3" num="sg" pred="ministry">
          <opt>
            <rel name="Det">
              <node id="w0" pred="the"/>
            </rel>
          </opt>
          <rel name="Mod">
            <one-of>
              <node id="w1" pred="french"/>
              <node id="w1" num="sg" pred="france"/>
            </one-of>
          </rel>
          <rel name="Mod">
            <node id="w2" pred="foreign"/>
          </rel>
        </node>
      </rel>
      <rel name="Arg1">
        <node id="w15" pred="cause">
          <opt>
            <rel name="Mod">
              <node id="w6" pred="because">
                <rel name="Arg1">
                  <node id="w9" pred="refuse" tense="pres">
                    <rel name="Arg0">
                      <node det="nil" id="w8" num="sg" pred="leader">
                        <rel name="Mod">
                          <node id="w7" pred="iraqi"/>
                        </rel>
                      </node>
                    </rel>
                    <rel name="Arg1">
                      <node id="w11">
                        <one-of>
                          <atts pred="cooperate"/>
                          <atts pred="co-operate"/>
                        </one-of>
                        <rel name="Arg0">
                          <node idref="w8"/>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </opt>
          <rel name="Arg1">
            <node id="w18" num="pl">
              <one-of>
                <atts pred="event"/>
                <atts pred="outcome"/>
              </one-of>
              <rel name="Det">
                <node id="w16" pred="this"/>
              </rel>
              <rel name="Mod">
                <node id="w17" pred="sad"/>
              </rel>
            </node>
          </rel>
          <rel name="Arg2">
            <node id="w12" pred="with">
              <rel name="Arg1">
                <node id="w14" num="sg" pred="un">
                  <opt>
                    <rel name="Det">
                      <node id="w13" pred="the"/>
                    </rel>
                  </opt>
                </node>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
    </node>
  </dlf>
  <string number="47" position="A">during the preliminaries , lan wei , a highly-skilled twenty-six year-old native of guangdong , scored 355.35 for first place .</string>
  <string number="47" position="B">in the qualifiers , 26-year-old lan wei from guangdong displayed excellent skill , and ranked no. 1 with a total score of 355.3 .</string>
  <mappings><![CDATA[[0 <-> 0, 1 <-> 1, 2 <-> 2, 3 <-> 3, 4 <-> 5, 5 <-> 6, 8 <-> 9, 8 <-> 10, 8 <-> 11, 9 <-> 4, 10 <-> 4, 11 <-> 7, 12 <-> 7, 13 <-> 8, 14 <-> 12, 15 <-> 20, 16 <-> 22, 18 <-> 15, 18 <-> 16, 19 <-> 14, 19 <-> 15, 20 <-> 23]]]></mappings>
  <dlf>
    <node id="w15" mood="dcl" pred="score" tense="past">
      <opt>
        <rel name="Mod">
          <node id="w17" pred="for">
            <rel name="Arg1">
              <node det="nil" id="w19" num="sg" pred="place">
                <rel name="Mod">
                  <node id="w18" pred="first"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </opt>
      <rel name="Arg0">
        <node det="nil" id="w5" num="pl" pred="wei">
          <one-of>
            <rel name="ApposRel">
              <node id="w11" num="sg" pred="native">
                <opt>
                  <rel name="Det">
                    <node id="w7" pred="a"/>
                  </rel>
                </opt>
                <rel name="Mod">
                  <node id="w10" pred="year-old"/>
                </rel>
                <rel name="Mod">
                  <node id="w12">
                    <one-of>
                      <atts pred="of"/>
                      <atts pred="from"/>
                    </one-of>
                    <rel name="Arg1">
                      <node det="nil" id="w13" num="sg" pred="guangdong"/>
                    </rel>
                  </node>
                </rel>
                <rel name="Mod">
                  <node id="w8" pred="highly-skilled"/>
                </rel>
                <rel name="Mod">
                  <node id="w9" pred="twenty-six"/>
                </rel>
              </node>
            </rel>
            <rel name="Mod">
              <node id="w11" pred="from">
                <rel name="Arg1">
                  <node id="w8f" partic="pres" pred="guangdong">
                    <rel name="Arg0">
                      <node id="x2f"/>
                    </rel>
                    <rel name="Arg1">
                      <node id="w13f" pred="and">
                        <rel name="First">
                          <node id="w9f" partic="pass" pred="display">
                            <rel name="Arg1">
                              <node idref="x2f"/>
                            </rel>
                            <rel name="Mod">
                              <node id="w11f" num="sg" pred="skill">
                                <rel name="Mod">
                                  <node id="w10f" pred="excellent"/>
                                </rel>
                              </node>
                            </rel>
                          </node>
                        </rel>
                        <rel name="Next">
                          <node id="w14f" pred="rank" tense="past">
                            <rel name="Arg1">
                              <node idref="x2f"/>
                            </rel>
                            <rel name="Mod">
                              <node id="w15f" num="sg" pred="no.">
                                <rel name="Arg1">
                                  <node id="w16f" pred="1"/>
                                </rel>
                              </node>
                            </rel>
                            <rel name="Mod">
                              <node id="w17f" pred="with">
                                <rel name="Arg1">
                                  <node id="w20f" num="sg" pred="score">
                                    <rel name="Mod">
                                      <node id="w19f" pred="total"/>
                                    </rel>
                                    <rel name="Mod">
                                      <node id="w21f" pred="of">
                                        <rel name="Arg1">
                                          <node det="nil" id="w22f" pred="355.3"/>
                                        </rel>
                                      </node>
                                    </rel>
                                  </node>
                                </rel>
                              </node>
                            </rel>
                          </node>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </one-of>
          <rel name="Mod">
            <node id="w4" pred="lan"/>
          </rel>
        </node>
      </rel>
      <rel name="Mod">
        <node emph-intro="+" id="w0" pred="during">
          <rel name="Arg1">
            <node id="w2" num="pl">
              <one-of>
                <atts pred="preliminaries"/>
                <atts pred="qualifiers"/>
              </one-of>
              <rel name="Det">
                <node id="w1" pred="the"/>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
      <rel name="Mod">
        <node id="w16" pred="355.35"/>
      </rel>
    </node>
  </dlf>
  <dlf>
    <node id="x1" mood="dcl">
      <rel name="Mod">
        <node id="w0" pred="in">
          <rel name="Arg1">
            <node id="w3" pred=",">
              <rel name="First">
                <node id="w2" num="pl">
                  <one-of>
                    <atts pred="qualifiers"/>
                    <atts pred="preliminaries"/>
                  </one-of>
                  <rel name="Det">
                    <node id="w1" pred="the"/>
                  </rel>
                </node>
              </rel>
              <rel name="Next">
                <node det="nil" id="w6" num="pl" pred="wei">
                  <rel name="Mod">
                    <node id="w4" pred="26-year-old"/>
                  </rel>
                  <rel name="Mod">
                    <node id="w5" pred="lan"/>
                  </rel>
                  <one-of>
                    <rel name="Mod">
                      <node id="w7">
                        <one-of>
                          <atts pred="from"/>
                          <atts pred="of"/>
                        </one-of>
                        <rel name="Arg1">
                          <node id="w8" partic="pres" pred="guangdong">
                            <opt>
                              <rel name="Arg1">
                                <node id="w13" pred="and">
                                  <rel name="First">
                                    <node id="w9" partic="pass" pred="display">
                                      <rel name="Arg1">
                                        <node id="x2"/>
                                      </rel>
                                      <rel name="Mod">
                                        <node id="w11" num="sg" pred="skill">
                                          <rel name="Mod">
                                            <node id="w10" pred="excellent"/>
                                          </rel>
                                        </node>
                                      </rel>
                                    </node>
                                  </rel>
                                  <rel name="Next">
                                    <node id="w14" pred="rank" tense="past">
                                      <opt>
                                        <rel name="Mod">
                                          <node id="w17" pred="with">
                                            <rel name="Arg1">
                                              <node id="w20" num="sg" pred="score">
                                                <opt>
                                                  <rel name="Det">
                                                    <node id="w18" pred="a"/>
                                                  </rel>
                                                </opt>
                                                <opt>
                                                  <rel name="Mod">
                                                    <node id="w19" pred="total"/>
                                                  </rel>
                                                </opt>
                                                <opt>
                                                  <rel name="Mod">
                                                    <node id="w21" pred="of">
                                                      <rel name="Arg1">
                                                        <node det="nil" id="w22" pred="355.3"/>
                                                      </rel>
                                                    </node>
                                                  </rel>
                                                </opt>
                                              </node>
                                            </rel>
                                          </node>
                                        </rel>
                                      </opt>
                                      <rel name="Arg1">
                                        <node idref="x2"/>
                                      </rel>
                                      <rel name="Mod">
                                        <node id="w15" num="sg" pred="no.">
                                          <rel name="Arg1">
                                            <node id="w16" pred="1"/>
                                          </rel>
                                        </node>
                                      </rel>
                                    </node>
                                  </rel>
                                </node>
                              </rel>
                            </opt>
                            <rel name="Arg0">
                              <node idref="x2"/>
                            </rel>
                          </node>
                        </rel>
                      </node>
                    </rel>
                    <rel name="ApposRel">
                      <node id="w7" num="sg" pred="native">
                        <rel name="Det">
                          <node id="w7f" pred="a"/>
                        </rel>
                        <rel name="Mod">
                          <node id="w10f" pred="year-old"/>
                        </rel>
                        <rel name="Mod">
                          <node id="w12f" pred="of">
                            <rel name="Arg1">
                              <node det="nil" id="w13f" num="sg" pred="guangdong"/>
                            </rel>
                          </node>
                        </rel>
                        <rel name="Mod">
                          <node id="w8f" pred="highly-skilled"/>
                        </rel>
                        <rel name="Mod">
                          <node id="w9f" pred="twenty-six"/>
                        </rel>
                      </node>
                    </rel>
                  </one-of>
                </node>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
    </node>
    <node id="x2"/>
  </dlf>
  <string number="48" position="A">nanjing , december 16 ( xinhua ) foreign fund put into jiangsu 's agricultural sector is increasing</string>
  <string number="48" position="B">xinhua news agency , nanjing , dec. 16 ( reporter zhou fang ) - foreign investment in jiangsu 's agriculture is on the rise .</string>
  <mappings><![CDATA[[0 <-> 4, 1 <-> 5, 2 <-> 6, 3 <-> 7, 4 <-> 8, 5 <-> 0, 7 <-> 14, 8 <-> 15, 8 <-> 16, 9 <-> 15, 9 <-> 16, 10 <-> 15, 10 <-> 16, 11 <-> 17, 12 <-> 18, 13 <-> 19, 14 <-> 19, 15 <-> 20, 16 <-> 21, 16 <-> 22, 16 <-> 23]]]></mappings>
  <dlf>
    <node id="w15" pred="PROG" tense="pres">
      <rel name="Arg0">
        <node det="nil" id="w2" num="sg" pred="december">
          <rel name="Mod">
            <node id="w4" num="pl" pred="lrb"/>
          </rel>
        </node>
      </rel>
      <rel name="Arg1">
        <node id="w16" partic="pres" pred="increase">
          <rel name="Arg0">
            <node idref="w2"/>
          </rel>
        </node>
      </rel>
      <rel name="Mod">
        <node emph-intro="+" id="w0" num="sg" pred="nanjing"/>
      </rel>
    </node>
    <node id="x1">
      <rel name="Mod">
        <node id="w3" pred="16"/>
      </rel>
      <rel name="Mod">
        <node id="w5" pred="xinhua">
          <rel name="Arg1">
            <node id="w8" num="sg" pred="fund">
              <opt>
                <rel name="Det">
                  <node id="w6" pred="rrb"/>
                </rel>
              </opt>
              <rel name="Mod">
                <node id="w7" pred="foreign"/>
              </rel>
              <rel name="GenRel">
                <node id="w9" pred="put" tense="past">
                  <rel name="Arg1">
                    <node idref="w8"/>
                  </rel>
                  <rel name="Arg2">
                    <node id="w10">
                      <one-of>
                        <atts pred="into"/>
                        <atts pred="in"/>
                      </one-of>
                      <rel name="Arg1">
                        <node id="w14" num="sg">
                          <one-of>
                            <atts pred="sector"/>
                            <atts pred="agriculture"/>
                          </one-of>
                          <rel name="GenOwn">
                            <node det="nil" id="w11" num="sg" pred="jiangsu"/>
                          </rel>
                          <rel name="Mod">
                            <node id="w13" pred="agricultural"/>
                          </rel>
                        </node>
                      </rel>
                    </node>
                  </rel>
                </node>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
    </node>
  </dlf>
  <dlf>
    <node det="nil" id="w6" mood="dcl" num="sg" pred="dec." tense="pres">
      <opt>
        <rel name="Arg0">
          <node id="w2" num="sg" pred="agency">
            <rel name="ApposRel">
              <node det="nil" id="w4" num="sg" pred="nanjing"/>
            </rel>
            <rel name="Det">
              <node id="w0" pred="xinhua"/>
            </rel>
            <rel name="Mod">
              <node id="w1" num="sg" pred="news"/>
            </rel>
          </node>
        </rel>
      </opt>
      <opt>
        <rel name="Arg1">
          <node det="nil" id="w12" pred="rrb">
            <rel name="Mod">
              <node id="w10" num="sg" pred="zhou"/>
            </rel>
            <rel name="Mod">
              <node id="w11" partic="pres" pred="fang"/>
            </rel>
            <rel name="Mod">
              <node id="w7" pred="16"/>
            </rel>
            <rel name="Mod">
              <node id="w8" num="sg" pred="lrb"/>
            </rel>
            <rel name="Mod">
              <node id="w9" num="sg" pred="reporter"/>
            </rel>
            <rel name="GenRel">
              <node id="w20" pred="be" tense="pres">
                <opt>
                  <rel name="Mod">
                    <node id="x1"/>
                  </rel>
                </opt>
                <rel name="Arg0">
                  <node det="nil" id="w15" num="sg">
                    <one-of>
                      <atts pred="investment"/>
                      <atts pred="fund"/>
                    </one-of>
                    <rel name="Mod">
                      <node id="w14" pred="foreign"/>
                    </rel>
                    <rel name="Mod">
                      <node id="w16">
                        <one-of>
                          <atts pred="in"/>
                          <atts pred="into"/>
                        </one-of>
                        <rel name="Arg1">
                          <node id="w19" num="sg">
                            <one-of>
                              <atts pred="agriculture"/>
                              <atts pred="sector"/>
                            </one-of>
                            <rel name="GenOwn">
                              <node det="nil" id="w17" num="sg" pred="jiangsu"/>
                            </rel>
                          </node>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
                <rel name="Arg1">
                  <node id="w21" pred="on">
                    <rel name="Arg1">
                      <node id="w23" num="sg" pred="rise">
                        <rel name="Det">
                          <node id="w22" pred="the"/>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
                <rel name="Mod">
                  <node idref="x1"/>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </opt>
    </node>
    <node id="x1"/>
  </dlf>
  <string number="49" position="A">someone connected global warming to the phenomenon of el nino .</string>
  <string number="49" position="B">some linked global warming with el nino .</string>
  <mappings><![CDATA[[0 <-> 0, 1 <-> 1, 2 <-> 2, 3 <-> 3, 4 <-> 4, 8 <-> 5, 9 <-> 6, 10 <-> 7]]]></mappings>
  <dlf>
    <node id="w3" mood="dcl" num="sg" pred="warming">
      <rel name="Det">
        <one-of>
          <node id="w0" pred="someone"/>
          <node id="w0" pred="some"/>
        </one-of>
      </rel>
      <rel name="Mod">
        <one-of>
          <node id="w1" pred="connected"/>
          <node id="w1" pred="link"/>
        </one-of>
      </rel>
      <rel name="Mod">
        <node id="w2" pred="global"/>
      </rel>
      <rel name="Mod">
        <node id="w4" num="sg" pred="to">
          <opt>
            <rel name="Arg1">
              <node id="w6" num="sg" pred="phenomenon">
                <rel name="Det">
                  <node id="w5" pred="the"/>
                </rel>
                <rel name="Mod">
                  <node id="w7" pred="of">
                    <rel name="Arg1">
                      <node det="nil" id="w9" num="sg" pred="nino">
                        <rel name="Mod">
                          <node id="w8" pred="el"/>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </opt>
        </node>
      </rel>
    </node>
  </dlf>
  <dlf>
    <node id="w3" mood="dcl" num="sg" pred="warming">
      <rel name="Det">
        <one-of>
          <node id="w0" pred="some"/>
          <node id="w0" pred="someone"/>
        </one-of>
      </rel>
      <rel name="Mod">
        <one-of>
          <node id="w1" pred="link"/>
          <node id="w1" pred="connected"/>
        </one-of>
      </rel>
      <rel name="Mod">
        <node id="w2" pred="global"/>
      </rel>
      <rel name="Mod">
        <node id="w4" pred="with">
          <rel name="Arg1">
            <node det="nil" id="w6" num="sg" pred="nino">
              <rel name="Mod">
                <node id="w5" pred="el"/>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
    </node>
  </dlf>
  <string number="50" position="A">xinhua news agency , beijing , january 16th , by xintang xu and yuhong qian- the president of the bank of china , xianglong dai said that , china will continue implementing the financial opening up policy .</string>
  <string number="50" position="B">xinhua news agency , beijing , january 16th ( reporter : xu xingtang , qian yuhong ) . dai xianglong , the president of people 's bank of china , said that china will carry on with the open financial policy .</string>
  <mappings><![CDATA[[0 <-> 0, 1 <-> 1, 2 <-> 2, 3 <-> 3, 4 <-> 4, 5 <-> 5, 6 <-> 6, 7 <-> 7, 10 <-> 10, 11 <-> 9, 12 <-> 11, 13 <-> 13, 14 <-> 12, 15 <-> 19, 16 <-> 20, 17 <-> 21, 18 <-> 23, 19 <-> 24, 20 <-> 25, 21 <-> 26, 22 <-> 27, 23 <-> 17, 24 <-> 16, 25 <-> 28, 26 <-> 29, 28 <-> 30, 29 <-> 31, 30 <-> 32, 30 <-> 33, 31 <-> 34, 32 <-> 35, 33 <-> 37, 34 <-> 36, 35 <-> 36, 36 <-> 38, 37 <-> 39]]]></mappings>
  <dlf>
    <node id="w24" pred="say"/>
    <node id="w24" mood="dcl" num="sg" pred="dai" tense="past">
      <rel name="Arg0">
        <node id="w2" num="sg" pred="agency">
          <rel name="Det">
            <node id="w0" pred="xinhua"/>
          </rel>
          <rel name="Mod">
            <node id="w1" num="sg" pred="news"/>
          </rel>
        </node>
      </rel>
      <rel name="Arg1">
        <node id="w29" pred="will">
          <rel name="Arg0">
            <node det="nil" id="w28" num="sg" pred="china"/>
          </rel>
          <rel name="Arg1">
            <node id="w30" pred="continue">
              <rel name="Arg0">
                <node idref="w28"/>
              </rel>
              <rel name="Arg1">
                <node id="w31" partic="pres" pred="implement">
                  <rel name="Arg0">
                    <node idref="w28"/>
                  </rel>
                  <one-of>
                    <rel name="Arg1">
                      <node id="w34" num="sg" pred="opening">
                        <rel name="Det">
                          <node id="w32" pred="the"/>
                        </rel>
                        <rel name="Mod">
                          <node id="w33" pred="financial"/>
                        </rel>
                        <rel name="Mod">
                          <node id="w35" pred="up">
                            <rel name="Arg1">
                              <node det="nil" id="w36" num="sg" pred="policy"/>
                            </rel>
                          </node>
                        </rel>
                      </node>
                    </rel>
                    <rel name="Mod">
                      <node id="w34" pred="with">
                        <rel name="Arg1">
                          <node id="w40f" num="sg" pred="policy">
                            <rel name="Det">
                              <node id="w37f" pred="the"/>
                            </rel>
                            <rel name="Mod">
                              <node id="w38f" pred="open"/>
                            </rel>
                            <rel name="Mod">
                              <node id="w39f" pred="financial"/>
                            </rel>
                          </node>
                        </rel>
                      </node>
                    </rel>
                  </one-of>
                </node>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
      <rel name="InterruptRel">
        <node emph-final="+" id="w4" partic="pres" pred="beijing">
          <opt>
            <rel name="Mod">
              <node emph-final="+" id="w9" pred="by">
                <rel name="Arg1">
                  <node id="w10" partic="pres" pred="xintang">
                    <rel name="Arg0">
                      <node idref="w2"/>
                    </rel>
                    <rel name="Arg1">
                      <node det="nil" id="w12" pred="and">
                        <rel name="First">
                          <node id="w11" num="sg" pred="xu"/>
                        </rel>
                        <rel name="Next">
                          <node id="w13" num="sg" pred="yuhong"/>
                        </rel>
                      </node>
                    </rel>
                    <rel name="Mod">
                      <node id="w14" pred="qian-">
                        <rel name="Arg1">
                          <node id="w16" num="sg" pred="president">
                            <rel name="Det">
                              <node id="w15" pred="the"/>
                            </rel>
                            <rel name="Mod">
                              <node id="w17" pred="of">
                                <rel name="Arg1">
                                  <node id="w19" num="sg" pred="bank">
                                    <rel name="Det">
                                      <node id="w18" pred="the"/>
                                    </rel>
                                  </node>
                                </rel>
                              </node>
                            </rel>
                            <rel name="Mod">
                              <node id="w20" pred="of">
                                <rel name="Arg1">
                                  <node det="nil" id="w21" num="sg" pred="china"/>
                                </rel>
                              </node>
                            </rel>
                          </node>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </opt>
          <rel name="Arg0">
            <node idref="w2"/>
          </rel>
          <rel name="Mod">
            <node id="w7" pred="16th">
              <rel name="Mod">
                <node id="w6" pred="january"/>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
      <rel name="Mod">
        <node idref="w24"/>
      </rel>
      <rel name="Mod">
        <node id="w23" pred="xianglong"/>
      </rel>
    </node>
  </dlf>
  <dlf>
    <node id="w29" mood="dcl" pred="say" tense="past">
      <rel name="Arg0">
        <node id="w2" num="sg" pred="agency">
          <rel name="Det">
            <node id="w0" pred="xinhua"/>
          </rel>
          <rel name="Mod">
            <node id="w1" num="sg" pred="news"/>
          </rel>
        </node>
      </rel>
      <rel name="Arg1">
        <node id="w33" pred="will">
          <rel name="Arg0">
            <node det="nil" id="w32" num="sg" pred="china"/>
          </rel>
          <rel name="Arg1">
            <node id="w34" pred="carry">
              <rel name="Arg0">
                <node idref="w32"/>
              </rel>
              <rel name="Mod">
                <node id="w35" pred="on"/>
              </rel>
              <one-of>
                <rel name="Mod">
                  <node id="w36" num="sg" pred="with">
                    <opt>
                      <rel name="Arg1">
                        <node id="w40" num="sg" pred="policy">
                          <rel name="Det">
                            <node id="w37" pred="the"/>
                          </rel>
                          <rel name="Mod">
                            <node id="w38" pred="open"/>
                          </rel>
                          <rel name="Mod">
                            <node id="w39" pred="financial"/>
                          </rel>
                        </node>
                      </rel>
                    </opt>
                  </node>
                </rel>
                <rel name="Arg1">
                  <node id="w36" num="sg" pred="opening">
                    <rel name="Det">
                      <node id="w32f" pred="the"/>
                    </rel>
                    <rel name="Mod">
                      <node id="w33f" pred="financial"/>
                    </rel>
                    <rel name="Mod">
                      <node id="w35f" num="sg" pred="up">
                        <atts det="nil"/>
                      </node>
                    </rel>
                  </node>
                </rel>
              </one-of>
            </node>
          </rel>
        </node>
      </rel>
      <rel name="modFeat">
        <node id="x1"/>
      </rel>
      <rel name="GenRel">
        <node id="w4" partic="pres" pred="beijing">
          <rel name="ApposRel">
            <node det="nil" id="w9" num="sg" pred="reporter">
              <opt>
                <rel name="Mod">
                  <node id="w8" num="sg" pred="lrb"/>
                </rel>
              </opt>
              <rel name="Mod">
                <node id="w10" pred="&amp;amp;#58;">
                  <rel name="Arg1">
                    <node id="w13" pred=",">
                      <rel name="First">
                        <node det="nil" id="w12" num="sg" pred="xingtang">
                          <rel name="Mod">
                            <node id="w11" num="sg" pred="xu"/>
                          </rel>
                        </node>
                      </rel>
                      <rel name="Next">
                        <node det="nil" id="w16" num="sg" pred="rrb">
                          <opt>
                            <rel name="Mod">
                              <node id="w14" pred="qian"/>
                            </rel>
                          </opt>
                          <opt>
                            <rel name="Mod">
                              <node id="w15" pred="yuhong"/>
                            </rel>
                          </opt>
                        </node>
                      </rel>
                    </node>
                  </rel>
                </node>
              </rel>
              <rel name="Mod">
                <node id="w6" pred="january"/>
              </rel>
              <rel name="Mod">
                <node id="w7" pred="16th"/>
              </rel>
            </node>
          </rel>
          <rel name="Arg0">
            <node idref="w2"/>
          </rel>
          <rel name="Arg1">
            <node det="nil" id="w19" num="sg" pred="xianglong">
              <opt>
                <rel name="ApposRel">
                  <node id="w22" num="sg" pred="president">
                    <rel name="Det">
                      <node id="w21" pred="the"/>
                    </rel>
                    <rel name="Mod">
                      <node id="w23" pred="of">
                        <rel name="Arg1">
                          <node id="w26" num="sg" pred="bank">
                            <rel name="GenOwn">
                              <node det="nil" id="w24" num="pl" pred="people"/>
                            </rel>
                          </node>
                        </rel>
                      </node>
                    </rel>
                    <rel name="Mod">
                      <node id="w27" pred="of">
                        <rel name="Arg1">
                          <node det="nil" id="w28" num="sg" pred="china"/>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
              </opt>
              <opt>
                <rel name="Mod">
                  <node id="w18" num="sg" pred="dai"/>
                </rel>
              </opt>
            </node>
          </rel>
        </node>
      </rel>
    </node>
    <node id="x1"/>
  </dlf>
  <string number="51" position="A">this kind of measure restrained the economic growth , leading to the rise of unemployment .</string>
  <string number="51" position="B">such measures checked economic growth and caused unemployment to rise .</string>
  <mappings><![CDATA[[0 <-> 0, 1 <-> 0, 2 <-> 0, 3 <-> 1, 4 <-> 2, 6 <-> 3, 7 <-> 4, 8 <-> 5, 9 <-> 6, 10 <-> 6, 12 <-> 9, 14 <-> 7, 15 <-> 10]]]></mappings>
  <dlf>
    <node id="w4" mood="dcl" pred="restrain" tense="past">
      <rel name="Arg0">
        <node id="w1" num="sg" pred="kind">
          <rel name="Det">
            <node id="w0" pred="this"/>
          </rel>
          <rel name="Mod">
            <node id="w2" pred="of">
              <rel name="Arg1">
                <node det="nil" id="w3" num="sg" pred="measure"/>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
      <rel name="Arg1">
        <node id="w7" num="sg" pred="growth">
          <opt>
            <rel name="Det">
              <node id="w5" pred="the"/>
            </rel>
          </opt>
          <rel name="Mod">
            <node id="w6" pred="economic"/>
          </rel>
        </node>
      </rel>
      <rel name="EmphFinal">
        <node id="w9" partic="pres" pred="lead">
          <rel name="Arg0">
            <node idref="w1"/>
          </rel>
          <rel name="Mod">
            <node id="w10">
              <one-of>
                <atts pred="to"/>
                <atts pred="cause"/>
              </one-of>
              <one-of>
                <rel name="Arg1">
                  <node id="w12" num="sg" pred="rise">
                    <opt>
                      <rel name="Det">
                        <node id="w11" pred="the"/>
                      </rel>
                    </opt>
                    <opt>
                      <rel name="Mod">
                        <node id="w13" pred="of">
                          <rel name="Arg1">
                            <node det="nil" id="w14" num="sg" pred="unemployment"/>
                          </rel>
                        </node>
                      </rel>
                    </opt>
                  </node>
                </rel>
                <rel name="Arg2">
                  <node id="w12" pred="rise">
                    <rel name="Arg0">
                      <node det="nil" id="w7f" num="sg" pred="unemployment"/>
                    </rel>
                  </node>
                </rel>
              </one-of>
            </node>
          </rel>
        </node>
      </rel>
    </node>
  </dlf>
  <dlf>
    <node id="w5" mood="dcl" pred="and">
      <rel name="First">
        <node id="w2" pred="check" tense="past">
          <rel name="Arg0">
            <node det="nil" id="w1" num="pl" pred="measure">
              <rel name="Mod">
                <node id="w0" pred="such"/>
              </rel>
            </node>
          </rel>
          <rel name="Arg1">
            <node det="nil" id="w4" num="sg" pred="growth">
              <rel name="Mod">
                <node id="w3" pred="economic"/>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
      <rel name="Next">
        <node id="w6" pred="cause" tense="past">
          <rel name="Arg0">
            <node idref="w1"/>
          </rel>
          <rel name="Arg1">
            <node det="nil" id="w7" num="sg" pred="unemployment"/>
          </rel>
          <one-of>
            <rel name="Arg2">
              <node id="w9" pred="rise">
                <rel name="Arg0">
                  <node idref="w7"/>
                </rel>
              </node>
            </rel>
            <rel name="Arg1">
              <node id="w9" num="sg" pred="rise">
                <rel name="Det">
                  <node id="w11f" pred="the"/>
                </rel>
                <rel name="Mod">
                  <node id="w13f" pred="of">
                    <rel name="Arg1">
                      <node det="nil" id="w14f" num="sg" pred="unemployment"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </one-of>
        </node>
      </rel>
    </node>
  </dlf>
  <string number="52" position="A">siemens germany is currently cooperating with a local thai company , and constructing another 23km long electric railway project in bangkok .</string>
  <string number="52" position="B">the german shermans company is currently working together with a local company constructing a 23 kilometer electronic train engineering project .</string>
  <mappings><![CDATA[[0 <-> 2, 1 <-> 1, 2 <-> 4, 3 <-> 5, 4 <-> 6, 4 <-> 7, 5 <-> 8, 6 <-> 9, 7 <-> 10, 9 <-> 11, 12 <-> 12, 13 <-> 13, 14 <-> 14, 14 <-> 15, 16 <-> 16, 17 <-> 17, 17 <-> 18, 18 <-> 19, 21 <-> 20]]]></mappings>
  <dlf>
    <node id="w2" mood="dcl" pred="PROG" tense="pres">
      <opt>
        <rel name="Arg1">
          <node id="w11" pred="and">
            <rel name="First">
              <node id="w4" partic="pres" pred="cooperate">
                <rel name="Arg0">
                  <node det="nil" id="w1" num="sg" pred="germany">
                    <rel name="Mod">
                      <node id="w0" num="pl" pred="siemens"/>
                    </rel>
                  </node>
                </rel>
                <one-of>
                  <rel name="Arg1">
                    <node id="w5" pred="with">
                      <rel name="Arg1">
                        <node id="w9" num="sg" pred="company">
                          <opt>
                            <rel name="Mod">
                              <node id="w8" num="sg" pred="thai"/>
                            </rel>
                          </opt>
                          <rel name="Det">
                            <node id="w6" pred="a"/>
                          </rel>
                          <rel name="Mod">
                            <node id="w7" pred="local"/>
                          </rel>
                        </node>
                      </rel>
                    </node>
                  </rel>
                  <rel name="Mod">
                    <node id="w5" pred="with">
                      <rel name="Arg1">
                        <node id="w11f" num="sg" pred="company">
                          <rel name="Det">
                            <node id="w9f" pred="a"/>
                          </rel>
                          <rel name="Mod">
                            <node id="w10f" pred="local"/>
                          </rel>
                          <rel name="GenRel">
                            <node id="w12f" partic="pres" pred="construct">
                              <rel name="Arg0">
                                <node idref="w11f"/>
                              </rel>
                              <rel name="Arg1">
                                <node id="w19f" num="sg" pred="project">
                                  <rel name="Det">
                                    <node id="w13f" pred="a"/>
                                  </rel>
                                  <rel name="Mod">
                                    <node id="w14f" pred="23"/>
                                  </rel>
                                  <rel name="Mod">
                                    <node id="w15f" num="sg" pred="kilometer"/>
                                  </rel>
                                  <rel name="Mod">
                                    <node id="w16f" pred="electronic"/>
                                  </rel>
                                  <rel name="Mod">
                                    <node id="w17f" num="sg" pred="train"/>
                                  </rel>
                                  <rel name="Mod">
                                    <node id="w18f" num="sg" pred="engineering"/>
                                  </rel>
                                </node>
                              </rel>
                            </node>
                          </rel>
                        </node>
                      </rel>
                    </node>
                  </rel>
                </one-of>
              </node>
            </rel>
            <rel name="Next">
              <node idref="w12f"/>
            </rel>
          </node>
        </rel>
      </opt>
      <rel name="Arg0">
        <node idref="w1"/>
      </rel>
      <rel name="Mod">
        <node id="w3" pred="currently"/>
      </rel>
    </node>
  </dlf>
  <dlf>
    <node id="w4" mood="dcl" num="sg" pred="PROG" tense="pres">
      <opt>
        <rel name="Arg0">
          <node id="w3" num="sg" pred="company">
            <rel name="Det">
              <node id="w0" pred="the"/>
            </rel>
            <rel name="Mod">
              <node id="w1" num="sg" pred="german"/>
            </rel>
            <rel name="Mod">
              <node id="w2" num="pl" pred="shermans"/>
            </rel>
          </node>
        </rel>
      </opt>
      <rel name="Arg1">
        <node id="w6" num="sg" partic="pres" pred="work">
          <opt>
            <rel name="Arg0">
              <node idref="w3"/>
            </rel>
          </opt>
          <rel name="Mod">
            <node id="w7" pred="together"/>
          </rel>
          <one-of>
            <rel name="Mod">
              <node id="w8" pred="with">
                <rel name="Arg1">
                  <node id="w11" num="sg" pred="company">
                    <rel name="Det">
                      <node id="w9" pred="a"/>
                    </rel>
                    <rel name="Mod">
                      <node id="w10" pred="local"/>
                    </rel>
                    <rel name="GenRel">
                      <node id="w12" partic="pres" pred="construct">
                        <rel name="Arg0">
                          <node idref="w11"/>
                        </rel>
                        <rel name="Arg1">
                          <node id="w19" num="sg" pred="project">
                            <rel name="Det">
                              <one-of>
                                <node id="w13" pred="a"/>
                                <node id="w13" pred="another"/>
                              </one-of>
                            </rel>
                            <rel name="Mod">
                              <one-of>
                                <node id="w14" pred="23"/>
                                <node id="w14" pred="23km"/>
                              </one-of>
                            </rel>
                            <rel name="Mod">
                              <one-of>
                                <node id="w15" num="sg" pred="kilometer"/>
                                <node idref="w14"/>
                              </one-of>
                            </rel>
                            <rel name="Mod">
                              <one-of>
                                <node id="w16" pred="electronic"/>
                                <node id="w16" pred="electric"/>
                              </one-of>
                            </rel>
                            <rel name="Mod">
                              <one-of>
                                <node id="w17" num="sg" pred="train"/>
                                <node id="w17" num="sg" pred="railway"/>
                              </one-of>
                            </rel>
                            <rel name="Mod">
                              <one-of>
                                <node id="w18" num="sg" pred="engineering"/>
                                <node idref="w17"/>
                              </one-of>
                            </rel>
                          </node>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
            <rel name="Arg1">
              <node id="w8" num="sg" pred="with"/>
            </rel>
          </one-of>
        </node>
      </rel>
      <rel name="Mod">
        <node id="w5" pred="currently"/>
      </rel>
    </node>
  </dlf>
  <string number="53" position="A">he said that the same resolve would lead to the success of the kyoto protocol .</string>
  <string number="53" position="B">he said that the same resolve would lead to the success of the kyoto protocol .</string>
  <mappings><![CDATA[[0 <-> 0, 1 <-> 1, 2 <-> 2, 3 <-> 3, 4 <-> 4, 5 <-> 5, 6 <-> 6, 7 <-> 7, 8 <-> 8, 9 <-> 9, 10 <-> 10, 11 <-> 11, 12 <-> 12, 13 <-> 13, 14 <-> 14, 15 <-> 15]]]></mappings>
  <dlf>
    <node id="w1" mood="dcl" pred="say" tense="past">
      <rel name="Arg0">
        <node id="w0" pred="he"/>
      </rel>
      <rel name="Arg1">
        <node id="w6" pred="would">
          <rel name="Arg0">
            <node id="w5" num="sg" pred="resolve">
              <rel name="Det">
                <node id="w3" pred="the"/>
              </rel>
              <rel name="Mod">
                <node id="w4" pred="same"/>
              </rel>
            </node>
          </rel>
          <rel name="Arg1">
            <node id="w7" pred="lead">
              <rel name="Arg0">
                <node idref="w5"/>
              </rel>
              <rel name="Arg1">
                <node id="w8" pred="to">
                  <rel name="Arg1">
                    <node id="w10" num="sg" pred="success">
                      <rel name="Det">
                        <node id="w9" pred="the"/>
                      </rel>
                      <rel name="Mod">
                        <node id="w11" pred="of">
                          <rel name="Arg1">
                            <node id="w14" num="sg" pred="protocol">
                              <rel name="Det">
                                <node id="w12" pred="the"/>
                              </rel>
                              <rel name="Mod">
                                <node id="w13" num="sg" pred="kyoto"/>
                              </rel>
                            </node>
                          </rel>
                        </node>
                      </rel>
                    </node>
                  </rel>
                </node>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
    </node>
  </dlf>
  <dlf>
    <node id="w1" mood="dcl" pred="say" tense="past">
      <rel name="Arg0">
        <node id="w0" pred="he"/>
      </rel>
      <rel name="Arg1">
        <node id="w6" pred="would">
          <rel name="Arg0">
            <node id="w5" num="sg" pred="resolve">
              <rel name="Det">
                <node id="w3" pred="the"/>
              </rel>
              <rel name="Mod">
                <node id="w4" pred="same"/>
              </rel>
            </node>
          </rel>
          <rel name="Arg1">
            <node id="w7" pred="lead">
              <rel name="Arg0">
                <node idref="w5"/>
              </rel>
              <rel name="Arg1">
                <node id="w8" pred="to">
                  <rel name="Arg1">
                    <node id="w10" num="sg" pred="success">
                      <rel name="Det">
                        <node id="w9" pred="the"/>
                      </rel>
                      <rel name="Mod">
                        <node id="w11" pred="of">
                          <rel name="Arg1">
                            <node id="w14" num="sg" pred="protocol">
                              <rel name="Det">
                                <node id="w12" pred="the"/>
                              </rel>
                              <rel name="Mod">
                                <node id="w13" num="sg" pred="kyoto"/>
                              </rel>
                            </node>
                          </rel>
                        </node>
                      </rel>
                    </node>
                  </rel>
                </node>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
    </node>
  </dlf>
  <string number="54" position="A">however , the official who disclosed the above declined to elaborate what kind of missile technology is being exported and when china provided such technology to pakistan and iran .</string>
  <string number="54" position="B">however , the official was not willing to explain what kind of missile technology that china provided to pakistan and iran , and when this technology was provided .</string>
  <mappings><![CDATA[[0 <-> 0, 1 <-> 1, 2 <-> 2, 3 <-> 3, 8 <-> 4, 8 <-> 5, 8 <-> 6, 9 <-> 7, 10 <-> 8, 11 <-> 9, 12 <-> 10, 13 <-> 11, 14 <-> 12, 15 <-> 13, 19 <-> 22, 20 <-> 23, 21 <-> 15, 22 <-> 16, 22 <-> 26, 22 <-> 27, 23 <-> 24, 24 <-> 13, 24 <-> 25, 25 <-> 17, 26 <-> 18, 27 <-> 19, 28 <-> 20, 29 <-> 28]]]></mappings>
  <dlf>
    <node id="w16" pred="PROG" tense="pres">
      <rel name="Arg0">
        <node id="w12" num="sg" pred="kind">
          <rel name="Det">
            <node id="w11" pred="what"/>
          </rel>
          <rel name="Mod">
            <node id="w13" pred="of">
              <rel name="Arg1">
                <node det="nil" id="w15" num="sg" pred="technology">
                  <rel name="Mod">
                    <node id="w14" num="sg" pred="missile"/>
                  </rel>
                </node>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
      <rel name="Arg1">
        <node id="w17" partic="pres" pred="PASS">
          <rel name="Arg0">
            <node idref="w12"/>
          </rel>
          <rel name="Arg1">
            <node id="w18" partic="pass" pred="export">
              <rel name="Arg1">
                <node idref="w12"/>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
    </node>
    <node id="w21" num="sg" pred="china"/>
    <node id="w24" num="sg" pred="technology"/>
    <node id="w8" tense="past">
      <one-of>
        <atts pred="decline"/>
        <atts pred="be"/>
        <atts pred="willing"/>
      </one-of>
      <rel name="Arg0">
        <node id="w3" num="sg" pred="official" tense="past">
          <opt>
            <rel name="GenRel">
              <node id="w5" pred="disclose" tense="past">
                <rel name="Arg0">
                  <node idref="w3"/>
                </rel>
                <rel name="Arg1">
                  <node id="w7" num="sg" pred="above">
                    <rel name="Det">
                      <node id="w6" pred="the"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </opt>
          <rel name="Det">
            <node id="w2" pred="the"/>
          </rel>
        </node>
      </rel>
      <rel name="Arg1">
        <node id="w10" pred="elaborate">
          <rel name="Arg0">
            <node idref="w3"/>
          </rel>
        </node>
      </rel>
    </node>
    <node id="x7" mood="dcl">
      <rel name="Mod">
        <node id="w19" pred="and">
          <opt>
            <rel name="Arg1">
              <node id="x5">
                <rel name="Mod">
                  <node id="w20" pred="when">
                    <rel name="Arg1">
                      <node id="w22" pred="provide" tense="past">
                        <opt>
                          <rel name="Arg1">
                            <node id="x4">
                              <rel name="Mod">
                                <node id="w23" pred="such"/>
                              </rel>
                            </node>
                          </rel>
                        </opt>
                        <rel name="Arg0">
                          <node id="x3"/>
                        </rel>
                        <rel name="Arg1">
                          <node idref="x4"/>
                        </rel>
                        <rel name="Purpose">
                          <node id="w27" pred="and">
                            <rel name="First">
                              <node id="w26" pred="pakistan">
                                <rel name="Arg0">
                                  <node idref="x3"/>
                                </rel>
                              </node>
                            </rel>
                            <rel name="Next">
                              <node id="w28" pred="iran">
                                <rel name="Arg0">
                                  <node idref="x3"/>
                                </rel>
                              </node>
                            </rel>
                          </node>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </opt>
          <opt>
            <rel name="Arg2">
              <node id="x6">
                <rel name="GenRel">
                  <node id="x1">
                    <rel name="Mod">
                      <node emph-intro="+" id="w0" pred="however"/>
                    </rel>
                    <rel name="Mod">
                      <node id="x2"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </opt>
          <rel name="Arg1">
            <node idref="x5"/>
          </rel>
          <rel name="Arg2">
            <node idref="x6"/>
          </rel>
        </node>
      </rel>
    </node>
    <node id="x5">
      <rel name="Mod">
        <node id="w20" pred="when">
          <rel name="Arg1">
            <node id="w22" pred="provide" tense="past">
              <opt>
                <rel name="Arg1">
                  <node id="x4">
                    <rel name="Mod">
                      <node id="w23" pred="such"/>
                    </rel>
                  </node>
                </rel>
              </opt>
              <rel name="Arg0">
                <node id="x3"/>
              </rel>
              <rel name="Arg1">
                <node idref="x4"/>
              </rel>
              <rel name="Purpose">
                <node id="w27" pred="and">
                  <rel name="First">
                    <node id="w26" pred="pakistan">
                      <rel name="Arg0">
                        <node idref="x3"/>
                      </rel>
                    </node>
                  </rel>
                  <rel name="Next">
                    <node id="w28" pred="iran">
                      <rel name="Arg0">
                        <node idref="x3"/>
                      </rel>
                    </node>
                  </rel>
                </node>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
    </node>
    <node id="x3"/>
    <node id="x4">
      <rel name="Mod">
        <node id="w23" pred="such"/>
      </rel>
    </node>
    <node id="x6">
      <rel name="GenRel">
        <node id="x1">
          <rel name="Mod">
            <node emph-intro="+" id="w0" pred="however"/>
          </rel>
          <rel name="Mod">
            <node id="x2"/>
          </rel>
        </node>
      </rel>
    </node>
    <node id="x1">
      <rel name="Mod">
        <node emph-intro="+" id="w0" pred="however"/>
      </rel>
      <rel name="Mod">
        <node id="x2"/>
      </rel>
    </node>
    <node id="x2"/>
  </dlf>
  <dlf>
    <node id="w21" mood="dcl" pred="and">
      <rel name="First">
        <node id="x1">
          <rel name="ApposRel">
            <node id="w3" num="sg" pred="official">
              <rel name="Det">
                <node id="w2" pred="the"/>
              </rel>
              <rel name="GenRel">
                <node id="w4" tense="past">
                  <one-of>
                    <atts pred="be"/>
                    <atts pred="decline"/>
                  </one-of>
                  <rel name="Arg0">
                    <node idref="w3"/>
                  </rel>
                  <rel name="Arg1">
                    <node id="w6">
                      <one-of>
                        <atts pred="willing"/>
                        <atts pred="decline"/>
                      </one-of>
                      <rel name="Arg0">
                        <node idref="w3"/>
                      </rel>
                      <rel name="Arg1">
                        <node id="w8" pred="explain">
                          <rel name="Arg0">
                            <node id="x2"/>
                          </rel>
                          <rel name="Arg1">
                            <node id="w10" num="sg" pred="kind">
                              <rel name="Det">
                                <node id="w9" pred="what"/>
                              </rel>
                              <rel name="Mod">
                                <node id="w11" pred="of">
                                  <rel name="Arg1">
                                    <node det="nil" id="w13" num="sg" pred="technology">
                                      <rel name="Mod">
                                        <node id="w12" num="sg" pred="missile"/>
                                      </rel>
                                    </node>
                                  </rel>
                                </node>
                              </rel>
                              <rel name="GenRel">
                                <node id="w15" pred="china" tense="pres">
                                  <rel name="Arg0">
                                    <node idref="w10"/>
                                  </rel>
                                  <rel name="Arg1">
                                    <node id="w16" partic="pass" pred="provide">
                                      <rel name="Arg1">
                                        <node idref="w10"/>
                                      </rel>
                                      <rel name="Arg2">
                                        <node id="w17" pred="to">
                                          <rel name="Arg1">
                                            <node det="nil" id="w19" pred="and">
                                              <rel name="First">
                                                <node id="w18" num="sg" pred="pakistan"/>
                                              </rel>
                                              <rel name="Next">
                                                <node id="w20" num="sg" pred="iran"/>
                                              </rel>
                                            </node>
                                          </rel>
                                        </node>
                                      </rel>
                                    </node>
                                  </rel>
                                </node>
                              </rel>
                            </node>
                          </rel>
                        </node>
                      </rel>
                    </node>
                  </rel>
                  <rel name="Mod">
                    <node id="w5" pred="not"/>
                  </rel>
                </node>
              </rel>
            </node>
          </rel>
          <rel name="Mod">
            <node id="w23" pred="when">
              <rel name="Arg1">
                <node id="w26" pred="PASS" tense="past">
                  <rel name="Arg0">
                    <node id="w25" num="sg" pred="technology">
                      <rel name="Det">
                        <node id="w24" pred="this"/>
                      </rel>
                    </node>
                  </rel>
                  <rel name="Arg1">
                    <node id="w27" partic="pass" pred="provide">
                      <rel name="Arg1">
                        <node idref="w25"/>
                      </rel>
                    </node>
                  </rel>
                </node>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
      <rel name="Mod">
        <node id="w0" pred="however"/>
      </rel>
      <rel name="Next">
        <node idref="x1"/>
      </rel>
    </node>
    <node id="x1">
      <rel name="ApposRel">
        <node id="w3" num="sg" pred="official">
          <rel name="Det">
            <node id="w2" pred="the"/>
          </rel>
          <rel name="GenRel">
            <node id="w4" tense="past">
              <one-of>
                <atts pred="be"/>
                <atts pred="decline"/>
              </one-of>
              <rel name="Arg0">
                <node idref="w3"/>
              </rel>
              <rel name="Arg1">
                <node id="w6">
                  <one-of>
                    <atts pred="willing"/>
                    <atts pred="decline"/>
                  </one-of>
                  <rel name="Arg0">
                    <node idref="w3"/>
                  </rel>
                  <rel name="Arg1">
                    <node id="w8" pred="explain">
                      <rel name="Arg0">
                        <node id="x2"/>
                      </rel>
                      <rel name="Arg1">
                        <node id="w10" num="sg" pred="kind">
                          <rel name="Det">
                            <node id="w9" pred="what"/>
                          </rel>
                          <rel name="Mod">
                            <node id="w11" pred="of">
                              <rel name="Arg1">
                                <node det="nil" id="w13" num="sg" pred="technology">
                                  <rel name="Mod">
                                    <node id="w12" num="sg" pred="missile"/>
                                  </rel>
                                </node>
                              </rel>
                            </node>
                          </rel>
                          <rel name="GenRel">
                            <node id="w15" pred="china" tense="pres">
                              <rel name="Arg0">
                                <node idref="w10"/>
                              </rel>
                              <rel name="Arg1">
                                <node id="w16" partic="pass" pred="provide">
                                  <rel name="Arg1">
                                    <node idref="w10"/>
                                  </rel>
                                  <rel name="Arg2">
                                    <node id="w17" pred="to">
                                      <rel name="Arg1">
                                        <node det="nil" id="w19" pred="and">
                                          <rel name="First">
                                            <node id="w18" num="sg" pred="pakistan"/>
                                          </rel>
                                          <rel name="Next">
                                            <node id="w20" num="sg" pred="iran"/>
                                          </rel>
                                        </node>
                                      </rel>
                                    </node>
                                  </rel>
                                </node>
                              </rel>
                            </node>
                          </rel>
                        </node>
                      </rel>
                    </node>
                  </rel>
                </node>
              </rel>
              <rel name="Mod">
                <node id="w5" pred="not"/>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
      <rel name="Mod">
        <node id="w23" pred="when">
          <rel name="Arg1">
            <node id="w26" pred="PASS" tense="past">
              <rel name="Arg0">
                <node id="w25" num="sg" pred="technology">
                  <rel name="Det">
                    <node id="w24" pred="this"/>
                  </rel>
                </node>
              </rel>
              <rel name="Arg1">
                <node id="w27" partic="pass" pred="provide">
                  <rel name="Arg1">
                    <node idref="w25"/>
                  </rel>
                </node>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
    </node>
    <node id="x2"/>
  </dlf>
  <string number="55" position="A">yunnan gardens was developed by fujian company , there are 313 apartments in this residential project .</string>
  <string number="55" position="B">the yunnan gardens project developed by the fujian society is a 313-unit housing project with land .</string>
  <mappings><![CDATA[[0 <-> 1, 1 <-> 2, 2 <-> 4, 3 <-> 4, 4 <-> 5, 5 <-> 7, 6 <-> 8, 9 <-> 9, 10 <-> 11, 11 <-> 11, 13 <-> 10, 14 <-> 12, 15 <-> 13, 16 <-> 16]]]></mappings>
  <dlf>
    <node id="w2" pred="PASS" tense="past">
      <rel name="Arg0">
        <node det="nil" id="w1" num="pl" pred="garden">
          <rel name="Mod">
            <node id="w0" pred="yunnan"/>
          </rel>
        </node>
      </rel>
      <rel name="Arg1">
        <node id="w3" partic="pass" pred="develop">
          <rel name="Arg1">
            <node idref="w1"/>
          </rel>
          <rel name="Mod">
            <node id="w4" pred="by">
              <rel name="Arg1">
                <node det="nil" id="w6" num="sg">
                  <one-of>
                    <atts pred="company"/>
                    <atts pred="society"/>
                  </one-of>
                  <rel name="Mod">
                    <node id="w5" pred="fujian"/>
                  </rel>
                </node>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
    </node>
    <node id="w8" pred="be" tense="pres">
      <rel name="Arg0">
        <node det="nil" id="w11" num="pl" pred="apartment">
          <opt>
            <rel name="Mod">
              <node id="w12" pred="in">
                <rel name="Arg1">
                  <node id="w15" num="sg" pred="project">
                    <rel name="Det">
                      <one-of>
                        <node id="w13" pred="this"/>
                        <node id="w13" pred="a"/>
                      </one-of>
                    </rel>
                    <rel name="Mod">
                      <one-of>
                        <node id="w14" pred="residential"/>
                        <node id="w14" num="sg" pred="housing"/>
                      </one-of>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </opt>
          <rel name="Mod">
            <node id="w10" pred="313"/>
          </rel>
        </node>
      </rel>
    </node>
    <node id="x1" mood="dcl"/>
  </dlf>
  <dlf>
    <node id="w9" mood="dcl" num="sg" pred="be" tense="pres">
      <opt>
        <rel name="Arg0">
          <node id="w3" num="sg" pred="project">
            <rel name="Det">
              <node id="w0" pred="the"/>
            </rel>
            <rel name="Mod">
              <node id="w1" pred="yunnan"/>
            </rel>
            <rel name="Mod">
              <node id="w2" num="pl" pred="garden"/>
            </rel>
            <rel name="GenRel">
              <node id="w4" num="sg" partic="pass" pred="develop">
                <opt>
                  <rel name="Arg1">
                    <node idref="w3"/>
                  </rel>
                </opt>
                <rel name="Mod">
                  <node id="w5" pred="by">
                    <rel name="Arg1">
                      <node id="w8" num="sg" pred="society">
                        <opt>
                          <rel name="Det">
                            <node id="w6" pred="the"/>
                          </rel>
                        </opt>
                        <rel name="Mod">
                          <node id="w7" pred="fujian"/>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </opt>
    </node>
  </dlf>
  <string number="56" position="A">in the last two years , some foreign businessmen showed their interest in the construction of xiling city .</string>
  <string number="56" position="B">during the past two years , a batch of foreign businessmen expressed their wishes to get involved in xining 's city construction one after another .</string>
  <mappings><![CDATA[[0 <-> 0, 1 <-> 1, 2 <-> 2, 3 <-> 3, 4 <-> 4, 5 <-> 5, 6 <-> 6, 6 <-> 7, 6 <-> 8, 7 <-> 9, 8 <-> 10, 9 <-> 11, 10 <-> 12, 11 <-> 13, 12 <-> 17, 13 <-> 19, 14 <-> 21, 15 <-> 19, 16 <-> 18, 17 <-> 20, 18 <-> 25]]]></mappings>
  <dlf>
    <node id="w9" mood="dcl" pred="show" tense="past">
      <rel name="Arg0">
        <node id="w8" num="pl" pred="businessman">
          <rel name="Det">
            <node id="w6" pred="some"/>
          </rel>
          <rel name="Mod">
            <node id="w7" pred="foreign"/>
          </rel>
        </node>
      </rel>
      <rel name="Arg1">
        <node id="w11" num="sg">
          <one-of>
            <atts pred="interest"/>
            <atts pred="wish"/>
          </one-of>
          <rel name="Det">
            <node id="w10" pred="their"/>
          </rel>
          <rel name="Mod">
            <node id="w12" pred="in">
              <rel name="Arg1">
                <node id="w14" num="sg" pred="construction">
                  <rel name="Det">
                    <node id="w13" pred="the"/>
                  </rel>
                  <rel name="Mod">
                    <node id="w15" pred="of">
                      <rel name="Arg1">
                        <node id="w16" partic="pres" pred="xiling">
                          <rel name="Arg0">
                            <node id="x1"/>
                          </rel>
                          <rel name="Arg1">
                            <node det="nil" id="w17" num="sg" pred="city"/>
                          </rel>
                        </node>
                      </rel>
                    </node>
                  </rel>
                </node>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
      <rel name="Mod">
        <node emph-intro="+" id="w0">
          <one-of>
            <atts pred="in"/>
            <atts pred="during"/>
          </one-of>
          <rel name="Arg1">
            <node id="w4" num="pl" pred="year">
              <rel name="Det">
                <node id="w1" pred="the"/>
              </rel>
              <rel name="Mod">
                <one-of>
                  <node id="w2" pred="last"/>
                  <node id="w2" pred="past"/>
                </one-of>
              </rel>
              <rel name="Mod">
                <node id="w3" pred="two"/>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
    </node>
    <node id="x1"/>
  </dlf>
  <dlf>
    <node id="w11" mood="dcl" pred="express" tense="past">
      <rel name="Arg0">
        <node id="w7" num="sg" pred="batch">
          <rel name="Det">
            <node id="w6" pred="a"/>
          </rel>
          <rel name="Mod">
            <node id="w8" pred="of">
              <rel name="Arg1">
                <node det="nil" id="w10" num="pl" pred="businessman">
                  <rel name="Mod">
                    <node id="w9" pred="foreign"/>
                  </rel>
                </node>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
      <rel name="Arg1">
        <node id="w13" num="pl">
          <opt>
            <rel name="Purpose">
              <node id="w15" pred="get">
                <rel name="Arg0">
                  <node idref="w13"/>
                </rel>
                <rel name="Arg1">
                  <node id="w16" pred="involve">
                    <rel name="Arg0">
                      <node idref="w13"/>
                    </rel>
                    <rel name="Arg1">
                      <node id="w17" num="sg" pred="in">
                        <opt>
                          <rel name="Arg1">
                            <node id="w22" num="sg" pred="one">
                              <rel name="GenOwn">
                                <node det="nil" id="w18" num="sg" pred="xining"/>
                              </rel>
                              <rel name="Mod">
                                <node id="w20" num="sg" pred="city"/>
                              </rel>
                              <rel name="Mod">
                                <node id="w21" num="sg" pred="construction"/>
                              </rel>
                              <rel name="Mod">
                                <node id="w23" pred="after">
                                  <rel name="Arg1">
                                    <node id="w24" pred="another"/>
                                  </rel>
                                </node>
                              </rel>
                            </node>
                          </rel>
                        </opt>
                      </node>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </opt>
          <one-of>
            <atts pred="wish"/>
            <atts pred="interest"/>
          </one-of>
          <rel name="Det">
            <node id="w12" pred="their"/>
          </rel>
        </node>
      </rel>
      <rel name="Mod">
        <node emph-intro="+" id="w0">
          <one-of>
            <atts pred="during"/>
            <atts pred="in"/>
          </one-of>
          <rel name="Arg1">
            <node id="w4" num="pl" pred="year">
              <rel name="Det">
                <node id="w1" pred="the"/>
              </rel>
              <rel name="Mod">
                <one-of>
                  <node id="w2" pred="past"/>
                  <node id="w2" pred="last"/>
                </one-of>
              </rel>
              <rel name="Mod">
                <node id="w3" pred="two"/>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
    </node>
  </dlf>
  <string number="57" position="A">the dai yu xiang industrial consulting company said that spacious front door area is the biggest characteristic of yunnan gardens with land ownership .</string>
  <string number="57" position="B">dai yuxiang real estate consulting firm said that the most special characteristic of the landed residences at yunnan gardens is their spacious appearance .</string>
  <mappings><![CDATA[[1 <-> 0, 2 <-> 1, 3 <-> 1, 4 <-> 2, 4 <-> 3, 5 <-> 4, 6 <-> 5, 7 <-> 6, 8 <-> 7, 9 <-> 21, 10 <-> 22, 11 <-> 22, 12 <-> 22, 13 <-> 19, 14 <-> 8, 15 <-> 9, 15 <-> 10, 16 <-> 11, 17 <-> 12, 18 <-> 17, 19 <-> 18, 20 <-> 14, 21 <-> 14, 22 <-> 15, 22 <-> 22, 23 <-> 23]]]></mappings>
  <dlf>
    <node id="w7" mood="dcl" pred="say" tense="past">
      <rel name="Arg0">
        <node id="w6" num="sg" pred="company">
          <opt>
            <rel name="Det">
              <node id="w0" pred="the"/>
            </rel>
          </opt>
          <rel name="Mod">
            <node id="w1" pred="dai"/>
          </rel>
          <rel name="Mod">
            <one-of>
              <node id="w2" num="sg" pred="yu"/>
              <node id="w2" num="sg" pred="yuxiang"/>
            </one-of>
          </rel>
          <rel name="Mod">
            <one-of>
              <node id="w3" partic="pres" pred="xiang"/>
              <node idref="w2"/>
            </one-of>
          </rel>
          <one-of>
            <rel name="Mod">
              <node id="w4" pred="industrial"/>
            </rel>
            <atts>
              <rel name="Mod">
                <node id="w4" pred="real"/>
              </rel>
              <rel name="Mod">
                <node id="w3" num="sg" pred="estate"/>
              </rel>
            </atts>
          </one-of>
          <rel name="Mod">
            <node id="w5" num="sg" pred="consulting"/>
          </rel>
        </node>
      </rel>
      <rel name="Arg1">
        <node id="w13" pred="be" tense="pres">
          <one-of>
            <rel name="Arg0">
              <node det="nil" id="w12" num="sg" pred="area">
                <rel name="Mod">
                  <node id="w10" pred="front"/>
                </rel>
                <rel name="Mod">
                  <node id="w11" num="sg" pred="door"/>
                </rel>
                <rel name="Mod">
                  <node id="w9" pred="spacious"/>
                </rel>
              </node>
            </rel>
            <rel name="Arg1">
              <node id="w12" num="sg" pred="appearance">
                <rel name="Det">
                  <node id="w20f" pred="their"/>
                </rel>
                <rel name="Mod">
                  <node id="w21f" pred="spacious"/>
                </rel>
              </node>
            </rel>
          </one-of>
          <one-of>
            <rel name="Arg1">
              <node id="w16" num="sg" pred="characteristic">
                <rel name="Det">
                  <node id="w14" pred="the"/>
                </rel>
                <rel name="Mod">
                  <node id="w15" pred="biggest"/>
                </rel>
                <rel name="Mod">
                  <node id="w17" pred="of">
                    <rel name="Arg1">
                      <node det="nil" id="w19" num="pl" pred="garden">
                        <rel name="Mod">
                          <node id="w18" pred="yunnan"/>
                        </rel>
                        <rel name="Mod">
                          <node id="w20" pred="with">
                            <rel name="Arg1">
                              <node det="nil" id="w22" num="sg">
                                <one-of>
                                  <atts pred="ownership"/>
                                  <atts pred="residence"/>
                                </one-of>
                                <rel name="Mod">
                                  <node id="w21" num="sg" pred="land"/>
                                </rel>
                              </node>
                            </rel>
                          </node>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
            <rel name="Arg0">
              <node id="w16" num="sg" pred="characteristic">
                <rel name="Det">
                  <node id="w8f" pred="the"/>
                </rel>
                <rel name="Mod">
                  <node id="w10f" pred="special">
                    <rel name="Mod">
                      <node id="w9f" pred="most"/>
                    </rel>
                  </node>
                </rel>
                <rel name="Mod">
                  <node id="w12f" pred="of">
                    <rel name="Arg1">
                      <node id="w15f" num="pl" pred="residence">
                        <rel name="Det">
                          <node id="w13f" pred="the"/>
                        </rel>
                        <rel name="Mod">
                          <node id="w14f" pred="land"/>
                        </rel>
                        <rel name="Mod">
                          <node id="w16f" pred="at">
                            <rel name="Arg1">
                              <node det="nil" id="w18f" num="pl" pred="garden">
                                <rel name="Mod">
                                  <node id="w17f" pred="yunnan"/>
                                </rel>
                              </node>
                            </rel>
                          </node>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </one-of>
        </node>
      </rel>
    </node>
  </dlf>
  <dlf>
    <node id="w6" mood="dcl" pred="say" tense="past">
      <rel name="Arg0">
        <node det="nil" id="w5" num="sg">
          <one-of>
            <atts pred="firm"/>
            <atts pred="company"/>
          </one-of>
          <rel name="Mod">
            <node id="w0" num="sg" pred="dai"/>
          </rel>
          <one-of>
            <rel name="Mod">
              <node id="w1" num="sg" pred="yuxiang"/>
            </rel>
            <atts>
              <rel name="Mod">
                <node id="w1" num="sg" pred="yu"/>
              </rel>
              <rel name="Mod">
                <node id="w3" partic="pres" pred="xiang"/>
              </rel>
            </atts>
          </one-of>
          <rel name="Mod">
            <one-of>
              <node id="w2" pred="real"/>
              <node id="w2" pred="industrial"/>
            </one-of>
          </rel>
          <rel name="Mod">
            <one-of>
              <node id="w3" num="sg" pred="estate"/>
              <node idref="w2"/>
            </one-of>
          </rel>
          <rel name="Mod">
            <node id="w4" num="sg" pred="consulting"/>
          </rel>
        </node>
      </rel>
      <rel name="Arg1">
        <node id="w19" pred="be" tense="pres">
          <one-of>
            <rel name="Arg0">
              <node id="w11" num="sg" pred="characteristic">
                <rel name="Det">
                  <node id="w8" pred="the"/>
                </rel>
                <rel name="Mod">
                  <one-of>
                    <node id="w10" pred="special">
                      <rel name="Mod">
                        <node id="w9" pred="most"/>
                      </rel>
                    </node>
                    <node id="w10" pred="biggest"/>
                  </one-of>
                </rel>
                <rel name="Mod">
                  <node id="w12" pred="of">
                    <rel name="Arg1">
                      <node id="w15" num="pl" pred="residence">
                        <opt>
                          <rel name="Det">
                            <node id="w13" pred="the"/>
                          </rel>
                        </opt>
                        <opt>
                          <rel name="Mod">
                            <node id="w16" pred="at">
                              <rel name="Arg1">
                                <node det="nil" id="w18" num="pl" pred="garden">
                                  <rel name="Mod">
                                    <node id="w17" pred="yunnan"/>
                                  </rel>
                                </node>
                              </rel>
                            </node>
                          </rel>
                        </opt>
                        <rel name="Mod">
                          <node id="w14" pred="land"/>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
            <rel name="Arg1">
              <node id="w11" num="sg" pred="characteristic">
                <rel name="Det">
                  <node id="w14f" pred="the"/>
                </rel>
                <rel name="Mod">
                  <node idref="w10"/>
                </rel>
                <rel name="Mod">
                  <node id="w17f" pred="of">
                    <rel name="Arg1">
                      <node det="nil" id="w19f" num="pl" pred="garden">
                        <rel name="Mod">
                          <node id="w18f" pred="yunnan"/>
                        </rel>
                        <rel name="Mod">
                          <node id="w20f" pred="with">
                            <rel name="Arg1">
                              <node det="nil" id="w22f" num="sg" pred="ownership">
                                <rel name="Mod">
                                  <node id="w21f" num="sg" pred="land"/>
                                </rel>
                              </node>
                            </rel>
                          </node>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </one-of>
          <one-of>
            <rel name="Arg1">
              <node id="w22" num="sg" pred="appearance">
                <opt>
                  <rel name="Det">
                    <node id="w20" pred="their"/>
                  </rel>
                </opt>
                <rel name="Mod">
                  <node id="w21" pred="spacious"/>
                </rel>
              </node>
            </rel>
            <rel name="Arg0">
              <node det="nil" id="w22" num="sg" pred="area">
                <rel name="Mod">
                  <node id="w10f" pred="front"/>
                </rel>
                <rel name="Mod">
                  <node id="w11f" num="sg" pred="door"/>
                </rel>
                <rel name="Mod">
                  <node id="w9f" pred="spacious"/>
                </rel>
              </node>
            </rel>
          </one-of>
        </node>
      </rel>
    </node>
  </dlf>
  <string number="58" position="A">this measure restrained economic growth and raised the rate of unemployment .</string>
  <string number="58" position="B">this curbs economic growth and increases unemployment rates .</string>
  <mappings><![CDATA[[0 <-> 0, 2 <-> 1, 3 <-> 2, 4 <-> 3, 5 <-> 4, 6 <-> 5, 8 <-> 7, 10 <-> 6, 11 <-> 8]]]></mappings>
  <!--missing LF!-->
  <string number="59" position="A">according to xinhua news agency , london , on february 3rd , bbc reporter bowen stayed in baghdad . the capital of iraq stated that there was no evidence to indicate the bomb-shelter destroyed by a us bomber was a military target .</string>
  <string number="59" position="B">according to xinhua news report from london on february 13 , bonne , a reporter of bbc in iraqi capital baghdad , confirmed on 13th that no any sign showed the bomb shelter in baghdad destroyed by american bomber was a military blindage .</string>
  <mappings><![CDATA[[0 <-> 0, 1 <-> 1, 2 <-> 2, 3 <-> 3, 6 <-> 6, 8 <-> 7, 9 <-> 8, 10 <-> 9, 11 <-> 10, 12 <-> 15, 12 <-> 16, 13 <-> 14, 14 <-> 11, 16 <-> 17, 17 <-> 20, 17 <-> 34, 20 <-> 19, 21 <-> 18, 22 <-> 18, 23 <-> 22, 24 <-> 25, 26 <-> 26, 27 <-> 26, 28 <-> 28, 30 <-> 29, 31 <-> 30, 32 <-> 31, 32 <-> 32, 33 <-> 35, 34 <-> 36, 36 <-> 37, 37 <-> 38, 38 <-> 39, 39 <-> 40, 40 <-> 41, 41 <-> 42, 42 <-> 43]]]></mappings>
  <dlf>
    <node id="w21" pred="state"/>
    <node id="w21" mood="dcl" pred="of" tense="past">
      <rel name="Arg0">
        <node id="w20" num="sg" pred="capital">
          <opt>
            <rel name="Det">
              <node id="w19" pred="the"/>
            </rel>
          </opt>
          <rel name="Mod">
            <node idref="w21"/>
          </rel>
        </node>
      </rel>
      <rel name="Arg1">
        <node det="nil" id="w22" num="sg" pred="iraq"/>
      </rel>
      <rel name="Arg1">
        <node id="w26" pred="be" tense="past">
          <rel name="Arg0">
            <node id="w28" num="sg">
              <one-of>
                <atts pred="evidence"/>
                <atts pred="sign"/>
              </one-of>
              <rel name="Det">
                <node id="w27" pred="no"/>
              </rel>
              <rel name="Purpose">
                <node id="w30">
                  <one-of>
                    <atts pred="indicate"/>
                    <atts pred="show"/>
                  </one-of>
                  <rel name="Arg0">
                    <node idref="w28"/>
                  </rel>
                  <rel name="Arg1">
                    <node id="w32" num="sg">
                      <one-of>
                        <atts pred="bomb-shelter"/>
                        <atts pred="shelter"/>
                      </one-of>
                      <rel name="Det">
                        <node id="w31" pred="the"/>
                      </rel>
                      <rel name="GenRel">
                        <node id="w33" partic="pass" pred="destroy">
                          <rel name="Arg1">
                            <node idref="w32"/>
                          </rel>
                          <rel name="Mod">
                            <node id="w34" pred="by">
                              <opt>
                                <rel name="Arg1">
                                  <node id="w35" pred="a">
                                    <rel name="GenRel">
                                      <node id="w38" pred="be" tense="past">
                                        <rel name="Arg0">
                                          <node id="w36" pred="us"/>
                                        </rel>
                                        <rel name="Arg1">
                                          <node id="w41" num="sg">
                                            <one-of>
                                              <atts pred="target"/>
                                              <atts pred="blindage"/>
                                            </one-of>
                                            <rel name="Det">
                                              <node id="w39" pred="a"/>
                                            </rel>
                                            <rel name="Mod">
                                              <node id="w40" pred="military"/>
                                            </rel>
                                          </node>
                                        </rel>
                                        <rel name="Mod">
                                          <node id="w37" num="sg" pred="bomber"/>
                                        </rel>
                                        <rel name="Mod">
                                          <node id="x3"/>
                                        </rel>
                                      </node>
                                    </rel>
                                  </node>
                                </rel>
                              </opt>
                            </node>
                          </rel>
                        </node>
                      </rel>
                    </node>
                  </rel>
                </node>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
      <rel name="Mod">
        <node id="w0" partic="pres" pred="accord">
          <rel name="Arg1">
            <node det="nil" id="w1" num="sg" pred="to">
              <opt>
                <rel name="Arg1">
                  <node det="nil" id="w4" num="sg" pred="agency">
                    <rel name="Mod">
                      <node id="w2" num="sg" pred="xinhua"/>
                    </rel>
                    <rel name="Mod">
                      <node id="w3" num="sg" pred="news"/>
                    </rel>
                    <rel name="GenRel">
                      <node id="w15" pred="stay" tense="past">
                        <rel name="Arg0">
                          <node det="nil" id="w6" num="sg" pred="london"/>
                        </rel>
                        <rel name="Arg1">
                          <node id="w16" pred="in">
                            <rel name="Arg1">
                              <node det="nil" id="w17" num="sg" pred="baghdad"/>
                            </rel>
                          </node>
                        </rel>
                        <rel name="Mod">
                          <node id="w8" pred="on">
                            <rel name="Arg1">
                              <node det="nil" id="w11" pred=",">
                                <rel name="Arg0">
                                  <node id="h1" pred="has-rel">
                                    <rel name="Mod">
                                      <node id="w10" pred="3rd"/>
                                    </rel>
                                    <rel name="Of">
                                      <node id="w14" num="sg" pred="bowen">
                                        <rel name="Mod">
                                          <node id="w12" pred="bbc"/>
                                        </rel>
                                        <rel name="Mod">
                                          <node id="w13" num="sg" pred="reporter"/>
                                        </rel>
                                      </node>
                                    </rel>
                                  </node>
                                </rel>
                                <rel name="Arg1">
                                  <node idref="w14"/>
                                </rel>
                                <rel name="Mod">
                                  <node id="w9" pred="february"/>
                                </rel>
                              </node>
                            </rel>
                          </node>
                        </rel>
                        <rel name="Mod">
                          <node id="x1"/>
                        </rel>
                        <rel name="modFeat">
                          <node id="x2"/>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
              </opt>
            </node>
          </rel>
        </node>
      </rel>
    </node>
    <node id="x3"/>
    <node id="x1"/>
    <node id="x2"/>
  </dlf>
  <dlf>
    <node id="w22" mood="dcl" pred="confirm" tense="past">
      <opt>
        <rel name="Mod">
          <node id="w23" pred="on">
            <rel name="Arg1">
              <node det="nil" id="w24" num="sg" pred="13th">
                <rel name="GenRel">
                  <node id="w29" tense="past">
                    <one-of>
                      <atts pred="show"/>
                      <atts pred="indicate"/>
                    </one-of>
                    <rel name="Arg0">
                      <node id="w28" num="sg">
                        <opt>
                          <rel name="Mod">
                            <node id="w27" pred="any"/>
                          </rel>
                        </opt>
                        <one-of>
                          <atts pred="sign"/>
                          <atts pred="evidence"/>
                        </one-of>
                        <rel name="Det">
                          <node id="w26" pred="no"/>
                        </rel>
                      </node>
                    </rel>
                    <rel name="Arg1">
                      <node det="nil" id="w39" num="sg" pred="be" tense="past">
                        <opt>
                          <rel name="Arg1">
                            <node idref="w24"/>
                          </rel>
                        </opt>
                        <rel name="Arg0">
                          <node id="w32" num="sg">
                            <opt>
                              <rel name="Mod">
                                <node id="w33" pred="in">
                                  <rel name="Arg1">
                                    <node det="nil" id="w34" num="sg" pred="baghdad">
                                      <rel name="GenRel">
                                        <node id="w35" partic="pass" pred="destroy">
                                          <rel name="Arg1">
                                            <node idref="w34"/>
                                          </rel>
                                          <rel name="Mod">
                                            <node id="w36" pred="by">
                                              <rel name="Arg1">
                                                <node det="nil" id="w38" num="sg" pred="bomber">
                                                  <rel name="Mod">
                                                    <node id="w37" pred="american"/>
                                                  </rel>
                                                </node>
                                              </rel>
                                            </node>
                                          </rel>
                                        </node>
                                      </rel>
                                    </node>
                                  </rel>
                                </node>
                              </rel>
                            </opt>
                            <one-of>
                              <atts pred="shelter"/>
                              <atts pred="bomb-shelter"/>
                            </one-of>
                            <rel name="Det">
                              <node id="w30" pred="the"/>
                            </rel>
                            <rel name="Mod">
                              <node id="w31" num="sg" pred="bomb"/>
                            </rel>
                          </node>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </opt>
      <rel name="Arg0">
        <node id="w14" num="sg" pred="reporter">
          <opt>
            <rel name="Det">
              <node id="w13" pred="a"/>
            </rel>
          </opt>
          <rel name="Mod">
            <node id="w15" pred="of">
              <rel name="Arg1">
                <node det="nil" id="w16" num="sg" pred="bbc"/>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
      <rel name="Arg1">
        <node id="w42" num="sg">
          <one-of>
            <atts pred="blindage"/>
            <atts pred="target"/>
          </one-of>
          <rel name="Det">
            <node id="w40" pred="a"/>
          </rel>
          <rel name="Mod">
            <node id="w41" pred="military"/>
          </rel>
        </node>
      </rel>
      <rel name="Mod">
        <node id="w0" partic="pres" pred="accord">
          <rel name="Arg1">
            <node id="w1" num="sg" pred="to">
              <opt>
                <rel name="Arg1">
                  <node id="w4" num="sg" pred="report">
                    <rel name="Det">
                      <node id="w2" pred="xinhua"/>
                    </rel>
                    <rel name="Mod">
                      <node id="w3" num="sg" pred="news"/>
                    </rel>
                    <rel name="Mod">
                      <node id="w5" pred="from">
                        <rel name="Arg1">
                          <node det="nil" id="w6" num="sg" pred="london">
                            <rel name="Mod">
                              <node id="w7" pred="on">
                                <rel name="Arg1">
                                  <node det="nil" id="w9" pred="13">
                                    <rel name="ApposRel">
                                      <node det="nil" id="w11" num="sg" pred="bonne"/>
                                    </rel>
                                    <rel name="Mod">
                                      <node id="w8" pred="february"/>
                                    </rel>
                                  </node>
                                </rel>
                              </node>
                            </rel>
                          </node>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
              </opt>
            </node>
          </rel>
        </node>
      </rel>
      <rel name="modFeat">
        <node id="x1"/>
      </rel>
    </node>
    <node id="x1"/>
  </dlf>
  <string number="60" position="A">mr. siazon said , someone used to say , have n't we been burned once before ? when we were ready to accept them , it did n't take long before they fought agaion .</string>
  <string number="60" position="B">siazon said : someone says , were we deceived before ? when we prepared to accept them but just after several days they began to fight again .</string>
  <mappings><![CDATA[[0 <-> 0, 1 <-> 0, 2 <-> 1, 3 <-> 2, 4 <-> 3, 5 <-> 4, 6 <-> 4, 7 <-> 4, 8 <-> 5, 9 <-> 6, 9 <-> 8, 11 <-> 7, 12 <-> 6, 12 <-> 8, 13 <-> 6, 13 <-> 8, 15 <-> 9, 16 <-> 10, 17 <-> 11, 18 <-> 12, 19 <-> 13, 20 <-> 13, 21 <-> 14, 22 <-> 15, 23 <-> 16, 24 <-> 17, 25 <-> 18, 25 <-> 19, 25 <-> 20, 25 <-> 21, 26 <-> 18, 26 <-> 19, 26 <-> 20, 26 <-> 21, 27 <-> 18, 27 <-> 19, 27 <-> 20, 27 <-> 21, 28 <-> 18, 28 <-> 19, 28 <-> 20, 28 <-> 21, 29 <-> 18, 29 <-> 19, 29 <-> 20, 29 <-> 21, 30 <-> 18, 30 <-> 19, 30 <-> 20, 30 <-> 21, 31 <-> 22, 32 <-> 23, 32 <-> 24, 32 <-> 25, 33 <-> 26, 34 <-> 27]]]></mappings>
  <dlf>
    <node id="w2" pred="say" tense="past">
      <rel name="Arg0">
        <node id="w1" num="sg" pred="siazon">
          <rel name="Det">
            <node id="w0" pred="mr."/>
          </rel>
        </node>
      </rel>
      <rel name="Arg1">
        <node id="w9" tense="pres">
          <opt>
            <rel name="Mod">
              <node id="w10" pred="n't"/>
            </rel>
          </opt>
          <one-of>
            <atts pred="have"/>
            <atts pred="be"/>
          </one-of>
          <rel name="Arg0">
            <node id="w4" pred="someone">
              <rel name="GenRel">
                <node id="w5" tense="past">
                  <one-of>
                    <atts pred="use"/>
                    <atts pred="say"/>
                  </one-of>
                  <one-of>
                    <rel name="Arg1">
                      <node idref="w4"/>
                    </rel>
                    <rel name="Arg0">
                      <node id="w4" pred="someone"/>
                    </rel>
                  </one-of>
                  <rel name="Arg2">
                    <node id="w7" pred="say">
                      <rel name="Arg0">
                        <node idref="w4"/>
                      </rel>
                    </node>
                  </rel>
                  <rel name="modFeat">
                    <node id="x1"/>
                  </rel>
                </node>
              </rel>
            </node>
          </rel>
          <rel name="Arg1">
            <node id="w11" pred="we">
              <rel name="GenRel">
                <node id="w12" tense="past">
                  <one-of>
                    <atts pred="been"/>
                    <atts pred="be"/>
                    <atts pred="deceive"/>
                  </one-of>
                  <one-of>
                    <rel name="Arg0">
                      <node idref="w11"/>
                    </rel>
                    <rel name="Arg1">
                      <node id="w11" pred="we">
                        <rel name="GenRel">
                          <node id="w8f" pred="deceive" tense="past">
                            <rel name="Arg0">
                              <node idref="w11"/>
                            </rel>
                            <rel name="Mod">
                              <node id="w9f" pred="before"/>
                            </rel>
                          </node>
                        </rel>
                      </node>
                    </rel>
                  </one-of>
                  <rel name="Arg0">
                    <node idref="w11"/>
                  </rel>
                  <rel name="Arg1">
                    <node id="w13" partic="pass">
                      <one-of>
                        <atts pred="burn"/>
                        <atts pred="be"/>
                        <atts pred="deceive"/>
                      </one-of>
                      <rel name="Arg1">
                        <node idref="w11"/>
                      </rel>
                      <one-of>
                        <rel name="Arg1">
                          <node idref="w11"/>
                        </rel>
                        <rel name="Arg0">
                          <node idref="w11"/>
                        </rel>
                      </one-of>
                      <rel name="Mod">
                        <node id="w15" pred="before">
                          <opt>
                            <rel name="Mod">
                              <node id="w14" pred="once"/>
                            </rel>
                          </opt>
                        </node>
                      </rel>
                    </node>
                  </rel>
                </node>
              </rel>
            </node>
          </rel>
          <one-of>
            <rel name="Arg1">
              <node idref="w11"/>
            </rel>
            <rel name="Arg0">
              <node idref="w11"/>
            </rel>
          </one-of>
        </node>
      </rel>
    </node>
    <node id="w25" pred="do"/>
    <node id="w25" pred="it" tense="past">
      <rel name="Arg0">
        <node idref="w25"/>
      </rel>
      <rel name="Arg1">
        <node id="w28" pred="take">
          <rel name="Arg0">
            <node idref="w25"/>
          </rel>
          <rel name="Mod">
            <node id="w29" pred="long"/>
          </rel>
          <rel name="Mod">
            <node id="w30" pred="before">
              <rel name="Arg1">
                <node id="w32" pred="fight" tense="past">
                  <rel name="Arg0">
                    <node id="w31" pred="they"/>
                  </rel>
                  <rel name="Mod">
                    <one-of>
                      <node id="w33" num="sg" pred="agaion"/>
                      <node id="w33" pred="again"/>
                    </one-of>
                  </rel>
                </node>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
      <rel name="Mod">
        <node emph-intro="+" id="w17" pred="when">
          <rel name="Arg1">
            <node id="w19" tense="past">
              <one-of>
                <atts pred="be"/>
                <atts pred="prepare"/>
              </one-of>
              <rel name="Arg0">
                <node id="w18" pred="we"/>
              </rel>
              <rel name="Arg1">
                <node id="w20">
                  <one-of>
                    <atts pred="ready"/>
                    <atts pred="prepare"/>
                  </one-of>
                  <rel name="Arg0">
                    <node idref="w18"/>
                  </rel>
                  <rel name="Arg1">
                    <node id="w22" pred="accept">
                      <rel name="Arg0">
                        <node id="x2"/>
                      </rel>
                      <rel name="Arg1">
                        <node id="w23" pred="them"/>
                      </rel>
                    </node>
                  </rel>
                </node>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
      <rel name="Mod">
        <node id="w27" pred="n't"/>
      </rel>
    </node>
    <node id="x1"/>
    <node id="x2"/>
    <node id="x3" mood="dcl"/>
  </dlf>
  <dlf>
    <node id="w1" mood="dcl" pred="say" tense="past">
      <rel name="Arg0">
        <node det="nil" id="w0" num="sg" pred="siazon"/>
      </rel>
      <rel name="Arg1">
        <node id="w17" pred="but">
          <rel name="First">
            <node id="w23"/>
          </rel>
          <rel name="Next">
            <node idref="w23"/>
          </rel>
        </node>
      </rel>
      <rel name="Mod">
        <node id="w2" pred="&amp;amp;#58;">
          <rel name="Arg1">
            <node id="w5" pred=",">
              <rel name="First">
                <node id="w4" tense="pres">
                  <one-of>
                    <atts pred="say"/>
                    <atts pred="use"/>
                  </one-of>
                  <one-of>
                    <rel name="Arg0">
                      <node id="w3" pred="someone"/>
                    </rel>
                    <rel name="Arg1">
                      <node id="w3" pred="someone">
                        <rel name="GenRel">
                          <node id="w5f" pred="use" tense="past">
                            <rel name="Arg1">
                              <node idref="w3"/>
                            </rel>
                            <rel name="Arg2">
                              <node id="w7f" pred="say">
                                <rel name="Arg0">
                                  <node idref="w3"/>
                                </rel>
                              </node>
                            </rel>
                            <rel name="modFeat">
                              <node id="x1f"/>
                            </rel>
                          </node>
                        </rel>
                      </node>
                    </rel>
                  </one-of>
                  <rel name="Arg0">
                    <node idref="w3"/>
                  </rel>
                </node>
              </rel>
              <rel name="Next">
                <node id="w6" tense="past">
                  <one-of>
                    <atts pred="be"/>
                    <atts pred="have"/>
                  </one-of>
                  <rel name="Arg0">
                    <node idref="w3"/>
                  </rel>
                  <rel name="Arg1">
                    <node id="w7" pred="we">
                      <rel name="GenRel">
                        <node id="w8" tense="past">
                          <one-of>
                            <atts pred="deceive"/>
                            <atts pred="have"/>
                            <atts pred="been"/>
                            <atts pred="burn"/>
                          </one-of>
                          <one-of>
                            <rel name="Arg0">
                              <node idref="w7"/>
                            </rel>
                            <rel name="Arg1">
                              <node id="w7" pred="we">
                                <rel name="GenRel">
                                  <node id="w12f" pred="been" tense="past">
                                    <rel name="Arg0">
                                      <node idref="w7"/>
                                    </rel>
                                    <rel name="Arg1">
                                      <node id="w13f" partic="pass" pred="burn">
                                        <rel name="Arg1">
                                          <node idref="w7"/>
                                        </rel>
                                        <rel name="Mod">
                                          <node id="w15f" pred="before">
                                            <rel name="Mod">
                                              <node id="w14f" pred="once"/>
                                            </rel>
                                          </node>
                                        </rel>
                                      </node>
                                    </rel>
                                  </node>
                                </rel>
                              </node>
                            </rel>
                          </one-of>
                          <rel name="Arg0">
                            <node idref="w7"/>
                          </rel>
                          <one-of>
                            <rel name="Arg0">
                              <node idref="w7"/>
                            </rel>
                            <rel name="Arg1">
                              <node idref="w7"/>
                            </rel>
                          </one-of>
                          <rel name="Mod">
                            <node id="w9" pred="before"/>
                          </rel>
                        </node>
                      </rel>
                    </node>
                  </rel>
                  <one-of>
                    <rel name="Arg1">
                      <node idref="w7"/>
                    </rel>
                    <rel name="Arg0">
                      <node idref="w7"/>
                    </rel>
                  </one-of>
                </node>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
    </node>
    <node id="w22" pred="begin"/>
    <node id="w23"/>
  </dlf>
  <string number="61" position="A">railroad officials blamed the bus passengers for the accident , the indian news agency india press trust report said .</string>
  <string number="61" position="B">report of pti said that railway official charged the bus passengers upon the accident .</string>
  <mappings><![CDATA[[0 <-> 5, 1 <-> 6, 2 <-> 7, 3 <-> 8, 4 <-> 9, 5 <-> 10, 6 <-> 11, 7 <-> 12, 8 <-> 13, 14 <-> 2, 15 <-> 2, 16 <-> 2, 17 <-> 0, 18 <-> 3, 19 <-> 14]]]></mappings>
  <dlf>
    <node id="w2" mood="dcl" tense="past">
      <one-of>
        <atts pred="blame"/>
        <atts pred="charge"/>
      </one-of>
      <rel name="Arg0">
        <node det="nil" id="w1" num="pl" pred="official">
          <rel name="Mod">
            <one-of>
              <node id="w0" num="sg" pred="railroad"/>
              <node id="w0" num="sg" pred="railway"/>
            </one-of>
          </rel>
        </node>
      </rel>
      <rel name="Arg1">
        <node id="w5" num="pl" pred="passenger">
          <rel name="Det">
            <node id="w3" pred="the"/>
          </rel>
          <rel name="Mod">
            <node id="w4" num="sg" pred="bus"/>
          </rel>
        </node>
      </rel>
      <rel name="Arg2">
        <node id="w6">
          <one-of>
            <atts pred="for"/>
            <atts pred="upon"/>
          </one-of>
          <rel name="Arg1">
            <node id="w8" num="sg" pred="accident">
              <rel name="Det">
                <node id="w7" pred="the"/>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
      <rel name="ElabRel">
        <node idref="w2"/>
      </rel>
      <rel name="Mod">
        <node id="w18" pred="say" tense="past">
          <one-of>
            <rel name="Arg1">
              <node id="w17" num="sg" pred="report">
                <opt>
                  <rel name="Det">
                    <node id="w10" pred="the"/>
                  </rel>
                </opt>
                <opt>
                  <rel name="Mod">
                    <node id="w11" pred="indian"/>
                  </rel>
                </opt>
                <opt>
                  <rel name="Mod">
                    <node id="w12" num="sg" pred="news"/>
                  </rel>
                </opt>
                <opt>
                  <rel name="Mod">
                    <node id="w13" num="sg" pred="agency"/>
                  </rel>
                </opt>
                <rel name="Mod">
                  <node id="w14" num="sg" pred="india"/>
                </rel>
                <rel name="Mod">
                  <node id="w15" num="sg" pred="press"/>
                </rel>
                <rel name="Mod">
                  <node id="w16" num="sg" pred="trust"/>
                </rel>
              </node>
            </rel>
            <rel name="Arg0">
              <node det="nil" id="w17" num="sg" pred="report">
                <rel name="Mod">
                  <node id="w1f" pred="of">
                    <rel name="Arg1">
                      <node det="nil" id="w2f" num="pl" pred="pti"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </one-of>
        </node>
      </rel>
    </node>
  </dlf>
  <dlf>
    <node id="w3" mood="dcl" pred="say" tense="past">
      <one-of>
        <rel name="Arg0">
          <node det="nil" id="w0" num="sg" pred="report">
            <opt>
              <rel name="Mod">
                <node id="w1" pred="of">
                  <rel name="Arg1">
                    <node det="nil" id="w2" num="pl" pred="pti"/>
                  </rel>
                </node>
              </rel>
            </opt>
          </node>
        </rel>
        <rel name="Arg1">
          <node id="w0" num="sg" pred="report">
            <rel name="Det">
              <node id="w10f" pred="the"/>
            </rel>
            <rel name="Mod">
              <node id="w11f" pred="indian"/>
            </rel>
            <rel name="Mod">
              <node id="w12f" num="sg" pred="news"/>
            </rel>
            <rel name="Mod">
              <node id="w13f" num="sg" pred="agency"/>
            </rel>
            <rel name="Mod">
              <node id="w14f" num="sg" pred="india"/>
            </rel>
            <rel name="Mod">
              <node id="w15f" num="sg" pred="press"/>
            </rel>
            <rel name="Mod">
              <node id="w16f" num="sg" pred="trust"/>
            </rel>
          </node>
        </rel>
      </one-of>
      <rel name="Arg1">
        <node id="w7" tense="past">
          <one-of>
            <atts pred="charge"/>
            <atts pred="blame"/>
          </one-of>
          <rel name="Arg0">
            <node det="nil" id="w6" num="sg" pred="official">
              <rel name="Mod">
                <one-of>
                  <node id="w5" num="sg" pred="railway"/>
                  <node id="w5" num="sg" pred="railroad"/>
                </one-of>
              </rel>
            </node>
          </rel>
          <rel name="Arg1">
            <node id="w10" num="pl" pred="passenger">
              <rel name="Det">
                <node id="w8" pred="the"/>
              </rel>
              <rel name="Mod">
                <node id="w9" num="sg" pred="bus"/>
              </rel>
            </node>
          </rel>
          <rel name="Arg2">
            <node id="w11">
              <one-of>
                <atts pred="upon"/>
                <atts pred="for"/>
              </one-of>
              <rel name="Arg1">
                <node id="w13" num="sg" pred="accident">
                  <rel name="Det">
                    <node id="w12" pred="the"/>
                  </rel>
                </node>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
    </node>
  </dlf>
  <string number="62" position="A">we mentioned the problems australia is concerned with , such as human rights and dispatching army officers to east timor .</string>
  <string number="62" position="B">we mentioned the problems that have attracted australia 's attention , such as the humam rights in east timor and the issue of sending military officers to east timor .</string>
  <mappings><![CDATA[[0 <-> 0, 1 <-> 1, 2 <-> 2, 3 <-> 3, 4 <-> 7, 5 <-> 5, 5 <-> 6, 5 <-> 8, 5 <-> 9, 6 <-> 5, 6 <-> 6, 6 <-> 8, 6 <-> 9, 7 <-> 5, 7 <-> 6, 7 <-> 8, 7 <-> 9, 8 <-> 10, 9 <-> 11, 10 <-> 12, 11 <-> 14, 12 <-> 15, 13 <-> 19, 14 <-> 23, 15 <-> 24, 16 <-> 25, 17 <-> 26, 18 <-> 27, 19 <-> 17, 19 <-> 28, 20 <-> 18, 20 <-> 29]]]></mappings>
  <dlf>
    <node id="x1" mood="dcl">
      <rel name="Mod">
        <node id="w10" pred="as">
          <rel name="Arg1">
            <node id="w13" pred="and">
              <rel name="First">
                <node det="nil" id="w12" num="pl" pred="rights">
                  <rel name="Mod">
                    <one-of>
                      <node id="w11" pred="human"/>
                      <node id="w11" num="sg" pred="humam"/>
                    </one-of>
                  </rel>
                </node>
              </rel>
              <rel name="Next">
                <node det="nil" id="w16" num="pl" pred="officer">
                  <rel name="Mod">
                    <node id="w14" partic="pres" pred="dispatch"/>
                  </rel>
                  <rel name="Mod">
                    <one-of>
                      <node id="w15" num="sg" pred="army"/>
                      <node id="w15" pred="military"/>
                    </one-of>
                  </rel>
                  <rel name="Mod">
                    <node id="w17" pred="to">
                      <rel name="Arg1">
                        <node det="nil" id="w19" num="sg" pred="timor">
                          <rel name="Mod">
                            <node id="w18" pred="east"/>
                          </rel>
                        </node>
                      </rel>
                    </node>
                  </rel>
                </node>
              </rel>
            </node>
          </rel>
          <rel name="Mod">
            <node id="w9" pred="such"/>
          </rel>
        </node>
      </rel>
      <rel name="GenRel">
        <node id="w5" pred="PASS" tense="pres">
          <rel name="Arg0">
            <node id="w0" pred="we">
              <rel name="GenRel">
                <node id="w1" pred="mention" tense="past">
                  <rel name="Arg0">
                    <node idref="w0"/>
                  </rel>
                  <rel name="Arg1">
                    <node id="w4" num="sg" pred="australia">
                      <rel name="Det">
                        <node id="w2" pred="the"/>
                      </rel>
                      <rel name="Mod">
                        <node id="w3" num="pl" pred="problem"/>
                      </rel>
                    </node>
                  </rel>
                </node>
              </rel>
            </node>
          </rel>
          <rel name="Arg1">
            <node id="w6" partic="pass" pred="concern">
              <rel name="Arg1">
                <node idref="w0"/>
              </rel>
              <rel name="Arg2">
                <node id="w7">
                  <one-of>
                    <atts pred="with"/>
                    <atts pred="PERF"/>
                  </one-of>
                  <one-of>
                    <rel name="Arg1">
                      <node idref="x1"/>
                    </rel>
                    <rel name="modFeat">
                      <node id="x1"/>
                    </rel>
                  </one-of>
                </node>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
    </node>
  </dlf>
  <dlf>
    <node id="w1" mood="dcl" pred="mention" tense="past">
      <rel name="Arg0">
        <node id="w0" pred="we"/>
      </rel>
      <rel name="Arg1">
        <node id="w3" num="pl" pred="problem">
          <rel name="Det">
            <node id="w2" pred="the"/>
          </rel>
          <rel name="Mod">
            <node id="w12" pred="as">
              <rel name="Arg1">
                <node id="w19" num="sg" pred="and">
                  <opt>
                    <rel name="Next">
                      <node id="w21" num="sg" pred="issue">
                        <rel name="Det">
                          <node id="w20" pred="the"/>
                        </rel>
                        <rel name="Mod">
                          <node id="w22" pred="of">
                            <rel name="Arg1">
                              <node id="w23" partic="pres" pred="send">
                                <rel name="Arg0">
                                  <node id="x2"/>
                                </rel>
                                <rel name="Arg1">
                                  <node det="nil" id="w25" num="pl" pred="officer">
                                    <rel name="Mod">
                                      <one-of>
                                        <node id="w24" pred="military"/>
                                        <node id="w24" num="sg" pred="army"/>
                                      </one-of>
                                    </rel>
                                  </node>
                                </rel>
                                <rel name="Mod">
                                  <node id="w26" pred="to">
                                    <rel name="Arg1">
                                      <node det="nil" id="w28" num="sg" pred="timor">
                                        <rel name="Mod">
                                          <node id="w27" pred="east"/>
                                        </rel>
                                      </node>
                                    </rel>
                                  </node>
                                </rel>
                              </node>
                            </rel>
                          </node>
                        </rel>
                      </node>
                    </rel>
                  </opt>
                  <rel name="First">
                    <node id="w15" num="pl" pred="rights">
                      <opt>
                        <rel name="Det">
                          <node id="w13" pred="the"/>
                        </rel>
                      </opt>
                      <opt>
                        <rel name="Mod">
                          <node id="w16" pred="in">
                            <rel name="Arg1">
                              <node det="nil" id="w18" num="sg" pred="timor">
                                <rel name="Mod">
                                  <node id="w17" pred="east"/>
                                </rel>
                              </node>
                            </rel>
                          </node>
                        </rel>
                      </opt>
                      <rel name="Mod">
                        <one-of>
                          <node id="w14" num="sg" pred="humam"/>
                          <node id="w14" pred="human"/>
                        </one-of>
                      </rel>
                    </node>
                  </rel>
                </node>
              </rel>
              <rel name="Mod">
                <node id="w11" pred="such"/>
              </rel>
            </node>
          </rel>
          <rel name="GenRel">
            <node id="w5" pred="PERF" tense="pres">
              <rel name="Arg0">
                <node idref="w3"/>
              </rel>
              <rel name="Arg1">
                <node id="w6" partic="past" pred="attract">
                  <rel name="Arg0">
                    <node idref="w3"/>
                  </rel>
                  <rel name="Arg1">
                    <node id="w9" num="sg" pred="attention">
                      <rel name="GenOwn">
                        <node det="nil" id="w7" num="sg" pred="australia"/>
                      </rel>
                    </node>
                  </rel>
                </node>
              </rel>
              <one-of>
                <rel name="modFeat">
                  <node id="x1"/>
                </rel>
                <rel name="Arg1">
                  <node id="x1" mood="dcl">
                    <rel name="Mod">
                      <node id="w10f" pred="as">
                        <rel name="Arg1">
                          <node id="w13f" pred="and">
                            <rel name="First">
                              <node det="nil" id="w12f" num="pl" pred="rights">
                                <rel name="Mod">
                                  <node idref="w14"/>
                                </rel>
                              </node>
                            </rel>
                            <rel name="Next">
                              <node det="nil" id="w16f" num="pl" pred="officer">
                                <rel name="Mod">
                                  <node id="w14f" partic="pres" pred="dispatch"/>
                                </rel>
                                <rel name="Mod">
                                  <node idref="w24"/>
                                </rel>
                                <rel name="Mod">
                                  <node id="w17f" pred="to">
                                    <rel name="Arg1">
                                      <node det="nil" id="w19f" num="sg" pred="timor">
                                        <rel name="Mod">
                                          <node id="w18f" pred="east"/>
                                        </rel>
                                      </node>
                                    </rel>
                                  </node>
                                </rel>
                              </node>
                            </rel>
                          </node>
                        </rel>
                        <rel name="Mod">
                          <node id="w9f" pred="such"/>
                        </rel>
                      </node>
                    </rel>
                    <rel name="GenRel">
                      <node id="w5f" pred="PASS" tense="pres">
                        <rel name="Arg0">
                          <node idref="w0f"/>
                        </rel>
                        <rel name="Arg1">
                          <node id="w6f" partic="pass" pred="concern">
                            <rel name="Arg1">
                              <node idref="w0f"/>
                            </rel>
                            <rel name="Arg2">
                              <node id="w7f" pred="with">
                                <rel name="Arg1">
                                  <node idref="x1"/>
                                </rel>
                              </node>
                            </rel>
                          </node>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
              </one-of>
            </node>
          </rel>
        </node>
      </rel>
    </node>
    <node id="x2"/>
    <node id="x1"/>
  </dlf>
  <string number="63" position="A">the two prime ministers requested that un secretary-general prolong the un representative 's stay in cambodia to 6 months or longer .</string>
  <string number="63" position="B">the two prime ministers of cambodia asked the un secretary general to extend the un representative 's term of stay in cambodia to six months or longer .</string>
  <mappings><![CDATA[[0 <-> 0, 1 <-> 1, 2 <-> 2, 3 <-> 3, 4 <-> 6, 6 <-> 8, 7 <-> 9, 7 <-> 10, 8 <-> 12, 9 <-> 13, 10 <-> 14, 11 <-> 15, 12 <-> 16, 13 <-> 19, 14 <-> 20, 15 <-> 5, 15 <-> 21, 16 <-> 22, 17 <-> 23, 18 <-> 24, 19 <-> 25, 20 <-> 26, 21 <-> 27]]]></mappings>
  <dlf>
    <node id="w4" mood="dcl" tense="past">
      <one-of>
        <atts pred="request"/>
        <atts pred="ask"/>
      </one-of>
      <rel name="Arg0">
        <node id="w3" num="pl" pred="minister">
          <rel name="Det">
            <node id="w0" pred="the"/>
          </rel>
          <rel name="Mod">
            <node id="w1" pred="two"/>
          </rel>
          <rel name="Mod">
            <node id="w2" pred="prime"/>
          </rel>
        </node>
      </rel>
      <rel name="Arg1">
        <node id="w7" num="sg" pred="secretary-general">
          <opt>
            <rel name="Det">
              <node id="w5" pred="that"/>
            </rel>
          </opt>
          <rel name="Mod">
            <node id="w6" pred="un"/>
          </rel>
        </node>
      </rel>
      <one-of>
        <rel name="GenRel">
          <node id="w8" partic="pres" pred="prolong">
            <rel name="Arg0">
              <node idref="w3"/>
            </rel>
            <rel name="Arg1">
              <node id="w13" num="sg" pred="stay">
                <rel name="GenOwn">
                  <node id="w11" num="sg" pred="representative">
                    <rel name="Det">
                      <node id="w9" pred="the"/>
                    </rel>
                    <rel name="Mod">
                      <node id="w10" pred="un"/>
                    </rel>
                  </node>
                </rel>
                <rel name="Mod">
                  <node id="w14" pred="in">
                    <rel name="Arg1">
                      <node det="nil" id="w15" num="sg" pred="cambodia">
                        <rel name="Mod">
                          <node id="w19" pred="or">
                            <rel name="Arg1">
                              <node id="x1">
                                <rel name="Mod">
                                  <node id="w20" pred="longer"/>
                                </rel>
                              </node>
                            </rel>
                            <rel name="Arg2">
                              <node id="x2">
                                <rel name="Mod">
                                  <node id="w16" pred="to">
                                    <rel name="Arg1">
                                      <node det="nil" id="w18" num="pl" pred="month">
                                        <rel name="Mod">
                                          <one-of>
                                            <node id="w17" pred="6"/>
                                            <node id="w17" pred="six"/>
                                          </one-of>
                                        </rel>
                                      </node>
                                    </rel>
                                  </node>
                                </rel>
                              </node>
                            </rel>
                          </node>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="Arg2">
          <node id="w8" pred="extend">
            <rel name="Arg0">
              <node id="w9f" num="sg" pred="secretary">
                <rel name="Det">
                  <node id="w7f" pred="the"/>
                </rel>
                <rel name="Mod">
                  <node id="w8f" num="sg" pred="un"/>
                </rel>
                <rel name="GenRel">
                  <node id="w10f" pred="general">
                    <rel name="Arg0">
                      <node idref="w9f"/>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
            <rel name="Arg1">
              <node id="w17f" num="sg" pred="term">
                <rel name="GenOwn">
                  <node id="w15f" num="sg" pred="representative">
                    <rel name="Det">
                      <node id="w13f" pred="the"/>
                    </rel>
                    <rel name="Mod">
                      <node id="w14f" pred="un"/>
                    </rel>
                  </node>
                </rel>
                <rel name="Mod">
                  <node id="w18f" pred="of">
                    <rel name="Arg1">
                      <node det="nil" id="w19f" num="sg" pred="stay">
                        <rel name="Mod">
                          <node id="w20f" pred="in">
                            <rel name="Arg1">
                              <node det="nil" id="w21f" num="sg" pred="cambodia"/>
                            </rel>
                          </node>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
            <rel name="Arg2">
              <node id="w22f" pred="to">
                <rel name="Arg1">
                  <node det="nil" id="w24f" num="pl" pred="month">
                    <rel name="Mod">
                      <node idref="w17"/>
                    </rel>
                    <rel name="Mod">
                      <node id="w26f" pred="longer">
                        <rel name="Mod">
                          <node id="w25f" pred="or"/>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </one-of>
    </node>
    <node id="x1">
      <rel name="Mod">
        <node id="w20" pred="longer"/>
      </rel>
    </node>
    <node id="x2">
      <rel name="Mod">
        <node id="w16" pred="to">
          <rel name="Arg1">
            <node det="nil" id="w18" num="pl" pred="month">
              <rel name="Mod">
                <one-of>
                  <node id="w17" pred="6"/>
                  <node id="w17" pred="six"/>
                </one-of>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
    </node>
  </dlf>
  <dlf>
    <node id="w6" mood="dcl" tense="past">
      <one-of>
        <atts pred="ask"/>
        <atts pred="request"/>
      </one-of>
      <rel name="Arg0">
        <node id="w3" num="pl" pred="minister">
          <opt>
            <rel name="Mod">
              <node id="w4" pred="of">
                <rel name="Arg1">
                  <node det="nil" id="w5" num="sg" pred="cambodia"/>
                </rel>
              </node>
            </rel>
          </opt>
          <rel name="Det">
            <node id="w0" pred="the"/>
          </rel>
          <rel name="Mod">
            <node id="w1" pred="two"/>
          </rel>
          <rel name="Mod">
            <node id="w2" pred="prime"/>
          </rel>
        </node>
      </rel>
      <rel name="Arg1">
        <node id="w9" num="sg" pred="secretary">
          <opt>
            <rel name="Det">
              <node id="w7" pred="the"/>
            </rel>
          </opt>
          <rel name="Mod">
            <node id="w8" num="sg" pred="un"/>
          </rel>
          <rel name="GenRel">
            <node id="w10" pred="general">
              <rel name="Arg0">
                <node idref="w9"/>
              </rel>
            </node>
          </rel>
        </node>
      </rel>
      <one-of>
        <rel name="Arg2">
          <node id="w12" num="sg" pred="extend">
            <opt>
              <rel name="Arg1">
                <node id="w17" num="sg" pred="term">
                  <rel name="GenOwn">
                    <node id="w15" num="sg" pred="representative">
                      <rel name="Det">
                        <node id="w13" pred="the"/>
                      </rel>
                      <rel name="Mod">
                        <node id="w14" pred="un"/>
                      </rel>
                    </node>
                  </rel>
                  <rel name="Mod">
                    <node id="w18" pred="of">
                      <rel name="Arg1">
                        <node det="nil" id="w19" num="sg" pred="stay">
                          <rel name="Mod">
                            <node id="w20" pred="in">
                              <rel name="Arg1">
                                <node det="nil" id="w21" num="sg" pred="cambodia"/>
                              </rel>
                            </node>
                          </rel>
                        </node>
                      </rel>
                    </node>
                  </rel>
                </node>
              </rel>
            </opt>
            <rel name="Arg0">
              <node idref="w9"/>
            </rel>
            <rel name="Arg2">
              <node id="w22" pred="to">
                <rel name="Arg1">
                  <node det="nil" id="w24" num="pl" pred="month">
                    <rel name="Mod">
                      <one-of>
                        <node id="w23" pred="six"/>
                        <node id="w23" pred="6"/>
                      </one-of>
                    </rel>
                    <rel name="Mod">
                      <node id="w26" pred="longer">
                        <rel name="Mod">
                          <node id="w25" pred="or"/>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
        <rel name="GenRel">
          <node id="w12" partic="pres" pred="prolong">
            <rel name="Arg0">
              <node idref="w3f"/>
            </rel>
            <rel name="Arg1">
              <node id="w13f" num="sg" pred="stay">
                <rel name="GenOwn">
                  <node id="w11f" num="sg" pred="representative">
                    <rel name="Det">
                      <node id="w9f" pred="the"/>
                    </rel>
                    <rel name="Mod">
                      <node id="w10f" pred="un"/>
                    </rel>
                  </node>
                </rel>
                <rel name="Mod">
                  <node id="w14f" pred="in">
                    <rel name="Arg1">
                      <node det="nil" id="w15f" num="sg" pred="cambodia">
                        <rel name="Mod">
                          <node id="w19f" pred="or">
                            <rel name="Arg1">
                              <node id="x1f">
                                <rel name="Mod">
                                  <node id="w20f" pred="longer"/>
                                </rel>
                              </node>
                            </rel>
                            <rel name="Arg2">
                              <node id="x2f">
                                <rel name="Mod">
                                  <node id="w16f" pred="to">
                                    <rel name="Arg1">
                                      <node det="nil" id="w18f" num="pl" pred="month">
                                        <rel name="Mod">
                                          <node idref="w23"/>
                                        </rel>
                                      </node>
                                    </rel>
                                  </node>
                                </rel>
                              </node>
                            </rel>
                          </node>
                        </rel>
                      </node>
                    </rel>
                  </node>
                </rel>
              </node>
            </rel>
          </node>
        </rel>
      </one-of>
    </node>
  </dlf>
</dlfs>


================================================
FILE: test/paraphrases.xml
================================================
<?xml version="1.0"?>

<paraphrases>
<paraphrase corpus="mtc.common" id="32">
<alignments source="GIZA_INTERSECTED">
<alignment first="0" second="1" status="S"/>
<alignment first="3" second="6" status="S"/>
<alignment first="5" second="7" status="S"/>
<alignment first="6" second="8" status="S"/>
<alignment first="7" second="9" status="S"/>
<alignment first="8" second="10" status="S"/>
<alignment first="9" second="11" status="S"/>
<alignment first="10" second="12" status="S"/>
<alignment first="11" second="13" status="S"/>
<alignment first="12" second="14" status="S"/>
<alignment first="15" second="17" status="S"/>
<alignment first="16" second="18" status="S"/>
<alignment first="17" second="19" status="S"/>
<alignment first="19" second="20" status="S"/>
<alignment first="20" second="23" status="S"/>
</alignments>
<alignments source="ANNOTATOR">
<alignment first="0" second="1" status="S"/>
<alignment first="1" second="2" status="P"/>
<alignment first="2" second="3" status="S"/>
<alignment first="2" second="5" status="S"/>
<alignment first="2" second="6" status="S"/>
<alignment first="3" second="4" status="P"/>
<alignment first="4" second="3" status="S"/>
<alignment first="4" second="5" status="S"/>
<alignment first="4" second="6" status="S"/>
<alignment first="5" second="7" status="S"/>
<alignment first="6" second="8" status="S"/>
<alignment first="6" second="15" status="P"/>
<alignment first="7" second="9" status="S"/>
<alignment first="8" second="10" status="S"/>
<alignment first="9" second="11" status="S"/>
<alignment first="10" second="12" status="S"/>
<alignment first="11" second="13" status="S"/>
<alignment first="12" second="14" status="S"/>
<alignment first="15" second="17" status="S"/>
<alignment first="16" second="18" status="P"/>
<alignment first="17" second="19" status="S"/>
<alignment first="18" second="21" status="P"/>
<alignment first="18" second="22" status="P"/>
<alignment first="19" second="20" status="S"/>
<alignment first="20" second="23" status="S"/>
</alignments>
<first>
<string>chinese officials have repeatedly indicated that taiwan is a province of china and that china is a domestic chinese issue .</string>
<pred-info>w19:n:NN:issue w9:n:NN:province w18:n/n:NN:chinese w8:np/n:DT:a w17:n/n:JJ:domestic w7:s[dcl]\np/np:VBZ:be w16:np/n:DT:a w6:n:NN:taiwan w15:s[dcl]\np/np:VBZ:be w14:n:NN:china w4:s[pt]\np/s[em]:VBN:indicate w3:s\np\(s\np):RB:repeatedly w12:s[em]$\(s[em]$)/(s[em]$):CC:and w2:s[dcl]\np/(s[pt]\np):VBP:PERF w11:n:NN:china w1:n:NNS:official w10:np\np/np:IN:of w0:n/n:NN:chinese</pred-info>
<full-words>chinese:S-chinese:P-NN:T-n/n officials:S-official:P-NNS:T-n have:S-have:P-VBP:T-s[dcl]\np/(s[pt]\np) repeatedly:S-repeatedly:P-RB:T-s\np\(s\np) indicated:S-indicate:P-VBN:T-s[pt]\np/s[em] that:S-that:P-IN:T-s[em]/s[dcl] taiwan:S-taiwan:P-NN:T-n is:S-be:P-VBZ:T-s[dcl]\np/np a:S-a:P-DT:T-np/n province:S-province:P-NN:T-n of:S-of:P-IN:T-np\np/np china:S-china:P-NN:T-n and:S-and:P-CC:T-s[em]$\(s[em]$)/(s[em]$) that:S-that:P-DT:T-s[em]/s[dcl] china:S-china:P-NN:T-n is:S-be:P-VBZ:T-s[dcl]\np/np a:S-a:P-DT:T-np/n domestic:S-domestic:P-JJ:T-n/n chinese:S-chinese:P-NN:T-n/n issue:S-issue:P-NN:T-n .:S-.:P-.:T-sent\s[dcl]</full-words>
<lf>
  <satop nom="w2">
    <prop name="PERF"/>
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
    <diamond mode="tense">
      <prop name="pres"/>
    </diamond>
    <diamond mode="Arg0">
      <chunk>
        <nom name="w1"/>
        <prop name="official"/>
        <diamond mode="det">
          <prop name="nil"/>
        </diamond>
        <diamond mode="num">
          <prop name="pl"/>
        </diamond>
        <diamond mode="Mod">
          <nom name="w0"/>
          <prop name="chinese"/>
          <diamond mode="num">
            <prop name="sg"/>
          </diamond>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Arg1">
      <chunk>
        <nom name="w4"/>
        <prop name="indicate"/>
        <diamond mode="partic">
          <prop name="past"/>
        </diamond>
        <diamond mode="Arg0">
          <nom name="w1"/>
        </diamond>
        <diamond mode="Arg1">
          <chunk>
            <nom name="w12"/>
            <prop name="and"/>
            <diamond mode="First">
              <chunk>
                <nom name="w7"/>
                <prop name="be"/>
                <diamond mode="tense">
                  <prop name="pres"/>
                </diamond>
                <diamond mode="Arg0">
                  <nom name="w6"/>
                  <prop name="taiwan"/>
                  <diamond mode="det">
                    <prop name="nil"/>
                  </diamond>
                  <diamond mode="num">
                    <prop name="sg"/>
                  </diamond>
                </diamond>
                <diamond mode="Arg1">
                  <chunk>
                    <nom name="w9"/>
                    <prop name="province"/>
                    <diamond mode="num">
                      <prop name="sg"/>
                    </diamond>
                    <diamond mode="Det">
                      <nom name="w8"/>
                      <prop name="a"/>
                    </diamond>
                    <diamond mode="Mod">
                      <chunk>
                        <nom name="w10"/>
                        <prop name="of"/>
                        <diamond mode="Arg1">
                          <nom name="w11"/>
                          <prop name="china"/>
                          <diamond mode="det">
                            <prop name="nil"/>
                          </diamond>
                          <diamond mode="num">
                            <prop name="sg"/>
                          </diamond>
                        </diamond>
                      </chunk>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
            <diamond mode="Next">
              <chunk>
                <nom name="w15"/>
                <prop name="be"/>
                <diamond mode="tense">
                  <prop name="pres"/>
                </diamond>
                <diamond mode="Arg0">
                  <nom name="w14"/>
                  <prop name="china"/>
                  <diamond mode="det">
                    <prop name="nil"/>
                  </diamond>
                  <diamond mode="num">
                    <prop name="sg"/>
                  </diamond>
                </diamond>
                <diamond mode="Arg1">
                  <chunk>
                    <nom name="w19"/>
                    <prop name="issue"/>
                    <diamond mode="num">
                      <prop name="sg"/>
                    </diamond>
                    <diamond mode="Det">
                      <nom name="w16"/>
                      <prop name="a"/>
                    </diamond>
                    <diamond mode="Mod">
                      <nom name="w17"/>
                      <prop name="domestic"/>
                    </diamond>
                    <diamond mode="Mod">
                      <nom name="w18"/>
                      <prop name="chinese"/>
                      <diamond mode="num">
                        <prop name="sg"/>
                      </diamond>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Mod">
      <nom name="w3"/>
      <prop name="repeatedly"/>
    </diamond>
  </satop>
</lf>
</first>
<second>
<string>the chinese government has always been signifying that taiwan is a province of china and taiwan issue is the internal issue of china .</string>
<pred-info>w9:s[dcl]\np/np:VBZ:be w19:n/n:JJ:internal w18:np/n:DT:the w8:n:NN:taiwan w17:s[dcl]\np/np:VBZ:be w16:n:NN:issue w6:s[ng]\np/s[em]:VBG:signify w15:n/n:JJ:taiwan w5:s[pt]\np/(s[ng]\np):VBN:PROG w14:s[dcl]$\(s[dcl]$)/(s[dcl]$):CC:and w4:s\np\(s\np):RB:always w13:n:NN:china w3:s[dcl]\np/(s[pt]\np):VBZ:PERF w12:np\np/np:IN:of w2:n:NN:government w11:n:NN:province w1:n/n:JJ:chinese w10:np/n:DT:a w0:np/n:DT:the w22:n:NN:china w21:np\np/np:IN:of w20:n:NN:issue</pred-info>
<full-words>the:S-the:P-DT:T-np/n chinese:S-chinese:P-JJ:T-n/n government:S-government:P-NN:T-n has:S-have:P-VBZ:T-s[dcl]\np/(s[pt]\np) always:S-always:P-RB:T-s\np\(s\np) been:S-be:P-VBN:T-s[pt]\np/(s[ng]\np) signifying:S-signify:P-VBG:T-s[ng]\np/s[em] that:S-that:P-DT:T-s[em]/s[dcl] taiwan:S-taiwan:P-NN:T-n is:S-be:P-VBZ:T-s[dcl]\np/np a:S-a:P-DT:T-np/n province:S-province:P-NN:T-n of:S-of:P-IN:T-np\np/np china:S-china:P-NN:T-n and:S-and:P-CC:T-s[dcl]$\(s[dcl]$)/(s[dcl]$) taiwan:S-taiwan:P-JJ:T-n/n issue:S-issue:P-NN:T-n is:S-be:P-VBZ:T-s[dcl]\np/np the:S-the:P-DT:T-np/n internal:S-internal:P-JJ:T-n/n issue:S-issue:P-NN:T-n of:S-of:P-IN:T-np\np/np china:S-china:P-NN:T-n .:S-.:P-.:T-sent\s[dcl]</full-words>
<lf>
  <satop nom="w3">
    <prop name="PERF"/>
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
    <diamond mode="tense">
      <prop name="pres"/>
    </diamond>
    <diamond mode="Arg0">
      <chunk>
        <nom name="w2"/>
        <prop name="government"/>
        <diamond mode="num">
          <prop name="sg"/>
        </diamond>
        <diamond mode="Det">
          <nom name="w0"/>
          <prop name="the"/>
        </diamond>
        <diamond mode="Mod">
          <nom name="w1"/>
          <prop name="chinese"/>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Arg1">
      <chunk>
        <nom name="w5"/>
        <prop name="PROG"/>
        <diamond mode="partic">
          <prop name="past"/>
        </diamond>
        <diamond mode="Arg0">
          <nom name="w2"/>
        </diamond>
        <diamond mode="Arg1">
          <chunk>
            <nom name="w6"/>
            <prop name="signify"/>
            <diamond mode="partic">
              <prop name="pres"/>
            </diamond>
            <diamond mode="Arg0">
              <nom name="w2"/>
            </diamond>
            <diamond mode="Arg1">
              <chunk>
                <nom name="w14"/>
                <prop name="and"/>
                <diamond mode="First">
                  <chunk>
                    <nom name="w9"/>
                    <prop name="be"/>
                    <diamond mode="tense">
                      <prop name="pres"/>
                    </diamond>
                    <diamond mode="Arg0">
                      <nom name="w8"/>
                      <prop name="taiwan"/>
                      <diamond mode="det">
                        <prop name="nil"/>
                      </diamond>
                      <diamond mode="num">
                        <prop name="sg"/>
                      </diamond>
                    </diamond>
                    <diamond mode="Arg1">
                      <chunk>
                        <nom name="w11"/>
                        <prop name="province"/>
                        <diamond mode="num">
                          <prop name="sg"/>
                        </diamond>
                        <diamond mode="Det">
                          <nom name="w10"/>
                          <prop name="a"/>
                        </diamond>
                        <diamond mode="Mod">
                          <chunk>
                            <nom name="w12"/>
                            <prop name="of"/>
                            <diamond mode="Arg1">
                              <nom name="w13"/>
                              <prop name="china"/>
                              <diamond mode="det">
                                <prop name="nil"/>
                              </diamond>
                              <diamond mode="num">
                                <prop name="sg"/>
                              </diamond>
                            </diamond>
                          </chunk>
                        </diamond>
                      </chunk>
                    </diamond>
                  </chunk>
                </diamond>
                <diamond mode="Next">
                  <chunk>
                    <nom name="w17"/>
                    <prop name="be"/>
                    <diamond mode="tense">
                      <prop name="pres"/>
                    </diamond>
                    <diamond mode="Arg0">
                      <chunk>
                        <nom name="w16"/>
                        <prop name="issue"/>
                        <diamond mode="det">
                          <prop name="nil"/>
                        </diamond>
                        <diamond mode="num">
                          <prop name="sg"/>
                        </diamond>
                        <diamond mode="Mod">
                          <nom name="w15"/>
                          <prop name="taiwan"/>
                        </diamond>
                      </chunk>
                    </diamond>
                    <diamond mode="Arg1">
                      <chunk>
                        <nom name="w20"/>
                        <prop name="issue"/>
                        <diamond mode="num">
                          <prop name="sg"/>
                        </diamond>
                        <diamond mode="Det">
                          <nom name="w18"/>
                          <prop name="the"/>
                        </diamond>
                        <diamond mode="Mod">
                          <nom name="w19"/>
                          <prop name="internal"/>
                        </diamond>
                        <diamond mode="Mod">
                          <chunk>
                            <nom name="w21"/>
                            <prop name="of"/>
                            <diamond mode="Arg1">
                              <nom name="w22"/>
                              <prop name="china"/>
                              <diamond mode="det">
                                <prop name="nil"/>
                              </diamond>
                              <diamond mode="num">
                                <prop name="sg"/>
                              </diamond>
                            </diamond>
                          </chunk>
                        </diamond>
                      </chunk>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Mod">
      <nom name="w4"/>
      <prop name="always"/>
    </diamond>
  </satop>
</lf>
</second>
</paraphrase>
<paraphrase corpus="mtc.common" id="33">
<alignments source="GIZA_INTERSECTED">
<alignment first="0" second="0" status="S"/>
<alignment first="1" second="1" status="S"/>
<alignment first="2" second="2" status="S"/>
<alignment first="3" second="3" status="S"/>
<alignment first="4" second="4" status="S"/>
<alignment first="19" second="10" status="S"/>
<alignment first="21" second="12" status="S"/>
<alignment first="22" second="13" status="S"/>
<alignment first="24" second="14" status="S"/>
<alignment first="25" second="15" status="S"/>
<alignment first="26" second="16" status="S"/>
<alignment first="30" second="28" status="S"/>
<alignment first="32" second="29" status="S"/>
<alignment first="33" second="30" status="S"/>
<alignment first="35" second="18" status="S"/>
<alignment first="37" second="26" status="S"/>
<alignment first="38" second="27" status="S"/>
<alignment first="40" second="20" status="S"/>
<alignment first="41" second="21" status="S"/>
<alignment first="42" second="22" status="S"/>
<alignment first="43" second="23" status="S"/>
<alignment first="44" second="24" status="S"/>
<alignment first="45" second="31" status="S"/>
</alignments>
<alignments source="ANNOTATOR">
<alignment first="0" second="0" status="S"/>
<alignment first="1" second="1" status="S"/>
<alignment first="2" second="2" status="S"/>
<alignment first="3" second="3" status="S"/>
<alignment first="4" second="4" status="S"/>
<alignment first="13" second="5" status="P"/>
<alignment first="13" second="6" status="P"/>
<alignment first="14" second="5" status="P"/>
<alignment first="14" second="6" status="P"/>
<alignment first="15" second="5" status="P"/>
<alignment first="15" second="6" status="P"/>
<alignment first="16" second="7" status="P"/>
<alignment first="17" second="8" status="S"/>
<alignment first="18" second="9" status="P"/>
<alignment first="18" second="10" status="P"/>
<alignment first="19" second="9" status="P"/>
<alignment first="19" second="10" status="P"/>
<alignment first="21" second="12" status="P"/>
<alignment first="22" second="13" status="S"/>
<alignment first="24" second="14" status="S"/>
<alignment first="25" second="15" status="S"/>
<alignment first="26" second="16" status="S"/>
<alignment first="28" second="28" status="S"/>
<alignment first="29" second="28" status="S"/>
<alignment first="30" second="28" status="S"/>
<alignment first="32" second="29" status="S"/>
<alignment first="33" second="30" status="S"/>
<alignment first="35" second="18" status="S"/>
<alignment first="36" second="19" status="P"/>
<alignment first="36" second="25" status="P"/>
<alignment first="37" second="26" status="S"/>
<alignment first="38" second="27" status="S"/>
<alignment first="39" second="19" status="P"/>
<alignment first="40" second="20" status="S"/>
<alignment first="41" second="21" status="S"/>
<alignment first="42" second="22" status="P"/>
<alignment first="43" second="23" status="S"/>
<alignment first="44" second="24" status="S"/>
<alignment first="45" second="31" status="S"/>
</alignments>
<first>
<string>the government of qinghai province made the best use of the situation , coming up with an idea to commercialize the urban infrastructure construction , and ratified , at the beginning of this year , provisions for xining city to encourage and guide foreign investments .</string>
<pred-info>w36:s[ng]\np/np:VBG:xining w35:np\np/(s[ng]\np):IN:for w34:n:NNS:provision w33:np\np/np:,:, w32:n:NN:year w31:np/n:DT:this w30:np\np/np:IN:of w29:n:NN:beginning w28:np/n:DT:the w27:s\np\(s\np)/np:IN:at w26:s[dcl]\np:VBD:ratify w25:s[dcl]$\(s[dcl]$)/(s[dcl]$):CC:and w23:n:NN:construction w22:n/n:NN:infrastructure w21:n/n:JJ:urban w20:np/n:DT:the w9:np\np/np:IN:of w8:n:NN:use w7:n/n:JJS:best w6:np/n:DT:the w5:s[dcl]\np/np:VBD:make w4:n:NN:province w3:n/n:NNP:qinghai w19:s[b]\np/np:VB:commercialize w2:np\np/np:IN:of w1:n:NN:government w17:n:NN:idea w0:np/n:DT:the w16:np/n:DT:an w15:pp/np:IN:with w14:s\np\(s\np):RP:up w13:s[ng]\np/pp:VBG:come w11:n:NN:situation w43:n:NNS:investment w10:np/n:DT:the w42:n/n:JJ:foreign w41:s[b]\np/np:VB:guide w40:s[b]$\(s[b]$)/(s[b]$):CC:and w39:s[b]\np/np:VB:encourage w37:n:NN:city</pred-info>
<full-words>the:S-the:P-DT:T-np/n government:S-government:P-NN:T-n of:S-of:P-IN:T-np\np/np qinghai:S-qinghai:P-NNP:T-n/n province:S-province:P-NN:T-n made:S-make:P-VBD:T-s[dcl]\np/np the:S-the:P-DT:T-np/n best:S-best:P-JJS:T-n/n use:S-use:P-NN:T-n of:S-of:P-IN:T-np\np/np the:S-the:P-DT:T-np/n situation:S-situation:P-NN:T-n ,:S-,:P-,:T-s\np\(s\np)/punct[,]/(s\np) coming:S-come:P-VBG:T-s[ng]\np/pp up:S-up:P-RP:T-s\np\(s\np) with:S-with:P-IN:T-pp/np an:S-an:P-DT:T-np/n idea:S-idea:P-NN:T-n to:S-to:P-TO:T-s[to]\np/(s[b]\np) commercialize:S-commercialize:P-VB:T-s[b]\np/np the:S-the:P-DT:T-np/n urban:S-urban:P-JJ:T-n/n infrastructure:S-infrastructure:P-NN:T-n/n construction:S-construction:P-NN:T-n ,:S-,:P-,:T-punct[,] and:S-and:P-CC:T-s[dcl]$\(s[dcl]$)/(s[dcl]$) ratified:S-ratify:P-VBD:T-s[dcl]\np ,:S-,:P-,:T-punct[,] at:S-at:P-IN:T-s\np\(s\np)/np the:S-the:P-DT:T-np/n beginning:S-beginning:P-NN:T-n of:S-of:P-IN:T-np\np/np this:S-this:P-DT:T-np/n year:S-year:P-NN:T-n ,:S-,:P-,:T-np\np/np provisions:S-provision:P-NNS:T-n for:S-for:P-IN:T-np\np/(s[ng]\np) xining:S-xining:P-VBG:T-s[ng]\np/np city:S-city:P-NN:T-n to:S-to:P-TO:T-s[to]\np/(s[b]\np) encourage:S-encourage:P-VB:T-s[b]\np/np and:S-and:P-CC:T-s[b]$\(s[b]$)/(s[b]$) guide:S-guide:P-VB:T-s[b]\np/np foreign:S-foreign:P-JJ:T-n/n investments:S-investment:P-NNS:T-n .:S-.:P-.:T-sent\s[dcl]</full-words>
<lf>
  <satop nom="w25">
    <prop name="and"/>
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
    <diamond mode="First">
      <chunk>
        <nom name="w5"/>
        <prop name="make"/>
        <diamond mode="tense">
          <prop name="past"/>
        </diamond>
        <diamond mode="Arg0">
          <nom name="w1"/>
        </diamond>
        <diamond mode="Arg1">
          <chunk>
            <nom name="w8"/>
            <prop name="use"/>
            <diamond mode="num">
              <prop name="sg"/>
            </diamond>
            <diamond mode="Det">
              <nom name="w6"/>
              <prop name="the"/>
            </diamond>
            <diamond mode="Mod">
              <nom name="w7"/>
              <prop name="best"/>
            </diamond>
            <diamond mode="Mod">
              <chunk>
                <nom name="w9"/>
                <prop name="of"/>
                <diamond mode="Arg1">
                  <chunk>
                    <nom name="w11"/>
                    <prop name="situation"/>
                    <diamond mode="num">
                      <prop name="sg"/>
                    </diamond>
                    <diamond mode="Det">
                      <nom name="w10"/>
                      <prop name="the"/>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
        <diamond mode="InterruptRel">
          <chunk>
            <nom name="w13"/>
            <prop name="come"/>
            <diamond mode="partic">
              <prop name="pres"/>
            </diamond>
            <diamond mode="Arg0">
              <nom name="w1"/>
            </diamond>
            <diamond mode="Arg1">
              <chunk>
                <nom name="w15"/>
                <prop name="with"/>
                <diamond mode="Arg1">
                  <chunk>
                    <nom name="w17"/>
                    <prop name="idea"/>
                    <diamond mode="num">
                      <prop name="sg"/>
                    </diamond>
                    <diamond mode="Det">
                      <nom name="w16"/>
                      <prop name="an"/>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
            <diamond mode="Mod">
              <nom name="w14"/>
              <prop name="up"/>
            </diamond>
            <diamond mode="Purpose">
              <chunk>
                <nom name="w19"/>
                <prop name="commercialize"/>
                <diamond mode="Arg0">
                  <nom name="w1"/>
                </diamond>
                <diamond mode="Arg1">
                  <chunk>
                    <nom name="w23"/>
                    <prop name="construction"/>
                    <diamond mode="num">
                      <prop name="sg"/>
                    </diamond>
                    <diamond mode="Det">
                      <nom name="w20"/>
                      <prop name="the"/>
                    </diamond>
                    <diamond mode="Mod">
                      <nom name="w21"/>
                      <prop name="urban"/>
                    </diamond>
                    <diamond mode="Mod">
                      <nom name="w22"/>
                      <prop name="infrastructure"/>
                      <diamond mode="num">
                        <prop name="sg"/>
                      </diamond>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Next">
      <chunk>
        <nom name="w26"/>
        <prop name="ratify"/>
        <diamond mode="tense">
          <prop name="past"/>
        </diamond>
        <diamond mode="Arg0">
          <nom name="w1"/>
        </diamond>
        <diamond mode="Mod">
          <chunk>
            <nom name="w28"/>
            <prop name="at"/>
            <diamond mode="Arg1">
              <chunk>
                <nom name="w34"/>
                <prop name=","/>
                <diamond mode="First">
                  <chunk>
                    <nom name="w30"/>
                    <prop name="beginning"/>
                    <diamond mode="num">
                      <prop name="sg"/>
                    </diamond>
                    <diamond mode="Det">
                      <nom name="w29"/>
                      <prop name="the"/>
                    </diamond>
                    <diamond mode="Mod">
                      <chunk>
                        <nom name="w31"/>
                        <prop name="of"/>
                        <diamond mode="Arg1">
                          <chunk>
                            <nom name="w33"/>
                            <prop name="year"/>
                            <diamond mode="num">
                              <prop name="sg"/>
                            </diamond>
                            <diamond mode="Det">
                              <nom name="w32"/>
                              <prop name="this"/>
                            </diamond>
                          </chunk>
                        </diamond>
                      </chunk>
                    </diamond>
                  </chunk>
                </diamond>
                <diamond mode="Next">
                  <chunk>
                    <nom name="w35"/>
                    <prop name="provision"/>
                    <diamond mode="det">
                      <prop name="nil"/>
                    </diamond>
                    <diamond mode="num">
                      <prop name="pl"/>
                    </diamond>
                    <diamond mode="Mod">
                      <chunk>
                        <nom name="w36"/>
                        <prop name="for"/>
                        <diamond mode="Arg1">
                          <chunk>
                            <nom name="w37"/>
                            <prop name="xining"/>
                            <diamond mode="partic">
                              <prop name="pres"/>
                            </diamond>
                            <diamond mode="Arg0">
                              <nom name="x1"/>
                            </diamond>
                            <diamond mode="Arg1">
                              <nom name="w38"/>
                              <prop name="city"/>
                              <diamond mode="det">
                                <prop name="nil"/>
                              </diamond>
                              <diamond mode="num">
                                <prop name="sg"/>
                              </diamond>
                            </diamond>
                            <diamond mode="Purpose">
                              <chunk>
                                <nom name="w41"/>
                                <prop name="and"/>
                                <diamond mode="First">
                                  <chunk>
                                    <nom name="w40"/>
                                    <prop name="encourage"/>
                                    <diamond mode="Arg0">
                                      <nom name="x1"/>
                                    </diamond>
                                    <diamond mode="Arg1">
                                      <nom name="w44"/>
                                    </diamond>
                                  </chunk>
                                </diamond>
                                <diamond mode="Next">
                                  <chunk>
                                    <nom name="w42"/>
                                    <prop name="guide"/>
                                    <diamond mode="Arg0">
                                      <nom name="x1"/>
                                    </diamond>
                                    <diamond mode="Arg1">
                                      <nom name="w44"/>
                                    </diamond>
                                  </chunk>
                                </diamond>
                                <satop nom="w43">
                                  <chunk>
                                    <prop name="investment"/>
                                    <diamond mode="det">
                                      <prop name="nil"/>
                                    </diamond>
                                    <diamond mode="num">
                                      <prop name="pl"/>
                                    </diamond>
                                    <diamond mode="Mod">
                                      <nom name="w43"/>
                                      <prop name="foreign"/>
                                    </diamond>
                                  </chunk>
                                </satop>
                              </chunk>
                            </diamond>
                          </chunk>
                        </diamond>
                      </chunk>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
    <satop nom="w1">
      <chunk>
        <prop name="government"/>
        <diamond mode="num">
          <prop name="sg"/>
        </diamond>
        <diamond mode="Det">
          <nom name="w0"/>
          <prop name="the"/>
        </diamond>
        <diamond mode="Mod">
          <chunk>
            <nom name="w2"/>
            <prop name="of"/>
            <diamond mode="Arg1">
              <chunk>
                <nom name="w4"/>
                <prop name="province"/>
                <diamond mode="det">
                  <prop name="nil"/>
                </diamond>
                <diamond mode="num">
                  <prop name="sg"/>
                </diamond>
                <diamond mode="Mod">
                  <nom name="w3"/>
                  <prop name="qinghai"/>
                  <diamond mode="num">
                    <prop name="sg"/>
                  </diamond>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </satop>
  </satop>
</lf>
</first>
<second>
<string>the government of qinghai province put forward the idea of commercialization of city infrastructure , and approved some regulations on encouraging and attracting foreign investment in xining city early this year .</string>
<pred-info>w30:n:NN:year w19:np\np/(s[ng]\np):IN:on w9:np\np/np:IN:of w18:n:NNS:regulation w8:n:NN:idea w17:np/n:DT:some w7:np/n:DT:the w16:s[dcl]\np/np:VBD:approve w6:s\np\(s\np):RP:forward w15:s[dcl]$\(s[dcl]$)\punct[,]/(s[dcl]$):CC:and w5:s[dcl]\np/np:VBD:put w4:n:NN:province w13:n:NN:infrastructure w3:n/n:NNP:qinghai w12:n/n:NN:city w2:np\np/np:IN:of w1:n:NN:government w11:np\np/np:IN:of w10:n:NN:commercialization w0:np/n:DT:the w29:s\np\(s\np)/n:DT:this w28:s\np\(s\np)/(s\np\(s\np)):RB:early w27:n:NN:city w26:s[ng]\np/np:VBG:xining w25:np\np/(s[ng]\np):IN:in w24:n:NN:investment w23:n/n:JJ:foreign w22:s[ng]\np/np:VBG:attract w21:s[ng]$\(s[ng]$)/(s[ng]$):CC:and w20:s[ng]\np/np:VBG:encourage</pred-info>
<full-words>the:S-the:P-DT:T-np/n government:S-government:P-NN:T-n of:S-of:P-IN:T-np\np/np qinghai:S-qinghai:P-NNP:T-n/n province:S-province:P-NN:T-n put:S-put:P-VBD:T-s[dcl]\np/np forward:S-forward:P-RP:T-s\np\(s\np) the:S-the:P-DT:T-np/n idea:S-idea:P-NN:T-n of:S-of:P-IN:T-np\np/np commercialization:S-commercialization:P-NN:T-n of:S-of:P-IN:T-np\np/np city:S-city:P-NN:T-n/n infrastructure:S-infrastructure:P-NN:T-n ,:S-,:P-,:T-punct[,] and:S-and:P-CC:T-s[dcl]$\(s[dcl]$)\punct[,]/(s[dcl]$) approved:S-approve:P-VBD:T-s[dcl]\np/np some:S-some:P-DT:T-np/n regulations:S-regulation:P-NNS:T-n on:S-on:P-IN:T-np\np/(s[ng]\np) encouraging:S-encourage:P-VBG:T-s[ng]\np/np and:S-and:P-CC:T-s[ng]$\(s[ng]$)/(s[ng]$) attracting:S-attract:P-VBG:T-s[ng]\np/np foreign:S-foreign:P-JJ:T-n/n investment:S-investment:P-NN:T-n in:S-in:P-IN:T-np\np/(s[ng]\np) xining:S-xining:P-VBG:T-s[ng]\np/np city:S-city:P-NN:T-n early:S-early:P-RB:T-s\np\(s\np)/(s\np\(s\np)) this:S-this:P-DT:T-s\np\(s\np)/n year:S-year:P-NN:T-n .:S-.:P-.:T-sent\s[dcl]</full-words>
<lf>
  <satop nom="w15">
    <prop name="and"/>
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
    <diamond mode="First">
      <chunk>
        <nom name="w5"/>
        <prop name="put"/>
        <diamond mode="tense">
          <prop name="past"/>
        </diamond>
        <diamond mode="Arg0">
          <nom name="w1"/>
        </diamond>
        <diamond mode="Arg1">
          <chunk>
            <nom name="w8"/>
            <prop name="idea"/>
            <diamond mode="num">
              <prop name="sg"/>
            </diamond>
            <diamond mode="Det">
              <nom name="w7"/>
              <prop name="the"/>
            </diamond>
            <diamond mode="Mod">
              <chunk>
                <nom name="w9"/>
                <prop name="of"/>
                <diamond mode="Arg1">
                  <chunk>
                    <nom name="w10"/>
                    <prop name="commercialization"/>
                    <diamond mode="det">
                      <prop name="nil"/>
                    </diamond>
                    <diamond mode="num">
                      <prop name="sg"/>
                    </diamond>
                    <diamond mode="Mod">
                      <chunk>
                        <nom name="w11"/>
                        <prop name="of"/>
                        <diamond mode="Arg1">
                          <chunk>
                            <nom name="w13"/>
                            <prop name="infrastructure"/>
                            <diamond mode="det">
                              <prop name="nil"/>
                            </diamond>
                            <diamond mode="num">
                              <prop name="sg"/>
                            </diamond>
                            <diamond mode="Mod">
                              <nom name="w12"/>
                              <prop name="city"/>
                              <diamond mode="num">
                                <prop name="sg"/>
                              </diamond>
                            </diamond>
                          </chunk>
                        </diamond>
                      </chunk>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
        <diamond mode="Mod">
          <nom name="w6"/>
          <prop name="forward"/>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Next">
      <chunk>
        <nom name="w16"/>
        <prop name="approve"/>
        <diamond mode="tense">
          <prop name="past"/>
        </diamond>
        <diamond mode="Arg0">
          <nom name="w1"/>
        </diamond>
        <diamond mode="Arg1">
          <chunk>
            <nom name="w18"/>
            <prop name="regulation"/>
            <diamond mode="num">
              <prop name="pl"/>
            </diamond>
            <diamond mode="Det">
              <nom name="w17"/>
              <prop name="some"/>
            </diamond>
            <diamond mode="Mod">
              <chunk>
                <nom name="w19"/>
                <prop name="on"/>
                <diamond mode="Arg1">
                  <chunk>
                    <nom name="w21"/>
                    <prop name="and"/>
                    <diamond mode="First">
                      <chunk>
                        <nom name="w20"/>
                        <prop name="encourage"/>
                        <diamond mode="partic">
                          <prop name="pres"/>
                        </diamond>
                        <diamond mode="Arg0">
                          <nom name="x1"/>
                        </diamond>
                        <diamond mode="Arg1">
                          <nom name="w24"/>
                        </diamond>
                      </chunk>
                    </diamond>
                    <diamond mode="Next">
                      <chunk>
                        <nom name="w22"/>
                        <prop name="attract"/>
                        <diamond mode="partic">
                          <prop name="pres"/>
                        </diamond>
                        <diamond mode="Arg0">
                          <nom name="x1"/>
                        </diamond>
                        <diamond mode="Arg1">
                          <nom name="w24"/>
                        </diamond>
                      </chunk>
                    </diamond>
                    <satop nom="w24">
                      <chunk>
                        <prop name="investment"/>
                        <diamond mode="det">
                          <prop name="nil"/>
                        </diamond>
                        <diamond mode="num">
                          <prop name="sg"/>
                        </diamond>
                        <diamond mode="Mod">
                          <nom name="w23"/>
                          <prop name="foreign"/>
                        </diamond>
                        <diamond mode="Mod">
                          <chunk>
                            <nom name="w25"/>
                            <prop name="in"/>
                            <diamond mode="Arg1">
                              <chunk>
                                <nom name="w26"/>
                                <prop name="xining"/>
                                <diamond mode="partic">
                                  <prop name="pres"/>
                                </diamond>
                                <diamond mode="Arg0">
                                  <nom name="x2"/>
                                </diamond>
                                <diamond mode="Arg1">
                                  <nom name="w27"/>
                                  <prop name="city"/>
                                  <diamond mode="det">
                                    <prop name="nil"/>
                                  </diamond>
                                  <diamond mode="num">
                                    <prop name="sg"/>
                                  </diamond>
                                </diamond>
                                <diamond mode="Mod">
                                  <chunk>
                                    <nom name="w29"/>
                                    <prop name="this"/>
                                    <diamond mode="Arg1">
                                      <nom name="w30"/>
                                      <prop name="year"/>
                                      <diamond mode="num">
                                        <prop name="sg"/>
                                      </diamond>
                                    </diamond>
                                    <diamond mode="Mod">
                                      <nom name="w28"/>
                                      <prop name="early"/>
                                    </diamond>
                                  </chunk>
                                </diamond>
                              </chunk>
                            </diamond>
                          </chunk>
                        </diamond>
                      </chunk>
                    </satop>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
    <satop nom="w1">
      <chunk>
        <prop name="government"/>
        <diamond mode="num">
          <prop name="sg"/>
        </diamond>
        <diamond mode="Det">
          <nom name="w0"/>
          <prop name="the"/>
        </diamond>
        <diamond mode="Mod">
          <chunk>
            <nom name="w2"/>
            <prop name="of"/>
            <diamond mode="Arg1">
              <chunk>
                <nom name="w4"/>
                <prop name="province"/>
                <diamond mode="det">
                  <prop name="nil"/>
                </diamond>
                <diamond mode="num">
                  <prop name="sg"/>
                </diamond>
                <diamond mode="Mod">
                  <nom name="w3"/>
                  <prop name="qinghai"/>
                  <diamond mode="num">
                    <prop name="sg"/>
                  </diamond>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </satop>
  </satop>
</lf>
</second>
</paraphrase>
<paraphrase corpus="mtc.common" id="34">
<alignments source="GIZA_INTERSECTED">
<alignment first="0" second="1" status="S"/>
<alignment first="2" second="3" status="S"/>
<alignment first="3" second="4" status="S"/>
<alignment first="4" second="5" status="S"/>
<alignment first="5" second="7" status="S"/>
<alignment first="6" second="8" status="S"/>
<alignment first="8" second="14" status="S"/>
<alignment first="9" second="17" status="S"/>
<alignment first="10" second="18" status="S"/>
<alignment first="12" second="15" status="S"/>
<alignment first="14" second="16" status="S"/>
<alignment first="16" second="38" status="S"/>
<alignment first="18" second="40" status="S"/>
<alignment first="19" second="41" status="S"/>
<alignment first="20" second="27" status="S"/>
</alignments>
<alignments source="ANNOTATOR">
<alignment first="0" second="1" status="P"/>
<alignment first="1" second="2" status="P"/>
<alignment first="2" second="3" status="S"/>
<alignment first="3" second="4" status="S"/>
<alignment first="4" second="5" status="S"/>
<alignment first="4" second="21" status="P"/>
<alignment first="5" second="7" status="S"/>
<alignment first="6" second="8" status="S"/>
<alignment first="8" second="14" status="S"/>
<alignment first="9" second="17" status="S"/>
<alignment first="9" second="32" status="P"/>
<alignment first="10" second="18" status="S"/>
<alignment first="12" second="15" status="P"/>
<alignment first="14" second="16" status="P"/>
<alignment first="16" second="38" status="S"/>
<alignment first="17" second="39" status="P"/>
<alignment first="18" second="40" status="S"/>
<alignment first="19" second="24" status="P"/>
<alignment first="19" second="41" status="S"/>
<alignment first="20" second="26" status="P"/>
<alignment first="20" second="27" status="P"/>
<alignment first="21" second="28" status="P"/>
<alignment first="21" second="29" status="P"/>
<alignment first="21" second="30" status="P"/>
<alignment first="21" second="31" status="P"/>
<alignment first="23" second="33" status="P"/>
<alignment first="24" second="34" status="P"/>
<alignment first="24" second="35" status="P"/>
<alignment first="25" second="36" status="S"/>
</alignments>
<first>
<string>relevant sections of the henan government released their foreign cooperation projects concerning economy and technology . representatives attending the meeting consulted on information of some projects they interested in.</string>
<pred-info>w19:s[dcl]\np/np/pp:VBD:consulted w9:n/n:NN:cooperation w18:n:NN:meeting w8:n/n:JJ:foreign w17:np/n:DT:the w7:np/n:PRP$:their w6:s[dcl]\np/np:VBD:release w16:s[ng]\np/np:VBG:attend w15:n:NNS:representative w5:n:NN:government w14:n:NN:technology w4:n/n:JJ:henan w13:n\n/n:CC:and w3:np/n:DT:the w12:n:NN:economy w2:np\np/np:IN:of w11:n/n:VBG:concern w1:n:NNS:section w10:n/n:NNS:project w0:n/n:JJ:relevant w27:s[adj]\np\(s[adj]\np):NN:in. w26:s[adj]\np:JJ:interested w25:np:PRP:they w24:n:NNS:project w23:np/n:DT:some w22:np\np/np:IN:of w21:n:NN:information w20:pp/np:IN:on</pred-info>
<full-words>relevant:S-relevant:P-JJ:T-n/n sections:S-section:P-NNS:T-n of:S-of:P-IN:T-np\np/np the:S-the:P-DT:T-np/n henan:S-henan:P-JJ:T-n/n government:S-government:P-NN:T-n released:S-release:P-VBD:T-s[dcl]\np/np their:S-their:P-PRP$:T-np/n foreign:S-foreign:P-JJ:T-n/n cooperation:S-cooperation:P-NN:T-n/n projects:S-project:P-NNS:T-n/n concerning:S-concern:P-VBG:T-n/n economy:S-economy:P-NN:T-n and:S-and:P-CC:T-n\n/n technology:S-technology:P-NN:T-n .:S-.:P-.:T-punct[.] representatives:S-representative:P-NNS:T-n attending:S-attend:P-VBG:T-s[ng]\np/np the:S-the:P-DT:T-np/n meeting:S-meeting:P-NN:T-n consulted:S-consulted:P-VBD:T-s[dcl]\np/np/pp on:S-on:P-IN:T-pp/np information:S-information:P-NN:T-n of:S-of:P-IN:T-np\np/np some:S-some:P-DT:T-np/n projects:S-project:P-NNS:T-n they:S-they:P-PRP:T-np interested:S-interested:P-JJ:T-s[adj]\np in.:S-in.:P-NN:T-s[adj]\np\(s[adj]\np)</full-words>
<lf>
  <satop nom="w1">
    <chunk>
      <prop name="section"/>
      <diamond mode="num">
        <prop name="pl"/>
      </diamond>
      <diamond mode="Mod">
        <nom name="w0"/>
        <prop name="relevant"/>
      </diamond>
    </chunk>
  </satop>
  <satop nom="w19">
    <chunk>
      <prop name="consulted"/>
      <diamond mode="tense">
        <prop name="past"/>
      </diamond>
      <diamond mode="Arg0">
        <chunk>
          <nom name="w16"/>
          <prop name="representative"/>
          <diamond mode="det">
            <prop name="nil"/>
          </diamond>
          <diamond mode="num">
            <prop name="pl"/>
          </diamond>
          <diamond mode="GenRel">
            <chunk>
              <nom name="w17"/>
              <prop name="attend"/>
              <diamond mode="partic">
                <prop name="pres"/>
              </diamond>
              <diamond mode="Arg0">
                <nom name="w16"/>
              </diamond>
              <diamond mode="Arg1">
                <chunk>
                  <nom name="w19"/>
                  <prop name="meeting"/>
                  <diamond mode="num">
                    <prop name="sg"/>
                  </diamond>
                  <diamond mode="Det">
                    <nom name="w18"/>
                    <prop name="the"/>
                  </diamond>
                </chunk>
              </diamond>
            </chunk>
          </diamond>
        </chunk>
      </diamond>
      <diamond mode="Arg1">
        <chunk>
          <nom name="w21"/>
          <prop name="on"/>
          <diamond mode="Arg1">
            <chunk>
              <nom name="w22"/>
              <prop name="information"/>
              <diamond mode="det">
                <prop name="nil"/>
              </diamond>
              <diamond mode="num">
                <prop name="sg"/>
              </diamond>
              <diamond mode="Mod">
                <chunk>
                  <nom name="w23"/>
                  <prop name="of"/>
                  <diamond mode="Arg1">
                    <chunk>
                      <nom name="w25"/>
                      <prop name="project"/>
                      <diamond mode="num">
                        <prop name="pl"/>
                      </diamond>
                      <diamond mode="Det">
                        <nom name="w24"/>
                        <prop name="some"/>
                      </diamond>
                    </chunk>
                  </diamond>
                </chunk>
              </diamond>
            </chunk>
          </diamond>
        </chunk>
      </diamond>
      <diamond mode="Arg2">
        <chunk>
          <nom name="w26"/>
          <prop name="they"/>
          <diamond mode="GenRel">
            <chunk>
              <nom name="w27"/>
              <prop name="interested"/>
              <diamond mode="Arg0">
                <nom name="w26"/>
              </diamond>
              <diamond mode="Mod">
                <nom name="w28"/>
                <prop name="in."/>
                <diamond mode="num">
                  <prop name="sg"/>
                </diamond>
              </diamond>
            </chunk>
          </diamond>
        </chunk>
      </diamond>
    </chunk>
  </satop>
  <satop nom="w6">
    <chunk>
      <prop name="release"/>
      <diamond mode="tense">
        <prop name="past"/>
      </diamond>
      <diamond mode="Arg0">
        <chunk>
          <nom name="x1"/>
          <diamond mode="Mod">
            <chunk>
              <nom name="w2"/>
              <prop name="of"/>
              <diamond mode="Arg1">
                <chunk>
                  <nom name="w5"/>
                  <prop name="government"/>
                  <diamond mode="num">
                    <prop name="sg"/>
                  </diamond>
                  <diamond mode="Det">
                    <nom name="w3"/>
                    <prop name="the"/>
                  </diamond>
                  <diamond mode="Mod">
                    <nom name="w4"/>
                    <prop name="henan"/>
                  </diamond>
                </chunk>
              </diamond>
            </chunk>
          </diamond>
        </chunk>
      </diamond>
      <diamond mode="Arg1">
        <chunk>
          <nom name="w13"/>
          <prop name="and"/>
          <diamond mode="Det">
            <nom name="w7"/>
            <prop name="their"/>
          </diamond>
          <diamond mode="First">
            <chunk>
              <nom name="w12"/>
              <prop name="economy"/>
              <diamond mode="num">
                <prop name="sg"/>
              </diamond>
              <diamond mode="Mod">
                <nom name="w10"/>
                <prop name="project"/>
                <diamond mode="num">
                  <prop name="pl"/>
                </diamond>
              </diamond>
              <diamond mode="Mod">
                <nom name="w11"/>
                <prop name="concern"/>
                <diamond mode="partic">
                  <prop name="pres"/>
                </diamond>
              </diamond>
              <diamond mode="Mod">
                <nom name="w8"/>
                <prop name="foreign"/>
              </diamond>
              <diamond mode="Mod">
                <nom name="w9"/>
                <prop name="cooperation"/>
                <diamond mode="num">
                  <prop name="sg"/>
                </diamond>
              </diamond>
            </chunk>
          </diamond>
          <diamond mode="Next">
            <nom name="w14"/>
            <prop name="technology"/>
            <diamond mode="num">
              <prop name="sg"/>
            </diamond>
          </diamond>
        </chunk>
      </diamond>
    </chunk>
  </satop>
</lf>
</first>
<second>
<string>the competent agencies of the henan provincial government released [ a list of ] foreign economic technological cooperation projects of the province at the meeting and held discussions regarding the purpose of cooperation in the related projects with representatives at the meeting .</string>
<pred-info>w36:n:NNS:project w35:n/n:JJ:related w34:np/n:DT:the w33:np\np/np:IN:in w32:n:NN:cooperation w31:np\np/np:IN:of w30:n:NN:purpose w29:np/n:DT:the w28:s[ng]\np/np:VBG:regard w27:n:NNS:discussion w26:s[dcl]\np/np:VBD:hold w25:s[dcl]$\(s[dcl]$)/(s[dcl]$):CC:and w24:n:NN:meeting w23:np/n:DT:the w22:s\np\(s\np)/np:IN:at w21:n:NN:province w20:np/n:DT:the w9:s\np\(s\np)/np:IN:lsb w8:s[dcl]\np/np:VBD:release w7:n:NN:government w6:n/n:JJ:provincial w5:n/n:JJ:henan w4:np/n:DT:the w3:np\np/np:IN:of w19:np\np/np:IN:of w2:n:NNS:agency w18:n:NNS:project w1:n/n:JJ:competent w17:n/n:NN:cooperation w0:np/n:DT:the w16:n/n:JJ:technological w15:n/n:JJ:economic w14:n/n:JJ:foreign w13:n/n:JJ:rsb w12:np\np/np:IN:of w11:n:NN:list w10:np/n:DT:a w41:n:NN:meeting w40:np/n:DT:the w39:s\np\(s\np)/np:IN:at w38:n:NNS:representative w37:np\np/np:IN:with</pred-info>
<full-words>the:S-the:P-DT:T-np/n competent:S-competent:P-JJ:T-n/n agencies:S-agency:P-NNS:T-n of:S-of:P-IN:T-np\np/np the:S-the:P-DT:T-np/n henan:S-henan:P-JJ:T-n/n provincial:S-provincial:P-JJ:T-n/n government:S-government:P-NN:T-n released:S-release:P-VBD:T-s[dcl]\np/np [:S-[:P-IN:T-s\np\(s\np)/np a:S-a:P-DT:T-np/n list:S-list:P-NN:T-n of:S-of:P-IN:T-np\np/np ]:S-]:P-JJ:T-n/n foreign:S-foreign:P-JJ:T-n/n economic:S-economic:P-JJ:T-n/n technological:S-technological:P-JJ:T-n/n cooperation:S-cooperation:P-NN:T-n/n projects:S-project:P-NNS:T-n of:S-of:P-IN:T-np\np/np the:S-the:P-DT:T-np/n province:S-province:P-NN:T-n at:S-at:P-IN:T-s\np\(s\np)/np the:S-the:P-DT:T-np/n meeting:S-meeting:P-NN:T-n and:S-and:P-CC:T-s[dcl]$\(s[dcl]$)/(s[dcl]$) held:S-hold:P-VBD:T-s[dcl]\np/np discussions:S-discussion:P-NNS:T-n regarding:S-regard:P-VBG:T-s[ng]\np/np the:S-the:P-DT:T-np/n purpose:S-purpose:P-NN:T-n of:S-of:P-IN:T-np\np/np cooperation:S-cooperation:P-NN:T-n in:S-in:P-IN:T-np\np/np the:S-the:P-DT:T-np/n related:S-related:P-JJ:T-n/n projects:S-project:P-NNS:T-n with:S-with:P-IN:T-np\np/np representatives:S-representative:P-NNS:T-n at:S-at:P-IN:T-s\np\(s\np)/np the:S-the:P-DT:T-np/n meeting:S-meeting:P-NN:T-n .:S-.:P-.:T-sent\s[dcl]</full-words>
<lf>
  <satop nom="w25">
    <prop name="and"/>
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
    <diamond mode="First">
      <chunk>
        <nom name="w8"/>
        <prop name="release"/>
        <diamond mode="tense">
          <prop name="past"/>
        </diamond>
        <diamond mode="Arg0">
          <nom name="w2"/>
        </diamond>
        <diamond mode="Arg1">
          <nom name="w27"/>
        </diamond>
        <diamond mode="Mod">
          <chunk>
            <nom name="w22"/>
            <prop name="at"/>
            <diamond mode="Arg1">
              <chunk>
                <nom name="w24"/>
                <prop name="meeting"/>
                <diamond mode="num">
                  <prop name="sg"/>
                </diamond>
                <diamond mode="Det">
                  <nom name="w23"/>
                  <prop name="the"/>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
        <diamond mode="Mod">
          <chunk>
            <nom name="w9"/>
            <prop name="lsb"/>
            <diamond mode="Arg1">
              <chunk>
                <nom name="w11"/>
                <prop name="list"/>
                <diamond mode="num">
                  <prop name="sg"/>
                </diamond>
                <diamond mode="Det">
                  <nom name="w10"/>
                  <prop name="a"/>
                </diamond>
                <diamond mode="Mod">
                  <chunk>
                    <nom name="w12"/>
                    <prop name="of"/>
                    <diamond mode="Arg1">
                      <chunk>
                        <nom name="w18"/>
                        <prop name="project"/>
                        <diamond mode="det">
                          <prop name="nil"/>
                        </diamond>
                        <diamond mode="num">
                          <prop name="pl"/>
                        </diamond>
                        <diamond mode="Mod">
                          <nom name="w13"/>
                          <prop name="rsb"/>
                        </diamond>
                        <diamond mode="Mod">
                          <nom name="w14"/>
                          <prop name="foreign"/>
                        </diamond>
                        <diamond mode="Mod">
                          <nom name="w15"/>
                          <prop name="economic"/>
                        </diamond>
                        <diamond mode="Mod">
                          <nom name="w16"/>
                          <prop name="technological"/>
                        </diamond>
                        <diamond mode="Mod">
                          <nom name="w17"/>
                          <prop name="cooperation"/>
                          <diamond mode="num">
                            <prop name="sg"/>
                          </diamond>
                        </diamond>
                        <diamond mode="Mod">
                          <chunk>
                            <nom name="w19"/>
                            <prop name="of"/>
                            <diamond mode="Arg1">
                              <chunk>
                                <nom name="w21"/>
                                <prop name="province"/>
                                <diamond mode="num">
                                  <prop name="sg"/>
                                </diamond>
                                <diamond mode="Det">
                                  <nom name="w20"/>
                                  <prop name="the"/>
                                </diamond>
                              </chunk>
                            </diamond>
                          </chunk>
                        </diamond>
                      </chunk>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Next">
      <chunk>
        <nom name="w26"/>
        <prop name="hold"/>
        <diamond mode="tense">
          <prop name="past"/>
        </diamond>
        <diamond mode="Arg0">
          <nom name="w2"/>
        </diamond>
        <diamond mode="Arg1">
          <nom name="w27"/>
        </diamond>
      </chunk>
    </diamond>
    <satop nom="w2">
      <chunk>
        <prop name="agency"/>
        <diamond mode="num">
          <prop name="pl"/>
        </diamond>
        <diamond mode="Det">
          <nom name="w0"/>
          <prop name="the"/>
        </diamond>
        <diamond mode="Mod">
          <nom name="w1"/>
          <prop name="competent"/>
        </diamond>
        <diamond mode="Mod">
          <chunk>
            <nom name="w3"/>
            <prop name="of"/>
            <diamond mode="Arg1">
              <chunk>
                <nom name="w7"/>
                <prop name="government"/>
                <diamond mode="num">
                  <prop name="sg"/>
                </diamond>
                <diamond mode="Det">
                  <nom name="w4"/>
                  <prop name="the"/>
                </diamond>
                <diamond mode="Mod">
                  <nom name="w5"/>
                  <prop name="henan"/>
                </diamond>
                <diamond mode="Mod">
                  <nom name="w6"/>
                  <prop name="provincial"/>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </satop>
    <satop nom="w27">
      <chunk>
        <prop name="discussion"/>
        <diamond mode="det">
          <prop name="nil"/>
        </diamond>
        <diamond mode="num">
          <prop name="pl"/>
        </diamond>
        <diamond mode="GenRel">
          <chunk>
            <nom name="w28"/>
            <prop name="regard"/>
            <diamond mode="partic">
              <prop name="pres"/>
            </diamond>
            <diamond mode="Arg0">
              <nom name="w27"/>
            </diamond>
            <diamond mode="Arg1">
              <chunk>
                <nom name="w30"/>
                <prop name="purpose"/>
                <diamond mode="num">
                  <prop name="sg"/>
                </diamond>
                <diamond mode="Det">
                  <nom name="w29"/>
                  <prop name="the"/>
                </diamond>
                <diamond mode="Mod">
                  <chunk>
                    <nom name="w31"/>
                    <prop name="of"/>
                    <diamond mode="Arg1">
                      <chunk>
                        <nom name="w32"/>
                        <prop name="cooperation"/>
                        <diamond mode="det">
                          <prop name="nil"/>
                        </diamond>
                        <diamond mode="num">
                          <prop name="sg"/>
                        </diamond>
                        <diamond mode="Mod">
                          <chunk>
                            <nom name="w33"/>
                            <prop name="in"/>
                            <diamond mode="Arg1">
                              <chunk>
                                <nom name="w36"/>
                                <prop name="project"/>
                                <diamond mode="num">
                                  <prop name="pl"/>
                                </diamond>
                                <diamond mode="Det">
                                  <nom name="w34"/>
                                  <prop name="the"/>
                                </diamond>
                                <diamond mode="Mod">
                                  <nom name="w35"/>
                                  <prop name="related"/>
                                </diamond>
                              </chunk>
                            </diamond>
                          </chunk>
                        </diamond>
                        <diamond mode="Mod">
                          <chunk>
                            <nom name="w37"/>
                            <prop name="with"/>
                            <diamond mode="Arg1">
                              <nom name="w38"/>
                              <prop name="representative"/>
                              <diamond mode="det">
                                <prop name="nil"/>
                              </diamond>
                              <diamond mode="num">
                                <prop name="pl"/>
                              </diamond>
                            </diamond>
                          </chunk>
                        </diamond>
                      </chunk>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
            <diamond mode="Mod">
              <chunk>
                <nom name="w39"/>
                <prop name="at"/>
                <diamond mode="Arg1">
                  <chunk>
                    <nom name="w41"/>
                    <prop name="meeting"/>
                    <diamond mode="num">
                      <prop name="sg"/>
                    </diamond>
                    <diamond mode="Det">
                      <nom name="w40"/>
                      <prop name="the"/>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </satop>
  </satop>
</lf>
</second>
</paraphrase>
<paraphrase corpus="mtc.common" id="35">
<alignments source="GIZA_INTERSECTED">
<alignment first="0" second="1" status="S"/>
<alignment first="1" second="2" status="S"/>
<alignment first="5" second="3" status="S"/>
<alignment first="6" second="4" status="S"/>
<alignment first="7" second="5" status="S"/>
<alignment first="8" second="7" status="S"/>
<alignment first="9" second="8" status="S"/>
<alignment first="10" second="9" status="S"/>
<alignment first="12" second="14" status="S"/>
<alignment first="13" second="15" status="S"/>
<alignment first="15" second="16" status="S"/>
<alignment first="16" second="17" status="S"/>
<alignment first="17" second="18" status="S"/>
<alignment first="18" second="19" status="S"/>
<alignment first="19" second="20" status="S"/>
<alignment first="20" second="22" status="S"/>
<alignment first="21" second="23" status="S"/>
<alignment first="22" second="24" status="S"/>
<alignment first="24" second="28" status="S"/>
<alignment first="27" second="29" status="S"/>
<alignment first="28" second="30" status="S"/>
<alignment first="29" second="31" status="S"/>
<alignment first="30" second="32" status="S"/>
<alignment first="31" second="33" status="S"/>
</alignments>
<alignments source="ANNOTATOR">
<alignment first="0" second="1" status="S"/>
<alignment first="1" second="2" status="S"/>
<alignment first="3" second="3" status="P"/>
<alignment first="5" second="3" status="P"/>
<alignment first="6" second="4" status="S"/>
<alignment first="7" second="5" status="S"/>
<alignment first="8" second="6" status="S"/>
<alignment first="8" second="7" status="S"/>
<alignment first="9" second="8" status="S"/>
<alignment first="10" second="9" status="S"/>
<alignment first="11" second="10" status="S"/>
<alignment first="11" second="11" status="S"/>
<alignment first="12" second="14" status="S"/>
<alignment first="13" second="15" status="S"/>
<alignment first="14" second="13" status="S"/>
<alignment first="15" second="16" status="S"/>
<alignment first="16" second="17" status="S"/>
<alignment first="17" second="18" status="S"/>
<alignment first="18" second="19" status="S"/>
<alignment first="19" second="20" status="S"/>
<alignment first="20" second="22" status="S"/>
<alignment first="21" second="23" status="S"/>
<alignment first="22" second="24" status="S"/>
<alignment first="23" second="24" status="P"/>
<alignment first="24" second="28" status="S"/>
<alignment first="27" second="29" status="S"/>
<alignment first="28" second="30" status="P"/>
<alignment first="29" second="31" status="S"/>
<alignment first="30" second="32" status="S"/>
<alignment first="31" second="33" status="S"/>
</alignments>
<first>
<string>foreign minister duma expressed his thoughts that the un was born after world war ii , and that france and other permanent member countries were all the victors of that war .</string>
<pred-info>w30:n:NN:war w9:s[dcl]\np/(s[pss]\np):VBD:PASS w19:n\(n/n)/n:CC:and w8:n:NN:un w18:n/n:NN:france w7:np/n:DT:the h1:n\(n/n)/n:CC:has-rel w16:s[em]$\(s[em]$)\punct[,]/(s[em]$):CC:and w5:n/s[em]:NNS:thought w14:n:NNS:ii w4:np/n:PRP$:his w3:s[dcl]\np/np:VBD:express w13:n/n:NN:war w12:n/n:NN:world w2:n:NN:duma w11:s\np\(s\np)/np:IN:after w1:n/n:NN:minister w10:s[pss]\np:VBN:bear w0:n/n:JJ:foreign w29:np/n:DT:that w28:np\np/np:IN:of w27:n:NNS:victors w26:np/n:DT:the w25:np/np:PDT:all w24:s[dcl]\np/np:VBD:be w23:n:NNS:country w22:n/n:NN:member w21:n/n:JJ:permanent w20:n/n:JJ:other</pred-info>
<full-words>foreign:S-foreign:P-JJ:T-n/n minister:S-minister:P-NN:T-n/n duma:S-duma:P-NN:T-n expressed:S-express:P-VBD:T-s[dcl]\np/np his:S-his:P-PRP$:T-np/n thoughts:S-thought:P-NNS:T-n/s[em] that:S-that:P-IN:T-s[em]/s[dcl] the:S-the:P-DT:T-np/n un:S-un:P-NN:T-n was:S-be:P-VBD:T-s[dcl]\np/(s[pss]\np) born:S-bear:P-VBN:T-s[pss]\np after:S-after:P-IN:T-s\np\(s\np)/np world:S-world:P-NN:T-n/n war:S-war:P-NN:T-n/n ii:S-ii:P-NNS:T-n ,:S-,:P-,:T-punct[,] and:S-and:P-CC:T-s[em]$\(s[em]$)\punct[,]/(s[em]$) that:S-that:P-DT:T-s[em]/s[dcl] france:S-france:P-NN:T-n/n and:S-and:P-CC:T-n\(n/n)/n other:S-other:P-JJ:T-n/n permanent:S-permanent:P-JJ:T-n/n member:S-member:P-NN:T-n/n countries:S-country:P-NNS:T-n were:S-be:P-VBD:T-s[dcl]\np/np all:S-all:P-PDT:T-np/np the:S-the:P-DT:T-np/n victors:S-victors:P-NNS:T-n of:S-of:P-IN:T-np\np/np that:S-that:P-DT:T-np/n war:S-war:P-NN:T-n .:S-.:P-.:T-sent\s[dcl]</full-words>
<lf>
  <satop nom="w3">
    <prop name="express"/>
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
    <diamond mode="tense">
      <prop name="past"/>
    </diamond>
    <diamond mode="Arg0">
      <chunk>
        <nom name="w2"/>
        <prop name="duma"/>
        <diamond mode="det">
          <prop name="nil"/>
        </diamond>
        <diamond mode="num">
          <prop name="sg"/>
        </diamond>
        <diamond mode="Mod">
          <nom name="w0"/>
          <prop name="foreign"/>
        </diamond>
        <diamond mode="Mod">
          <nom name="w1"/>
          <prop name="minister"/>
          <diamond mode="num">
            <prop name="sg"/>
          </diamond>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Arg1">
      <chunk>
        <nom name="w5"/>
        <prop name="thought"/>
        <diamond mode="num">
          <prop name="pl"/>
        </diamond>
        <diamond mode="Arg">
          <chunk>
            <nom name="w16"/>
            <prop name="and"/>
            <diamond mode="First">
              <chunk>
                <nom name="w9"/>
                <prop name="PASS"/>
                <diamond mode="tense">
                  <prop name="past"/>
                </diamond>
                <diamond mode="Arg0">
                  <chunk>
                    <nom name="w8"/>
                    <prop name="un"/>
                    <diamond mode="num">
                      <prop name="sg"/>
                    </diamond>
                    <diamond mode="Det">
                      <nom name="w7"/>
                      <prop name="the"/>
                    </diamond>
                  </chunk>
                </diamond>
                <diamond mode="Arg1">
                  <chunk>
                    <nom name="w10"/>
                    <prop name="bear"/>
                    <diamond mode="partic">
                      <prop name="pass"/>
                    </diamond>
                    <diamond mode="Arg1">
                      <nom name="w8"/>
                    </diamond>
                    <diamond mode="Mod">
                      <chunk>
                        <nom name="w11"/>
                        <prop name="after"/>
                        <diamond mode="Arg1">
                          <chunk>
                            <nom name="w14"/>
                            <prop name="ii"/>
                            <diamond mode="det">
                              <prop name="nil"/>
                            </diamond>
                            <diamond mode="num">
                              <prop name="pl"/>
                            </diamond>
                            <diamond mode="Mod">
                              <nom name="w12"/>
                              <prop name="world"/>
                              <diamond mode="num">
                                <prop name="sg"/>
                              </diamond>
                            </diamond>
                            <diamond mode="Mod">
                              <nom name="w13"/>
                              <prop name="war"/>
                              <diamond mode="num">
                                <prop name="sg"/>
                              </diamond>
                            </diamond>
                          </chunk>
                        </diamond>
                      </chunk>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
            <diamond mode="Next">
              <chunk>
                <nom name="w24"/>
                <prop name="be"/>
                <diamond mode="tense">
                  <prop name="past"/>
                </diamond>
                <diamond mode="Arg0">
                  <chunk>
                    <nom name="w19"/>
                    <prop name="and"/>
                    <diamond mode="det">
                      <prop name="nil"/>
                    </diamond>
                    <diamond mode="Arg0">
                      <chunk>
                        <nom name="h1"/>
                        <prop name="has-rel"/>
                        <diamond mode="Mod">
                          <nom name="w18"/>
                          <prop name="france"/>
                          <diamond mode="num">
                            <prop name="sg"/>
                          </diamond>
                        </diamond>
                        <diamond mode="Of">
                          <nom name="w23"/>
                        </diamond>
                      </chunk>
                    </diamond>
                    <diamond mode="Arg1">
                      <chunk>
                        <nom name="w23"/>
                        <prop name="country"/>
                        <diamond mode="num">
                          <prop name="pl"/>
                        </diamond>
                        <diamond mode="Mod">
                          <nom name="w20"/>
                          <prop name="other"/>
                        </diamond>
                        <diamond mode="Mod">
                          <nom name="w21"/>
                          <prop name="permanent"/>
                        </diamond>
                        <diamond mode="Mod">
                          <nom name="w22"/>
                          <prop name="member"/>
                          <diamond mode="num">
                            <prop name="sg"/>
                          </diamond>
                        </diamond>
                      </chunk>
                    </diamond>
                  </chunk>
                </diamond>
                <diamond mode="Arg1">
                  <chunk>
                    <nom name="w27"/>
                    <prop name="victors"/>
                    <diamond mode="num">
                      <prop name="pl"/>
                    </diamond>
                    <diamond mode="Det">
                      <nom name="w26"/>
                      <prop name="the"/>
                    </diamond>
                    <diamond mode="Mod">
                      <nom name="w25"/>
                      <prop name="all"/>
                    </diamond>
                    <diamond mode="Mod">
                      <chunk>
                        <nom name="w28"/>
                        <prop name="of"/>
                        <diamond mode="Arg1">
                          <chunk>
                            <nom name="w30"/>
                            <prop name="war"/>
                            <diamond mode="num">
                              <prop name="sg"/>
                            </diamond>
                            <diamond mode="Det">
                              <nom name="w29"/>
                              <prop name="that"/>
                            </diamond>
                          </chunk>
                        </diamond>
                      </chunk>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
        <diamond mode="Det">
          <nom name="w4"/>
          <prop name="his"/>
        </diamond>
      </chunk>
    </diamond>
  </satop>
</lf>
</first>
<second>
<string>the foreign minister feels that the united nations was born out of the second world war , and that france and the other permanent members of the council were victors in that war .</string>
<pred-info>w32:n:NN:war w31:np/n:DT:that w30:s\np\(s\np)/np:IN:in w9:s[pss]\np:VBN:bear w19:n:NN:france w8:s[dcl]\np/(s[pss]\np):VBD:PASS w17:s[em]$\(s[em]$)\punct[,]/(s[em]$):CC:and w7:n:NNS:nation w6:n/n:JJ:united w15:n:NN:war w5:np/n:DT:the w14:n/n:NN:world w3:s[dcl]\np/s[em]:VBZ:feel w13:n/n:JJ:second w2:n:NN:minister w12:np/n:DT:the w11:pp/np:IN:of w1:n/n:JJ:foreign w10:s\np\(s\np)/pp:IN:out w0:np/n:DT:the w29:n:NNS:victors w28:s[dcl]\np/np:VBD:be w27:n:NN:council w26:np/n:DT:the w25:np\np/np:IN:of w24:n:NNS:member w23:n/n:JJ:permanent w22:n/n:JJ:other w21:np/n:DT:the w20:np\np/np:CC:and</pred-info>
<full-words>the:S-the:P-DT:T-np/n foreign:S-foreign:P-JJ:T-n/n minister:S-minister:P-NN:T-n feels:S-feel:P-VBZ:T-s[dcl]\np/s[em] that:S-that:P-IN:T-s[em]/s[dcl] the:S-the:P-DT:T-np/n united:S-united:P-JJ:T-n/n nations:S-nation:P-NNS:T-n was:S-be:P-VBD:T-s[dcl]\np/(s[pss]\np) born:S-bear:P-VBN:T-s[pss]\np out:S-out:P-IN:T-s\np\(s\np)/pp of:S-of:P-IN:T-pp/np the:S-the:P-DT:T-np/n second:S-second:P-JJ:T-n/n world:S-world:P-NN:T-n/n war:S-war:P-NN:T-n ,:S-,:P-,:T-punct[,] and:S-and:P-CC:T-s[em]$\(s[em]$)\punct[,]/(s[em]$) that:S-that:P-DT:T-s[em]/s[dcl] france:S-france:P-NN:T-n and:S-and:P-CC:T-np\np/np the:S-the:P-DT:T-np/n other:S-other:P-JJ:T-n/n permanent:S-permanent:P-JJ:T-n/n members:S-member:P-NNS:T-n of:S-of:P-IN:T-np\np/np the:S-the:P-DT:T-np/n council:S-council:P-NN:T-n were:S-be:P-VBD:T-s[dcl]\np/np victors:S-victors:P-NNS:T-n in:S-in:P-IN:T-s\np\(s\np)/np that:S-that:P-DT:T-np/n war:S-war:P-NN:T-n .:S-.:P-.:T-sent\s[dcl]</full-words>
<lf>
  <satop nom="w3">
    <prop name="feel"/>
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
    <diamond mode="tense">
      <prop name="pres"/>
    </diamond>
    <diamond mode="Arg0">
      <chunk>
        <nom name="w2"/>
        <prop name="minister"/>
        <diamond mode="num">
          <prop name="sg"/>
        </diamond>
        <diamond mode="Det">
          <nom name="w0"/>
          <prop name="the"/>
        </diamond>
        <diamond mode="Mod">
          <nom name="w1"/>
          <prop name="foreign"/>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Arg1">
      <chunk>
        <nom name="w17"/>
        <prop name="and"/>
        <diamond mode="First">
          <chunk>
            <nom name="w8"/>
            <prop name="PASS"/>
            <diamond mode="tense">
              <prop name="past"/>
            </diamond>
            <diamond mode="Arg0">
              <chunk>
                <nom name="w7"/>
                <prop name="nation"/>
                <diamond mode="num">
                  <prop name="pl"/>
                </diamond>
                <diamond mode="Det">
                  <nom name="w5"/>
                  <prop name="the"/>
                </diamond>
                <diamond mode="Mod">
                  <nom name="w6"/>
                  <prop name="united"/>
                </diamond>
              </chunk>
            </diamond>
            <diamond mode="Arg1">
              <chunk>
                <nom name="w9"/>
                <prop name="bear"/>
                <diamond mode="partic">
                  <prop name="pass"/>
                </diamond>
                <diamond mode="Arg1">
                  <nom name="w7"/>
                </diamond>
                <diamond mode="Mod">
                  <chunk>
                    <nom name="w10"/>
                    <prop name="out"/>
                    <diamond mode="Arg1">
                      <chunk>
                        <nom name="w11"/>
                        <prop name="of"/>
                        <diamond mode="Arg1">
                          <chunk>
                            <nom name="w15"/>
                            <prop name="war"/>
                            <diamond mode="num">
                              <prop name="sg"/>
                            </diamond>
                            <diamond mode="Det">
                              <nom name="w12"/>
                              <prop name="the"/>
                            </diamond>
                            <diamond mode="Mod">
                              <nom name="w13"/>
                              <prop name="second"/>
                            </diamond>
                            <diamond mode="Mod">
                              <nom name="w14"/>
                              <prop name="world"/>
                              <diamond mode="num">
                                <prop name="sg"/>
                              </diamond>
                            </diamond>
                          </chunk>
                        </diamond>
                      </chunk>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
        <diamond mode="Next">
          <chunk>
            <nom name="w28"/>
            <prop name="be"/>
            <diamond mode="tense">
              <prop name="past"/>
            </diamond>
            <diamond mode="Arg0">
              <chunk>
                <nom name="w20"/>
                <prop name="and"/>
                <diamond mode="First">
                  <nom name="w19"/>
                  <prop name="france"/>
                  <diamond mode="det">
                    <prop name="nil"/>
                  </diamond>
                  <diamond mode="num">
                    <prop name="sg"/>
                  </diamond>
                </diamond>
                <diamond mode="Next">
                  <chunk>
                    <nom name="w24"/>
                    <prop name="member"/>
                    <diamond mode="num">
                      <prop name="pl"/>
                    </diamond>
                    <diamond mode="Det">
                      <nom name="w21"/>
                      <prop name="the"/>
                    </diamond>
                    <diamond mode="Mod">
                      <nom name="w22"/>
                      <prop name="other"/>
                    </diamond>
                    <diamond mode="Mod">
                      <nom name="w23"/>
                      <prop name="permanent"/>
                    </diamond>
                    <diamond mode="Mod">
                      <chunk>
                        <nom name="w25"/>
                        <prop name="of"/>
                        <diamond mode="Arg1">
                          <chunk>
                            <nom name="w27"/>
                            <prop name="council"/>
                            <diamond mode="num">
                              <prop name="sg"/>
                            </diamond>
                            <diamond mode="Det">
                              <nom name="w26"/>
                              <prop name="the"/>
                            </diamond>
                          </chunk>
                        </diamond>
                      </chunk>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
            <diamond mode="Arg1">
              <nom name="w29"/>
              <prop name="victors"/>
              <diamond mode="det">
                <prop name="nil"/>
              </diamond>
              <diamond mode="num">
                <prop name="pl"/>
              </diamond>
            </diamond>
            <diamond mode="Mod">
              <chunk>
                <nom name="w30"/>
                <prop name="in"/>
                <diamond mode="Arg1">
                  <chunk>
                    <nom name="w32"/>
                    <prop name="war"/>
                    <diamond mode="num">
                      <prop name="sg"/>
                    </diamond>
                    <diamond mode="Det">
                      <nom name="w31"/>
                      <prop name="that"/>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
  </satop>
</lf>
</second>
</paraphrase>
<paraphrase corpus="mtc.common" id="36">
<alignments source="GIZA_INTERSECTED">
<alignment first="0" second="0" status="S"/>
<alignment first="1" second="1" status="S"/>
<alignment first="2" second="4" status="S"/>
<alignment first="3" second="5" status="S"/>
<alignment first="4" second="6" status="S"/>
<alignment first="5" second="7" status="S"/>
<alignment first="6" second="8" status="S"/>
<alignment first="7" second="9" status="S"/>
<alignment first="11" second="20" status="S"/>
<alignment first="14" second="10" status="S"/>
<alignment first="15" second="11" status="S"/>
<alignment first="16" second="12" status="S"/>
<alignment first="17" second="13" status="S"/>
<alignment first="18" second="14" status="S"/>
<alignment first="19" second="24" status="S"/>
</alignments>
<alignments source="ANNOTATOR">
<alignment first="0" second="0" status="S"/>
<alignment first="1" second="1" status="S"/>
<alignment first="2" second="4" status="S"/>
<alignment first="3" second="5" status="S"/>
<alignment first="4" second="6" status="S"/>
<alignment first="5" second="7" status="S"/>
<alignment first="5" second="16" status="P"/>
<alignment first="6" second="8" status="S"/>
<alignment first="7" second="9" status="S"/>
<alignment first="8" second="17" status="P"/>
<alignment first="8" second="18" status="P"/>
<alignment first="9" second="17" status="P"/>
<alignment first="9" second="18" status="P"/>
<alignment first="10" second="20" status="P"/>
<alignment first="11" second="19" status="S"/>
<alignment first="14" second="10" status="S"/>
<alignment first="15" second="11" status="S"/>
<alignment first="16" second="12" status="S"/>
<alignment first="16" second="23" status="P"/>
<alignment first="17" second="13" status="S"/>
<alignment first="17" second="23" status="P"/>
<alignment first="18" second="14" status="S"/>
<alignment first="19" second="24" status="S"/>
</alignments>
<first>
<string>moore said the australian military attache to jakarta will conduct free investigations after he arrives in east timor tomorrow .</string>
<pred-info>w9:s[b]\np/np:VB:conduct w18:s\np\(s\np):NN:tomorrow w8:s[dcl]\np/(s[b]\np):MD:will w17:n:NN:timor w7:n:NNP:jakarta w16:n/n:JJ:east w6:np\np/np:TO:to w15:s\np\(s\np)/np:IN:in w5:n:NN:attache w14:s[dcl]\np:VBZ:arrive w4:n/n:JJ:military w13:np:PRP:he w3:n/n:JJ:australian w12:s\np\(s\np)/s[dcl]:IN:after w2:np/n:DT:the w11:n:NNS:investigation w1:s[dcl]\np/s[dcl]:VBD:say w10:n/n:JJ:free w0:n:NN:moore</pred-info>
<full-words>moore:S-moore:P-NN:T-n said:S-say:P-VBD:T-s[dcl]\np/s[dcl] the:S-the:P-DT:T-np/n australian:S-australian:P-JJ:T-n/n military:S-military:P-JJ:T-n/n attache:S-attache:P-NN:T-n to:S-to:P-TO:T-np\np/np jakarta:S-jakarta:P-NNP:T-n will:S-will:P-MD:T-s[dcl]\np/(s[b]\np) conduct:S-conduct:P-VB:T-s[b]\np/np free:S-free:P-JJ:T-n/n investigations:S-investigation:P-NNS:T-n after:S-after:P-IN:T-s\np\(s\np)/s[dcl] he:S-he:P-PRP:T-np arrives:S-arrive:P-VBZ:T-s[dcl]\np in:S-in:P-IN:T-s\np\(s\np)/np east:S-east:P-JJ:T-n/n timor:S-timor:P-NN:T-n tomorrow:S-tomorrow:P-NN:T-s\np\(s\np) .:S-.:P-.:T-sent\s[dcl]</full-words>
<lf>
  <satop nom="w1">
    <prop name="say"/>
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
    <diamond mode="tense">
      <prop name="past"/>
    </diamond>
    <diamond mode="Arg0">
      <nom name="w0"/>
      <prop name="moore"/>
      <diamond mode="det">
        <prop name="nil"/>
      </diamond>
      <diamond mode="num">
        <prop name="sg"/>
      </diamond>
    </diamond>
    <diamond mode="Arg1">
      <chunk>
        <nom name="w8"/>
        <prop name="will"/>
        <diamond mode="Arg0">
          <chunk>
            <nom name="w5"/>
            <prop name="attache"/>
            <diamond mode="num">
              <prop name="sg"/>
            </diamond>
            <diamond mode="Det">
              <nom name="w2"/>
              <prop name="the"/>
            </diamond>
            <diamond mode="Mod">
              <nom name="w3"/>
              <prop name="australian"/>
            </diamond>
            <diamond mode="Mod">
              <nom name="w4"/>
              <prop name="military"/>
            </diamond>
            <diamond mode="Mod">
              <chunk>
                <nom name="w6"/>
                <prop name="to"/>
                <diamond mode="Arg1">
                  <nom name="w7"/>
                  <prop name="jakarta"/>
                  <diamond mode="det">
                    <prop name="nil"/>
                  </diamond>
                  <diamond mode="num">
                    <prop name="sg"/>
                  </diamond>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
        <diamond mode="Arg1">
          <chunk>
            <nom name="w9"/>
            <prop name="conduct"/>
            <diamond mode="Arg0">
              <nom name="w5"/>
            </diamond>
            <diamond mode="Arg1">
              <chunk>
                <nom name="w11"/>
                <prop name="investigation"/>
                <diamond mode="det">
                  <prop name="nil"/>
                </diamond>
                <diamond mode="num">
                  <prop name="pl"/>
                </diamond>
                <diamond mode="Mod">
                  <nom name="w10"/>
                  <prop name="free"/>
                </diamond>
              </chunk>
            </diamond>
            <diamond mode="Mod">
              <chunk>
                <nom name="w12"/>
                <prop name="after"/>
                <diamond mode="Arg1">
                  <chunk>
                    <nom name="w14"/>
                    <prop name="arrive"/>
                    <diamond mode="tense">
                      <prop name="pres"/>
                    </diamond>
                    <diamond mode="Arg0">
                      <nom name="w13"/>
                      <prop name="he"/>
                    </diamond>
                    <diamond mode="Mod">
                      <chunk>
                        <nom name="w15"/>
                        <prop name="in"/>
                        <diamond mode="Arg1">
                          <chunk>
                            <nom name="w17"/>
                            <prop name="timor"/>
                            <diamond mode="det">
                              <prop name="nil"/>
                            </diamond>
                            <diamond mode="num">
                              <prop name="sg"/>
                            </diamond>
                            <diamond mode="Mod">
                              <nom name="w16"/>
                              <prop name="east"/>
                            </diamond>
                          </chunk>
                        </diamond>
                      </chunk>
                    </diamond>
                    <diamond mode="Mod">
                      <nom name="w18"/>
                      <prop name="tomorrow"/>
                      <diamond mode="num">
                        <prop name="sg"/>
                      </diamond>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
  </satop>
</lf>
</first>
<second>
<string>moore said , after the australian military attache to jakarta arrives in east timor tomorrow , he can conduct investigations freely in the area .</string>
<pred-info>w19:n:NNS:investigation w9:n:NN:jakarta w18:s[b]\np/np:VB:conduct w8:np\np/np:TO:to w7:n:NN:attache w17:s[dcl]\np/(s[b]\np):MD:can w16:np:PRP:he w6:n/n:JJ:military w5:n/n:JJ:australian w14:s\np\(s\np):NN:tomorrow w4:np/n:DT:the w13:n:NN:timor w3:s/s/s[dcl]:IN:after w12:n/n:JJ:east w11:s\np\(s\np)/np:IN:in w1:s[dcl]\np/s[dcl]/punct[,]:VBD:say w10:s[dcl]\np:VBZ:arrive w0:n:NN:moore w23:n:NN:area w22:np/n:DT:the w21:s\np\(s\np)/np:IN:in w20:s\np\(s\np):RB:freely</pred-info>
<full-words>moore:S-moore:P-NN:T-n said:S-say:P-VBD:T-s[dcl]\np/s[dcl]/punct[,] ,:S-,:P-,:T-punct[,] after:S-after:P-IN:T-s/s/s[dcl] the:S-the:P-DT:T-np/n australian:S-australian:P-JJ:T-n/n military:S-military:P-JJ:T-n/n attache:S-attache:P-NN:T-n to:S-to:P-TO:T-np\np/np jakarta:S-jakarta:P-NN:T-n arrives:S-arrive:P-VBZ:T-s[dcl]\np in:S-in:P-IN:T-s\np\(s\np)/np east:S-east:P-JJ:T-n/n timor:S-timor:P-NN:T-n tomorrow:S-tomorrow:P-NN:T-s\np\(s\np) ,:S-,:P-,:T-s/s\(s/s) he:S-he:P-PRP:T-np can:S-can:P-MD:T-s[dcl]\np/(s[b]\np) conduct:S-conduct:P-VB:T-s[b]\np/np investigations:S-investigation:P-NNS:T-n freely:S-freely:P-RB:T-s\np\(s\np) in:S-in:P-IN:T-s\np\(s\np)/np the:S-the:P-DT:T-np/n area:S-area:P-NN:T-n .:S-.:P-.:T-sent\s[dcl]</full-words>
<lf>
  <satop nom="w1">
    <prop name="say"/>
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
    <diamond mode="tense">
      <prop name="past"/>
    </diamond>
    <diamond mode="Arg0">
      <nom name="w0"/>
      <prop name="moore"/>
      <diamond mode="det">
        <prop name="nil"/>
      </diamond>
      <diamond mode="num">
        <prop name="sg"/>
      </diamond>
    </diamond>
    <diamond mode="Arg1">
      <chunk>
        <nom name="w17"/>
        <prop name="can"/>
        <diamond mode="Arg0">
          <nom name="w16"/>
          <prop name="he"/>
        </diamond>
        <diamond mode="Arg1">
          <chunk>
            <nom name="w18"/>
            <prop name="conduct"/>
            <diamond mode="Arg0">
              <nom name="w16"/>
            </diamond>
            <diamond mode="Arg1">
              <nom name="w19"/>
              <prop name="investigation"/>
              <diamond mode="det">
                <prop name="nil"/>
              </diamond>
              <diamond mode="num">
                <prop name="pl"/>
              </diamond>
            </diamond>
            <diamond mode="Mod">
              <nom name="w20"/>
              <prop name="freely"/>
            </diamond>
            <diamond mode="Mod">
              <chunk>
                <nom name="w21"/>
                <prop name="in"/>
                <diamond mode="Arg1">
                  <chunk>
                    <nom name="w23"/>
                    <prop name="area"/>
                    <diamond mode="num">
                      <prop name="sg"/>
                    </diamond>
                    <diamond mode="Det">
                      <nom name="w22"/>
                      <prop name="the"/>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
        <diamond mode="Mod">
          <chunk>
            <nom name="w3"/>
            <prop name="after"/>
            <diamond mode="emph-intro">
              <prop name="+"/>
            </diamond>
            <diamond mode="Arg1">
              <chunk>
                <nom name="w10"/>
                <prop name="arrive"/>
                <diamond mode="tense">
                  <prop name="pres"/>
                </diamond>
                <diamond mode="Arg0">
                  <chunk>
                    <nom name="w7"/>
                    <prop name="attache"/>
                    <diamond mode="num">
                      <prop name="sg"/>
                    </diamond>
                    <diamond mode="Det">
                      <nom name="w4"/>
                      <prop name="the"/>
                    </diamond>
                    <diamond mode="Mod">
                      <nom name="w5"/>
                      <prop name="australian"/>
                    </diamond>
                    <diamond mode="Mod">
                      <nom name="w6"/>
                      <prop name="military"/>
                    </diamond>
                    <diamond mode="Mod">
                      <chunk>
                        <nom name="w8"/>
                        <prop name="to"/>
                        <diamond mode="Arg1">
                          <nom name="w9"/>
                          <prop name="jakarta"/>
                          <diamond mode="det">
                            <prop name="nil"/>
                          </diamond>
                          <diamond mode="num">
                            <prop name="sg"/>
                          </diamond>
                        </diamond>
                      </chunk>
                    </diamond>
                  </chunk>
                </diamond>
                <diamond mode="Mod">
                  <chunk>
                    <nom name="w11"/>
                    <prop name="in"/>
                    <diamond mode="Arg1">
                      <chunk>
                        <nom name="w13"/>
                        <prop name="timor"/>
                        <diamond mode="det">
                          <prop name="nil"/>
                        </diamond>
                        <diamond mode="num">
                          <prop name="sg"/>
                        </diamond>
                        <diamond mode="Mod">
                          <nom name="w12"/>
                          <prop name="east"/>
                        </diamond>
                      </chunk>
                    </diamond>
                  </chunk>
                </diamond>
                <diamond mode="Mod">
                  <nom name="w14"/>
                  <prop name="tomorrow"/>
                  <diamond mode="num">
                    <prop name="sg"/>
                  </diamond>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
  </satop>
</lf>
</second>
</paraphrase>
<paraphrase corpus="mtc.common" id="37">
<alignments source="GIZA_INTERSECTED">
<alignment first="0" second="3" status="S"/>
<alignment first="1" second="4" status="S"/>
<alignment first="2" second="5" status="S"/>
<alignment first="4" second="0" status="S"/>
<alignment first="5" second="1" status="S"/>
<alignment first="7" second="6" status="S"/>
<alignment first="8" second="7" status="S"/>
<alignment first="9" second="8" status="S"/>
<alignment first="10" second="9" status="S"/>
<alignment first="11" second="10" status="S"/>
<alignment first="12" second="11" status="S"/>
<alignment first="13" second="12" status="S"/>
<alignment first="14" second="13" status="S"/>
<alignment first="15" second="14" status="S"/>
<alignment first="23" second="20" status="S"/>
<alignment first="25" second="24" status="S"/>
<alignment first="26" second="25" status="S"/>
<alignment first="34" second="29" status="S"/>
<alignment first="35" second="31" status="S"/>
</alignments>
<alignments source="ANNOTATOR">
<alignment first="0" second="3" status="S"/>
<alignment first="1" second="4" status="S"/>
<alignment first="2" second="5" status="S"/>
<alignment first="4" second="0" status="S"/>
<alignment first="5" second="1" status="S"/>
<alignment first="6" second="2" status="P"/>
<alignment first="7" second="6" status="S"/>
<alignment first="8" second="7" status="S"/>
<alignment first="9" second="8" status="S"/>
<alignment first="10" second="9" status="S"/>
<alignment first="11" second="10" status="S"/>
<alignment first="12" second="11" status="S"/>
<alignment first="13" second="12" status="S"/>
<alignment first="14" second="13" status="S"/>
<alignment first="15" second="14" status="S"/>
<alignment first="16" second="15" status="S"/>
<alignment first="17" second="16" status="P"/>
<alignment first="18" second="17" status="P"/>
<alignment first="19" second="17" status="P"/>
<alignment first="20" second="18" status="P"/>
<alignment first="20" second="19" status="P"/>
<alignment first="21" second="18" status="P"/>
<alignment first="21" second="19" status="P"/>
<alignment first="22" second="18" status="P"/>
<alignment first="22" second="19" status="P"/>
<alignment first="23" second="20" status="S"/>
<alignment first="24" second="21" status="P"/>
<alignment first="24" second="23" status="P"/>
<alignment first="25" second="24" status="S"/>
<alignment first="26" second="25" status="S"/>
<alignment first="27" second="26" status="P"/>
<alignment first="28" second="27" status="S"/>
<alignment first="29" second="29" status="P"/>
<alignment first="29" second="30" status="P"/>
<alignment first="30" second="28" status="P"/>
<alignment first="31" second="28" status="P"/>
<alignment first="32" second="28" status="P"/>
<alignment first="33" second="28" status="P"/>
<alignment first="34" second="29" status="P"/>
<alignment first="35" second="31" status="S"/>
</alignments>
<first>
<string>at that time , jiang zeming indicated that china would consider joining the missile technology control regime . the indication has been taken as the principle result of the meeting between the two state heads .</string>
<pred-info>w33:n:NNS:head w32:n/n:NN:state w31:n/n:CD:two w30:np/n:DT:the w9:s[dcl]\np/(s[b]\np):MD:would w19:s[dcl]\np/(s[pt]\np):VBZ:PERF w18:n:NN:indication w8:n:NN:china w17:np/n:DT:the w6:s[dcl]\np/s[em]:VBD:indicate w16:n:NN:regime w5:n:VBG:zeming w15:n/n:NN:control w14:n/n:NN:technology w4:n/n:VBG:jiang w13:n/n:NN:missile w2:n:NN:time w12:np/n:DT:the w11:s[ng]\np/np:VBG:join w1:np/n:DT:that w10:s[b]\np/np:VB:consider w0:s/s/np:IN:at w29:np\np/np:IN:between w28:n:NN:meeting w27:np/n:DT:the w26:np\np/np:IN:of w25:n:NN:result w24:n:NN:principle w23:np/n:DT:the w22:pp/np:IN:as w21:s[pss]\np/pp:VBN:take w20:s[pt]\np/(s[pss]\np):VBN:PASS</pred-info>
<full-words>at:S-at:P-IN:T-s/s/np that:S-that:P-DT:T-np/n time:S-time:P-NN:T-n ,:S-,:P-,:T-s/s\(s/s) jiang:S-jiang:P-VBG:T-n/n zeming:S-zeming:P-VBG:T-n indicated:S-indicate:P-VBD:T-s[dcl]\np/s[em] that:S-that:P-IN:T-s[em]/s[dcl] china:S-china:P-NN:T-n would:S-would:P-MD:T-s[dcl]\np/(s[b]\np) consider:S-consider:P-VB:T-s[b]\np/np joining:S-join:P-VBG:T-s[ng]\np/np the:S-the:P-DT:T-np/n missile:S-missile:P-NN:T-n/n technology:S-technology:P-NN:T-n/n control:S-control:P-NN:T-n/n regime:S-regime:P-NN:T-n .:S-.:P-.:T-punct[.] the:S-the:P-DT:T-np/n indication:S-indication:P-NN:T-n has:S-have:P-VBZ:T-s[dcl]\np/(s[pt]\np) been:S-be:P-VBN:T-s[pt]\np/(s[pss]\np) taken:S-take:P-VBN:T-s[pss]\np/pp as:S-as:P-IN:T-pp/np the:S-the:P-DT:T-np/n principle:S-principle:P-NN:T-n result:S-result:P-NN:T-n of:S-of:P-IN:T-np\np/np the:S-the:P-DT:T-np/n meeting:S-meeting:P-NN:T-n between:S-between:P-IN:T-np\np/np the:S-the:P-DT:T-np/n two:S-two:P-CD:T-n/n state:S-state:P-NN:T-n/n heads:S-head:P-NNS:T-n .:S-.:P-.:T-sent\s[dcl]</full-words>
<lf>
  <satop nom="w6">
    <prop name="indicate"/>
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
    <diamond mode="tense">
      <prop name="past"/>
    </diamond>
    <diamond mode="Arg0">
      <chunk>
        <nom name="w5"/>
        <prop name="zeming"/>
        <diamond mode="det">
          <prop name="nil"/>
        </diamond>
        <diamond mode="partic">
          <prop name="pres"/>
        </diamond>
        <diamond mode="Mod">
          <nom name="w4"/>
          <prop name="jiang"/>
          <diamond mode="partic">
            <prop name="pres"/>
          </diamond>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Arg1">
      <chunk>
        <nom name="w9"/>
        <prop name="would"/>
        <diamond mode="Arg0">
          <nom name="w8"/>
          <prop name="china"/>
          <diamond mode="det">
            <prop name="nil"/>
          </diamond>
          <diamond mode="num">
            <prop name="sg"/>
          </diamond>
        </diamond>
        <diamond mode="Arg1">
          <chunk>
            <nom name="w10"/>
            <prop name="consider"/>
            <diamond mode="Arg0">
              <nom name="w8"/>
            </diamond>
            <diamond mode="Arg1">
              <chunk>
                <nom name="w26"/>
                <prop name="result"/>
                <diamond mode="det">
                  <prop name="nil"/>
                </diamond>
                <diamond mode="num">
                  <prop name="sg"/>
                </diamond>
                <diamond mode="Mod">
                  <chunk>
                    <nom name="w27"/>
                    <prop name="of"/>
                    <diamond mode="Arg1">
                      <chunk>
                        <nom name="w29"/>
                        <prop name="meeting"/>
                        <diamond mode="num">
                          <prop name="sg"/>
                        </diamond>
                        <diamond mode="Det">
                          <nom name="w28"/>
                          <prop name="the"/>
                        </diamond>
                        <diamond mode="Mod">
                          <chunk>
                            <nom name="w30"/>
                            <prop name="between"/>
                            <diamond mode="Arg1">
                              <chunk>
                                <nom name="w34"/>
                                <prop name="head"/>
                                <diamond mode="num">
                                  <prop name="pl"/>
                                </diamond>
                                <diamond mode="Det">
                                  <nom name="w31"/>
                                  <prop name="the"/>
                                </diamond>
                                <diamond mode="Mod">
                                  <nom name="w32"/>
                                  <prop name="two"/>
                                </diamond>
                                <diamond mode="Mod">
                                  <nom name="w33"/>
                                  <prop name="state"/>
                                  <diamond mode="num">
                                    <prop name="sg"/>
                                  </diamond>
                                </diamond>
                              </chunk>
                            </diamond>
                          </chunk>
                        </diamond>
                      </chunk>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
            <diamond mode="GenRel">
              <chunk>
                <nom name="w11"/>
                <prop name="join"/>
                <diamond mode="partic">
                  <prop name="pres"/>
                </diamond>
                <diamond mode="Arg0">
                  <nom name="w8"/>
                </diamond>
                <diamond mode="Arg1">
                  <chunk>
                    <nom name="w16"/>
                    <prop name="regime"/>
                    <diamond mode="num">
                      <prop name="sg"/>
                    </diamond>
                    <diamond mode="Det">
                      <nom name="w12"/>
                      <prop name="the"/>
                    </diamond>
                    <diamond mode="Mod">
                      <nom name="w13"/>
                      <prop name="missile"/>
                      <diamond mode="num">
                        <prop name="sg"/>
                      </diamond>
                    </diamond>
                    <diamond mode="Mod">
                      <nom name="w14"/>
                      <prop name="technology"/>
                      <diamond mode="num">
                        <prop name="sg"/>
                      </diamond>
                    </diamond>
                    <diamond mode="Mod">
                      <nom name="w15"/>
                      <prop name="control"/>
                      <diamond mode="num">
                        <prop name="sg"/>
                      </diamond>
                    </diamond>
                    <diamond mode="GenRel">
                      <chunk>
                        <nom name="w20"/>
                        <prop name="PERF"/>
                        <diamond mode="tense">
                          <prop name="pres"/>
                        </diamond>
                        <diamond mode="Arg0">
                          <chunk>
                            <nom name="w19"/>
                            <prop name="indication"/>
                            <diamond mode="num">
                              <prop name="sg"/>
                            </diamond>
                            <diamond mode="Det">
                              <nom name="w18"/>
                              <prop name="the"/>
                            </diamond>
                          </chunk>
                        </diamond>
                        <diamond mode="Arg1">
                          <chunk>
                            <nom name="w21"/>
                            <prop name="PASS"/>
                            <diamond mode="partic">
                              <prop name="past"/>
                            </diamond>
                            <diamond mode="Arg0">
                              <nom name="w19"/>
                            </diamond>
                            <diamond mode="Arg1">
                              <chunk>
                                <nom name="w22"/>
                                <prop name="take"/>
                                <diamond mode="partic">
                                  <prop name="pass"/>
                                </diamond>
                                <diamond mode="Arg1">
                                  <nom name="w19"/>
                                </diamond>
                                <diamond mode="Arg2">
                                  <chunk>
                                    <nom name="w23"/>
                                    <prop name="as"/>
                                    <diamond mode="Arg1">
                                      <chunk>
                                        <nom name="w25"/>
                                        <prop name="principle"/>
                                        <diamond mode="num">
                                          <prop name="sg"/>
                                        </diamond>
                                        <diamond mode="Det">
                                          <nom name="w24"/>
                                          <prop name="the"/>
                                        </diamond>
                                      </chunk>
                                    </diamond>
                                  </chunk>
                                </diamond>
                              </chunk>
                            </diamond>
                          </chunk>
                        </diamond>
                        <diamond mode="Mod">
                          <nom name="x1"/>
                        </diamond>
                      </chunk>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Mod">
      <chunk>
        <nom name="w0"/>
        <prop name="at"/>
        <diamond mode="emph-intro">
          <prop name="+"/>
        </diamond>
        <diamond mode="Arg1">
          <chunk>
            <nom name="w2"/>
            <prop name="time"/>
            <diamond mode="num">
              <prop name="sg"/>
            </diamond>
            <diamond mode="Det">
              <nom name="w1"/>
              <prop name="that"/>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
  </satop>
</lf>
</first>
<second>
<string>jiang zemin promised at that time that china would consider joining the missile technology control agreement , which was seen as one of the major achievements in the china-us summit meeting .</string>
<pred-info>w30:n:NN:meeting w19:s[pss]\np/pp:VBN:see w9:s[b]\np/(s[ng]\np):VB:consider w18:s[dcl]\np/(s[pss]\np):VBD:PASS w8:s[dcl]\np/(s[b]\np):MD:would w7:n:NN:china w15:n:NN:agreement w5:n:NN:time w14:n/n:NN:control w4:np/n:DT:that w13:n/n:NN:technology w3:s\np\(s\np)/np:IN:at w2:s[dcl]\np/np:VBD:promise w12:n/n:NN:missile w11:np/n:DT:the w1:n:NNP:zemin w10:s[ng]\np/np:VBG:join w0:n/n:NNP:jiang w29:n/n:NN:summit w28:n/n:JJ:china-us w27:np/n:DT:the w26:np\np/np:IN:in w25:n:NNS:achievement w24:n/n:JJ:major w23:np/n:DT:the w22:np\np/np:IN:of w21:n:CD:one w20:pp/np:IN:as</pred-info>
<full-words>jiang:S-jiang:P-NNP:T-n/n zemin:S-zemin:P-NNP:T-n promised:S-promise:P-VBD:T-s[dcl]\np/np at:S-at:P-IN:T-s\np\(s\np)/np that:S-that:P-DT:T-np/n time:S-time:P-NN:T-n that:S-that:P-IN:T-np\np/(s[dcl]/np) china:S-china:P-NN:T-n would:S-would:P-MD:T-s[dcl]\np/(s[b]\np) consider:S-consider:P-VB:T-s[b]\np/(s[ng]\np) joining:S-join:P-VBG:T-s[ng]\np/np the:S-the:P-DT:T-np/n missile:S-missile:P-NN:T-n/n technology:S-technology:P-NN:T-n/n control:S-control:P-NN:T-n/n agreement:S-agreement:P-NN:T-n ,:S-,:P-,:T-punct[,] which:S-which:P-WDT:T-np\np\punct[,]/(s[dcl]\np) was:S-be:P-VBD:T-s[dcl]\np/(s[pss]\np) seen:S-see:P-VBN:T-s[pss]\np/pp as:S-as:P-IN:T-pp/np one:S-one:P-CD:T-n of:S-of:P-IN:T-np\np/np the:S-the:P-DT:T-np/n major:S-major:P-JJ:T-n/n achievements:S-achievement:P-NNS:T-n in:S-in:P-IN:T-np\np/np the:S-the:P-DT:T-np/n china&#45;us:S-china&#45;us:P-JJ:T-n/n summit:S-summit:P-NN:T-n/n meeting:S-meeting:P-NN:T-n .:S-.:P-.:T-sent\s[dcl]</full-words>
<lf>
  <satop nom="w2">
    <prop name="promise"/>
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
    <diamond mode="tense">
      <prop name="past"/>
    </diamond>
    <diamond mode="Arg0">
      <chunk>
        <nom name="w1"/>
        <prop name="zemin"/>
        <diamond mode="det">
          <prop name="nil"/>
        </diamond>
        <diamond mode="num">
          <prop name="sg"/>
        </diamond>
        <diamond mode="Mod">
          <nom name="w0"/>
          <prop name="jiang"/>
          <diamond mode="num">
            <prop name="sg"/>
          </diamond>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Arg1">
      <chunk>
        <nom name="w15"/>
        <prop name="agreement"/>
        <diamond mode="num">
          <prop name="sg"/>
        </diamond>
        <diamond mode="Det">
          <nom name="w11"/>
          <prop name="the"/>
        </diamond>
        <diamond mode="Mod">
          <nom name="w12"/>
          <prop name="missile"/>
          <diamond mode="num">
            <prop name="sg"/>
          </diamond>
        </diamond>
        <diamond mode="Mod">
          <nom name="w13"/>
          <prop name="technology"/>
          <diamond mode="num">
            <prop name="sg"/>
          </diamond>
        </diamond>
        <diamond mode="Mod">
          <nom name="w14"/>
          <prop name="control"/>
          <diamond mode="num">
            <prop name="sg"/>
          </diamond>
        </diamond>
        <diamond mode="whApposRel">
          <chunk>
            <nom name="w18"/>
            <prop name="PASS"/>
            <diamond mode="tense">
              <prop name="past"/>
            </diamond>
            <diamond mode="Arg0">
              <nom name="w15"/>
            </diamond>
            <diamond mode="Arg1">
              <chunk>
                <nom name="w19"/>
                <prop name="see"/>
                <diamond mode="partic">
                  <prop name="pass"/>
                </diamond>
                <diamond mode="Arg1">
                  <nom name="w15"/>
                </diamond>
                <diamond mode="Arg2">
                  <chunk>
                    <nom name="w20"/>
                    <prop name="as"/>
                    <diamond mode="Arg1">
                      <chunk>
                        <nom name="w21"/>
                        <prop name="one"/>
                        <diamond mode="det">
                          <prop name="nil"/>
                        </diamond>
                        <diamond mode="Mod">
                          <chunk>
                            <nom name="w22"/>
                            <prop name="of"/>
                            <diamond mode="Arg1">
                              <chunk>
                                <nom name="w25"/>
                                <prop name="achievement"/>
                                <diamond mode="num">
                                  <prop name="pl"/>
                                </diamond>
                                <diamond mode="Det">
                                  <nom name="w23"/>
                                  <prop name="the"/>
                                </diamond>
                                <diamond mode="Mod">
                                  <nom name="w24"/>
                                  <prop name="major"/>
                                </diamond>
                                <diamond mode="Mod">
                                  <chunk>
                                    <nom name="w26"/>
                                    <prop name="in"/>
                                    <diamond mode="Arg1">
                                      <chunk>
                                        <nom name="w30"/>
                                        <prop name="meeting"/>
                                        <diamond mode="num">
                                          <prop name="sg"/>
                                        </diamond>
                                        <diamond mode="Det">
                                          <nom name="w27"/>
                                          <prop name="the"/>
                                        </diamond>
                                        <diamond mode="Mod">
                                          <nom name="w28"/>
                                          <prop name="china-us"/>
                                        </diamond>
                                        <diamond mode="Mod">
                                          <nom name="w29"/>
                                          <prop name="summit"/>
                                          <diamond mode="num">
                                            <prop name="sg"/>
                                          </diamond>
                                        </diamond>
                                      </chunk>
                                    </diamond>
                                  </chunk>
                                </diamond>
                              </chunk>
                            </diamond>
                          </chunk>
                        </diamond>
                      </chunk>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Mod">
      <chunk>
        <nom name="w3"/>
        <prop name="at"/>
        <diamond mode="Arg1">
          <chunk>
            <nom name="w5"/>
            <prop name="time"/>
            <diamond mode="num">
              <prop name="sg"/>
            </diamond>
            <diamond mode="Det">
              <nom name="w4"/>
              <prop name="that"/>
            </diamond>
            <diamond mode="GenRel">
              <chunk>
                <nom name="w8"/>
                <prop name="would"/>
                <diamond mode="Arg0">
                  <nom name="w7"/>
                  <prop name="china"/>
                  <diamond mode="det">
                    <prop name="nil"/>
                  </diamond>
                  <diamond mode="num">
                    <prop name="sg"/>
                  </diamond>
                </diamond>
                <diamond mode="Arg1">
                  <chunk>
                    <nom name="w9"/>
                    <prop name="consider"/>
                    <diamond mode="Arg0">
                      <nom name="w7"/>
                    </diamond>
                    <diamond mode="Arg1">
                      <chunk>
                        <nom name="w10"/>
                        <prop name="join"/>
                        <diamond mode="partic">
                          <prop name="pres"/>
                        </diamond>
                        <diamond mode="Arg0">
                          <nom name="w7"/>
                        </diamond>
                        <diamond mode="Arg1">
                          <nom name="w5"/>
                        </diamond>
                      </chunk>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
  </satop>
</lf>
</second>
</paraphrase>
<paraphrase corpus="mtc.common" id="38">
<alignments source="GIZA_INTERSECTED">
<alignment first="0" second="0" status="S"/>
<alignment first="1" second="1" status="S"/>
<alignment first="2" second="2" status="S"/>
<alignment first="7" second="8" status="S"/>
<alignment first="11" second="11" status="S"/>
<alignment first="13" second="15" status="S"/>
<alignment first="14" second="16" status="S"/>
</alignments>
<alignments source="ANNOTATOR">
<alignment first="0" second="0" status="S"/>
<alignment first="1" second="1" status="S"/>
<alignment first="2" second="2" status="S"/>
<alignment first="2" second="3" status="S"/>
<alignment first="3" second="4" status="S"/>
<alignment first="4" second="13" status="P"/>
<alignment first="6" second="6" status="S"/>
<alignment first="7" second="7" status="S"/>
<alignment first="7" second="8" status="S"/>
<alignment first="8" second="9" status="P"/>
<alignment first="9" second="10" status="S"/>
<alignment first="10" second="10" status="S"/>
<alignment first="11" second="11" status="S"/>
<alignment first="12" second="13" status="P"/>
<alignment first="12" second="14" status="S"/>
<alignment first="13" second="15" status="S"/>
<alignment first="14" second="16" status="S"/>
</alignments>
<first>
<string>more than 90% of china 's people centralize on one third of its territory .</string>
<pred-info>w9:n/n:CD:one w8:pp/np:IN:on w7:s[dcl]\np/pp:VBP:centralize w6:n:NNS:people w4:n:NN:china w3:np\np/np:IN:of w2:n:CD:90% w1:n/n\(s[adj]\np):IN:than w0:s[adj]\np:JJR:more w13:n:NN:territory w12:np/n:PRP$:its w11:np\np/np:IN:of w10:n:NN:third</pred-info>
<full-words>more:S-more:P-JJR:T-s[adj]\np than:S-than:P-IN:T-n/n\(s[adj]\np) 90%:S-90%:P-CD:T-n of:S-of:P-IN:T-np\np/np china:S-china:P-NN:T-n &apos;s:S-&apos;s:P-POS:T-np/n\np people:S-people:P-NNS:T-n centralize:S-centralize:P-VBP:T-s[dcl]\np/pp on:S-on:P-IN:T-pp/np one:S-one:P-CD:T-n/n third:S-third:P-NN:T-n of:S-of:P-IN:T-np\np/np its:S-its:P-PRP$:T-np/n territory:S-territory:P-NN:T-n .:S-.:P-.:T-sent\s[dcl]</full-words>
<lf>
  <satop nom="w7">
    <prop name="centralize"/>
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
    <diamond mode="tense">
      <prop name="pres"/>
    </diamond>
    <diamond mode="Arg0">
      <chunk>
        <nom name="w2"/>
        <prop name="90%"/>
        <diamond mode="det">
          <prop name="nil"/>
        </diamond>
        <diamond mode="Mod">
          <chunk>
            <nom name="w1"/>
            <prop name="than"/>
            <diamond mode="Arg1">
              <chunk>
                <nom name="w0"/>
                <prop name="more"/>
                <diamond mode="Arg0">
                  <nom name="x1"/>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
        <diamond mode="Mod">
          <chunk>
            <nom name="w3"/>
            <prop name="of"/>
            <diamond mode="Arg1">
              <chunk>
                <nom name="w6"/>
                <prop name="people"/>
                <diamond mode="num">
                  <prop name="pl"/>
                </diamond>
                <diamond mode="GenOwn">
                  <nom name="w4"/>
                  <prop name="china"/>
                  <diamond mode="det">
                    <prop name="nil"/>
                  </diamond>
                  <diamond mode="num">
                    <prop name="sg"/>
                  </diamond>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Arg1">
      <chunk>
        <nom name="w8"/>
        <prop name="on"/>
        <diamond mode="Arg1">
          <chunk>
            <nom name="w10"/>
            <prop name="third"/>
            <diamond mode="det">
              <prop name="nil"/>
            </diamond>
            <diamond mode="num">
              <prop name="sg"/>
            </diamond>
            <diamond mode="Mod">
              <chunk>
                <nom name="w11"/>
                <prop name="of"/>
                <diamond mode="Arg1">
                  <chunk>
                    <nom name="w13"/>
                    <prop name="territory"/>
                    <diamond mode="num">
                      <prop name="sg"/>
                    </diamond>
                    <diamond mode="Det">
                      <nom name="w12"/>
                      <prop name="its"/>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
            <diamond mode="Mod">
              <nom name="w9"/>
              <prop name="one"/>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
  </satop>
</lf>
</first>
<second>
<string>more than 90 percent of the population is compacted into one-third of the country 's territory .</string>
<pred-info>w9:pp/np:IN:into w8:s[pss]\np/pp:VBN:compact w7:s[dcl]\np/(s[pss]\np):VBZ:PASS w6:n:NN:population w5:np/n:DT:the w4:np\np/np:IN:of w3:n:NN:percent w2:n/n:CD:90 w1:n/n/(n/n)\(s[adj]\np):IN:than w15:n:NN:territory w0:s[adj]\np:JJR:more w13:n:NN:country w12:np/n:DT:the w11:np\np/np:IN:of w10:n:NN:one-third</pred-info>
<full-words>more:S-more:P-JJR:T-s[adj]\np than:S-than:P-IN:T-n/n/(n/n)\(s[adj]\np) 90:S-90:P-CD:T-n/n percent:S-percent:P-NN:T-n of:S-of:P-IN:T-np\np/np the:S-the:P-DT:T-np/n population:S-population:P-NN:T-n is:S-be:P-VBZ:T-s[dcl]\np/(s[pss]\np) compacted:S-compact:P-VBN:T-s[pss]\np/pp into:S-into:P-IN:T-pp/np one&#45;third:S-one&#45;third:P-NN:T-n of:S-of:P-IN:T-np\np/np the:S-the:P-DT:T-np/n country:S-country:P-NN:T-n &apos;s:S-&apos;s:P-POS:T-np/n\np territory:S-territory:P-NN:T-n .:S-.:P-.:T-sent\s[dcl]</full-words>
<lf>
  <satop nom="w10">
    <prop name="one-third"/>
    <diamond mode="num">
      <prop name="sg"/>
    </diamond>
  </satop>
  <satop nom="w7">
    <prop name="PASS"/>
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
    <diamond mode="tense">
      <prop name="pres"/>
    </diamond>
    <diamond mode="Arg0">
      <chunk>
        <nom name="w3"/>
        <prop name="percent"/>
        <diamond mode="det">
          <prop name="nil"/>
        </diamond>
        <diamond mode="num">
          <prop name="sg"/>
        </diamond>
        <diamond mode="Mod">
          <nom name="w2"/>
          <prop name="90"/>
        </diamond>
        <diamond mode="Mod">
          <chunk>
            <nom name="w4"/>
            <prop name="of"/>
            <diamond mode="Arg1">
              <chunk>
                <nom name="w6"/>
                <prop name="population"/>
                <diamond mode="num">
                  <prop name="sg"/>
                </diamond>
                <diamond mode="Det">
                  <nom name="w5"/>
                  <prop name="the"/>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Arg1">
      <chunk>
        <nom name="w8"/>
        <prop name="compact"/>
        <diamond mode="partic">
          <prop name="pass"/>
        </diamond>
        <diamond mode="Arg1">
          <nom name="w3"/>
        </diamond>
        <diamond mode="Arg2">
          <chunk>
            <nom name="w9"/>
            <prop name="into"/>
            <diamond mode="Arg1">
              <chunk>
                <nom name="x3"/>
                <diamond mode="Mod">
                  <chunk>
                    <nom name="w11"/>
                    <prop name="of"/>
                    <diamond mode="Arg1">
                      <chunk>
                        <nom name="w15"/>
                        <prop name="territory"/>
                        <diamond mode="num">
                          <prop name="sg"/>
                        </diamond>
                        <diamond mode="GenOwn">
                          <chunk>
                            <nom name="w13"/>
                            <prop name="country"/>
                            <diamond mode="num">
                              <prop name="sg"/>
                            </diamond>
                            <diamond mode="Det">
                              <nom name="w12"/>
                              <prop name="the"/>
                            </diamond>
                          </chunk>
                        </diamond>
                      </chunk>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
  </satop>
  <satop nom="x1">
    <chunk>
      <diamond mode="Mod">
        <chunk>
          <nom name="w1"/>
          <prop name="than"/>
          <diamond mode="Arg1">
            <chunk>
              <nom name="w0"/>
              <prop name="more"/>
              <diamond mode="Arg0">
                <nom name="x2"/>
              </diamond>
            </chunk>
          </diamond>
        </chunk>
      </diamond>
    </chunk>
  </satop>
</lf>
</second>
</paraphrase>
<paraphrase corpus="mtc.common" id="39">
<alignments source="GIZA_INTERSECTED">
<alignment first="4" second="9" status="S"/>
<alignment first="5" second="10" status="S"/>
<alignment first="6" second="1" status="S"/>
<alignment first="7" second="2" status="S"/>
<alignment first="8" second="3" status="S"/>
<alignment first="14" second="17" status="S"/>
<alignment first="15" second="18" status="S"/>
<alignment first="16" second="19" status="S"/>
</alignments>
<alignments source="ANNOTATOR">
<alignment first="0" second="0" status="S"/>
<alignment first="1" second="0" status="S"/>
<alignment first="2" second="0" status="S"/>
<alignment first="4" second="9" status="S"/>
<alignment first="5" second="10" status="S"/>
<alignment first="6" second="1" status="S"/>
<alignment first="7" second="2" status="S"/>
<alignment first="8" second="3" status="P"/>
<alignment first="8" second="4" status="P"/>
<alignment first="8" second="5" status="P"/>
<alignment first="8" second="6" status="P"/>
<alignment first="8" second="7" status="P"/>
<alignment first="8" second="8" status="P"/>
<alignment first="8" second="11" status="P"/>
<alignment first="8" second="12" status="P"/>
<alignment first="8" second="13" status="P"/>
<alignment first="8" second="14" status="P"/>
<alignment first="9" second="3" status="P"/>
<alignment first="9" second="4" status="P"/>
<alignment first="9" second="5" status="P"/>
<alignment first="9" second="6" status="P"/>
<alignment first="9" second="7" status="P"/>
<alignment first="9" second="8" status="P"/>
<alignment first="9" second="11" status="P"/>
<alignment first="9" second="12" status="P"/>
<alignment first="9" second="13" status="P"/>
<alignment first="9" second="14" status="P"/>
<alignment first="10" second="3" status="P"/>
<alignment first="10" second="4" status="P"/>
<alignment first="10" second="6" status="P"/>
<alignment first="10" second="8" status="P"/>
<alignment first="10" second="11" status="S"/>
<alignment first="10" second="12" status="S"/>
<alignment first="10" second="13" status="S"/>
<alignment first="10" second="14" status="P"/>
<alignment first="11" second="3" status="P"/>
<alignment first="11" second="4" status="P"/>
<alignment first="11" second="6" status="P"/>
<alignment first="11" second="8" status="P"/>
<alignment first="11" second="11" status="S"/>
<alignment first="11" second="12" status="S"/>
<alignment first="11" second="13" status="S"/>
<alignment first="11" second="14" status="P"/>
<alignment first="12" second="3" status="P"/>
<alignment first="12" second="4" status="P"/>
<alignment first="12" second="6" status="P"/>
<alignment first="12" second="8" status="P"/>
<alignment first="12" second="11" status="S"/>
<alignment first="12" second="12" status="S"/>
<alignment first="12" second="13" status="S"/>
<alignment first="12" second="14" status="P"/>
<alignment first="13" second="3" status="P"/>
<alignment first="13" second="4" status="P"/>
<alignment first="13" second="6" status="P"/>
<alignment first="13" second="8" status="P"/>
<alignment first="13" second="11" status="P"/>
<alignment first="13" second="12" status="P"/>
<alignment first="13" second="13" status="P"/>
<alignment first="13" second="14" status="S"/>
<alignment first="14" second="17" status="S"/>
<alignment first="15" second="18" status="S"/>
<alignment first="16" second="19" status="S"/>
</alignments>
<first>
<string>what 's more , next year la nina will be just as bad as el nino .</string>
<pred-info>w9:s[b]\np/(s[adj]\np):VB:be w8:s[dcl]\np/(s[b]\np):MD:will w7:n:NN:nina w6:np/n:DT:la w5:s/s:NN:year w4:s/s/(s/s):JJ:next w2:n:JJR:more w1:s[dcl]\np/np:VBZ:be w15:n:NN:nino w14:n/n:JJ:el w13:s[adj]\np\(s[adj]\np)/np:IN:as w12:s[adj]\np:JJ:bad w11:s[adj]\np/(s[adj]\np):RB:as w10:s[adj]\np/(s[adj]\np):RB:just</pred-info>
<full-words>what:S-what:P-WP:T-np/(s[dcl]\np) &apos;s:S-be:P-VBZ:T-s[dcl]\np/np more:S-more:P-JJR:T-n ,:S-,:P-,:T-s/s\np next:S-next:P-JJ:T-s/s/(s/s) year:S-year:P-NN:T-s/s la:S-la:P-DT:T-np/n nina:S-nina:P-NN:T-n will:S-will:P-MD:T-s[dcl]\np/(s[b]\np) be:S-be:P-VB:T-s[b]\np/(s[adj]\np) just:S-just:P-RB:T-s[adj]\np/(s[adj]\np) as:S-as:P-RB:T-s[adj]\np/(s[adj]\np) bad:S-bad:P-JJ:T-s[adj]\np as:S-as:P-IN:T-s[adj]\np\(s[adj]\np)/np el:S-el:P-JJ:T-n/n nino:S-nino:P-NN:T-n .:S-.:P-.:T-sent\s[dcl]</full-words>
<lf>
  <satop nom="w8">
    <prop name="will"/>
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
    <diamond mode="ApposRel">
      <chunk>
        <nom name="x1"/>
        <diamond mode="GenRel">
          <chunk>
            <nom name="w1"/>
            <prop name="be"/>
            <diamond mode="tense">
              <prop name="pres"/>
            </diamond>
            <diamond mode="Arg0">
              <nom name="x2"/>
            </diamond>
            <diamond mode="Arg1">
              <nom name="w2"/>
              <prop name="more"/>
              <diamond mode="det">
                <prop name="nil"/>
              </diamond>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Arg0">
      <chunk>
        <nom name="w7"/>
        <prop name="nina"/>
        <diamond mode="num">
          <prop name="sg"/>
        </diamond>
        <diamond mode="Det">
          <nom name="w6"/>
          <prop name="la"/>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Arg1">
      <chunk>
        <nom name="w9"/>
        <prop name="be"/>
        <diamond mode="Arg0">
          <nom name="w7"/>
        </diamond>
        <diamond mode="Arg1">
          <chunk>
            <nom name="w12"/>
            <prop name="bad"/>
            <diamond mode="Arg0">
              <nom name="w7"/>
            </diamond>
            <diamond mode="Mod">
              <nom name="w10"/>
              <prop name="just"/>
            </diamond>
            <diamond mode="Mod">
              <nom name="w11"/>
              <prop name="as"/>
            </diamond>
            <diamond mode="Mod">
              <chunk>
                <nom name="w13"/>
                <prop name="as"/>
                <diamond mode="Arg1">
                  <chunk>
                    <nom name="w15"/>
                    <prop name="nino"/>
                    <diamond mode="det">
                      <prop name="nil"/>
                    </diamond>
                    <diamond mode="num">
                      <prop name="sg"/>
                    </diamond>
                    <diamond mode="Mod">
                      <nom name="w14"/>
                      <prop name="el"/>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Mod">
      <chunk>
        <nom name="w5"/>
        <prop name="year"/>
        <diamond mode="num">
          <prop name="sg"/>
        </diamond>
        <diamond mode="Mod">
          <nom name="w4"/>
          <prop name="next"/>
        </diamond>
      </chunk>
    </diamond>
  </satop>
</lf>
</first>
<second>
<string>and la nina will put on a frightening display next year no less devastating than that of el nino .</string>
<pred-info>w9:np\np/(np\np):JJ:next w18:n:NN:nino w8:n:NN:display w17:n/n:JJ:el w7:n/n:JJ:frightening w16:np\np/np:IN:of w6:np/n:DT:a w15:np:DT:that w5:pp/np:IN:on w14:s[adj]\np\(s[adj]\np)/np:IN:than w4:s[b]\np/pp:VB:put w13:s[adj]\np:JJ:devastating w3:s[dcl]\np/(s[b]\np):MD:will w12:s[adj]\np/(s[adj]\np):RBR:less w2:n:NN:nina w11:s[adj]\np/(s[adj]\np):RB:no w1:np/n:DT:la w10:np\np:NN:year w0:s/s:CC:and</pred-info>
<full-words>and:S-and:P-CC:T-s/s la:S-la:P-DT:T-np/n nina:S-nina:P-NN:T-n will:S-will:P-MD:T-s[dcl]\np/(s[b]\np) put:S-put:P-VB:T-s[b]\np/pp on:S-on:P-IN:T-pp/np a:S-a:P-DT:T-np/n frightening:S-frightening:P-JJ:T-n/n display:S-display:P-NN:T-n next:S-next:P-JJ:T-np\np/(np\np) year:S-year:P-NN:T-np\np no:S-no:P-RB:T-s[adj]\np/(s[adj]\np) less:S-less:P-RBR:T-s[adj]\np/(s[adj]\np) devastating:S-devastating:P-JJ:T-s[adj]\np than:S-than:P-IN:T-s[adj]\np\(s[adj]\np)/np that:S-that:P-DT:T-np of:S-of:P-IN:T-np\np/np el:S-el:P-JJ:T-n/n nino:S-nino:P-NN:T-n .:S-.:P-.:T-sent\s[dcl]</full-words>
<lf>
  <satop nom="w3">
    <prop name="will"/>
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
    <diamond mode="Arg0">
      <chunk>
        <nom name="w2"/>
        <prop name="nina"/>
        <diamond mode="num">
          <prop name="sg"/>
        </diamond>
        <diamond mode="Det">
          <nom name="w1"/>
          <prop name="la"/>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Arg1">
      <chunk>
        <nom name="w4"/>
        <prop name="put"/>
        <diamond mode="Arg0">
          <nom name="w2"/>
        </diamond>
        <diamond mode="Arg1">
          <chunk>
            <nom name="w5"/>
            <prop name="on"/>
            <diamond mode="Arg1">
              <chunk>
                <nom name="w8"/>
                <prop name="display"/>
                <diamond mode="num">
                  <prop name="sg"/>
                </diamond>
                <diamond mode="Det">
                  <nom name="w6"/>
                  <prop name="a"/>
                </diamond>
                <diamond mode="Mod">
                  <chunk>
                    <nom name="w10"/>
                    <prop name="year"/>
                    <diamond mode="num">
                      <prop name="sg"/>
                    </diamond>
                    <diamond mode="Mod">
                      <nom name="w9"/>
                      <prop name="next"/>
                    </diamond>
                  </chunk>
                </diamond>
                <diamond mode="Mod">
                  <nom name="w7"/>
                  <prop name="frightening"/>
                </diamond>
                <diamond mode="GenRel">
                  <chunk>
                    <nom name="w13"/>
                    <prop name="devastating"/>
                    <diamond mode="Arg0">
                      <nom name="w8"/>
                    </diamond>
                    <diamond mode="Mod">
                      <nom name="w11"/>
                      <prop name="no"/>
                    </diamond>
                    <diamond mode="Mod">
                      <nom name="w12"/>
                      <prop name="less"/>
                    </diamond>
                    <diamond mode="Mod">
                      <chunk>
                        <nom name="w14"/>
                        <prop name="than"/>
                        <diamond mode="Arg1">
                          <chunk>
                            <nom name="w15"/>
                            <prop name="that"/>
                            <diamond mode="Mod">
                              <chunk>
                                <nom name="w16"/>
                                <prop name="of"/>
                                <diamond mode="Arg1">
                                  <chunk>
                                    <nom name="w18"/>
                                    <prop name="nino"/>
                                    <diamond mode="det">
                                      <prop name="nil"/>
                                    </diamond>
                                    <diamond mode="num">
                                      <prop name="sg"/>
                                    </diamond>
                                    <diamond mode="Mod">
                                      <nom name="w17"/>
                                      <prop name="el"/>
                                    </diamond>
                                  </chunk>
                                </diamond>
                              </chunk>
                            </diamond>
                          </chunk>
                        </diamond>
                      </chunk>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Mod">
      <nom name="w0"/>
      <prop name="and"/>
    </diamond>
  </satop>
</lf>
</second>
</paraphrase>
<paraphrase corpus="mtc.common" id="40">
<alignments source="GIZA_INTERSECTED">
<alignment first="0" second="0" status="S"/>
<alignment first="1" second="1" status="S"/>
<alignment first="2" second="2" status="S"/>
<alignment first="5" second="6" status="S"/>
</alignments>
<alignments source="ANNOTATOR">
<alignment first="0" second="0" status="S"/>
<alignment first="1" second="1" status="S"/>
<alignment first="2" second="2" status="S"/>
<alignment first="3" second="4" status="S"/>
<alignment first="4" second="5" status="S"/>
<alignment first="5" second="6" status="S"/>
<alignment first="5" second="7" status="S"/>
</alignments>
<first>
<string>russian prime minister on domestic economy</string>
<pred-info>w2:n:NN:minister w1:n/n:JJ:prime w0:n/n:JJ:russian w5:n:NN:economy w4:n/n:JJ:domestic w3:np\np/np:IN:on</pred-info>
<full-words>russian:S-russian:P-JJ:T-n/n prime:S-prime:P-JJ:T-n/n minister:S-minister:P-NN:T-n on:S-on:P-IN:T-np\np/np domestic:S-domestic:P-JJ:T-n/n economy:S-economy:P-NN:T-n</full-words>
<lf>
  <satop nom="w2">
    <chunk>
      <prop name="minister"/>
      <diamond mode="det">
        <prop name="nil"/>
      </diamond>
      <diamond mode="num">
        <prop name="sg"/>
      </diamond>
      <diamond mode="Mod">
        <nom name="w0"/>
        <prop name="russian"/>
      </diamond>
      <diamond mode="Mod">
        <nom name="w1"/>
        <prop name="prime"/>
      </diamond>
      <diamond mode="Mod">
        <chunk>
          <nom name="w3"/>
          <prop name="on"/>
          <diamond mode="Arg1">
            <chunk>
              <nom name="w5"/>
              <prop name="economy"/>
              <diamond mode="det">
                <prop name="nil"/>
              </diamond>
              <diamond mode="num">
                <prop name="sg"/>
              </diamond>
              <diamond mode="Mod">
                <nom name="w4"/>
                <prop name="domestic"/>
              </diamond>
            </chunk>
          </diamond>
        </chunk>
      </diamond>
    </chunk>
  </satop>
</lf>
</first>
<second>
<string>russian prime minister talked about russian economic situation .</string>
<pred-info>w2:n:NN:minister w1:n/n:JJ:prime w0:n/n:JJ:russian w7:n:NN:situation w6:n/n:JJ:economic w5:n/n:JJ:russian w4:pp/np:IN:about w3:s[dcl]\np/pp:VBD:talk</pred-info>
<full-words>russian:S-russian:P-JJ:T-n/n prime:S-prime:P-JJ:T-n/n minister:S-minister:P-NN:T-n talked:S-talk:P-VBD:T-s[dcl]\np/pp about:S-about:P-IN:T-pp/np russian:S-russian:P-JJ:T-n/n economic:S-economic:P-JJ:T-n/n situation:S-situation:P-NN:T-n .:S-.:P-.:T-sent\s[dcl]</full-words>
<lf>
  <satop nom="w3">
    <prop name="talk"/>
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
    <diamond mode="tense">
      <prop name="past"/>
    </diamond>
    <diamond mode="Arg0">
      <chunk>
        <nom name="w2"/>
        <prop name="minister"/>
        <diamond mode="det">
          <prop name="nil"/>
        </diamond>
        <diamond mode="num">
          <prop name="sg"/>
        </diamond>
        <diamond mode="Mod">
          <nom name="w0"/>
          <prop name="russian"/>
        </diamond>
        <diamond mode="Mod">
          <nom name="w1"/>
          <prop name="prime"/>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Arg1">
      <chunk>
        <nom name="w4"/>
        <prop name="about"/>
        <diamond mode="Arg1">
          <chunk>
            <nom name="w7"/>
            <prop name="situation"/>
            <diamond mode="det">
              <prop name="nil"/>
            </diamond>
            <diamond mode="num">
              <prop name="sg"/>
            </diamond>
            <diamond mode="Mod">
              <nom name="w5"/>
              <prop name="russian"/>
            </diamond>
            <diamond mode="Mod">
              <nom name="w6"/>
              <prop name="economic"/>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
  </satop>
</lf>
</second>
</paraphrase>
<paraphrase corpus="mtc.common" id="41">
<alignments source="GIZA_INTERSECTED">
<alignment first="0" second="0" status="S"/>
<alignment first="1" second="1" status="S"/>
<alignment first="2" second="2" status="S"/>
<alignment first="3" second="3" status="S"/>
<alignment first="4" second="4" status="S"/>
<alignment first="5" second="5" status="S"/>
<alignment first="6" second="6" status="S"/>
<alignment first="7" second="7" status="S"/>
<alignment first="8" second="8" status="S"/>
<alignment first="9" second="9" status="S"/>
<alignment first="10" second="10" status="S"/>
<alignment first="11" second="11" status="S"/>
<alignment first="12" second="12" status="S"/>
<alignment first="13" second="13" status="S"/>
<alignment first="14" second="14" status="S"/>
<alignment first="15" second="15" status="S"/>
</alignments>
<alignments source="ANNOTATOR">
<alignment first="0" second="0" status="S"/>
<alignment first="1" second="1" status="S"/>
<alignment first="2" second="2" status="S"/>
<alignment first="3" second="3" status="S"/>
<alignment first="4" second="4" status="S"/>
<alignment first="5" second="5" status="S"/>
<alignment first="6" second="6" status="S"/>
<alignment first="7" second="7" status="S"/>
<alignment first="8" second="8" status="S"/>
<alignment first="9" second="9" status="S"/>
<alignment first="10" second="10" status="S"/>
<alignment first="11" second="11" status="S"/>
<alignment first="12" second="12" status="S"/>
<alignment first="13" second="13" status="S"/>
<alignment first="14" second="14" status="S"/>
<alignment first="15" second="15" status="S"/>
</alignments>
<first>
<string>nowadays , there appeared a lot of enterprise groups with high technology and strong stamina .</string>
<pred-info>w9:np\np/np:IN:with w8:n:NNS:group w7:n/n:NN:enterprise w6:s\np\(s\np)\(s\np\(s\np))/np:IN:of w5:n:NN:lot w4:s\np\(s\np)/n:DT:a w3:s[dcl]\np:VBD:appear w0:s/s:RB:nowadays w14:n:NN:stamina w13:n/n:JJ:strong w12:n\n/n:CC:and w11:n:NN:technology w10:n/n:JJ:high</pred-info>
<full-words>nowadays:S-nowadays:P-RB:T-s/s ,:S-,:P-,:T-s/s\(s/s) there:S-there:P-EX:T-np[thr] appeared:S-appear:P-VBD:T-s[dcl]\np a:S-a:P-DT:T-s\np\(s\np)/n lot:S-lot:P-NN:T-n of:S-of:P-IN:T-s\np\(s\np)\(s\np\(s\np))/np enterprise:S-enterprise:P-NN:T-n/n groups:S-group:P-NNS:T-n with:S-with:P-IN:T-np\np/np high:S-high:P-JJ:T-n/n technology:S-technology:P-NN:T-n and:S-and:P-CC:T-n\n/n strong:S-strong:P-JJ:T-n/n stamina:S-stamina:P-NN:T-n .:S-.:P-.:T-sent\s[dcl]</full-words>
<lf>
  <satop nom="w3">
    <prop name="appear"/>
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
    <diamond mode="tense">
      <prop name="past"/>
    </diamond>
    <diamond mode="Arg0">
      <nom name="x1"/>
    </diamond>
    <diamond mode="Mod">
      <nom name="w0"/>
      <prop name="nowadays"/>
      <diamond mode="emph-intro">
        <prop name="+"/>
      </diamond>
    </diamond>
    <diamond mode="Mod">
      <chunk>
        <nom name="w4"/>
        <prop name="a"/>
        <diamond mode="Arg1">
          <nom name="w5"/>
          <prop name="lot"/>
          <diamond mode="num">
            <prop name="sg"/>
          </diamond>
        </diamond>
        <diamond mode="Mod">
          <chunk>
            <nom name="w6"/>
            <prop name="of"/>
            <diamond mode="Arg1">
              <nom name="w3"/>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Mod">
      <chunk>
        <nom name="w9"/>
        <prop name="with"/>
        <diamond mode="Arg1">
          <chunk>
            <nom name="w12"/>
            <prop name="and"/>
            <diamond mode="det">
              <prop name="nil"/>
            </diamond>
            <diamond mode="First">
              <chunk>
                <nom name="w11"/>
                <prop name="technology"/>
                <diamond mode="num">
                  <prop name="sg"/>
                </diamond>
                <diamond mode="Mod">
                  <nom name="w10"/>
                  <prop name="high"/>
                </diamond>
              </chunk>
            </diamond>
            <diamond mode="Next">
              <chunk>
                <nom name="w14"/>
                <prop name="stamina"/>
                <diamond mode="num">
                  <prop name="sg"/>
                </diamond>
                <diamond mode="Mod">
                  <nom name="w13"/>
                  <prop name="strong"/>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
  </satop>
  <satop nom="w8">
    <chunk>
      <prop name="group"/>
      <diamond mode="num">
        <prop name="pl"/>
      </diamond>
      <diamond mode="Mod">
        <nom name="w7"/>
        <prop name="enterprise"/>
        <diamond mode="num">
          <prop name="sg"/>
        </diamond>
      </diamond>
    </chunk>
  </satop>
</lf>
</first>
<second>
<string>nowadays , there appeared a lot of enterprise groups with high technology and strong stamina .</string>
<pred-info>w9:np\np/np:IN:with w8:n:NNS:group w7:n/n:NN:enterprise w6:s\np\(s\np)\(s\np\(s\np))/np:IN:of w5:n:NN:lot w4:s\np\(s\np)/n:DT:a w3:s[dcl]\np:VBD:appear w0:s/s:RB:nowadays w14:n:NN:stamina w13:n/n:JJ:strong w12:n\n/n:CC:and w11:n:NN:technology w10:n/n:JJ:high</pred-info>
<full-words>nowadays:S-nowadays:P-RB:T-s/s ,:S-,:P-,:T-s/s\(s/s) there:S-there:P-EX:T-np[thr] appeared:S-appear:P-VBD:T-s[dcl]\np a:S-a:P-DT:T-s\np\(s\np)/n lot:S-lot:P-NN:T-n of:S-of:P-IN:T-s\np\(s\np)\(s\np\(s\np))/np enterprise:S-enterprise:P-NN:T-n/n groups:S-group:P-NNS:T-n with:S-with:P-IN:T-np\np/np high:S-high:P-JJ:T-n/n technology:S-technology:P-NN:T-n and:S-and:P-CC:T-n\n/n strong:S-strong:P-JJ:T-n/n stamina:S-stamina:P-NN:T-n .:S-.:P-.:T-sent\s[dcl]</full-words>
<lf>
  <satop nom="w3">
    <prop name="appear"/>
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
    <diamond mode="tense">
      <prop name="past"/>
    </diamond>
    <diamond mode="Arg0">
      <nom name="x1"/>
    </diamond>
    <diamond mode="Mod">
      <nom name="w0"/>
      <prop name="nowadays"/>
      <diamond mode="emph-intro">
        <prop name="+"/>
      </diamond>
    </diamond>
    <diamond mode="Mod">
      <chunk>
        <nom name="w4"/>
        <prop name="a"/>
        <diamond mode="Arg1">
          <nom name="w5"/>
          <prop name="lot"/>
          <diamond mode="num">
            <prop name="sg"/>
          </diamond>
        </diamond>
        <diamond mode="Mod">
          <chunk>
            <nom name="w6"/>
            <prop name="of"/>
            <diamond mode="Arg1">
              <nom name="w3"/>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Mod">
      <chunk>
        <nom name="w9"/>
        <prop name="with"/>
        <diamond mode="Arg1">
          <chunk>
            <nom name="w12"/>
            <prop name="and"/>
            <diamond mode="det">
              <prop name="nil"/>
            </diamond>
            <diamond mode="First">
              <chunk>
                <nom name="w11"/>
                <prop name="technology"/>
                <diamond mode="num">
                  <prop name="sg"/>
                </diamond>
                <diamond mode="Mod">
                  <nom name="w10"/>
                  <prop name="high"/>
                </diamond>
              </chunk>
            </diamond>
            <diamond mode="Next">
              <chunk>
                <nom name="w14"/>
                <prop name="stamina"/>
                <diamond mode="num">
                  <prop name="sg"/>
                </diamond>
                <diamond mode="Mod">
                  <nom name="w13"/>
                  <prop name="strong"/>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
  </satop>
  <satop nom="w8">
    <chunk>
      <prop name="group"/>
      <diamond mode="num">
        <prop name="pl"/>
      </diamond>
      <diamond mode="Mod">
        <nom name="w7"/>
        <prop name="enterprise"/>
        <diamond mode="num">
          <prop name="sg"/>
        </diamond>
      </diamond>
    </chunk>
  </satop>
</lf>
</second>
</paraphrase>
<paraphrase corpus="mtc.common" id="42">
<alignments source="GIZA_INTERSECTED">
<alignment first="0" second="0" status="S"/>
<alignment first="1" second="1" status="S"/>
<alignment first="3" second="4" status="S"/>
<alignment first="4" second="5" status="S"/>
<alignment first="5" second="8" status="S"/>
<alignment first="6" second="9" status="S"/>
<alignment first="7" second="10" status="S"/>
<alignment first="11" second="13" status="S"/>
<alignment first="12" second="14" status="S"/>
<alignment first="13" second="15" status="S"/>
<alignment first="15" second="16" status="S"/>
<alignment first="16" second="17" status="S"/>
<alignment first="17" second="18" status="S"/>
<alignment first="18" second="19" status="S"/>
<alignment first="19" second="20" status="S"/>
</alignments>
<alignments source="ANNOTATOR">
<alignment first="0" second="0" status="S"/>
<alignment first="1" second="1" status="S"/>
<alignment first="1" second="2" status="S"/>
<alignment first="1" second="3" status="S"/>
<alignment first="3" second="4" status="P"/>
<alignment first="4" second="5" status="S"/>
<alignment first="5" second="8" status="S"/>
<alignment first="6" second="9" status="S"/>
<alignment first="7" second="10" status="S"/>
<alignment first="8" second="6" status="S"/>
<alignment first="9" second="11" status="S"/>
<alignment first="9" second="12" status="S"/>
<alignment first="11" second="13" status="S"/>
<alignment first="12" second="14" status="S"/>
<alignment first="13" second="15" status="S"/>
<alignment first="15" second="16" status="S"/>
<alignment first="16" second="17" status="P"/>
<alignment first="17" second="18" status="S"/>
<alignment first="18" second="19" status="S"/>
<alignment first="19" second="20" status="S"/>
</alignments>
<first>
<string>the gnp created by the village and township enterprises occupied about 1\/3 of the total gnp in fujian province .</string>
<pred-info>w9:s[dcl]\np/np:VBD:occupy w8:n:NNS:enterprise w18:n:NN:province w17:n/n:JJ:fujian w7:n/n:NN:township h1:n\(n/n)/n:CC:has-rel w16:np\np/np:IN:in w6:n\(n/n)/n:CC:and w15:n:NN:gnp w5:n/n:NN:village w14:n/n:JJ:total w4:np/n:DT:the w13:np/n:DT:the w3:s\np\(s\np)/np:IN:by w12:np\np/np:IN:of w2:s[pss]\np:VBN:create w11:n:CD:1\/3 w1:n:NN:gnp w10:n/n:IN:about w0:np/n:DT:the</pred-info>
<full-words>the:S-the:P-DT:T-np/n gnp:S-gnp:P-NN:T-n created:S-create:P-VBN:T-s[pss]\np by:S-by:P-IN:T-s\np\(s\np)/np the:S-the:P-DT:T-np/n village:S-village:P-NN:T-n/n and:S-and:P-CC:T-n\(n/n)/n township:S-township:P-NN:T-n/n enterprises:S-enterprise:P-NNS:T-n occupied:S-occupy:P-VBD:T-s[dcl]\np/np about:S-about:P-IN:T-n/n 1\/3:S-1\/3:P-CD:T-n of:S-of:P-IN:T-np\np/np the:S-the:P-DT:T-np/n total:S-total:P-JJ:T-n/n gnp:S-gnp:P-NN:T-n in:S-in:P-IN:T-np\np/np fujian:S-fujian:P-JJ:T-n/n province:S-province:P-NN:T-n .:S-.:P-.:T-sent\s[dcl]</full-words>
<lf>
  <satop nom="w9">
    <prop name="occupy"/>
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
    <diamond mode="tense">
      <prop name="past"/>
    </diamond>
    <diamond mode="Arg0">
      <chunk>
        <nom name="w1"/>
        <prop name="gnp"/>
        <diamond mode="num">
          <prop name="sg"/>
        </diamond>
        <diamond mode="Det">
          <nom name="w0"/>
          <prop name="the"/>
        </diamond>
        <diamond mode="GenRel">
          <chunk>
            <nom name="w2"/>
            <prop name="create"/>
            <diamond mode="partic">
              <prop name="pass"/>
            </diamond>
            <diamond mode="Arg1">
              <nom name="w1"/>
            </diamond>
            <diamond mode="Mod">
              <chunk>
                <nom name="w3"/>
                <prop name="by"/>
                <diamond mode="Arg1">
                  <chunk>
                    <nom name="w6"/>
                    <prop name="and"/>
                    <diamond mode="Arg0">
                      <chunk>
                        <nom name="h1"/>
                        <prop name="has-rel"/>
                        <diamond mode="Mod">
                          <nom name="w5"/>
                          <prop name="village"/>
                          <diamond mode="num">
                            <prop name="sg"/>
                          </diamond>
                        </diamond>
                        <diamond mode="Of">
                          <nom name="w8"/>
                        </diamond>
                      </chunk>
                    </diamond>
                    <diamond mode="Arg1">
                      <chunk>
                        <nom name="w8"/>
                        <prop name="enterprise"/>
                        <diamond mode="num">
                          <prop name="pl"/>
                        </diamond>
                        <diamond mode="Mod">
                          <nom name="w7"/>
                          <prop name="township"/>
                          <diamond mode="num">
                            <prop name="sg"/>
                          </diamond>
                        </diamond>
                      </chunk>
                    </diamond>
                    <diamond mode="Det">
                      <nom name="w4"/>
                      <prop name="the"/>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Arg1">
      <chunk>
        <nom name="w11"/>
        <prop name="1\/3"/>
        <diamond mode="det">
          <prop name="nil"/>
        </diamond>
        <diamond mode="Mod">
          <nom name="w10"/>
          <prop name="about"/>
        </diamond>
        <diamond mode="Mod">
          <chunk>
            <nom name="w12"/>
            <prop name="of"/>
            <diamond mode="Arg1">
              <chunk>
                <nom name="w15"/>
                <prop name="gnp"/>
                <diamond mode="num">
                  <prop name="sg"/>
                </diamond>
                <diamond mode="Det">
                  <nom name="w13"/>
                  <prop name="the"/>
                </diamond>
                <diamond mode="Mod">
                  <nom name="w14"/>
                  <prop name="total"/>
                </diamond>
                <diamond mode="Mod">
                  <chunk>
                    <nom name="w16"/>
                    <prop name="in"/>
                    <diamond mode="Arg1">
                      <chunk>
                        <nom name="w18"/>
                        <prop name="province"/>
                        <diamond mode="det">
                          <prop name="nil"/>
                        </diamond>
                        <diamond mode="num">
                          <prop name="sg"/>
                        </diamond>
                        <diamond mode="Mod">
                          <nom name="w17"/>
                          <prop name="fujian"/>
                        </diamond>
                      </chunk>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
  </satop>
</lf>
</first>
<second>
<string>the gross national product of the industry of villages and towns made up 1\/3 of the gnp of fujian province .</string>
<pred-info>w9:np\np/np:CC:and w19:n:NN:province w18:n/n:JJ:fujian w8:n:NNS:village w17:np\np/np:IN:of w7:np\np/np:IN:of w16:n:NN:gnp w6:n:NN:industry w15:np/n:DT:the w5:np/n:DT:the w14:np\np/np:IN:of w4:np\np/np:IN:of w13:n:CD:1\/3 w3:n:NN:product w12:s\np\(s\np):RP:up w2:n/n:JJ:national w11:s[dcl]\np/np:VBD:make w1:n/n:JJ:gross w10:n:NNS:town w0:np/n:DT:the</pred-info>
<full-words>the:S-the:P-DT:T-np/n gross:S-gross:P-JJ:T-n/n national:S-national:P-JJ:T-n/n product:S-product:P-NN:T-n of:S-of:P-IN:T-np\np/np the:S-the:P-DT:T-np/n industry:S-industry:P-NN:T-n of:S-of:P-IN:T-np\np/np villages:S-village:P-NNS:T-n and:S-and:P-CC:T-np\np/np towns:S-town:P-NNS:T-n made:S-make:P-VBD:T-s[dcl]\np/np up:S-up:P-RP:T-s\np\(s\np) 1\/3:S-1\/3:P-CD:T-n of:S-of:P-IN:T-np\np/np the:S-the:P-DT:T-np/n gnp:S-gnp:P-NN:T-n of:S-of:P-IN:T-np\np/np fujian:S-fujian:P-JJ:T-n/n province:S-province:P-NN:T-n .:S-.:P-.:T-sent\s[dcl]</full-words>
<lf>
  <satop nom="w11">
    <prop name="make"/>
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
    <diamond mode="tense">
      <prop name="past"/>
    </diamond>
    <diamond mode="Arg0">
      <chunk>
        <nom name="w3"/>
        <prop name="product"/>
        <diamond mode="num">
          <prop name="sg"/>
        </diamond>
        <diamond mode="Det">
          <nom name="w0"/>
          <prop name="the"/>
        </diamond>
        <diamond mode="Mod">
          <nom name="w1"/>
          <prop name="gross"/>
        </diamond>
        <diamond mode="Mod">
          <nom name="w2"/>
          <prop name="national"/>
        </diamond>
        <diamond mode="Mod">
          <chunk>
            <nom name="w4"/>
            <prop name="of"/>
            <diamond mode="Arg1">
              <chunk>
                <nom name="w6"/>
                <prop name="industry"/>
                <diamond mode="num">
                  <prop name="sg"/>
                </diamond>
                <diamond mode="Det">
                  <nom name="w5"/>
                  <prop name="the"/>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
        <diamond mode="Mod">
          <chunk>
            <nom name="w7"/>
            <prop name="of"/>
            <diamond mode="Arg1">
              <chunk>
                <nom name="w9"/>
                <prop name="and"/>
                <diamond mode="First">
                  <nom name="w8"/>
                  <prop name="village"/>
                  <diamond mode="det">
                    <prop name="nil"/>
                  </diamond>
                  <diamond mode="num">
                    <prop name="pl"/>
                  </diamond>
                </diamond>
                <diamond mode="Next">
                  <nom name="w10"/>
                  <prop name="town"/>
                  <diamond mode="det">
                    <prop name="nil"/>
                  </diamond>
                  <diamond mode="num">
                    <prop name="pl"/>
                  </diamond>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Arg1">
      <chunk>
        <nom name="w13"/>
        <prop name="1\/3"/>
        <diamond mode="det">
          <prop name="nil"/>
        </diamond>
        <diamond mode="Mod">
          <chunk>
            <nom name="w14"/>
            <prop name="of"/>
            <diamond mode="Arg1">
              <chunk>
                <nom name="w16"/>
                <prop name="gnp"/>
                <diamond mode="num">
                  <prop name="sg"/>
                </diamond>
                <diamond mode="Det">
                  <nom name="w15"/>
                  <prop name="the"/>
                </diamond>
                <diamond mode="Mod">
                  <chunk>
                    <nom name="w17"/>
                    <prop name="of"/>
                    <diamond mode="Arg1">
                      <chunk>
                        <nom name="w19"/>
                        <prop name="province"/>
                        <diamond mode="det">
                          <prop name="nil"/>
                        </diamond>
                        <diamond mode="num">
                          <prop name="sg"/>
                        </diamond>
                        <diamond mode="Mod">
                          <nom name="w18"/>
                          <prop name="fujian"/>
                        </diamond>
                      </chunk>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Mod">
      <nom name="w12"/>
      <prop name="up"/>
    </diamond>
  </satop>
</lf>
</second>
</paraphrase>
<paraphrase corpus="mtc.common" id="43">
<alignments source="GIZA_INTERSECTED">
<alignment first="0" second="0" status="S"/>
<alignment first="1" second="1" status="S"/>
<alignment first="2" second="2" status="S"/>
<alignment first="3" second="3" status="S"/>
<alignment first="4" second="4" status="S"/>
<alignment first="5" second="5" status="S"/>
<alignment first="6" second="6" status="S"/>
<alignment first="7" second="7" status="S"/>
<alignment first="8" second="8" status="S"/>
<alignment first="9" second="9" status="S"/>
<alignment first="10" second="10" status="S"/>
<alignment first="11" second="11" status="S"/>
<alignment first="12" second="12" status="S"/>
<alignment first="13" second="13" status="S"/>
<alignment first="14" second="14" status="S"/>
<alignment first="15" second="15" status="S"/>
<alignment first="16" second="16" status="S"/>
<alignment first="17" second="17" status="S"/>
</alignments>
<alignments source="ANNOTATOR">
<alignment first="0" second="0" status="S"/>
<alignment first="1" second="1" status="S"/>
<alignment first="2" second="2" status="S"/>
<alignment first="3" second="3" status="S"/>
<alignment first="4" second="4" status="S"/>
<alignment first="5" second="5" status="S"/>
<alignment first="6" second="6" status="S"/>
<alignment first="7" second="7" status="S"/>
<alignment first="8" second="8" status="S"/>
<alignment first="9" second="9" status="S"/>
<alignment first="10" second="10" status="S"/>
<alignment first="11" second="11" status="S"/>
<alignment first="12" second="12" status="S"/>
<alignment first="13" second="13" status="S"/>
<alignment first="14" second="14" status="S"/>
<alignment first="15" second="15" status="S"/>
<alignment first="16" second="16" status="S"/>
<alignment first="17" second="17" status="S"/>
</alignments>
<first>
<string>both parties expressed satisfaction for the friendly cooperation between the two armies in the past 30 years .</string>
<pred-info>w9:np/n:DT:the w8:np\np/np:IN:between w7:n:NN:cooperation w6:n/n:JJ:friendly w5:np/n:DT:the w4:np\np/np:IN:for w3:n:NN:satisfaction w2:s[dcl]\np/np:VBD:express w16:n:NNS:year w1:n:NNS:party w15:n/n:CD:30 w0:np/n:DT:both w14:n/n:JJ:past w13:np/n:DT:the w12:np\np/np:IN:in w11:n:NNS:army w10:n/n:CD:two</pred-info>
<full-words>both:S-both:P-DT:T-np/n parties:S-party:P-NNS:T-n expressed:S-express:P-VBD:T-s[dcl]\np/np satisfaction:S-satisfaction:P-NN:T-n for:S-for:P-IN:T-np\np/np the:S-the:P-DT:T-np/n friendly:S-friendly:P-JJ:T-n/n cooperation:S-cooperation:P-NN:T-n between:S-between:P-IN:T-np\np/np the:S-the:P-DT:T-np/n two:S-two:P-CD:T-n/n armies:S-army:P-NNS:T-n in:S-in:P-IN:T-np\np/np the:S-the:P-DT:T-np/n past:S-past:P-JJ:T-n/n 30:S-30:P-CD:T-n/n years:S-year:P-NNS:T-n .:S-.:P-.:T-sent\s[dcl]</full-words>
<lf>
  <satop nom="w2">
    <prop name="express"/>
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
    <diamond mode="tense">
      <prop name="past"/>
    </diamond>
    <diamond mode="Arg0">
      <chunk>
        <nom name="w1"/>
        <prop name="party"/>
        <diamond mode="num">
          <prop name="pl"/>
        </diamond>
        <diamond mode="Det">
          <nom name="w0"/>
          <prop name="both"/>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Arg1">
      <chunk>
        <nom name="w3"/>
        <prop name="satisfaction"/>
        <diamond mode="det">
          <prop name="nil"/>
        </diamond>
        <diamond mode="num">
          <prop name="sg"/>
        </diamond>
        <diamond mode="Mod">
          <chunk>
            <nom name="w4"/>
            <prop name="for"/>
            <diamond mode="Arg1">
              <chunk>
                <nom name="w7"/>
                <prop name="cooperation"/>
                <diamond mode="num">
                  <prop name="sg"/>
                </diamond>
                <diamond mode="Det">
                  <nom name="w5"/>
                  <prop name="the"/>
                </diamond>
                <diamond mode="Mod">
                  <chunk>
                    <nom name="w12"/>
                    <prop name="in"/>
                    <diamond mode="Arg1">
                      <chunk>
                        <nom name="w16"/>
                        <prop name="year"/>
                        <diamond mode="num">
                          <prop name="pl"/>
                        </diamond>
                        <diamond mode="Det">
                          <nom name="w13"/>
                          <prop name="the"/>
                        </diamond>
                        <diamond mode="Mod">
                          <nom name="w14"/>
                          <prop name="past"/>
                        </diamond>
                        <diamond mode="Mod">
                          <nom name="w15"/>
                          <prop name="30"/>
                        </diamond>
                      </chunk>
                    </diamond>
                  </chunk>
                </diamond>
                <diamond mode="Mod">
                  <nom name="w6"/>
                  <prop name="friendly"/>
                </diamond>
                <diamond mode="Mod">
                  <chunk>
                    <nom name="w8"/>
                    <prop name="between"/>
                    <diamond mode="Arg1">
                      <chunk>
                        <nom name="w11"/>
                        <prop name="army"/>
                        <diamond mode="num">
                          <prop name="pl"/>
                        </diamond>
                        <diamond mode="Det">
                          <nom name="w9"/>
                          <prop name="the"/>
                        </diamond>
                        <diamond mode="Mod">
                          <nom name="w10"/>
                          <prop name="two"/>
                        </diamond>
                      </chunk>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
  </satop>
</lf>
</first>
<second>
<string>both parties expressed satisfaction for the friendly cooperation between the two armies in the past 30 years .</string>
<pred-info>w9:np/n:DT:the w8:np\np/np:IN:between w7:n:NN:cooperation w6:n/n:JJ:friendly w5:np/n:DT:the w4:np\np/np:IN:for w3:n:NN:satisfaction w2:s[dcl]\np/np:VBD:express w16:n:NNS:year w1:n:NNS:party w15:n/n:CD:30 w0:np/n:DT:both w14:n/n:JJ:past w13:np/n:DT:the w12:np\np/np:IN:in w11:n:NNS:army w10:n/n:CD:two</pred-info>
<full-words>both:S-both:P-DT:T-np/n parties:S-party:P-NNS:T-n expressed:S-express:P-VBD:T-s[dcl]\np/np satisfaction:S-satisfaction:P-NN:T-n for:S-for:P-IN:T-np\np/np the:S-the:P-DT:T-np/n friendly:S-friendly:P-JJ:T-n/n cooperation:S-cooperation:P-NN:T-n between:S-between:P-IN:T-np\np/np the:S-the:P-DT:T-np/n two:S-two:P-CD:T-n/n armies:S-army:P-NNS:T-n in:S-in:P-IN:T-np\np/np the:S-the:P-DT:T-np/n past:S-past:P-JJ:T-n/n 30:S-30:P-CD:T-n/n years:S-year:P-NNS:T-n .:S-.:P-.:T-sent\s[dcl]</full-words>
<lf>
  <satop nom="w2">
    <prop name="express"/>
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
    <diamond mode="tense">
      <prop name="past"/>
    </diamond>
    <diamond mode="Arg0">
      <chunk>
        <nom name="w1"/>
        <prop name="party"/>
        <diamond mode="num">
          <prop name="pl"/>
        </diamond>
        <diamond mode="Det">
          <nom name="w0"/>
          <prop name="both"/>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Arg1">
      <chunk>
        <nom name="w3"/>
        <prop name="satisfaction"/>
        <diamond mode="det">
          <prop name="nil"/>
        </diamond>
        <diamond mode="num">
          <prop name="sg"/>
        </diamond>
        <diamond mode="Mod">
          <chunk>
            <nom name="w4"/>
            <prop name="for"/>
            <diamond mode="Arg1">
              <chunk>
                <nom name="w7"/>
                <prop name="cooperation"/>
                <diamond mode="num">
                  <prop name="sg"/>
                </diamond>
                <diamond mode="Det">
                  <nom name="w5"/>
                  <prop name="the"/>
                </diamond>
                <diamond mode="Mod">
                  <chunk>
                    <nom name="w12"/>
                    <prop name="in"/>
                    <diamond mode="Arg1">
                      <chunk>
                        <nom name="w16"/>
                        <prop name="year"/>
                        <diamond mode="num">
                          <prop name="pl"/>
                        </diamond>
                        <diamond mode="Det">
                          <nom name="w13"/>
                          <prop name="the"/>
                        </diamond>
                        <diamond mode="Mod">
                          <nom name="w14"/>
                          <prop name="past"/>
                        </diamond>
                        <diamond mode="Mod">
                          <nom name="w15"/>
                          <prop name="30"/>
                        </diamond>
                      </chunk>
                    </diamond>
                  </chunk>
                </diamond>
                <diamond mode="Mod">
                  <nom name="w6"/>
                  <prop name="friendly"/>
                </diamond>
                <diamond mode="Mod">
                  <chunk>
                    <nom name="w8"/>
                    <prop name="between"/>
                    <diamond mode="Arg1">
                      <chunk>
                        <nom name="w11"/>
                        <prop name="army"/>
                        <diamond mode="num">
                          <prop name="pl"/>
                        </diamond>
                        <diamond mode="Det">
                          <nom name="w9"/>
                          <prop name="the"/>
                        </diamond>
                        <diamond mode="Mod">
                          <nom name="w10"/>
                          <prop name="two"/>
                        </diamond>
                      </chunk>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
  </satop>
</lf>
</second>
</paraphrase>
<paraphrase corpus="mtc.common" id="44">
<alignments source="GIZA_INTERSECTED">
<alignment first="5" second="1" status="S"/>
<alignment first="7" second="15" status="S"/>
<alignment first="8" second="14" status="S"/>
<alignment first="9" second="16" status="S"/>
<alignment first="10" second="5" status="S"/>
<alignment first="11" second="6" status="S"/>
<alignment first="16" second="7" status="S"/>
<alignment first="17" second="8" status="S"/>
<alignment first="18" second="9" status="S"/>
<alignment first="19" second="10" status="S"/>
<alignment first="20" second="11" status="S"/>
<alignment first="21" second="12" status="S"/>
<alignment first="22" second="17" status="S"/>
<alignment first="24" second="18" status="S"/>
<alignment first="25" second="19" status="S"/>
<alignment first="26" second="20" status="S"/>
<alignment first="27" second="21" status="S"/>
<alignment first="28" second="22" status="S"/>
<alignment first="29" second="23" status="S"/>
<alignment first="33" second="24" status="S"/>
<alignment first="34" second="25" status="S"/>
<alignment first="40" second="29" status="S"/>
<alignment first="41" second="33" status="S"/>
</alignments>
<alignments source="ANNOTATOR">
<alignment first="0" second="2" status="S"/>
<alignment first="1" second="0" status="P"/>
<alignment first="1" second="3" status="P"/>
<alignment first="5" second="1" status="S"/>
<alignment first="6" second="3" status="P"/>
<alignment first="7" second="15" status="S"/>
<alignment first="8" second="14" status="S"/>
<alignment first="9" second="16" status="S"/>
<alignment first="10" second="5" status="S"/>
<alignment first="11" second="6" status="S"/>
<alignment first="16" second="7" status="S"/>
<alignment first="17" second="8" status="S"/>
<alignment first="18" second="9" status="S"/>
<alignment first="19" second="10" status="S"/>
<alignment first="20" second="11" status="S"/>
<alignment first="21" second="12" status="S"/>
<alignment first="22" second="17" status="S"/>
<alignment first="23" second="18" status="P"/>
<alignment first="24" second="18" status="P"/>
<alignment first="25" second="19" status="S"/>
<alignment first="26" second="20" status="S"/>
<alignment first="27" second="21" status="S"/>
<alignment first="28" second="22" status="S"/>
<alignment first="29" second="23" status="S"/>
<alignment first="33" second="24" status="S"/>
<alignment first="34" second="25" status="S"/>
<alignment first="35" second="26" status="S"/>
<alignment first="35" second="27" status="P"/>
<alignment first="35" second="29" status="P"/>
<alignment first="36" second="30" status="P"/>
<alignment first="37" second="32" status="P"/>
<alignment first="38" second="27" status="P"/>
<alignment first="39" second="28" status="P"/>
<alignment first="40" second="29" status="P"/>
<alignment first="41" second="33" status="S"/>
</alignments>
<first>
<string>also present at the seminar will be long yongtu , vice minister of china 's ministry of foreign trade and economic cooperation who will accompany rugerro to shanghai , and shen jueren , former chief negotiator of china in gatt negotiations .</string>
</first>
<second>
<string>attendees will also include the vice minister of foreign trade &amp; economic cooperation , yongtu long , who accompanied ruggiero to shanghai , and former chief representative for trade negotiations of the moftec .</string>
</second>
</paraphrase>
<paraphrase corpus="mtc.common" id="45">
<alignments source="GIZA_INTERSECTED">
<alignment first="0" second="0" status="S"/>
<alignment first="1" second="1" status="S"/>
<alignment first="2" second="2" status="S"/>
<alignment first="3" second="3" status="S"/>
<alignment first="4" second="4" status="S"/>
<alignment first="5" second="5" status="S"/>
<alignment first="6" second="7" status="S"/>
<alignment first="7" second="6" status="S"/>
<alignment first="12" second="18" status="S"/>
<alignment first="13" second="19" status="S"/>
<alignment first="14" second="20" status="S"/>
<alignment first="15" second="21" status="S"/>
<alignment first="16" second="25" status="S"/>
<alignment first="17" second="26" status="S"/>
<alignment first="18" second="27" status="S"/>
<alignment first="19" second="28" status="S"/>
<alignment first="21" second="29" status="S"/>
</alignments>
<alignments source="ANNOTATOR">
<alignment first="0" second="0" status="S"/>
<alignment first="1" second="1" status="S"/>
<alignment first="2" second="2" status="S"/>
<alignment first="3" second="3" status="S"/>
<alignment first="4" second="4" status="S"/>
<alignment first="5" second="5" status="S"/>
<alignment first="6" second="7" status="S"/>
<alignment first="7" second="6" status="S"/>
<alignment first="8" second="8" status="P"/>
<alignment first="10" second="11" status="S"/>
<alignment first="10" second="12" status="S"/>
<alignment first="12" second="18" status="S"/>
<alignment first="13" second="19" status="S"/>
<alignment first="14" second="20" status="S"/>
<alignment first="15" second="21" status="S"/>
<alignment first="16" second="25" status="S"/>
<alignment first="17" second="26" status="S"/>
<alignment first="18" second="27" status="S"/>
<alignment first="19" second="28" status="S"/>
<alignment first="20" second="15" status="P"/>
<alignment first="21" second="29" status="S"/>
</alignments>
<first>
<string>xinhua news agency , nanjing , 16 december , by zhoufang the investment of foreign capital in agriculture of jiangsu increased .</string>
</first>
<second>
<string>xinhua news agency , nanjing , dec. 16 . ( reporter zhou fang ) an increasing number of investments from foreign capital are being made on agriculture in jiangsu .</string>
</second>
</paraphrase>
<paraphrase corpus="mtc.common" id="46">
<alignments source="GIZA_INTERSECTED">
<alignment first="0" second="1" status="S"/>
<alignment first="1" second="3" status="S"/>
<alignment first="3" second="2" status="S"/>
<alignment first="5" second="4" status="S"/>
<alignment first="6" second="5" status="S"/>
<alignment first="11" second="10" status="S"/>
<alignment first="12" second="11" status="S"/>
<alignment first="13" second="12" status="S"/>
<alignment first="15" second="14" status="S"/>
<alignment first="18" second="15" status="S"/>
<alignment first="19" second="16" status="S"/>
<alignment first="20" second="17" status="S"/>
<alignment first="23" second="19" status="S"/>
</alignments>
<alignments source="ANNOTATOR">
<alignment first="0" second="1" status="P"/>
<alignment first="1" second="3" status="S"/>
<alignment first="2" second="2" status="P"/>
<alignment first="3" second="2" status="P"/>
<alignment first="4" second="2" status="P"/>
<alignment first="5" second="4" status="S"/>
<alignment first="6" second="5" status="S"/>
<alignment first="7" second="8" status="S"/>
<alignment first="8" second="7" status="P"/>
<alignment first="9" second="7" status="P"/>
<alignment first="10" second="9" status="P"/>
<alignment first="11" second="10" status="S"/>
<alignment first="12" second="11" status="S"/>
<alignment first="13" second="12" status="S"/>
<alignment first="14" second="14" status="S"/>
<alignment first="15" second="14" status="S"/>
<alignment first="17" second="15" status="P"/>
<alignment first="18" second="15" status="P"/>
<alignment first="19" second="16" status="S"/>
<alignment first="20" second="17" status="P"/>
<alignment first="21" second="17" status="S"/>
<alignment first="22" second="18" status="S"/>
<alignment first="23" second="19" status="S"/>
</alignments>
<first>
<string>france ministry of foreign affairs said that leaders of iraq refused to co-operate with united nations and have caused this deeply regretted outcome .</string>
<pred-info>w19:np/n:DT:this w9:n:NNS:iraq w18:s[pt]\np/np:VBN:cause w8:np\np/np:IN:of w17:s[dcl]\np/(s[pt]\np):VBP:PERF w7:n:NNS:leader w16:s[dcl]$\(s[dcl]$)/(s[dcl]$):CC:and w6:np/n:DT:that w15:n:NNS:nation w5:s[dcl]\np/s[dcl]:VBD:say w14:n/n:JJ:united w4:n:NNS:affair w13:pp/np:IN:with w3:n/n:JJ:foreign w12:s[b]\np/pp:VB:co-operate w2:np\np/np:IN:of w1:n:NN:ministry w10:s[dcl]\np/(s[to]\np):VBD:refuse w0:n/n:NN:france w22:n:NN:outcome w21:n/n:JJ:regretted w20:n/n/(n/n):RB:deeply</pred-info>
<full-words>france:S-france:P-NN:T-n/n ministry:S-ministry:P-NN:T-n of:S-of:P-IN:T-np\np/np foreign:S-foreign:P-JJ:T-n/n affairs:S-affair:P-NNS:T-n said:S-say:P-VBD:T-s[dcl]\np/s[dcl] that:S-that:P-DT:T-np/n leaders:S-leader:P-NNS:T-n of:S-of:P-IN:T-np\np/np iraq:S-iraq:P-NNS:T-n refused:S-refuse:P-VBD:T-s[dcl]\np/(s[to]\np) to:S-to:P-TO:T-s[to]\np/(s[b]\np) co&#45;operate:S-co&#45;operate:P-VB:T-s[b]\np/pp with:S-with:P-IN:T-pp/np united:S-united:P-JJ:T-n/n nations:S-nation:P-NNS:T-n and:S-and:P-CC:T-s[dcl]$\(s[dcl]$)/(s[dcl]$) have:S-have:P-VBP:T-s[dcl]\np/(s[pt]\np) caused:S-cause:P-VBN:T-s[pt]\np/np this:S-this:P-DT:T-np/n deeply:S-deeply:P-RB:T-n/n/(n/n) regretted:S-regretted:P-JJ:T-n/n outcome:S-outcome:P-NN:T-n .:S-.:P-.:T-sent\s[dcl]</full-words>
<lf>
  <satop nom="w5">
    <prop name="say"/>
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
    <diamond mode="tense">
      <prop name="past"/>
    </diamond>
    <diamond mode="Arg0">
      <chunk>
        <nom name="w1"/>
        <prop name="ministry"/>
        <diamond mode="det">
          <prop name="nil"/>
        </diamond>
        <diamond mode="num">
          <prop name="sg"/>
        </diamond>
        <diamond mode="Mod">
          <nom name="w0"/>
          <prop name="france"/>
          <diamond mode="num">
            <prop name="sg"/>
          </diamond>
        </diamond>
        <diamond mode="Mod">
          <chunk>
            <nom name="w2"/>
            <prop name="of"/>
            <diamond mode="Arg1">
              <chunk>
                <nom name="w4"/>
                <prop name="affair"/>
                <diamond mode="det">
                  <prop name="nil"/>
                </diamond>
                <diamond mode="num">
                  <prop name="pl"/>
                </diamond>
                <diamond mode="Mod">
                  <nom name="w3"/>
                  <prop name="foreign"/>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Arg1">
      <chunk>
        <nom name="w16"/>
        <prop name="and"/>
        <diamond mode="First">
          <chunk>
            <nom name="w10"/>
            <prop name="refuse"/>
            <diamond mode="tense">
              <prop name="past"/>
            </diamond>
            <diamond mode="Arg0">
              <nom name="w7"/>
            </diamond>
            <diamond mode="Arg1">
              <chunk>
                <nom name="w12"/>
                <prop name="co-operate"/>
                <diamond mode="Arg0">
                  <nom name="w7"/>
                </diamond>
                <diamond mode="Arg1">
                  <chunk>
                    <nom name="w13"/>
                    <prop name="with"/>
                    <diamond mode="Arg1">
                      <chunk>
                        <nom name="w15"/>
                        <prop name="nation"/>
                        <diamond mode="det">
                          <prop name="nil"/>
                        </diamond>
                        <diamond mode="num">
                          <prop name="pl"/>
                        </diamond>
                        <diamond mode="Mod">
                          <nom name="w14"/>
                          <prop name="united"/>
                        </diamond>
                      </chunk>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
        <diamond mode="Next">
          <chunk>
            <nom name="w17"/>
            <prop name="PERF"/>
            <diamond mode="tense">
              <prop name="pres"/>
            </diamond>
            <diamond mode="Arg0">
              <nom name="w7"/>
            </diamond>
            <diamond mode="Arg1">
              <chunk>
                <nom name="w18"/>
                <prop name="cause"/>
                <diamond mode="partic">
                  <prop name="past"/>
                </diamond>
                <diamond mode="Arg0">
                  <nom name="w7"/>
                </diamond>
                <diamond mode="Arg1">
                  <chunk>
                    <nom name="w22"/>
                    <prop name="outcome"/>
                    <diamond mode="num">
                      <prop name="sg"/>
                    </diamond>
                    <diamond mode="Det">
                      <nom name="w19"/>
                      <prop name="this"/>
                    </diamond>
                    <diamond mode="Mod">
                      <chunk>
                        <nom name="w21"/>
                        <prop name="regretted"/>
                        <diamond mode="Mod">
                          <nom name="w20"/>
                          <prop name="deeply"/>
                        </diamond>
                      </chunk>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
        <satop nom="w7">
          <chunk>
            <prop name="leader"/>
            <diamond mode="num">
              <prop name="pl"/>
            </diamond>
            <diamond mode="Det">
              <nom name="w6"/>
              <prop name="that"/>
            </diamond>
            <diamond mode="Mod">
              <chunk>
                <nom name="w8"/>
                <prop name="of"/>
                <diamond mode="Arg1">
                  <nom name="w9"/>
                  <prop name="iraq"/>
                  <diamond mode="det">
                    <prop name="nil"/>
                  </diamond>
                  <diamond mode="num">
                    <prop name="pl"/>
                  </diamond>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </satop>
      </chunk>
    </diamond>
  </satop>
</lf>
</first>
<second>
<string>the french foreign ministry said that because iraqi leader refuses to cooperate with the un caused this sad events .</string>
<pred-info>w9:s[dcl]\np/(s[to]\np):VBZ:refuse w8:n:NN:leader w7:n/n:JJ:iraqi w6:s/s/s[dcl]:IN:because w4:s[dcl]\np/s[em]:VBD:say w18:n:NNS:event w3:n:NN:ministry w17:n/n:JJ:sad w2:n/n:JJ:foreign w16:np/n:DT:this w1:n/n:JJ:french w15:s[dcl]\pp/np:VBD:cause w0:np/n:DT:the w14:n:NN:un w13:np/n:DT:the w12:pp/np:IN:with w11:s[b]\np:VB:cooperate</pred-info>
<full-words>the:S-the:P-DT:T-np/n french:S-french:P-JJ:T-n/n foreign:S-foreign:P-JJ:T-n/n ministry:S-ministry:P-NN:T-n said:S-say:P-VBD:T-s[dcl]\np/s[em] that:S-that:P-IN:T-s[em]/s[dcl] because:S-because:P-IN:T-s/s/s[dcl] iraqi:S-iraqi:P-JJ:T-n/n leader:S-leader:P-NN:T-n refuses:S-refuse:P-VBZ:T-s[dcl]\np/(s[to]\np) to:S-to:P-TO:T-s[to]\np/(s[b]\np) cooperate:S-cooperate:P-VB:T-s[b]\np with:S-with:P-IN:T-pp/np the:S-the:P-DT:T-np/n un:S-un:P-NN:T-n caused:S-cause:P-VBD:T-s[dcl]\pp/np this:S-this:P-DT:T-np/n sad:S-sad:P-JJ:T-n/n events:S-event:P-NNS:T-n .:S-.:P-.:T-sent\s[dcl]</full-words>
<lf>
  <satop nom="w4">
    <prop name="say"/>
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
    <diamond mode="tense">
      <prop name="past"/>
    </diamond>
    <diamond mode="Arg0">
      <chunk>
        <nom name="w3"/>
        <prop name="ministry"/>
        <diamond mode="num">
          <prop name="sg"/>
        </diamond>
        <diamond mode="Det">
          <nom name="w0"/>
          <prop name="the"/>
        </diamond>
        <diamond mode="Mod">
          <nom name="w1"/>
          <prop name="french"/>
        </diamond>
        <diamond mode="Mod">
          <nom name="w2"/>
          <prop name="foreign"/>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Arg1">
      <chunk>
        <nom name="w15"/>
        <prop name="cause"/>
        <diamond mode="Arg1">
          <chunk>
            <nom name="w18"/>
            <prop name="event"/>
            <diamond mode="num">
              <prop name="pl"/>
            </diamond>
            <diamond mode="Det">
              <nom name="w16"/>
              <prop name="this"/>
            </diamond>
            <diamond mode="Mod">
              <nom name="w17"/>
              <prop name="sad"/>
            </diamond>
          </chunk>
        </diamond>
        <diamond mode="Arg2">
          <chunk>
            <nom name="w12"/>
            <prop name="with"/>
            <diamond mode="Arg1">
              <chunk>
                <nom name="w14"/>
                <prop name="un"/>
                <diamond mode="num">
                  <prop name="sg"/>
                </diamond>
                <diamond mode="Det">
                  <nom name="w13"/>
                  <prop name="the"/>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
        <diamond mode="Mod">
          <chunk>
            <nom name="w6"/>
            <prop name="because"/>
            <diamond mode="Arg1">
              <chunk>
                <nom name="w9"/>
                <prop name="refuse"/>
                <diamond mode="tense">
                  <prop name="pres"/>
                </diamond>
                <diamond mode="Arg0">
                  <chunk>
                    <nom name="w8"/>
                    <prop name="leader"/>
                    <diamond mode="det">
                      <prop name="nil"/>
                    </diamond>
                    <diamond mode="num">
                      <prop name="sg"/>
                    </diamond>
                    <diamond mode="Mod">
                      <nom name="w7"/>
                      <prop name="iraqi"/>
                    </diamond>
                  </chunk>
                </diamond>
                <diamond mode="Arg1">
                  <chunk>
                    <nom name="w11"/>
                    <prop name="cooperate"/>
                    <diamond mode="Arg0">
                      <nom name="w8"/>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
  </satop>
</lf>
</second>
</paraphrase>
<paraphrase corpus="mtc.common" id="47">
<alignments source="GIZA_INTERSECTED">
<alignment first="0" second="0" status="S"/>
<alignment first="1" second="1" status="S"/>
<alignment first="2" second="2" status="S"/>
<alignment first="3" second="3" status="S"/>
<alignment first="4" second="5" status="S"/>
<alignment first="5" second="6" status="S"/>
<alignment first="13" second="8" status="S"/>
<alignment first="15" second="20" status="S"/>
<alignment first="16" second="22" status="S"/>
<alignment first="20" second="23" status="S"/>
</alignments>
<alignments source="ANNOTATOR">
<alignment first="0" second="0" status="P"/>
<alignment first="1" second="1" status="S"/>
<alignment first="2" second="2" status="S"/>
<alignment first="3" second="3" status="S"/>
<alignment first="4" second="5" status="S"/>
<alignment first="5" second="6" status="S"/>
<alignment first="8" second="9" status="P"/>
<alignment first="8" second="10" status="P"/>
<alignment first="8" second="11" status="P"/>
<alignment first="9" second="4" status="S"/>
<alignment first="10" second="4" status="S"/>
<alignment first="11" second="7" status="S"/>
<alignment first="12" second="7" status="S"/>
<alignment first="13" second="8" status="S"/>
<alignment first="14" second="12" status="P"/>
<alignment first="15" second="20" status="P"/>
<alignment first="16" second="22" status="S"/>
<alignment first="18" second="15" status="P"/>
<alignment first="18" second="16" status="P"/>
<alignment first="19" second="14" status="P"/>
<alignment first="19" second="15" status="P"/>
<alignment first="20" second="23" status="S"/>
</alignments>
<first>
<string>during the preliminaries , lan wei , a highly-skilled twenty-six year-old native of guangdong , scored 355.35 for first place .</string>
<pred-info>w9:n/n:JJ:twenty-six w8:n/n:JJ:highly-skilled w7:np/n:DT:a w5:n:NNS:wei w19:n:NN:place w4:n/n:JJ:lan w18:n/n:JJ:first w2:n:NNS:preliminaries w17:s\np\(s\np)/np:IN:for w16:s\np\(s\np):CD:355.35 w1:np/n:DT:the w15:s[dcl]\np:VBD:score w0:s/s/np:IN:during w13:n:NN:guangdong w12:np\np/np:IN:of w11:n:NN:native w10:n/n:JJ:year-old</pred-info>
<full-words>during:S-during:P-IN:T-s/s/np the:S-the:P-DT:T-np/n preliminaries:S-preliminaries:P-NNS:T-n ,:S-,:P-,:T-s/s\(s/s) lan:S-lan:P-JJ:T-n/n wei:S-wei:P-NNS:T-n ,:S-,:P-,:T-np\np/punct[,]/np a:S-a:P-DT:T-np/n highly&#45;skilled:S-highly&#45;skilled:P-JJ:T-n/n twenty&#45;six:S-twenty&#45;six:P-JJ:T-n/n year&#45;old:S-year&#45;old:P-JJ:T-n/n native:S-native:P-NN:T-n of:S-of:P-IN:T-np\np/np guangdong:S-guangdong:P-NN:T-n ,:S-,:P-,:T-punct[,] scored:S-score:P-VBD:T-s[dcl]\np 355.35:S-355.35:P-CD:T-s\np\(s\np) for:S-for:P-IN:T-s\np\(s\np)/np first:S-first:P-JJ:T-n/n place:S-place:P-NN:T-n .:S-.:P-.:T-sent\s[dcl]</full-words>
<lf>
  <satop nom="w15">
    <prop name="score"/>
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
    <diamond mode="tense">
      <prop name="past"/>
    </diamond>
    <diamond mode="Arg0">
      <chunk>
        <nom name="w5"/>
        <prop name="wei"/>
        <diamond mode="det">
          <prop name="nil"/>
        </diamond>
        <diamond mode="num">
          <prop name="pl"/>
        </diamond>
        <diamond mode="ApposRel">
          <chunk>
            <nom name="w11"/>
            <prop name="native"/>
            <diamond mode="num">
              <prop name="sg"/>
            </diamond>
            <diamond mode="Det">
              <nom name="w7"/>
              <prop name="a"/>
            </diamond>
            <diamond mode="Mod">
              <nom name="w10"/>
              <prop name="year-old"/>
            </diamond>
            <diamond mode="Mod">
              <chunk>
                <nom name="w12"/>
                <prop name="of"/>
                <diamond mode="Arg1">
                  <nom name="w13"/>
                  <prop name="guangdong"/>
                  <diamond mode="det">
                    <prop name="nil"/>
                  </diamond>
                  <diamond mode="num">
                    <prop name="sg"/>
                  </diamond>
                </diamond>
              </chunk>
            </diamond>
            <diamond mode="Mod">
              <nom name="w8"/>
              <prop name="highly-skilled"/>
            </diamond>
            <diamond mode="Mod">
              <nom name="w9"/>
              <prop name="twenty-six"/>
            </diamond>
          </chunk>
        </diamond>
        <diamond mode="Mod">
          <nom name="w4"/>
          <prop name="lan"/>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Mod">
      <chunk>
        <nom name="w0"/>
        <prop name="during"/>
        <diamond mode="emph-intro">
          <prop name="+"/>
        </diamond>
        <diamond mode="Arg1">
          <chunk>
            <nom name="w2"/>
            <prop name="preliminaries"/>
            <diamond mode="num">
              <prop name="pl"/>
            </diamond>
            <diamond mode="Det">
              <nom name="w1"/>
              <prop name="the"/>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Mod">
      <nom name="w16"/>
      <prop name="355.35"/>
    </diamond>
    <diamond mode="Mod">
      <chunk>
        <nom name="w17"/>
        <prop name="for"/>
        <diamond mode="Arg1">
          <chunk>
            <nom name="w19"/>
            <prop name="place"/>
            <diamond mode="det">
              <prop name="nil"/>
            </diamond>
            <diamond mode="num">
              <prop name="sg"/>
            </diamond>
            <diamond mode="Mod">
              <nom name="w18"/>
              <prop name="first"/>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
  </satop>
</lf>
</first>
<second>
<string>in the qualifiers , 26-year-old lan wei from guangdong displayed excellent skill , and ranked no. 1 with a total score of 355.3 .</string>
<pred-info>w9:s[pss]\np:VBN:display w19:n/n:JJ:total w18:np/n:DT:a w8:s[ng]\np/(s[pss]\np):VBG:guangdong w17:s\np\(s\np)/np:IN:with w7:np\np/(s[ng]\np):IN:from w16:n[num]:CD:1 w6:n:NNS:wei w15:s\np\(s\np)/n[num]:NNP:no. w5:n/n:JJ:lan w14:s[pss]\np:VBD:rank w4:n/n:JJ:26-year-old w13:s[pss]$\(s[pss]$)\punct[,]/(s[pss]$):CC:and w3:np\np/np:,:, w2:n:NNS:qualifiers w11:s\np\(s\np):NN:skill w1:np/n:DT:the w10:s\np\(s\np)/(s\np\(s\np)):JJ:excellent w0:s/s/np:IN:in w22:n:CD:355.3 w21:np\np/np:IN:of w20:n:NN:score</pred-info>
<full-words>in:S-in:P-IN:T-s/s/np the:S-the:P-DT:T-np/n qualifiers:S-qualifiers:P-NNS:T-n ,:S-,:P-,:T-np\np/np 26&#45;year&#45;old:S-26&#45;year&#45;old:P-JJ:T-n/n lan:S-lan:P-JJ:T-n/n wei:S-wei:P-NNS:T-n from:S-from:P-IN:T-np\np/(s[ng]\np) guangdong:S-guangdong:P-VBG:T-s[ng]\np/(s[pss]\np) displayed:S-display:P-VBN:T-s[pss]\np excellent:S-excellent:P-JJ:T-s\np\(s\np)/(s\np\(s\np)) skill:S-skill:P-NN:T-s\np\(s\np) ,:S-,:P-,:T-punct[,] and:S-and:P-CC:T-s[pss]$\(s[pss]$)\punct[,]/(s[pss]$) ranked:S-rank:P-VBD:T-s[pss]\np no.:S-no.:P-NNP:T-s\np\(s\np)/n[num] 1:S-1:P-CD:T-n[num] with:S-with:P-IN:T-s\np\(s\np)/np a:S-a:P-DT:T-np/n total:S-total:P-JJ:T-n/n score:S-score:P-NN:T-n of:S-of:P-IN:T-np\np/np 355.3:S-355.3:P-CD:T-n .:S-.:P-.:T-sent\(s/s)</full-words>
<lf>
  <satop nom="x1">
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
    <diamond mode="Mod">
      <chunk>
        <nom name="w0"/>
        <prop name="in"/>
        <diamond mode="Arg1">
          <chunk>
            <nom name="w3"/>
            <prop name=","/>
            <diamond mode="First">
              <chunk>
                <nom name="w2"/>
                <prop name="qualifiers"/>
                <diamond mode="num">
                  <prop name="pl"/>
                </diamond>
                <diamond mode="Det">
                  <nom name="w1"/>
                  <prop name="the"/>
                </diamond>
              </chunk>
            </diamond>
            <diamond mode="Next">
              <chunk>
                <nom name="w6"/>
                <prop name="wei"/>
                <diamond mode="det">
                  <prop name="nil"/>
                </diamond>
                <diamond mode="num">
                  <prop name="pl"/>
                </diamond>
                <diamond mode="Mod">
                  <nom name="w4"/>
                  <prop name="26-year-old"/>
                </diamond>
                <diamond mode="Mod">
                  <nom name="w5"/>
                  <prop name="lan"/>
                </diamond>
                <diamond mode="Mod">
                  <chunk>
                    <nom name="w7"/>
                    <prop name="from"/>
                    <diamond mode="Arg1">
                      <chunk>
                        <nom name="w8"/>
                        <prop name="guangdong"/>
                        <diamond mode="partic">
                          <prop name="pres"/>
                        </diamond>
                        <diamond mode="Arg0">
                          <nom name="x2"/>
                        </diamond>
                        <diamond mode="Arg1">
                          <chunk>
                            <nom name="w13"/>
                            <prop name="and"/>
                            <diamond mode="First">
                              <chunk>
                                <nom name="w9"/>
                                <prop name="display"/>
                                <diamond mode="partic">
                                  <prop name="pass"/>
                                </diamond>
                                <diamond mode="Arg1">
                                  <nom name="x2"/>
                                </diamond>
                                <diamond mode="Mod">
                                  <chunk>
                                    <nom name="w11"/>
                                    <prop name="skill"/>
                                    <diamond mode="num">
                                      <prop name="sg"/>
                                    </diamond>
                                    <diamond mode="Mod">
                                      <nom name="w10"/>
                                      <prop name="excellent"/>
                                    </diamond>
                                  </chunk>
                                </diamond>
                              </chunk>
                            </diamond>
                            <diamond mode="Next">
                              <chunk>
                                <nom name="w14"/>
                                <prop name="rank"/>
                                <diamond mode="tense">
                                  <prop name="past"/>
                                </diamond>
                                <diamond mode="Arg1">
                                  <nom name="x2"/>
                                </diamond>
                                <diamond mode="Mod">
                                  <chunk>
                                    <nom name="w15"/>
                                    <prop name="no."/>
                                    <diamond mode="num">
                                      <prop name="sg"/>
                                    </diamond>
                                    <diamond mode="Arg1">
                                      <nom name="w16"/>
                                      <prop name="1"/>
                                    </diamond>
                                  </chunk>
                                </diamond>
                                <diamond mode="Mod">
                                  <chunk>
                                    <nom name="w17"/>
                                    <prop name="with"/>
                                    <diamond mode="Arg1">
                                      <chunk>
                                        <nom name="w20"/>
                                        <prop name="score"/>
                                        <diamond mode="num">
                                          <prop name="sg"/>
                                        </diamond>
                                        <diamond mode="Det">
                                          <nom name="w18"/>
                                          <prop name="a"/>
                                        </diamond>
                                        <diamond mode="Mod">
                                          <nom name="w19"/>
                                          <prop name="total"/>
                                        </diamond>
                                        <diamond mode="Mod">
                                          <chunk>
                                            <nom name="w21"/>
                                            <prop name="of"/>
                                            <diamond mode="Arg1">
                                              <nom name="w22"/>
                                              <prop name="355.3"/>
                                              <diamond mode="det">
                                                <prop name="nil"/>
                                              </diamond>
                                            </diamond>
                                          </chunk>
                                        </diamond>
                                      </chunk>
                                    </diamond>
                                  </chunk>
                                </diamond>
                              </chunk>
                            </diamond>
                          </chunk>
                        </diamond>
                      </chunk>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
  </satop>
</lf>
</second>
</paraphrase>
<paraphrase corpus="mtc.common" id="48">
<alignments source="GIZA_INTERSECTED">
<alignment first="0" second="4" status="S"/>
<alignment first="1" second="5" status="S"/>
<alignment first="2" second="6" status="S"/>
<alignment first="3" second="7" status="S"/>
<alignment first="4" second="8" status="S"/>
<alignment first="5" second="0" status="S"/>
<alignment first="6" second="12" status="S"/>
<alignment first="7" second="14" status="S"/>
<alignment first="11" second="17" status="S"/>
<alignment first="12" second="18" status="S"/>
<alignment first="13" second="19" status="S"/>
<alignment first="15" second="20" status="S"/>
<alignment first="16" second="23" status="S"/>
</alignments>
<alignments source="ANNOTATOR">
<alignment first="0" second="4" status="S"/>
<alignment first="1" second="5" status="S"/>
<alignment first="2" second="6" status="S"/>
<alignment first="3" second="7" status="S"/>
<alignment first="4" second="8" status="P"/>
<alignment first="5" second="0" status="S"/>
<alignment first="7" second="14" status="S"/>
<alignment first="8" second="15" status="S"/>
<alignment first="8" second="16" status="P"/>
<alignment first="9" second="15" status="P"/>
<alignment first="9" second="16" status="S"/>
<alignment first="10" second="15" status="P"/>
<alignment first="10" second="16" status="S"/>
<alignment first="11" second="17" status="S"/>
<alignment first="12" second="18" status="S"/>
<alignment first="13" second="19" status="S"/>
<alignment first="14" second="19" status="S"/>
<alignment first="15" second="20" status="S"/>
<alignment first="16" second="21" status="S"/>
<alignment first="16" second="22" status="S"/>
<alignment first="16" second="23" status="S"/>
</alignments>
<first>
<string>nanjing , december 16 ( xinhua ) foreign fund put into jiangsu 's agricultural sector is increasing</string>
<pred-info>w9:s[pss]\np/pp:VBD:put w8:n:NN:fund w7:n/n:JJ:foreign w6:np/n:DT:rrb w5:np\np\(np\np)/np:IN:xinhua w4:np\np:NNS:lrb w3:np\np/(np\np):CD:16 w2:n:NN:december w16:s[ng]\np:VBG:increase w15:s[dcl]\np/(s[ng]\np):VBZ:PROG w0:s/s:NN:nanjing w14:n:NN:sector w13:n/n:JJ:agricultural w11:n:NNP:jiangsu w10:pp/np:IN:into</pred-info>
<full-words>nanjing:S-nanjing:P-NN:T-s/s ,:S-,:P-,:T-s/s\(s/s) december:S-december:P-NN:T-n 16:S-16:P-CD:T-np\np/(np\np) (:S-(:P-NNS:T-np\np xinhua:S-xinhua:P-IN:T-np\np\(np\np)/np ):S-):P-DT:T-np/n foreign:S-foreign:P-JJ:T-n/n fund:S-fund:P-NN:T-n put:S-put:P-VBD:T-s[pss]\np/pp into:S-into:P-IN:T-pp/np jiangsu:S-jiangsu:P-NNP:T-n &apos;s:S-&apos;s:P-POS:T-np/n\np agricultural:S-agricultural:P-JJ:T-n/n sector:S-sector:P-NN:T-n is:S-be:P-VBZ:T-s[dcl]\np/(s[ng]\np) increasing:S-increase:P-VBG:T-s[ng]\np</full-words>
<lf>
  <satop nom="w15">
    <chunk>
      <prop name="PROG"/>
      <diamond mode="tense">
        <prop name="pres"/>
      </diamond>
      <diamond mode="Arg0">
        <chunk>
          <nom name="w2"/>
          <prop name="december"/>
          <diamond mode="det">
            <prop name="nil"/>
          </diamond>
          <diamond mode="num">
            <prop name="sg"/>
          </diamond>
          <diamond mode="Mod">
            <nom name="w4"/>
            <prop name="lrb"/>
            <diamond mode="num">
              <prop name="pl"/>
            </diamond>
          </diamond>
        </chunk>
      </diamond>
      <diamond mode="Arg1">
        <chunk>
          <nom name="w16"/>
          <prop name="increase"/>
          <diamond mode="partic">
            <prop name="pres"/>
          </diamond>
          <diamond mode="Arg0">
            <nom name="w2"/>
          </diamond>
        </chunk>
      </diamond>
      <diamond mode="Mod">
        <nom name="w0"/>
        <prop name="nanjing"/>
        <diamond mode="emph-intro">
          <prop name="+"/>
        </diamond>
        <diamond mode="num">
          <prop name="sg"/>
        </diamond>
      </diamond>
    </chunk>
  </satop>
  <satop nom="x1">
    <chunk>
      <diamond mode="Mod">
        <nom name="w3"/>
        <prop name="16"/>
      </diamond>
      <diamond mode="Mod">
        <chunk>
          <nom name="w5"/>
          <prop name="xinhua"/>
          <diamond mode="Arg1">
            <chunk>
              <nom name="w8"/>
              <prop name="fund"/>
              <diamond mode="num">
                <prop name="sg"/>
              </diamond>
              <diamond mode="Det">
                <nom name="w6"/>
                <prop name="rrb"/>
              </diamond>
              <diamond mode="Mod">
                <nom name="w7"/>
                <prop name="foreign"/>
              </diamond>
              <diamond mode="GenRel">
                <chunk>
                  <nom name="w9"/>
                  <prop name="put"/>
                  <diamond mode="tense">
                    <prop name="past"/>
                  </diamond>
                  <diamond mode="Arg1">
                    <nom name="w8"/>
                  </diamond>
                  <diamond mode="Arg2">
                    <chunk>
                      <nom name="w10"/>
                      <prop name="into"/>
                      <diamond mode="Arg1">
                        <chunk>
                          <nom name="w14"/>
                          <prop name="sector"/>
                          <diamond mode="num">
                            <prop name="sg"/>
                          </diamond>
                          <diamond mode="GenOwn">
                            <nom name="w11"/>
                            <prop name="jiangsu"/>
                            <diamond mode="det">
                              <prop name="nil"/>
                            </diamond>
                            <diamond mode="num">
                              <prop name="sg"/>
                            </diamond>
                          </diamond>
                          <diamond mode="Mod">
                            <nom name="w13"/>
                            <prop name="agricultural"/>
                          </diamond>
                        </chunk>
                      </diamond>
                    </chunk>
                  </diamond>
                </chunk>
              </diamond>
            </chunk>
          </diamond>
        </chunk>
      </diamond>
    </chunk>
  </satop>
</lf>
</first>
<second>
<string>xinhua news agency , nanjing , dec. 16 ( reporter zhou fang ) - foreign investment in jiangsu 's agriculture is on the rise .</string>
<pred-info>w19:s[dcl]\np/pp:VBZ:be w9:n/n:NN:reporter w18:n:NN:agriculture w8:n/n:NN:lrb w7:n/n:CD:16 w16:n:NNP:jiangsu w6:s[dcl]\np/np:VBZ:dec. w15:np\np/np:IN:in w14:n:NN:investment w4:n:NN:nanjing w13:n/n:JJ:foreign w12:n:SYM:rrb w2:n:NN:agency w11:n/n:VBG:fang w1:n/n:NN:news w10:n/n:NN:zhou w0:np/n:DT:xinhua w22:n:NN:rise w21:np/n:DT:the w20:pp/np:IN:on</pred-info>
<full-words>xinhua:S-xinhua:P-DT:T-np/n news:S-news:P-NN:T-n/n agency:S-agency:P-NN:T-n ,:S-,:P-,:T-np\np/punct[,]/np nanjing:S-nanjing:P-NN:T-n ,:S-,:P-,:T-punct[,] dec.:S-dec.:P-VBZ:T-s[dcl]\np/np 16:S-16:P-CD:T-n/n (:S-(:P-NN:T-n/n reporter:S-reporter:P-NN:T-n/n zhou:S-zhou:P-NN:T-n/n fang:S-fang:P-VBG:T-n/n ):S-):P-SYM:T-n -:S--:P--:T-punct[-] foreign:S-foreign:P-JJ:T-n/n investment:S-investment:P-NN:T-n in:S-in:P-IN:T-np\np/np jiangsu:S-jiangsu:P-NNP:T-n &apos;s:S-&apos;s:P-POS:T-np/n\np agriculture:S-agriculture:P-NN:T-n is:S-be:P-VBZ:T-s[dcl]\np/pp on:S-on:P-IN:T-pp/np the:S-the:P-DT:T-np/n rise:S-rise:P-NN:T-n .:S-.:P-.:T-sent\s[dcl]</full-words>
<lf>
  <satop nom="w6">
    <prop name="dec."/>
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
    <diamond mode="tense">
      <prop name="pres"/>
    </diamond>
    <diamond mode="Arg0">
      <chunk>
        <nom name="w2"/>
        <prop name="agency"/>
        <diamond mode="num">
          <prop name="sg"/>
        </diamond>
        <diamond mode="ApposRel">
          <nom name="w4"/>
          <prop name="nanjing"/>
          <diamond mode="det">
            <prop name="nil"/>
          </diamond>
          <diamond mode="num">
            <prop name="sg"/>
          </diamond>
        </diamond>
        <diamond mode="Det">
          <nom name="w0"/>
          <prop name="xinhua"/>
        </diamond>
        <diamond mode="Mod">
          <nom name="w1"/>
          <prop name="news"/>
          <diamond mode="num">
            <prop name="sg"/>
          </diamond>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Arg1">
      <chunk>
        <nom name="w12"/>
        <prop name="rrb"/>
        <diamond mode="det">
          <prop name="nil"/>
        </diamond>
        <diamond mode="Mod">
          <nom name="w10"/>
          <prop name="zhou"/>
          <diamond mode="num">
            <prop name="sg"/>
          </diamond>
        </diamond>
        <diamond mode="Mod">
          <nom name="w11"/>
          <prop name="fang"/>
          <diamond mode="partic">
            <prop name="pres"/>
          </diamond>
        </diamond>
        <diamond mode="Mod">
          <nom name="w7"/>
          <prop name="16"/>
        </diamond>
        <diamond mode="Mod">
          <nom name="w8"/>
          <prop name="lrb"/>
          <diamond mode="num">
            <prop name="sg"/>
          </diamond>
        </diamond>
        <diamond mode="Mod">
          <nom name="w9"/>
          <prop name="reporter"/>
          <diamond mode="num">
            <prop name="sg"/>
          </diamond>
        </diamond>
        <diamond mode="GenRel">
          <chunk>
            <nom name="w20"/>
            <prop name="be"/>
            <diamond mode="tense">
              <prop name="pres"/>
            </diamond>
            <diamond mode="Arg0">
              <chunk>
                <nom name="w15"/>
                <prop name="investment"/>
                <diamond mode="det">
                  <prop name="nil"/>
                </diamond>
                <diamond mode="num">
                  <prop name="sg"/>
                </diamond>
                <diamond mode="Mod">
                  <nom name="w14"/>
                  <prop name="foreign"/>
                </diamond>
                <diamond mode="Mod">
                  <chunk>
                    <nom name="w16"/>
                    <prop name="in"/>
                    <diamond mode="Arg1">
                      <chunk>
                        <nom name="w19"/>
                        <prop name="agriculture"/>
                        <diamond mode="num">
                          <prop name="sg"/>
                        </diamond>
                        <diamond mode="GenOwn">
                          <nom name="w17"/>
                          <prop name="jiangsu"/>
                          <diamond mode="det">
                            <prop name="nil"/>
                          </diamond>
                          <diamond mode="num">
                            <prop name="sg"/>
                          </diamond>
                        </diamond>
                      </chunk>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
            <diamond mode="Arg1">
              <chunk>
                <nom name="w21"/>
                <prop name="on"/>
                <diamond mode="Arg1">
                  <chunk>
                    <nom name="w23"/>
                    <prop name="rise"/>
                    <diamond mode="num">
                      <prop name="sg"/>
                    </diamond>
                    <diamond mode="Det">
                      <nom name="w22"/>
                      <prop name="the"/>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
            <diamond mode="Mod">
              <nom name="x1"/>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
  </satop>
</lf>
</second>
</paraphrase>
<paraphrase corpus="mtc.common" id="49">
<alignments source="GIZA_INTERSECTED">
<alignment first="0" second="0" status="S"/>
<alignment first="1" second="1" status="S"/>
<alignment first="2" second="2" status="S"/>
<alignment first="3" second="3" status="S"/>
<alignment first="8" second="5" status="S"/>
<alignment first="9" second="6" status="S"/>
<alignment first="10" second="7" status="S"/>
</alignments>
<alignments source="ANNOTATOR">
<alignment first="0" second="0" status="S"/>
<alignment first="1" second="1" status="S"/>
<alignment first="2" second="2" status="S"/>
<alignment first="3" second="3" status="S"/>
<alignment first="4" second="4" status="S"/>
<alignment first="8" second="5" status="S"/>
<alignment first="9" second="6" status="S"/>
<alignment first="10" second="7" status="S"/>
</alignments>
<first>
<string>someone connected global warming to the phenomenon of el nino .</string>
<pred-info>w9:n:NN:nino w8:n/n:JJ:el w7:np\np/np:IN:of w6:n:NN:phenomenon w5:np/n:DT:the w4:np\np/np:TO:to w3:n:NN:warming w2:n/n:JJ:global w1:n/n:JJ:connected w0:np/n:DT:someone</pred-info>
<full-words>someone:S-someone:P-DT:T-np/n connected:S-connected:P-JJ:T-n/n global:S-global:P-JJ:T-n/n warming:S-warming:P-NN:T-n to:S-to:P-TO:T-np\np/np the:S-the:P-DT:T-np/n phenomenon:S-phenomenon:P-NN:T-n of:S-of:P-IN:T-np\np/np el:S-el:P-JJ:T-n/n nino:S-nino:P-NN:T-n .:S-.:P-.:T-sent\np</full-words>
<lf>
  <satop nom="w3">
    <prop name="warming"/>
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
    <diamond mode="num">
      <prop name="sg"/>
    </diamond>
    <diamond mode="Det">
      <nom name="w0"/>
      <prop name="someone"/>
    </diamond>
    <diamond mode="Mod">
      <nom name="w1"/>
      <prop name="connected"/>
    </diamond>
    <diamond mode="Mod">
      <nom name="w2"/>
      <prop name="global"/>
    </diamond>
    <diamond mode="Mod">
      <chunk>
        <nom name="w4"/>
        <prop name="to"/>
        <diamond mode="Arg1">
          <chunk>
            <nom name="w6"/>
            <prop name="phenomenon"/>
            <diamond mode="num">
              <prop name="sg"/>
            </diamond>
            <diamond mode="Det">
              <nom name="w5"/>
              <prop name="the"/>
            </diamond>
            <diamond mode="Mod">
              <chunk>
                <nom name="w7"/>
                <prop name="of"/>
                <diamond mode="Arg1">
                  <chunk>
                    <nom name="w9"/>
                    <prop name="nino"/>
                    <diamond mode="det">
                      <prop name="nil"/>
                    </diamond>
                    <diamond mode="num">
                      <prop name="sg"/>
                    </diamond>
                    <diamond mode="Mod">
                      <nom name="w8"/>
                      <prop name="el"/>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
  </satop>
</lf>
</first>
<second>
<string>some linked global warming with el nino .</string>
<pred-info>w2:n/n:JJ:global w1:n/n:VBN:link w0:np/n:DT:some w6:n:NN:nino w5:n/n:JJ:el w4:np\np/np:IN:with w3:n:NN:warming</pred-info>
<full-words>some:S-some:P-DT:T-np/n linked:S-link:P-VBN:T-n/n global:S-global:P-JJ:T-n/n warming:S-warming:P-NN:T-n with:S-with:P-IN:T-np\np/np el:S-el:P-JJ:T-n/n nino:S-nino:P-NN:T-n .:S-.:P-.:T-sent\np</full-words>
<lf>
  <satop nom="w3">
    <prop name="warming"/>
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
    <diamond mode="num">
      <prop name="sg"/>
    </diamond>
    <diamond mode="Det">
      <nom name="w0"/>
      <prop name="some"/>
    </diamond>
    <diamond mode="Mod">
      <nom name="w1"/>
      <prop name="link"/>
    </diamond>
    <diamond mode="Mod">
      <nom name="w2"/>
      <prop name="global"/>
    </diamond>
    <diamond mode="Mod">
      <chunk>
        <nom name="w4"/>
        <prop name="with"/>
        <diamond mode="Arg1">
          <chunk>
            <nom name="w6"/>
            <prop name="nino"/>
            <diamond mode="det">
              <prop name="nil"/>
            </diamond>
            <diamond mode="num">
              <prop name="sg"/>
            </diamond>
            <diamond mode="Mod">
              <nom name="w5"/>
              <prop name="el"/>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
  </satop>
</lf>
</second>
</paraphrase>
<paraphrase corpus="mtc.common" id="50">
<alignments source="GIZA_INTERSECTED">
<alignment first="0" second="0" status="S"/>
<alignment first="1" second="1" status="S"/>
<alignment first="2" second="2" status="S"/>
<alignment first="3" second="3" status="S"/>
<alignment first="4" second="4" status="S"/>
<alignment first="5" second="5" status="S"/>
<alignment first="6" second="6" status="S"/>
<alignment first="7" second="7" status="S"/>
<alignment first="10" second="10" status="S"/>
<alignment first="11" second="9" status="S"/>
<alignment first="13" second="13" status="S"/>
<alignment first="15" second="19" status="S"/>
<alignment first="16" second="20" status="S"/>
<alignment first="17" second="21" status="S"/>
<alignment first="18" second="23" status="S"/>
<alignment first="19" second="24" status="S"/>
<alignment first="20" second="25" status="S"/>
<alignment first="21" second="26" status="S"/>
<alignment first="22" second="27" status="S"/>
<alignment first="23" second="17" status="S"/>
<alignment first="25" second="28" status="S"/>
<alignment first="26" second="29" status="S"/>
<alignment first="28" second="30" status="S"/>
<alignment first="29" second="31" status="S"/>
<alignment first="30" second="32" status="S"/>
<alignment first="32" second="35" status="S"/>
<alignment first="34" second="36" status="S"/>
<alignment first="36" second="38" status="S"/>
<alignment first="37" second="39" status="S"/>
</alignments>
<alignments source="ANNOTATOR">
<alignment first="0" second="0" status="S"/>
<alignment first="1" second="1" status="S"/>
<alignment first="2" second="2" status="S"/>
<alignment first="3" second="3" status="S"/>
<alignment first="4" second="4" status="S"/>
<alignment first="5" second="5" status="S"/>
<alignment first="6" second="6" status="S"/>
<alignment first="7" second="7" status="S"/>
<alignment first="10" second="10" status="S"/>
<alignment first="11" second="9" status="S"/>
<alignment first="12" second="11" status="P"/>
<alignment first="13" second="13" status="S"/>
<alignment first="14" second="12" status="S"/>
<alignment first="15" second="19" status="S"/>
<alignment first="16" second="20" status="S"/>
<alignment first="17" second="21" status="S"/>
<alignment first="18" second="23" status="P"/>
<alignment first="19" second="24" status="S"/>
<alignment first="20" second="25" status="S"/>
<alignment first="21" second="26" status="S"/>
<alignment first="22" second="27" status="S"/>
<alignment first="23" second="17" status="S"/>
<alignment first="24" second="16" status="S"/>
<alignment first="25" second="28" status="S"/>
<alignment first="26" second="29" status="S"/>
<alignment first="28" second="30" status="S"/>
<alignment first="29" second="31" status="S"/>
<alignment first="30" second="32" status="S"/>
<alignment first="30" second="33" status="S"/>
<alignment first="31" second="34" status="P"/>
<alignment first="32" second="35" status="S"/>
<alignment first="33" second="37" status="S"/>
<alignment first="34" second="36" status="P"/>
<alignment first="35" second="36" status="P"/>
<alignment first="36" second="38" status="S"/>
<alignment first="37" second="39" status="S"/>
</alignments>
<first>
<string>xinhua news agency , beijing , january 16th , by xintang xu and yuhong qian- the president of the bank of china , xianglong dai said that , china will continue implementing the financial opening up policy .</string>
<pred-info>w34:n:NN:policy w33:np\np/np:IN:up w32:n:NN:opening w31:n/n:JJ:financial w30:np/n:DT:the w9:s[ng]\np/np:VBG:xintang w19:np\np/np:IN:of w18:n:NN:bank w8:s\np\(s\np)/(s[ng]\np):IN:by w17:np/n:DT:the w16:np\np/np:IN:of w6:s\np\(s\np):JJ:16th w15:n:NN:president w5:s\np\(s\np)/(s\np\(s\np)):JJ:january w4:s[ng]\np:VBG:beijing w14:np/n:DT:the w13:s\np\(s\np)/np:IN:qian- w12:n:NN:yuhong w2:n:NN:agency w11:n\n/n:CC:and w1:n/n:NN:news w10:n:NN:xu w0:np/n:DT:xinhua w29:s[ng]\np/np:VBG:implement w28:s[b]\np/(s[ng]\np):VB:continue w27:s[dcl]\np/(s[b]\np):MD:will w26:n:NN:china w24:s[dcl]\np/s[em]:VBD:say w23:s\np/(s\np):NN:dai w22:s\np/(s\np)/(s\np/(s\np)):JJ:xianglong w20:n:NN:china</pred-info>
<full-words>xinhua:S-xinhua:P-DT:T-np/n news:S-news:P-NN:T-n/n agency:S-agency:P-NN:T-n ,:S-,:P-,:T-s\np/(s\np)/punct[,]/(s\np) beijing:S-beijing:P-VBG:T-s[ng]\np ,:S-,:P-,:T-punct[,] january:S-january:P-JJ:T-s\np\(s\np)/(s\np\(s\np)) 16th:S-16th:P-JJ:T-s\np\(s\np) ,:S-,:P-,:T-s\np\(s\np)/(s\np\(s\np)) by:S-by:P-IN:T-s\np\(s\np)/(s[ng]\np) xintang:S-xintang:P-VBG:T-s[ng]\np/np xu:S-xu:P-NN:T-n and:S-and:P-CC:T-n\n/n yuhong:S-yuhong:P-NN:T-n qian&#45;:S-qian&#45;:P-IN:T-s\np\(s\np)/np the:S-the:P-DT:T-np/n president:S-president:P-NN:T-n of:S-of:P-IN:T-np\np/np the:S-the:P-DT:T-np/n bank:S-bank:P-NN:T-n of:S-of:P-IN:T-np\np/np china:S-china:P-NN:T-n ,:S-,:P-,:T-punct[,] xianglong:S-xianglong:P-JJ:T-s\np/(s\np)/(s\np/(s\np)) dai:S-dai:P-NN:T-s\np/(s\np) said:S-say:P-VBD:T-s[dcl]\np/s[em] that:S-that:P-IN:T-s[em]/s[dcl] ,:S-,:P-,:T-punct[,] china:S-china:P-NN:T-n will:S-will:P-MD:T-s[dcl]\np/(s[b]\np) continue:S-continue:P-VB:T-s[b]\np/(s[ng]\np) implementing:S-implement:P-VBG:T-s[ng]\np/np the:S-the:P-DT:T-np/n financial:S-financial:P-JJ:T-n/n opening:S-opening:P-NN:T-n up:S-up:P-IN:T-np\np/np policy:S-policy:P-NN:T-n .:S-.:P-.:T-sent\s[dcl]</full-words>
<lf>
  <satop nom="w24">
    <prop name="say"/>
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
    <diamond mode="tense">
      <prop name="past"/>
    </diamond>
    <diamond mode="Arg0">
      <chunk>
        <nom name="w2"/>
        <prop name="agency"/>
        <diamond mode="num">
          <prop name="sg"/>
        </diamond>
        <diamond mode="Det">
          <nom name="w0"/>
          <prop name="xinhua"/>
        </diamond>
        <diamond mode="Mod">
          <nom name="w1"/>
          <prop name="news"/>
          <diamond mode="num">
            <prop name="sg"/>
          </diamond>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Arg1">
      <chunk>
        <nom name="w29"/>
        <prop name="will"/>
        <diamond mode="Arg0">
          <nom name="w28"/>
          <prop name="china"/>
          <diamond mode="det">
            <prop name="nil"/>
          </diamond>
          <diamond mode="num">
            <prop name="sg"/>
          </diamond>
        </diamond>
        <diamond mode="Arg1">
          <chunk>
            <nom name="w30"/>
            <prop name="continue"/>
            <diamond mode="Arg0">
              <nom name="w28"/>
            </diamond>
            <diamond mode="Arg1">
              <chunk>
                <nom name="w31"/>
                <prop name="implement"/>
                <diamond mode="partic">
                  <prop name="pres"/>
                </diamond>
                <diamond mode="Arg0">
                  <nom name="w28"/>
                </diamond>
                <diamond mode="Arg1">
                  <chunk>
                    <nom name="w34"/>
                    <prop name="opening"/>
                    <diamond mode="num">
                      <prop name="sg"/>
                    </diamond>
                    <diamond mode="Det">
                      <nom name="w32"/>
                      <prop name="the"/>
                    </diamond>
                    <diamond mode="Mod">
                      <nom name="w33"/>
                      <prop name="financial"/>
                    </diamond>
                    <diamond mode="Mod">
                      <chunk>
                        <nom name="w35"/>
                        <prop name="up"/>
                        <diamond mode="Arg1">
                          <nom name="w36"/>
                          <prop name="policy"/>
                          <diamond mode="det">
                            <prop name="nil"/>
                          </diamond>
                          <diamond mode="num">
                            <prop name="sg"/>
                          </diamond>
                        </diamond>
                      </chunk>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="InterruptRel">
      <chunk>
        <nom name="w4"/>
        <prop name="beijing"/>
        <diamond mode="partic">
          <prop name="pres"/>
        </diamond>
        <diamond mode="Arg0">
          <nom name="w2"/>
        </diamond>
        <diamond mode="Mod">
          <chunk>
            <nom name="w7"/>
            <prop name="16th"/>
            <diamond mode="Mod">
              <nom name="w6"/>
              <prop name="january"/>
            </diamond>
          </chunk>
        </diamond>
        <diamond mode="Mod">
          <chunk>
            <nom name="w9"/>
            <prop name="by"/>
            <diamond mode="emph-final">
              <prop name="+"/>
            </diamond>
            <diamond mode="Arg1">
              <chunk>
                <nom name="w10"/>
                <prop name="xintang"/>
                <diamond mode="partic">
                  <prop name="pres"/>
                </diamond>
                <diamond mode="Arg0">
                  <nom name="w2"/>
                </diamond>
                <diamond mode="Arg1">
                  <chunk>
                    <nom name="w12"/>
                    <prop name="and"/>
                    <diamond mode="det">
                      <prop name="nil"/>
                    </diamond>
                    <diamond mode="First">
                      <nom name="w11"/>
                      <prop name="xu"/>
                      <diamond mode="num">
                        <prop name="sg"/>
                      </diamond>
                    </diamond>
                    <diamond mode="Next">
                      <nom name="w13"/>
                      <prop name="yuhong"/>
                      <diamond mode="num">
                        <prop name="sg"/>
                      </diamond>
                    </diamond>
                  </chunk>
                </diamond>
                <diamond mode="Mod">
                  <chunk>
                    <nom name="w14"/>
                    <prop name="qian-"/>
                    <diamond mode="Arg1">
                      <chunk>
                        <nom name="w16"/>
                        <prop name="president"/>
                        <diamond mode="num">
                          <prop name="sg"/>
                        </diamond>
                        <diamond mode="Det">
                          <nom name="w15"/>
                          <prop name="the"/>
                        </diamond>
                        <diamond mode="Mod">
                          <chunk>
                            <nom name="w17"/>
                            <prop name="of"/>
                            <diamond mode="Arg1">
                              <chunk>
                                <nom name="w19"/>
                                <prop name="bank"/>
                                <diamond mode="num">
                                  <prop name="sg"/>
                                </diamond>
                                <diamond mode="Det">
                                  <nom name="w18"/>
                                  <prop name="the"/>
                                </diamond>
                              </chunk>
                            </diamond>
                          </chunk>
                        </diamond>
                        <diamond mode="Mod">
                          <chunk>
                            <nom name="w20"/>
                            <prop name="of"/>
                            <diamond mode="Arg1">
                              <nom name="w21"/>
                              <prop name="china"/>
                              <diamond mode="det">
                                <prop name="nil"/>
                              </diamond>
                              <diamond mode="num">
                                <prop name="sg"/>
                              </diamond>
                            </diamond>
                          </chunk>
                        </diamond>
                      </chunk>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Mod">
      <chunk>
        <nom name="w24"/>
        <prop name="dai"/>
        <diamond mode="num">
          <prop name="sg"/>
        </diamond>
        <diamond mode="Mod">
          <nom name="w23"/>
          <prop name="xianglong"/>
        </diamond>
      </chunk>
    </diamond>
  </satop>
</lf>
</first>
<second>
<string>xinhua news agency , beijing , january 16th ( reporter : xu xingtang , qian yuhong ) . dai xianglong , the president of people 's bank of china , said that china will carry on with the open financial policy .</string>
<pred-info>w37:n/n:JJ:open w36:np/n:DT:the w35:s\np\(s\np)/np:IN:with w34:s\np\(s\np):RP:on w33:s[b]\np:VB:carry w32:s[dcl]\np/(s[b]\np):MD:will w31:n:NN:china w9:n:NN:reporter w18:n:NNP:xianglong w8:n/n:NN:lrb w17:n/n:NNP:dai w7:n/n:JJ:16th w16:n:NN:rrb w6:n/n:JJ:january w15:n/n:JJ:yuhong w14:n/n:JJ:qian w4:s[ng]\np/np:VBG:beijing w13:np\np/np:,:, w2:n:NN:agency w12:n:NNP:xingtang w11:n/n:NNP:xu w1:n/n:NN:news w10:np\np/np:IN:| w0:np/n:DT:xinhua w29:s[dcl]\np/s[em]:VBD:say w27:n:NN:china w26:np\np/np:IN:of w25:n:NN:bank w23:n:NNS:people w22:np\np/np:IN:of w21:n:NN:president w20:np/n:DT:the w39:n:NN:policy w38:n/n:JJ:financial</pred-info>
<full-words>xinhua:S-xinhua:P-DT:T-np/n news:S-news:P-NN:T-n/n agency:S-agency:P-NN:T-n ,:S-,:P-,:T-s[dcl]\np/(s[dcl]\np) beijing:S-beijing:P-VBG:T-s[ng]\np/np ,:S-,:P-,:T-s\np\(s\np)/np january:S-january:P-JJ:T-n/n 16th:S-16th:P-JJ:T-n/n (:S-(:P-NN:T-n/n reporter:S-reporter:P-NN:T-n &amp;#58;:S-&amp;#58;:P-IN:T-np\np/np xu:S-xu:P-NNP:T-n/n xingtang:S-xingtang:P-NNP:T-n ,:S-,:P-,:T-np\np/np qian:S-qian:P-JJ:T-n/n yuhong:S-yuhong:P-JJ:T-n/n ):S-):P-NN:T-n .:S-.:P-.:T-punct[.] dai:S-dai:P-NNP:T-n/n xianglong:S-xianglong:P-NNP:T-n ,:S-,:P-,:T-np\np/punct[,]/np the:S-the:P-DT:T-np/n president:S-president:P-NN:T-n of:S-of:P-IN:T-np\np/np people:S-people:P-NNS:T-n &apos;s:S-&apos;s:P-POS:T-np/n\np bank:S-bank:P-NN:T-n of:S-of:P-IN:T-np\np/np china:S-china:P-NN:T-n ,:S-,:P-,:T-punct[,] said:S-say:P-VBD:T-s[dcl]\np/s[em] that:S-that:P-DT:T-s[em]/s[dcl] china:S-china:P-NN:T-n will:S-will:P-MD:T-s[dcl]\np/(s[b]\np) carry:S-carry:P-VB:T-s[b]\np on:S-on:P-RP:T-s\np\(s\np) with:S-with:P-IN:T-s\np\(s\np)/np the:S-the:P-DT:T-np/n open:S-open:P-JJ:T-n/n financial:S-financial:P-JJ:T-n/n policy:S-policy:P-NN:T-n .:S-.:P-.:T-sent\s[dcl]</full-words>
<lf>
  <satop nom="w29">
    <prop name="say"/>
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
    <diamond mode="tense">
      <prop name="past"/>
    </diamond>
    <diamond mode="Arg0">
      <chunk>
        <nom name="w2"/>
        <prop name="agency"/>
        <diamond mode="num">
          <prop name="sg"/>
        </diamond>
        <diamond mode="Det">
          <nom name="w0"/>
          <prop name="xinhua"/>
        </diamond>
        <diamond mode="Mod">
          <nom name="w1"/>
          <prop name="news"/>
          <diamond mode="num">
            <prop name="sg"/>
          </diamond>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Arg1">
      <chunk>
        <nom name="w33"/>
        <prop name="will"/>
        <diamond mode="Arg0">
          <nom name="w32"/>
          <prop name="china"/>
          <diamond mode="det">
            <prop name="nil"/>
          </diamond>
          <diamond mode="num">
            <prop name="sg"/>
          </diamond>
        </diamond>
        <diamond mode="Arg1">
          <chunk>
            <nom name="w34"/>
            <prop name="carry"/>
            <diamond mode="Arg0">
              <nom name="w32"/>
            </diamond>
            <diamond mode="Mod">
              <nom name="w35"/>
              <prop name="on"/>
            </diamond>
            <diamond mode="Mod">
              <chunk>
                <nom name="w36"/>
                <prop name="with"/>
                <diamond mode="Arg1">
                  <chunk>
                    <nom name="w40"/>
                    <prop name="policy"/>
                    <diamond mode="num">
                      <prop name="sg"/>
                    </diamond>
                    <diamond mode="Det">
                      <nom name="w37"/>
                      <prop name="the"/>
                    </diamond>
                    <diamond mode="Mod">
                      <nom name="w38"/>
                      <prop name="open"/>
                    </diamond>
                    <diamond mode="Mod">
                      <nom name="w39"/>
                      <prop name="financial"/>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="modFeat">
      <nom name="x1"/>
    </diamond>
    <diamond mode="GenRel">
      <chunk>
        <nom name="w4"/>
        <prop name="beijing"/>
        <diamond mode="partic">
          <prop name="pres"/>
        </diamond>
        <diamond mode="ApposRel">
          <chunk>
            <nom name="w9"/>
            <prop name="reporter"/>
            <diamond mode="det">
              <prop name="nil"/>
            </diamond>
            <diamond mode="num">
              <prop name="sg"/>
            </diamond>
            <diamond mode="Mod">
              <chunk>
                <nom name="w10"/>
                <prop name="&amp;amp;#58;"/>
                <diamond mode="Arg1">
                  <chunk>
                    <nom name="w13"/>
                    <prop name=","/>
                    <diamond mode="First">
                      <chunk>
                        <nom name="w12"/>
                        <prop name="xingtang"/>
                        <diamond mode="det">
                          <prop name="nil"/>
                        </diamond>
                        <diamond mode="num">
                          <prop name="sg"/>
                        </diamond>
                        <diamond mode="Mod">
                          <nom name="w11"/>
                          <prop name="xu"/>
                          <diamond mode="num">
                            <prop name="sg"/>
                          </diamond>
                        </diamond>
                      </chunk>
                    </diamond>
                    <diamond mode="Next">
                      <chunk>
                        <nom name="w16"/>
                        <prop name="rrb"/>
                        <diamond mode="det">
                          <prop name="nil"/>
                        </diamond>
                        <diamond mode="num">
                          <prop name="sg"/>
                        </diamond>
                        <diamond mode="Mod">
                          <nom name="w14"/>
                          <prop name="qian"/>
                        </diamond>
                        <diamond mode="Mod">
                          <nom name="w15"/>
                          <prop name="yuhong"/>
                        </diamond>
                      </chunk>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
            <diamond mode="Mod">
              <nom name="w6"/>
              <prop name="january"/>
            </diamond>
            <diamond mode="Mod">
              <nom name="w7"/>
              <prop name="16th"/>
            </diamond>
            <diamond mode="Mod">
              <nom name="w8"/>
              <prop name="lrb"/>
              <diamond mode="num">
                <prop name="sg"/>
              </diamond>
            </diamond>
          </chunk>
        </diamond>
        <diamond mode="Arg0">
          <nom name="w2"/>
        </diamond>
        <diamond mode="Arg1">
          <chunk>
            <nom name="w19"/>
            <prop name="xianglong"/>
            <diamond mode="det">
              <prop name="nil"/>
            </diamond>
            <diamond mode="num">
              <prop name="sg"/>
            </diamond>
            <diamond mode="ApposRel">
              <chunk>
                <nom name="w22"/>
                <prop name="president"/>
                <diamond mode="num">
                  <prop name="sg"/>
                </diamond>
                <diamond mode="Det">
                  <nom name="w21"/>
                  <prop name="the"/>
                </diamond>
                <diamond mode="Mod">
                  <chunk>
                    <nom name="w23"/>
                    <prop name="of"/>
                    <diamond mode="Arg1">
                      <chunk>
                        <nom name="w26"/>
                        <prop name="bank"/>
                        <diamond mode="num">
                          <prop name="sg"/>
                        </diamond>
                        <diamond mode="GenOwn">
                          <nom name="w24"/>
                          <prop name="people"/>
                          <diamond mode="det">
                            <prop name="nil"/>
                          </diamond>
                          <diamond mode="num">
                            <prop name="pl"/>
                          </diamond>
                        </diamond>
                      </chunk>
                    </diamond>
                  </chunk>
                </diamond>
                <diamond mode="Mod">
                  <chunk>
                    <nom name="w27"/>
                    <prop name="of"/>
                    <diamond mode="Arg1">
                      <nom name="w28"/>
                      <prop name="china"/>
                      <diamond mode="det">
                        <prop name="nil"/>
                      </diamond>
                      <diamond mode="num">
                        <prop name="sg"/>
                      </diamond>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
            <diamond mode="Mod">
              <nom name="w18"/>
              <prop name="dai"/>
              <diamond mode="num">
                <prop name="sg"/>
              </diamond>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
  </satop>
</lf>
</second>
</paraphrase>
<paraphrase corpus="mtc.common" id="51">
<alignments source="GIZA_INTERSECTED">
<alignment first="3" second="1" status="S"/>
<alignment first="4" second="2" status="S"/>
<alignment first="6" second="3" status="S"/>
<alignment first="7" second="4" status="S"/>
<alignment first="14" second="9" status="S"/>
<alignment first="15" second="10" status="S"/>
</alignments>
<alignments source="ANNOTATOR">
<alignment first="0" second="0" status="S"/>
<alignment first="1" second="0" status="S"/>
<alignment first="2" second="0" status="P"/>
<alignment first="3" second="1" status="S"/>
<alignment first="4" second="2" status="S"/>
<alignment first="6" second="3" status="S"/>
<alignment first="7" second="4" status="S"/>
<alignment first="8" second="5" status="P"/>
<alignment first="9" second="6" status="S"/>
<alignment first="10" second="6" status="S"/>
<alignment first="12" second="9" status="P"/>
<alignment first="14" second="7" status="S"/>
<alignment first="15" second="10" status="S"/>
</alignments>
<first>
<string>this kind of measure restrained the economic growth , leading to the rise of unemployment .</string>
<pred-info>w9:s[ng]\np:VBG:lead w7:n:NN:growth w6:n/n:JJ:economic w5:np/n:DT:the w4:s[dcl]\np/np:VBD:restrain w3:n:NN:measure w2:np\np/np:IN:of w1:n:NN:kind w0:np/n:DT:this w14:n:NN:unemployment w13:np\np/np:IN:of w12:n:NN:rise w11:np/n:DT:the w10:s\np\(s\np)/np:TO:to</pred-info>
<full-words>this:S-this:P-DT:T-np/n kind:S-kind:P-NN:T-n of:S-of:P-IN:T-np\np/np measure:S-measure:P-NN:T-n restrained:S-restrain:P-VBD:T-s[dcl]\np/np the:S-the:P-DT:T-np/n economic:S-economic:P-JJ:T-n/n growth:S-growth:P-NN:T-n ,:S-,:P-,:T-s\np\(s\np)/(s\np) leading:S-lead:P-VBG:T-s[ng]\np to:S-to:P-TO:T-s\np\(s\np)/np the:S-the:P-DT:T-np/n rise:S-rise:P-NN:T-n of:S-of:P-IN:T-np\np/np unemployment:S-unemployment:P-NN:T-n .:S-.:P-.:T-sent\s[dcl]</full-words>
<lf>
  <satop nom="w4">
    <prop name="restrain"/>
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
    <diamond mode="tense">
      <prop name="past"/>
    </diamond>
    <diamond mode="Arg0">
      <chunk>
        <nom name="w1"/>
        <prop name="kind"/>
        <diamond mode="num">
          <prop name="sg"/>
        </diamond>
        <diamond mode="Det">
          <nom name="w0"/>
          <prop name="this"/>
        </diamond>
        <diamond mode="Mod">
          <chunk>
            <nom name="w2"/>
            <prop name="of"/>
            <diamond mode="Arg1">
              <nom name="w3"/>
              <prop name="measure"/>
              <diamond mode="det">
                <prop name="nil"/>
              </diamond>
              <diamond mode="num">
                <prop name="sg"/>
              </diamond>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Arg1">
      <chunk>
        <nom name="w7"/>
        <prop name="growth"/>
        <diamond mode="num">
          <prop name="sg"/>
        </diamond>
        <diamond mode="Det">
          <nom name="w5"/>
          <prop name="the"/>
        </diamond>
        <diamond mode="Mod">
          <nom name="w6"/>
          <prop name="economic"/>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="EmphFinal">
      <chunk>
        <nom name="w9"/>
        <prop name="lead"/>
        <diamond mode="partic">
          <prop name="pres"/>
        </diamond>
        <diamond mode="Arg0">
          <nom name="w1"/>
        </diamond>
        <diamond mode="Mod">
          <chunk>
            <nom name="w10"/>
            <prop name="to"/>
            <diamond mode="Arg1">
              <chunk>
                <nom name="w12"/>
                <prop name="rise"/>
                <diamond mode="num">
                  <prop name="sg"/>
                </diamond>
                <diamond mode="Det">
                  <nom name="w11"/>
                  <prop name="the"/>
                </diamond>
                <diamond mode="Mod">
                  <chunk>
                    <nom name="w13"/>
                    <prop name="of"/>
                    <diamond mode="Arg1">
                      <nom name="w14"/>
                      <prop name="unemployment"/>
                      <diamond mode="det">
                        <prop name="nil"/>
                      </diamond>
                      <diamond mode="num">
                        <prop name="sg"/>
                      </diamond>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
  </satop>
</lf>
</first>
<second>
<string>such measures checked economic growth and caused unemployment to rise .</string>
<pred-info>w9:s[b]\np:VB:rise w7:n:NN:unemployment w6:s[dcl]\np/(s[to]\np)/np:VBD:cause w5:s[dcl]$\(s[dcl]$)/(s[dcl]$):CC:and w4:n:NN:growth w3:n/n:JJ:economic w2:s[dcl]\np/np:VBD:check w1:n:NNS:measure w0:np/np:JJ:such</pred-info>
<full-words>such:S-such:P-JJ:T-np/np measures:S-measure:P-NNS:T-n checked:S-check:P-VBD:T-s[dcl]\np/np economic:S-economic:P-JJ:T-n/n growth:S-growth:P-NN:T-n and:S-and:P-CC:T-s[dcl]$\(s[dcl]$)/(s[dcl]$) caused:S-cause:P-VBD:T-s[dcl]\np/(s[to]\np)/np unemployment:S-unemployment:P-NN:T-n to:S-to:P-TO:T-s[to]\np/(s[b]\np) rise:S-rise:P-VB:T-s[b]\np .:S-.:P-.:T-sent\s[dcl]</full-words>
<lf>
  <satop nom="w5">
    <prop name="and"/>
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
    <diamond mode="First">
      <chunk>
        <nom name="w2"/>
        <prop name="check"/>
        <diamond mode="tense">
          <prop name="past"/>
        </diamond>
        <diamond mode="Arg0">
          <nom name="w1"/>
        </diamond>
        <diamond mode="Arg1">
          <chunk>
            <nom name="w4"/>
            <prop name="growth"/>
            <diamond mode="det">
              <prop name="nil"/>
            </diamond>
            <diamond mode="num">
              <prop name="sg"/>
            </diamond>
            <diamond mode="Mod">
              <nom name="w3"/>
              <prop name="economic"/>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Next">
      <chunk>
        <nom name="w6"/>
        <prop name="cause"/>
        <diamond mode="tense">
          <prop name="past"/>
        </diamond>
        <diamond mode="Arg0">
          <nom name="w1"/>
        </diamond>
        <diamond mode="Arg1">
          <nom name="w7"/>
          <prop name="unemployment"/>
          <diamond mode="det">
            <prop name="nil"/>
          </diamond>
          <diamond mode="num">
            <prop name="sg"/>
          </diamond>
        </diamond>
        <diamond mode="Arg2">
          <chunk>
            <nom name="w9"/>
            <prop name="rise"/>
            <diamond mode="Arg0">
              <nom name="w7"/>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
    <satop nom="w1">
      <chunk>
        <prop name="measure"/>
        <diamond mode="det">
          <prop name="nil"/>
        </diamond>
        <diamond mode="num">
          <prop name="pl"/>
        </diamond>
        <diamond mode="Mod">
          <nom name="w0"/>
          <prop name="such"/>
        </diamond>
      </chunk>
    </satop>
  </satop>
</lf>
</second>
</paraphrase>
<paraphrase corpus="mtc.common" id="52">
<alignments source="GIZA_INTERSECTED">
<alignment first="0" second="2" status="S"/>
<alignment first="1" second="1" status="S"/>
<alignment first="2" second="4" status="S"/>
<alignment first="3" second="5" status="S"/>
<alignment first="4" second="6" status="S"/>
<alignment first="5" second="8" status="S"/>
<alignment first="6" second="9" status="S"/>
<alignment first="7" second="10" status="S"/>
<alignment first="12" second="12" status="S"/>
<alignment first="16" second="16" status="S"/>
<alignment first="17" second="17" status="S"/>
<alignment first="21" second="20" status="S"/>
</alignments>
<alignments source="ANNOTATOR">
<alignment first="0" second="2" status="P"/>
<alignment first="1" second="1" status="P"/>
<alignment first="2" second="4" status="S"/>
<alignment first="3" second="5" status="S"/>
<alignment first="4" second="6" status="S"/>
<alignment first="4" second="7" status="S"/>
<alignment first="5" second="8" status="S"/>
<alignment first="6" second="9" status="S"/>
<alignment first="7" second="10" status="S"/>
<alignment first="9" second="11" status="S"/>
<alignment first="12" second="12" status="S"/>
<alignment first="13" second="13" status="P"/>
<alignment first="14" second="14" status="S"/>
<alignment first="14" second="15" status="S"/>
<alignment first="16" second="16" status="P"/>
<alignment first="17" second="17" status="S"/>
<alignment first="17" second="18" status="P"/>
<alignment first="18" second="19" status="S"/>
<alignment first="21" second="20" status="S"/>
</alignments>
<first>
<string>siemens germany is currently cooperating with a local thai company , and constructing another 23km long electric railway project in bangkok .</string>
<pred-info>w19:s\np\(s\np)/np:IN:in w9:n:NN:company w18:n:NN:project w8:n/n:NN:thai w17:n/n:NN:railway w7:n/n:JJ:local w16:n/n:JJ:electric w6:np/n:DT:a w15:n/n:JJ:long w5:pp/np:IN:with w14:n/n:JJ:23km w4:s[ng]\np/pp:VBG:cooperate w13:np/n:DT:another w3:s\np\(s\np):RB:currently w12:s[ng]\np/np:VBG:construct w2:s[dcl]\np/(s[ng]\np):VBZ:PROG w11:s[ng]$\(s[ng]$)\punct[,]/(s[ng]$):CC:and w1:n:NN:germany w0:n/n:NNS:siemens w20:n:NN:bangkok</pred-info>
<full-words>siemens:S-siemens:P-NNS:T-n/n germany:S-germany:P-NN:T-n is:S-be:P-VBZ:T-s[dcl]\np/(s[ng]\np) currently:S-currently:P-RB:T-s\np\(s\np) cooperating:S-cooperate:P-VBG:T-s[ng]\np/pp with:S-with:P-IN:T-pp/np a:S-a:P-DT:T-np/n local:S-local:P-JJ:T-n/n thai:S-thai:P-NN:T-n/n company:S-company:P-NN:T-n ,:S-,:P-,:T-punct[,] and:S-and:P-CC:T-s[ng]$\(s[ng]$)\punct[,]/(s[ng]$) constructing:S-construct:P-VBG:T-s[ng]\np/np another:S-another:P-DT:T-np/n 23km:S-23km:P-JJ:T-n/n long:S-long:P-JJ:T-n/n electric:S-electric:P-JJ:T-n/n railway:S-railway:P-NN:T-n/n project:S-project:P-NN:T-n in:S-in:P-IN:T-s\np\(s\np)/np bangkok:S-bangkok:P-NN:T-n .:S-.:P-.:T-sent\s[dcl]</full-words>
<lf>
  <satop nom="w2">
    <prop name="PROG"/>
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
    <diamond mode="tense">
      <prop name="pres"/>
    </diamond>
    <diamond mode="Arg0">
      <chunk>
        <nom name="w1"/>
        <prop name="germany"/>
        <diamond mode="det">
          <prop name="nil"/>
        </diamond>
        <diamond mode="num">
          <prop name="sg"/>
        </diamond>
        <diamond mode="Mod">
          <nom name="w0"/>
          <prop name="siemens"/>
          <diamond mode="num">
            <prop name="pl"/>
          </diamond>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Arg1">
      <chunk>
        <nom name="w11"/>
        <prop name="and"/>
        <diamond mode="First">
          <chunk>
            <nom name="w4"/>
            <prop name="cooperate"/>
            <diamond mode="partic">
              <prop name="pres"/>
            </diamond>
            <diamond mode="Arg0">
              <nom name="w1"/>
            </diamond>
            <diamond mode="Arg1">
              <chunk>
                <nom name="w5"/>
                <prop name="with"/>
                <diamond mode="Arg1">
                  <chunk>
                    <nom name="w9"/>
                    <prop name="company"/>
                    <diamond mode="num">
                      <prop name="sg"/>
                    </diamond>
                    <diamond mode="Det">
                      <nom name="w6"/>
                      <prop name="a"/>
                    </diamond>
                    <diamond mode="Mod">
                      <nom name="w7"/>
                      <prop name="local"/>
                    </diamond>
                    <diamond mode="Mod">
                      <nom name="w8"/>
                      <prop name="thai"/>
                      <diamond mode="num">
                        <prop name="sg"/>
                      </diamond>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
        <diamond mode="Next">
          <chunk>
            <nom name="w12"/>
            <prop name="construct"/>
            <diamond mode="partic">
              <prop name="pres"/>
            </diamond>
            <diamond mode="Arg0">
              <nom name="w1"/>
            </diamond>
            <diamond mode="Arg1">
              <chunk>
                <nom name="w18"/>
                <prop name="project"/>
                <diamond mode="num">
                  <prop name="sg"/>
                </diamond>
                <diamond mode="Det">
                  <nom name="w13"/>
                  <prop name="another"/>
                </diamond>
                <diamond mode="Mod">
                  <nom name="w14"/>
                  <prop name="23km"/>
                </diamond>
                <diamond mode="Mod">
                  <nom name="w15"/>
                  <prop name="long"/>
                </diamond>
                <diamond mode="Mod">
                  <nom name="w16"/>
                  <prop name="electric"/>
                </diamond>
                <diamond mode="Mod">
                  <nom name="w17"/>
                  <prop name="railway"/>
                  <diamond mode="num">
                    <prop name="sg"/>
                  </diamond>
                </diamond>
              </chunk>
            </diamond>
            <diamond mode="Mod">
              <chunk>
                <nom name="w19"/>
                <prop name="in"/>
                <diamond mode="Arg1">
                  <nom name="w20"/>
                  <prop name="bangkok"/>
                  <diamond mode="det">
                    <prop name="nil"/>
                  </diamond>
                  <diamond mode="num">
                    <prop name="sg"/>
                  </diamond>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Mod">
      <nom name="w3"/>
      <prop name="currently"/>
    </diamond>
  </satop>
</lf>
</first>
<second>
<string>the german shermans company is currently working together with a local company constructing a 23 kilometer electronic train engineering project .</string>
<pred-info>w19:n:NN:project w9:np/n:DT:a w18:n/n:NN:engineering w8:s\np\(s\np)/np:IN:with w17:n/n:NN:train w7:s\np\(s\np):RB:together w6:s[ng]\np:VBG:work w16:n/n:JJ:electronic w15:n/n:NN:kilometer w5:s\np\(s\np):RB:currently w4:s[dcl]\np/(s[ng]\np):VBZ:PROG w14:n/n:CD:23 w13:np/n:DT:a w3:n:NN:company w12:s[ng]\np/np:VBG:construct w2:n/n:NNS:shermans w11:n:NN:company w1:n/n:NN:german w10:n/n:JJ:local w0:np/n:DT:the</pred-info>
<full-words>the:S-the:P-DT:T-np/n german:S-german:P-NN:T-n/n shermans:S-shermans:P-NNS:T-n/n company:S-company:P-NN:T-n is:S-be:P-VBZ:T-s[dcl]\np/(s[ng]\np) currently:S-currently:P-RB:T-s\np\(s\np) working:S-work:P-VBG:T-s[ng]\np together:S-together:P-RB:T-s\np\(s\np) with:S-with:P-IN:T-s\np\(s\np)/np a:S-a:P-DT:T-np/n local:S-local:P-JJ:T-n/n company:S-company:P-NN:T-n constructing:S-construct:P-VBG:T-s[ng]\np/np a:S-a:P-DT:T-np/n 23:S-23:P-CD:T-n/n kilometer:S-kilometer:P-NN:T-n/n electronic:S-electronic:P-JJ:T-n/n train:S-train:P-NN:T-n/n engineering:S-engineering:P-NN:T-n/n project:S-project:P-NN:T-n .:S-.:P-.:T-sent\s[dcl]</full-words>
<lf>
  <satop nom="w4">
    <prop name="PROG"/>
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
    <diamond mode="tense">
      <prop name="pres"/>
    </diamond>
    <diamond mode="Arg0">
      <chunk>
        <nom name="w3"/>
        <prop name="company"/>
        <diamond mode="num">
          <prop name="sg"/>
        </diamond>
        <diamond mode="Det">
          <nom name="w0"/>
          <prop name="the"/>
        </diamond>
        <diamond mode="Mod">
          <nom name="w1"/>
          <prop name="german"/>
          <diamond mode="num">
            <prop name="sg"/>
          </diamond>
        </diamond>
        <diamond mode="Mod">
          <nom name="w2"/>
          <prop name="shermans"/>
          <diamond mode="num">
            <prop name="pl"/>
          </diamond>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Arg1">
      <chunk>
        <nom name="w6"/>
        <prop name="work"/>
        <diamond mode="partic">
          <prop name="pres"/>
        </diamond>
        <diamond mode="Arg0">
          <nom name="w3"/>
        </diamond>
        <diamond mode="Mod">
          <nom name="w7"/>
          <prop name="together"/>
        </diamond>
        <diamond mode="Mod">
          <chunk>
            <nom name="w8"/>
            <prop name="with"/>
            <diamond mode="Arg1">
              <chunk>
                <nom name="w11"/>
                <prop name="company"/>
                <diamond mode="num">
                  <prop name="sg"/>
                </diamond>
                <diamond mode="Det">
                  <nom name="w9"/>
                  <prop name="a"/>
                </diamond>
                <diamond mode="Mod">
                  <nom name="w10"/>
                  <prop name="local"/>
                </diamond>
                <diamond mode="GenRel">
                  <chunk>
                    <nom name="w12"/>
                    <prop name="construct"/>
                    <diamond mode="partic">
                      <prop name="pres"/>
                    </diamond>
                    <diamond mode="Arg0">
                      <nom name="w11"/>
                    </diamond>
                    <diamond mode="Arg1">
                      <chunk>
                        <nom name="w19"/>
                        <prop name="project"/>
                        <diamond mode="num">
                          <prop name="sg"/>
                        </diamond>
                        <diamond mode="Det">
                          <nom name="w13"/>
                          <prop name="a"/>
                        </diamond>
                        <diamond mode="Mod">
                          <nom name="w14"/>
                          <prop name="23"/>
                        </diamond>
                        <diamond mode="Mod">
                          <nom name="w15"/>
                          <prop name="kilometer"/>
                          <diamond mode="num">
                            <prop name="sg"/>
                          </diamond>
                        </diamond>
                        <diamond mode="Mod">
                          <nom name="w16"/>
                          <prop name="electronic"/>
                        </diamond>
                        <diamond mode="Mod">
                          <nom name="w17"/>
                          <prop name="train"/>
                          <diamond mode="num">
                            <prop name="sg"/>
                          </diamond>
                        </diamond>
                        <diamond mode="Mod">
                          <nom name="w18"/>
                          <prop name="engineering"/>
                          <diamond mode="num">
                            <prop name="sg"/>
                          </diamond>
                        </diamond>
                      </chunk>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Mod">
      <nom name="w5"/>
      <prop name="currently"/>
    </diamond>
  </satop>
</lf>
</second>
</paraphrase>
<paraphrase corpus="mtc.common" id="53">
<alignments source="GIZA_INTERSECTED">
<alignment first="0" second="0" status="S"/>
<alignment first="1" second="1" status="S"/>
<alignment first="2" second="2" status="S"/>
<alignment first="3" second="3" status="S"/>
<alignment first="4" second="4" status="S"/>
<alignment first="5" second="5" status="S"/>
<alignment first="6" second="6" status="S"/>
<alignment first="7" second="7" status="S"/>
<alignment first="8" second="8" status="S"/>
<alignment first="9" second="9" status="S"/>
<alignment first="10" second="10" status="S"/>
<alignment first="11" second="11" status="S"/>
<alignment first="12" second="12" status="S"/>
<alignment first="13" second="13" status="S"/>
<alignment first="14" second="14" status="S"/>
<alignment first="15" second="15" status="S"/>
</alignments>
<alignments source="ANNOTATOR">
<alignment first="0" second="0" status="S"/>
<alignment first="1" second="1" status="S"/>
<alignment first="2" second="2" status="S"/>
<alignment first="3" second="3" status="S"/>
<alignment first="4" second="4" status="S"/>
<alignment first="5" second="5" status="S"/>
<alignment first="6" second="6" status="S"/>
<alignment first="7" second="7" status="S"/>
<alignment first="8" second="8" status="S"/>
<alignment first="9" second="9" status="S"/>
<alignment first="10" second="10" status="S"/>
<alignment first="11" second="11" status="S"/>
<alignment first="12" second="12" status="S"/>
<alignment first="13" second="13" status="S"/>
<alignment first="14" second="14" status="S"/>
<alignment first="15" second="15" status="S"/>
</alignments>
<first>
<string>he said that the same resolve would lead to the success of the kyoto protocol .</string>
<pred-info>w9:np/n:DT:the w8:pp/np:TO:to w7:s[b]\np/pp:VB:lead w6:s[dcl]\np/(s[b]\np):MD:would w5:n:NN:resolve w4:n/n:JJ:same w3:np/n:DT:the w1:s[dcl]\np/s[em]:VBD:say w0:np:PRP:he w14:n:NN:protocol w13:n/n:NN:kyoto w12:np/n:DT:the w11:np\np/np:IN:of w10:n:NN:success</pred-info>
<full-words>he:S-he:P-PRP:T-np said:S-say:P-VBD:T-s[dcl]\np/s[em] that:S-that:P-IN:T-s[em]/s[dcl] the:S-the:P-DT:T-np/n same:S-same:P-JJ:T-n/n resolve:S-resolve:P-NN:T-n would:S-would:P-MD:T-s[dcl]\np/(s[b]\np) lead:S-lead:P-VB:T-s[b]\np/pp to:S-to:P-TO:T-pp/np the:S-the:P-DT:T-np/n success:S-success:P-NN:T-n of:S-of:P-IN:T-np\np/np the:S-the:P-DT:T-np/n kyoto:S-kyoto:P-NN:T-n/n protocol:S-protocol:P-NN:T-n .:S-.:P-.:T-sent\s[dcl]</full-words>
<lf>
  <satop nom="w1">
    <prop name="say"/>
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
    <diamond mode="tense">
      <prop name="past"/>
    </diamond>
    <diamond mode="Arg0">
      <nom name="w0"/>
      <prop name="he"/>
    </diamond>
    <diamond mode="Arg1">
      <chunk>
        <nom name="w6"/>
        <prop name="would"/>
        <diamond mode="Arg0">
          <chunk>
            <nom name="w5"/>
            <prop name="resolve"/>
            <diamond mode="num">
              <prop name="sg"/>
            </diamond>
            <diamond mode="Det">
              <nom name="w3"/>
              <prop name="the"/>
            </diamond>
            <diamond mode="Mod">
              <nom name="w4"/>
              <prop name="same"/>
            </diamond>
          </chunk>
        </diamond>
        <diamond mode="Arg1">
          <chunk>
            <nom name="w7"/>
            <prop name="lead"/>
            <diamond mode="Arg0">
              <nom name="w5"/>
            </diamond>
            <diamond mode="Arg1">
              <chunk>
                <nom name="w8"/>
                <prop name="to"/>
                <diamond mode="Arg1">
                  <chunk>
                    <nom name="w10"/>
                    <prop name="success"/>
                    <diamond mode="num">
                      <prop name="sg"/>
                    </diamond>
                    <diamond mode="Det">
                      <nom name="w9"/>
                      <prop name="the"/>
                    </diamond>
                    <diamond mode="Mod">
                      <chunk>
                        <nom name="w11"/>
                        <prop name="of"/>
                        <diamond mode="Arg1">
                          <chunk>
                            <nom name="w14"/>
                            <prop name="protocol"/>
                            <diamond mode="num">
                              <prop name="sg"/>
                            </diamond>
                            <diamond mode="Det">
                              <nom name="w12"/>
                              <prop name="the"/>
                            </diamond>
                            <diamond mode="Mod">
                              <nom name="w13"/>
                              <prop name="kyoto"/>
                              <diamond mode="num">
                                <prop name="sg"/>
                              </diamond>
                            </diamond>
                          </chunk>
                        </diamond>
                      </chunk>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
  </satop>
</lf>
</first>
<second>
<string>he said that the same resolve would lead to the success of the kyoto protocol .</string>
<pred-info>w9:np/n:DT:the w8:pp/np:TO:to w7:s[b]\np/pp:VB:lead w6:s[dcl]\np/(s[b]\np):MD:would w5:n:NN:resolve w4:n/n:JJ:same w3:np/n:DT:the w1:s[dcl]\np/s[em]:VBD:say w0:np:PRP:he w14:n:NN:protocol w13:n/n:NN:kyoto w12:np/n:DT:the w11:np\np/np:IN:of w10:n:NN:success</pred-info>
<full-words>he:S-he:P-PRP:T-np said:S-say:P-VBD:T-s[dcl]\np/s[em] that:S-that:P-IN:T-s[em]/s[dcl] the:S-the:P-DT:T-np/n same:S-same:P-JJ:T-n/n resolve:S-resolve:P-NN:T-n would:S-would:P-MD:T-s[dcl]\np/(s[b]\np) lead:S-lead:P-VB:T-s[b]\np/pp to:S-to:P-TO:T-pp/np the:S-the:P-DT:T-np/n success:S-success:P-NN:T-n of:S-of:P-IN:T-np\np/np the:S-the:P-DT:T-np/n kyoto:S-kyoto:P-NN:T-n/n protocol:S-protocol:P-NN:T-n .:S-.:P-.:T-sent\s[dcl]</full-words>
<lf>
  <satop nom="w1">
    <prop name="say"/>
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
    <diamond mode="tense">
      <prop name="past"/>
    </diamond>
    <diamond mode="Arg0">
      <nom name="w0"/>
      <prop name="he"/>
    </diamond>
    <diamond mode="Arg1">
      <chunk>
        <nom name="w6"/>
        <prop name="would"/>
        <diamond mode="Arg0">
          <chunk>
            <nom name="w5"/>
            <prop name="resolve"/>
            <diamond mode="num">
              <prop name="sg"/>
            </diamond>
            <diamond mode="Det">
              <nom name="w3"/>
              <prop name="the"/>
            </diamond>
            <diamond mode="Mod">
              <nom name="w4"/>
              <prop name="same"/>
            </diamond>
          </chunk>
        </diamond>
        <diamond mode="Arg1">
          <chunk>
            <nom name="w7"/>
            <prop name="lead"/>
            <diamond mode="Arg0">
              <nom name="w5"/>
            </diamond>
            <diamond mode="Arg1">
              <chunk>
                <nom name="w8"/>
                <prop name="to"/>
                <diamond mode="Arg1">
                  <chunk>
                    <nom name="w10"/>
                    <prop name="success"/>
                    <diamond mode="num">
                      <prop name="sg"/>
                    </diamond>
                    <diamond mode="Det">
                      <nom name="w9"/>
                      <prop name="the"/>
                    </diamond>
                    <diamond mode="Mod">
                      <chunk>
                        <nom name="w11"/>
                        <prop name="of"/>
                        <diamond mode="Arg1">
                          <chunk>
                            <nom name="w14"/>
                            <prop name="protocol"/>
                            <diamond mode="num">
                              <prop name="sg"/>
                            </diamond>
                            <diamond mode="Det">
                              <nom name="w12"/>
                              <prop name="the"/>
                            </diamond>
                            <diamond mode="Mod">
                              <nom name="w13"/>
                              <prop name="kyoto"/>
                              <diamond mode="num">
                                <prop name="sg"/>
                              </diamond>
                            </diamond>
                          </chunk>
                        </diamond>
                      </chunk>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
  </satop>
</lf>
</second>
</paraphrase>
<paraphrase corpus="mtc.common" id="54">
<alignments source="GIZA_INTERSECTED">
<alignment first="0" second="0" status="S"/>
<alignment first="1" second="1" status="S"/>
<alignment first="2" second="2" status="S"/>
<alignment first="3" second="3" status="S"/>
<alignment first="8" second="6" status="S"/>
<alignment first="9" second="7" status="S"/>
<alignment first="10" second="8" status="S"/>
<alignment first="11" second="9" status="S"/>
<alignment first="12" second="10" status="S"/>
<alignment first="13" second="11" status="S"/>
<alignment first="14" second="12" status="S"/>
<alignment first="15" second="13" status="S"/>
<alignment first="19" second="22" status="S"/>
<alignment first="20" second="23" status="S"/>
<alignment first="21" second="15" status="S"/>
<alignment first="22" second="16" status="S"/>
<alignment first="25" second="17" status="S"/>
<alignment first="26" second="18" status="S"/>
<alignment first="27" second="19" status="S"/>
<alignment first="28" second="20" status="S"/>
<alignment first="29" second="28" status="S"/>
</alignments>
<alignments source="ANNOTATOR">
<alignment first="0" second="0" status="S"/>
<alignment first="1" second="1" status="S"/>
<alignment first="2" second="2" status="S"/>
<alignment first="3" second="3" status="S"/>
<alignment first="8" second="4" status="S"/>
<alignment first="8" second="5" status="S"/>
<alignment first="8" second="6" status="S"/>
<alignment first="9" second="7" status="S"/>
<alignment first="10" second="8" status="S"/>
<alignment first="11" second="9" status="S"/>
<alignment first="12" second="10" status="S"/>
<alignment first="13" second="11" status="S"/>
<alignment first="14" second="12" status="S"/>
<alignment first="15" second="13" status="S"/>
<alignment first="19" second="22" status="S"/>
<alignment first="20" second="23" status="S"/>
<alignment first="21" second="15" status="S"/>
<alignment first="22" second="16" status="S"/>
<alignment first="22" second="26" status="P"/>
<alignment first="22" second="27" status="P"/>
<alignment first="23" second="24" status="P"/>
<alignment first="24" second="13" status="P"/>
<alignment first="24" second="25" status="P"/>
<alignment first="25" second="17" status="S"/>
<alignment first="26" second="18" status="S"/>
<alignment first="27" second="19" status="S"/>
<alignment first="28" second="20" status="S"/>
<alignment first="29" second="28" status="S"/>
</alignments>
<first>
<string>however , the official who disclosed the above declined to elaborate what kind of missile technology is being exported and when china provided such technology to pakistan and iran .</string>
<pred-info>w19:np\np\(np\np)/(np\np):CC:and w18:s[pss]\np:VBN:export w8:s[dcl]\np/(s[to]\np):VBD:decline w17:s[ng]\np/(s[pss]\np):VBG:PASS w7:n:NN:above w16:s[dcl]\np/(s[ng]\np):VBZ:PROG w6:np/n:DT:the w15:n:NN:technology w5:s[dcl]\np/np:VBD:disclose w14:n/n:NN:missile w13:np\np/np:IN:of w3:n:NN:official w12:n:NN:kind w2:np/n:DT:the w11:np/n:WP:what w10:s[b]\np:VB:elaborate w0:s/s:RB:however w28:s[b]\np:VB:iran w27:s[b]$\(s[b]$)/(s[b]$):CC:and w26:s[b]\np:VB:pakistan w24:n:NN:technology w23:np/np:JJ:such w22:s[dcl]\np/np:VBD:provide w21:n:NN:china w20:np\np/s[dcl]:WRB:when</pred-info>
<full-words>however:S-however:P-RB:T-s/s ,:S-,:P-,:T-s/s\(s/s) the:S-the:P-DT:T-np/n official:S-official:P-NN:T-n who:S-who:P-WP:T-np\np/(s[dcl]\np) disclosed:S-disclose:P-VBD:T-s[dcl]\np/np the:S-the:P-DT:T-np/n above:S-above:P-NN:T-n declined:S-decline:P-VBD:T-s[dcl]\np/(s[to]\np) to:S-to:P-TO:T-s[to]\np/(s[b]\np) elaborate:S-elaborate:P-VB:T-s[b]\np what:S-what:P-WP:T-np/n kind:S-kind:P-NN:T-n of:S-of:P-IN:T-np\np/np missile:S-missile:P-NN:T-n/n technology:S-technology:P-NN:T-n is:S-be:P-VBZ:T-s[dcl]\np/(s[ng]\np) being:S-be:P-VBG:T-s[ng]\np/(s[pss]\np) exported:S-export:P-VBN:T-s[pss]\np and:S-and:P-CC:T-np\np\(np\np)/(np\np) when:S-when:P-WRB:T-np\np/s[dcl] china:S-china:P-NN:T-n provided:S-provide:P-VBD:T-s[dcl]\np/np such:S-such:P-JJ:T-np/np technology:S-technology:P-NN:T-n to:S-to:P-TO:T-s[to]\np/(s[b]\np) pakistan:S-pakistan:P-VB:T-s[b]\np and:S-and:P-CC:T-s[b]$\(s[b]$)/(s[b]$) iran:S-iran:P-VB:T-s[b]\np .:S-.:P-.:T-sent\(np\np)</full-words>
<lf>
  <satop nom="w16">
    <chunk>
      <prop name="PROG"/>
      <diamond mode="tense">
        <prop name="pres"/>
      </diamond>
      <diamond mode="Arg0">
        <chunk>
          <nom name="w12"/>
          <prop name="kind"/>
          <diamond mode="num">
            <prop name="sg"/>
          </diamond>
          <diamond mode="Det">
            <nom name="w11"/>
            <prop name="what"/>
          </diamond>
          <diamond mode="Mod">
            <chunk>
              <nom name="w13"/>
              <prop name="of"/>
              <diamond mode="Arg1">
                <chunk>
                  <nom name="w15"/>
                  <prop name="technology"/>
                  <diamond mode="det">
                    <prop name="nil"/>
                  </diamond>
                  <diamond mode="num">
                    <prop name="sg"/>
                  </diamond>
                  <diamond mode="Mod">
                    <nom name="w14"/>
                    <prop name="missile"/>
                    <diamond mode="num">
                      <prop name="sg"/>
                    </diamond>
                  </diamond>
                </chunk>
              </diamond>
            </chunk>
          </diamond>
        </chunk>
      </diamond>
      <diamond mode="Arg1">
        <chunk>
          <nom name="w17"/>
          <prop name="PASS"/>
          <diamond mode="partic">
            <prop name="pres"/>
          </diamond>
          <diamond mode="Arg0">
            <nom name="w12"/>
          </diamond>
          <diamond mode="Arg1">
            <chunk>
              <nom name="w18"/>
              <prop name="export"/>
              <diamond mode="partic">
                <prop name="pass"/>
              </diamond>
              <diamond mode="Arg1">
                <nom name="w12"/>
              </diamond>
            </chunk>
          </diamond>
        </chunk>
      </diamond>
    </chunk>
  </satop>
  <satop nom="w21">
    <prop name="china"/>
    <diamond mode="num">
      <prop name="sg"/>
    </diamond>
  </satop>
  <satop nom="w24">
    <prop name="technology"/>
    <diamond mode="num">
      <prop name="sg"/>
    </diamond>
  </satop>
  <satop nom="w8">
    <chunk>
      <prop name="decline"/>
      <diamond mode="tense">
        <prop name="past"/>
      </diamond>
      <diamond mode="Arg0">
        <chunk>
          <nom name="w3"/>
          <prop name="official"/>
          <diamond mode="num">
            <prop name="sg"/>
          </diamond>
          <diamond mode="Det">
            <nom name="w2"/>
            <prop name="the"/>
          </diamond>
          <diamond mode="GenRel">
            <chunk>
              <nom name="w5"/>
              <prop name="disclose"/>
              <diamond mode="tense">
                <prop name="past"/>
              </diamond>
              <diamond mode="Arg0">
                <nom name="w3"/>
              </diamond>
              <diamond mode="Arg1">
                <chunk>
                  <nom name="w7"/>
                  <prop name="above"/>
                  <diamond mode="num">
                    <prop name="sg"/>
                  </diamond>
                  <diamond mode="Det">
                    <nom name="w6"/>
                    <prop name="the"/>
                  </diamond>
                </chunk>
              </diamond>
            </chunk>
          </diamond>
        </chunk>
      </diamond>
      <diamond mode="Arg1">
        <chunk>
          <nom name="w10"/>
          <prop name="elaborate"/>
          <diamond mode="Arg0">
            <nom name="w3"/>
          </diamond>
        </chunk>
      </diamond>
    </chunk>
  </satop>
  <satop nom="x7">
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
    <diamond mode="Mod">
      <chunk>
        <nom name="w19"/>
        <prop name="and"/>
        <diamond mode="Arg1">
          <chunk>
            <nom name="x5"/>
            <diamond mode="Mod">
              <chunk>
                <nom name="w20"/>
                <prop name="when"/>
                <diamond mode="Arg1">
                  <chunk>
                    <nom name="w22"/>
                    <prop name="provide"/>
                    <diamond mode="tense">
                      <prop name="past"/>
                    </diamond>
                    <diamond mode="Arg0">
                      <nom name="x3"/>
                    </diamond>
                    <diamond mode="Arg1">
                      <chunk>
                        <nom name="x4"/>
                        <diamond mode="Mod">
                          <nom name="w23"/>
                          <prop name="such"/>
                        </diamond>
                      </chunk>
                    </diamond>
                    <diamond mode="Purpose">
                      <chunk>
                        <nom name="w27"/>
                        <prop name="and"/>
                        <diamond mode="First">
                          <chunk>
                            <nom name="w26"/>
                            <prop name="pakistan"/>
                            <diamond mode="Arg0">
                              <nom name="x3"/>
                            </diamond>
                          </chunk>
                        </diamond>
                        <diamond mode="Next">
                          <chunk>
                            <nom name="w28"/>
                            <prop name="iran"/>
                            <diamond mode="Arg0">
                              <nom name="x3"/>
                            </diamond>
                          </chunk>
                        </diamond>
                      </chunk>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
        <diamond mode="Arg2">
          <chunk>
            <nom name="x6"/>
            <diamond mode="GenRel">
              <chunk>
                <nom name="x1"/>
                <diamond mode="Mod">
                  <nom name="w0"/>
                  <prop name="however"/>
                  <diamond mode="emph-intro">
                    <prop name="+"/>
                  </diamond>
                </diamond>
                <diamond mode="Mod">
                  <nom name="x2"/>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
  </satop>
</lf>
</first>
<second>
<string>however , the official was not willing to explain what kind of missile technology that china provided to pakistan and iran , and when this technology was provided .</string>
<pred-info>w19:n:NN:iran w9:n:NN:kind w18:n\n/n:CC:and w8:np/n:WP:what w17:n:NN:pakistan w7:s[b]\np/np:VB:explain w16:pp/np:TO:to w15:s[pss]\np/pp:VBN:provide w5:s[adj]\np/(s[to]\np):JJ:willing w14:s[dcl]\np/(s[pss]\np):VBZ:china w4:s\np\(s\np):RB:not w3:s[dcl]\np/(s[adj]\np):VBD:be w12:n:NN:technology w2:n:NN:official w11:n/n:NN:missile w1:np/n:DT:the w10:np\np/np:IN:of w0:s/s:RB:however w26:s[pss]\np:VBN:provide w25:s[dcl]\np/(s[pss]\np):VBD:PASS w24:n:NN:technology w23:np/n:DT:this w22:s/s/s[dcl]:WRB:when w21:s$\(s$)/(s$):CC:and</pred-info>
<full-words>however:S-however:P-RB:T-s/s ,:S-,:P-,:T-punct[,] the:S-the:P-DT:T-np/n official:S-official:P-NN:T-n was:S-be:P-VBD:T-s[dcl]\np/(s[adj]\np) not:S-not:P-RB:T-s\np\(s\np) willing:S-willing:P-JJ:T-s[adj]\np/(s[to]\np) to:S-to:P-TO:T-s[to]\np/(s[b]\np) explain:S-explain:P-VB:T-s[b]\np/np what:S-what:P-WP:T-np/n kind:S-kind:P-NN:T-n of:S-of:P-IN:T-np\np/np missile:S-missile:P-NN:T-n/n technology:S-technology:P-NN:T-n that:S-that:P-WDT:T-np\np/(s[dcl]\np) china:S-china:P-VBZ:T-s[dcl]\np/(s[pss]\np) provided:S-provide:P-VBN:T-s[pss]\np/pp to:S-to:P-TO:T-pp/np pakistan:S-pakistan:P-NN:T-n and:S-and:P-CC:T-n\n/n iran:S-iran:P-NN:T-n ,:S-,:P-,:T-s/s\np and:S-and:P-CC:T-s$\(s$)/(s$) when:S-when:P-WRB:T-s/s/s[dcl] this:S-this:P-DT:T-np/n technology:S-technology:P-NN:T-n was:S-be:P-VBD:T-s[dcl]\np/(s[pss]\np) provided:S-provide:P-VBN:T-s[pss]\np .:S-.:P-.:T-sent\(s/s)</full-words>
<lf>
  <satop nom="w21">
    <prop name="and"/>
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
    <diamond mode="First">
      <chunk>
        <nom name="x1"/>
        <diamond mode="ApposRel">
          <chunk>
            <nom name="w3"/>
            <prop name="official"/>
            <diamond mode="num">
              <prop name="sg"/>
            </diamond>
            <diamond mode="Det">
              <nom name="w2"/>
              <prop name="the"/>
            </diamond>
            <diamond mode="GenRel">
              <chunk>
                <nom name="w4"/>
                <prop name="be"/>
                <diamond mode="tense">
                  <prop name="past"/>
                </diamond>
                <diamond mode="Arg0">
                  <nom name="w3"/>
                </diamond>
                <diamond mode="Arg1">
                  <chunk>
                    <nom name="w6"/>
                    <prop name="willing"/>
                    <diamond mode="Arg0">
                      <nom name="w3"/>
                    </diamond>
                    <diamond mode="Arg1">
                      <chunk>
                        <nom name="w8"/>
                        <prop name="explain"/>
                        <diamond mode="Arg0">
                          <nom name="x2"/>
                        </diamond>
                        <diamond mode="Arg1">
                          <chunk>
                            <nom name="w10"/>
                            <prop name="kind"/>
                            <diamond mode="num">
                              <prop name="sg"/>
                            </diamond>
                            <diamond mode="Det">
                              <nom name="w9"/>
                              <prop name="what"/>
                            </diamond>
                            <diamond mode="Mod">
                              <chunk>
                                <nom name="w11"/>
                                <prop name="of"/>
                                <diamond mode="Arg1">
                                  <chunk>
                                    <nom name="w13"/>
                                    <prop name="technology"/>
                                    <diamond mode="det">
                                      <prop name="nil"/>
                                    </diamond>
                                    <diamond mode="num">
                                      <prop name="sg"/>
                                    </diamond>
                                    <diamond mode="Mod">
                                      <nom name="w12"/>
                                      <prop name="missile"/>
                                      <diamond mode="num">
                                        <prop name="sg"/>
                                      </diamond>
                                    </diamond>
                                  </chunk>
                                </diamond>
                              </chunk>
                            </diamond>
                            <diamond mode="GenRel">
                              <chunk>
                                <nom name="w15"/>
                                <prop name="china"/>
                                <diamond mode="tense">
                                  <prop name="pres"/>
                                </diamond>
                                <diamond mode="Arg0">
                                  <nom name="w10"/>
                                </diamond>
                                <diamond mode="Arg1">
                                  <chunk>
                                    <nom name="w16"/>
                                    <prop name="provide"/>
                                    <diamond mode="partic">
                                      <prop name="pass"/>
                                    </diamond>
                                    <diamond mode="Arg1">
                                      <nom name="w10"/>
                                    </diamond>
                                    <diamond mode="Arg2">
                                      <chunk>
                                        <nom name="w17"/>
                                        <prop name="to"/>
                                        <diamond mode="Arg1">
                                          <chunk>
                                            <nom name="w19"/>
                                            <prop name="and"/>
                                            <diamond mode="det">
                                              <prop name="nil"/>
                                            </diamond>
                                            <diamond mode="First">
                                              <nom name="w18"/>
                                              <prop name="pakistan"/>
                                              <diamond mode="num">
                                                <prop name="sg"/>
                                              </diamond>
                                            </diamond>
                                            <diamond mode="Next">
                                              <nom name="w20"/>
                                              <prop name="iran"/>
                                              <diamond mode="num">
                                                <prop name="sg"/>
                                              </diamond>
                                            </diamond>
                                          </chunk>
                                        </diamond>
                                      </chunk>
                                    </diamond>
                                  </chunk>
                                </diamond>
                              </chunk>
                            </diamond>
                          </chunk>
                        </diamond>
                      </chunk>
                    </diamond>
                  </chunk>
                </diamond>
                <diamond mode="Mod">
                  <nom name="w5"/>
                  <prop name="not"/>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
        <diamond mode="Mod">
          <chunk>
            <nom name="w23"/>
            <prop name="when"/>
            <diamond mode="Arg1">
              <chunk>
                <nom name="w26"/>
                <prop name="PASS"/>
                <diamond mode="tense">
                  <prop name="past"/>
                </diamond>
                <diamond mode="Arg0">
                  <chunk>
                    <nom name="w25"/>
                    <prop name="technology"/>
                    <diamond mode="num">
                      <prop name="sg"/>
                    </diamond>
                    <diamond mode="Det">
                      <nom name="w24"/>
                      <prop name="this"/>
                    </diamond>
                  </chunk>
                </diamond>
                <diamond mode="Arg1">
                  <chunk>
                    <nom name="w27"/>
                    <prop name="provide"/>
                    <diamond mode="partic">
                      <prop name="pass"/>
                    </diamond>
                    <diamond mode="Arg1">
                      <nom name="w25"/>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Mod">
      <nom name="w0"/>
      <prop name="however"/>
    </diamond>
    <diamond mode="Next">
      <nom name="x1"/>
    </diamond>
  </satop>
</lf>
</second>
</paraphrase>
<paraphrase corpus="mtc.common" id="55">
<alignments source="GIZA_INTERSECTED">
<alignment first="0" second="1" status="S"/>
<alignment first="1" second="2" status="S"/>
<alignment first="3" second="4" status="S"/>
<alignment first="4" second="5" status="S"/>
<alignment first="5" second="7" status="S"/>
<alignment first="10" second="11" status="S"/>
<alignment first="14" second="12" status="S"/>
<alignment first="15" second="13" status="S"/>
<alignment first="16" second="16" status="S"/>
</alignments>
<alignments source="ANNOTATOR">
<alignment first="0" second="1" status="S"/>
<alignment first="1" second="2" status="S"/>
<alignment first="2" second="4" status="S"/>
<alignment first="3" second="4" status="S"/>
<alignment first="4" second="5" status="S"/>
<alignment first="5" second="7" status="S"/>
<alignment first="6" second="8" status="S"/>
<alignment first="9" second="9" status="P"/>
<alignment first="10" second="11" status="S"/>
<alignment first="11" second="11" status="S"/>
<alignment first="13" second="10" status="P"/>
<alignment first="14" second="12" status="S"/>
<alignment first="15" second="13" status="S"/>
<alignment first="16" second="16" status="S"/>
</alignments>
<first>
<string>yunnan gardens was developed by fujian company , there are 313 apartments in this residential project .</string>
<pred-info>w9:n/n:CD:313 w8:s[dcl]\np[thr]/np:VBP:be w6:n:NN:company w5:n/n:JJ:fujian w4:s\np\(s\np)/np:IN:by w3:s[pss]\np:VBN:develop w2:s[dcl]\np/(s[pss]\np):VBD:PASS w1:n:NNS:garden w0:n/n:JJ:yunnan w14:n:NN:project w13:n/n:JJ:residential w12:np/n:DT:this w11:np\np/np:IN:in w10:n:NNS:apartment</pred-info>
<full-words>yunnan:S-yunnan:P-JJ:T-n/n gardens:S-garden:P-NNS:T-n was:S-be:P-VBD:T-s[dcl]\np/(s[pss]\np) developed:S-develop:P-VBN:T-s[pss]\np by:S-by:P-IN:T-s\np\(s\np)/np fujian:S-fujian:P-JJ:T-n/n company:S-company:P-NN:T-n ,:S-,:P-,:T-punct[,] there:S-there:P-EX:T-np[thr] are:S-be:P-VBP:T-s[dcl]\np[thr]/np 313:S-313:P-CD:T-n/n apartments:S-apartment:P-NNS:T-n in:S-in:P-IN:T-np\np/np this:S-this:P-DT:T-np/n residential:S-residential:P-JJ:T-n/n project:S-project:P-NN:T-n .:S-.:P-.:T-sent\s[dcl]</full-words>
<lf>
  <satop nom="w2">
    <chunk>
      <prop name="PASS"/>
      <diamond mode="tense">
        <prop name="past"/>
      </diamond>
      <diamond mode="Arg0">
        <chunk>
          <nom name="w1"/>
          <prop name="garden"/>
          <diamond mode="det">
            <prop name="nil"/>
          </diamond>
          <diamond mode="num">
            <prop name="pl"/>
          </diamond>
          <diamond mode="Mod">
            <nom name="w0"/>
            <prop name="yunnan"/>
          </diamond>
        </chunk>
      </diamond>
      <diamond mode="Arg1">
        <chunk>
          <nom name="w3"/>
          <prop name="develop"/>
          <diamond mode="partic">
            <prop name="pass"/>
          </diamond>
          <diamond mode="Arg1">
            <nom name="w1"/>
          </diamond>
          <diamond mode="Mod">
            <chunk>
              <nom name="w4"/>
              <prop name="by"/>
              <diamond mode="Arg1">
                <chunk>
                  <nom name="w6"/>
                  <prop name="company"/>
                  <diamond mode="det">
                    <prop name="nil"/>
                  </diamond>
                  <diamond mode="num">
                    <prop name="sg"/>
                  </diamond>
                  <diamond mode="Mod">
                    <nom name="w5"/>
                    <prop name="fujian"/>
                  </diamond>
                </chunk>
              </diamond>
            </chunk>
          </diamond>
        </chunk>
      </diamond>
    </chunk>
  </satop>
  <satop nom="w8">
    <chunk>
      <prop name="be"/>
      <diamond mode="tense">
        <prop name="pres"/>
      </diamond>
      <diamond mode="Arg0">
        <chunk>
          <nom name="w11"/>
          <prop name="apartment"/>
          <diamond mode="det">
            <prop name="nil"/>
          </diamond>
          <diamond mode="num">
            <prop name="pl"/>
          </diamond>
          <diamond mode="Mod">
            <chunk>
              <nom name="w12"/>
              <prop name="in"/>
              <diamond mode="Arg1">
                <chunk>
                  <nom name="w15"/>
                  <prop name="project"/>
                  <diamond mode="num">
                    <prop name="sg"/>
                  </diamond>
                  <diamond mode="Det">
                    <nom name="w13"/>
                    <prop name="this"/>
                  </diamond>
                  <diamond mode="Mod">
                    <nom name="w14"/>
                    <prop name="residential"/>
                  </diamond>
                </chunk>
              </diamond>
            </chunk>
          </diamond>
          <diamond mode="Mod">
            <nom name="w10"/>
            <prop name="313"/>
          </diamond>
        </chunk>
      </diamond>
    </chunk>
  </satop>
  <satop nom="x1">
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
  </satop>
</lf>
</first>
<second>
<string>the yunnan gardens project developed by the fujian society is a 313-unit housing project with land .</string>
<pred-info>w9:s[dcl]\np/np:VBZ:be w8:n:NN:society w7:n/n:JJ:fujian w6:np/n:DT:the w5:s\np\(s\np)/np:IN:by w4:s[pss]\np:VBN:develop w3:n:NN:project w2:n/n:NNS:garden w1:n/n:JJ:yunnan w15:n:NN:land w0:np/n:DT:the w14:np\np/np:IN:with w13:n:NN:project w12:n/n:NN:housing w11:n/n:JJ:313-unit w10:np/n:DT:a</pred-info>
<full-words>the:S-the:P-DT:T-np/n yunnan:S-yunnan:P-JJ:T-n/n gardens:S-garden:P-NNS:T-n/n project:S-project:P-NN:T-n developed:S-develop:P-VBN:T-s[pss]\np by:S-by:P-IN:T-s\np\(s\np)/np the:S-the:P-DT:T-np/n fujian:S-fujian:P-JJ:T-n/n society:S-society:P-NN:T-n is:S-be:P-VBZ:T-s[dcl]\np/np a:S-a:P-DT:T-np/n 313&#45;unit:S-313&#45;unit:P-JJ:T-n/n housing:S-housing:P-NN:T-n/n project:S-project:P-NN:T-n with:S-with:P-IN:T-np\np/np land:S-land:P-NN:T-n .:S-.:P-.:T-sent\s[dcl]</full-words>
<lf>
  <satop nom="w9">
    <prop name="be"/>
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
    <diamond mode="tense">
      <prop name="pres"/>
    </diamond>
    <diamond mode="Arg0">
      <chunk>
        <nom name="w3"/>
        <prop name="project"/>
        <diamond mode="num">
          <prop name="sg"/>
        </diamond>
        <diamond mode="Det">
          <nom name="w0"/>
          <prop name="the"/>
        </diamond>
        <diamond mode="Mod">
          <nom name="w1"/>
          <prop name="yunnan"/>
        </diamond>
        <diamond mode="Mod">
          <nom name="w2"/>
          <prop name="garden"/>
          <diamond mode="num">
            <prop name="pl"/>
          </diamond>
        </diamond>
        <diamond mode="GenRel">
          <chunk>
            <nom name="w4"/>
            <prop name="develop"/>
            <diamond mode="partic">
              <prop name="pass"/>
            </diamond>
            <diamond mode="Arg1">
              <nom name="w3"/>
            </diamond>
            <diamond mode="Mod">
              <chunk>
                <nom name="w5"/>
                <prop name="by"/>
                <diamond mode="Arg1">
                  <chunk>
                    <nom name="w8"/>
                    <prop name="society"/>
                    <diamond mode="num">
                      <prop name="sg"/>
                    </diamond>
                    <diamond mode="Det">
                      <nom name="w6"/>
                      <prop name="the"/>
                    </diamond>
                    <diamond mode="Mod">
                      <nom name="w7"/>
                      <prop name="fujian"/>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Arg1">
      <chunk>
        <nom name="w13"/>
        <prop name="project"/>
        <diamond mode="num">
          <prop name="sg"/>
        </diamond>
        <diamond mode="Det">
          <nom name="w10"/>
          <prop name="a"/>
        </diamond>
        <diamond mode="Mod">
          <nom name="w11"/>
          <prop name="313-unit"/>
        </diamond>
        <diamond mode="Mod">
          <nom name="w12"/>
          <prop name="housing"/>
          <diamond mode="num">
            <prop name="sg"/>
          </diamond>
        </diamond>
        <diamond mode="Mod">
          <chunk>
            <nom name="w14"/>
            <prop name="with"/>
            <diamond mode="Arg1">
              <nom name="w15"/>
              <prop name="land"/>
              <diamond mode="det">
                <prop name="nil"/>
              </diamond>
              <diamond mode="num">
                <prop name="sg"/>
              </diamond>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
  </satop>
</lf>
</second>
</paraphrase>
<paraphrase corpus="mtc.common" id="56">
<alignments source="GIZA_INTERSECTED">
<alignment first="0" second="0" status="S"/>
<alignment first="1" second="1" status="S"/>
<alignment first="2" second="2" status="S"/>
<alignment first="3" second="3" status="S"/>
<alignment first="4" second="4" status="S"/>
<alignment first="5" second="5" status="S"/>
<alignment first="6" second="7" status="S"/>
<alignment first="7" second="9" status="S"/>
<alignment first="8" second="10" status="S"/>
<alignment first="9" second="11" status="S"/>
<alignment first="10" second="12" status="S"/>
<alignment first="14" second="21" status="S"/>
<alignment first="16" second="18" status="S"/>
<alignment first="17" second="20" status="S"/>
<alignment first="18" second="25" status="S"/>
</alignments>
<alignments source="ANNOTATOR">
<alignment first="0" second="0" status="S"/>
<alignment first="1" second="1" status="S"/>
<alignment first="2" second="2" status="S"/>
<alignment first="3" second="3" status="S"/>
<alignment first="4" second="4" status="S"/>
<alignment first="5" second="5" status="S"/>
<alignment first="6" second="6" status="P"/>
<alignment first="6" second="7" status="S"/>
<alignment first="6" second="8" status="S"/>
<alignment first="7" second="9" status="S"/>
<alignment first="8" second="10" status="S"/>
<alignment first="9" second="11" status="S"/>
<alignment first="10" second="12" status="S"/>
<alignment first="11" second="13" status="S"/>
<alignment first="12" second="17" status="S"/>
<alignment first="13" second="19" status="S"/>
<alignment first="14" second="21" status="S"/>
<alignment first="15" second="19" status="S"/>
<alignment first="16" second="18" status="S"/>
<alignment first="17" second="20" status="S"/>
<alignment first="18" second="25" status="S"/>
</alignments>
<first>
<string>in the last two years , some foreign businessmen showed their interest in the construction of xiling city .</string>
<pred-info>w9:s[dcl]\np/np:VBD:show w8:n:NNS:businessman w7:n/n:JJ:foreign w6:np/n:DT:some w4:n:NNS:year w3:n/n:CD:two w17:n:NN:city w2:n/n:JJ:last w16:s[ng]\np/np:VBG:xiling w1:np/n:DT:the w15:np\np/(s[ng]\np):IN:of w0:s/s/np:IN:in w14:n:NN:construction w13:np/n:DT:the w12:np\np/np:IN:in w11:n:NN:interest w10:np/n:PRP$:their</pred-info>
<full-words>in:S-in:P-IN:T-s/s/np the:S-the:P-DT:T-np/n last:S-last:P-JJ:T-n/n two:S-two:P-CD:T-n/n years:S-year:P-NNS:T-n ,:S-,:P-,:T-s/s\(s/s) some:S-some:P-DT:T-np/n foreign:S-foreign:P-JJ:T-n/n businessmen:S-businessman:P-NNS:T-n showed:S-show:P-VBD:T-s[dcl]\np/np their:S-their:P-PRP$:T-np/n interest:S-interest:P-NN:T-n in:S-in:P-IN:T-np\np/np the:S-the:P-DT:T-np/n construction:S-construction:P-NN:T-n of:S-of:P-IN:T-np\np/(s[ng]\np) xiling:S-xiling:P-VBG:T-s[ng]\np/np city:S-city:P-NN:T-n .:S-.:P-.:T-sent\s[dcl]</full-words>
<lf>
  <satop nom="w9">
    <prop name="show"/>
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
    <diamond mode="tense">
      <prop name="past"/>
    </diamond>
    <diamond mode="Arg0">
      <chunk>
        <nom name="w8"/>
        <prop name="businessman"/>
        <diamond mode="num">
          <prop name="pl"/>
        </diamond>
        <diamond mode="Det">
          <nom name="w6"/>
          <prop name="some"/>
        </diamond>
        <diamond mode="Mod">
          <nom name="w7"/>
          <prop name="foreign"/>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Arg1">
      <chunk>
        <nom name="w11"/>
        <prop name="interest"/>
        <diamond mode="num">
          <prop name="sg"/>
        </diamond>
        <diamond mode="Det">
          <nom name="w10"/>
          <prop name="their"/>
        </diamond>
        <diamond mode="Mod">
          <chunk>
            <nom name="w12"/>
            <prop name="in"/>
            <diamond mode="Arg1">
              <chunk>
                <nom name="w14"/>
                <prop name="construction"/>
                <diamond mode="num">
                  <prop name="sg"/>
                </diamond>
                <diamond mode="Det">
                  <nom name="w13"/>
                  <prop name="the"/>
                </diamond>
                <diamond mode="Mod">
                  <chunk>
                    <nom name="w15"/>
                    <prop name="of"/>
                    <diamond mode="Arg1">
                      <chunk>
                        <nom name="w16"/>
                        <prop name="xiling"/>
                        <diamond mode="partic">
                          <prop name="pres"/>
                        </diamond>
                        <diamond mode="Arg0">
                          <nom name="x1"/>
                        </diamond>
                        <diamond mode="Arg1">
                          <nom name="w17"/>
                          <prop name="city"/>
                          <diamond mode="det">
                            <prop name="nil"/>
                          </diamond>
                          <diamond mode="num">
                            <prop name="sg"/>
                          </diamond>
                        </diamond>
                      </chunk>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Mod">
      <chunk>
        <nom name="w0"/>
        <prop name="in"/>
        <diamond mode="emph-intro">
          <prop name="+"/>
        </diamond>
        <diamond mode="Arg1">
          <chunk>
            <nom name="w4"/>
            <prop name="year"/>
            <diamond mode="num">
              <prop name="pl"/>
            </diamond>
            <diamond mode="Det">
              <nom name="w1"/>
              <prop name="the"/>
            </diamond>
            <diamond mode="Mod">
              <nom name="w2"/>
              <prop name="last"/>
            </diamond>
            <diamond mode="Mod">
              <nom name="w3"/>
              <prop name="two"/>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
  </satop>
</lf>
</first>
<second>
<string>during the past two years , a batch of foreign businessmen expressed their wishes to get involved in xining 's city construction one after another .</string>
<pred-info>w9:n/n:JJ:foreign w18:n:NN:xining w8:np\np/np:IN:of w17:pp/np:IN:in w7:n:NN:batch w16:s[adj]\np/pp:VBN:involve w6:np/n:DT:a w15:s[b]\np/(s[adj]\np):VB:get w4:n:NNS:year w13:n:NNS:wish w3:n/n:CD:two w12:np/n:PRP$:their w2:n/n:JJ:past w11:s[dcl]\np/np:VBD:express w1:np/n:DT:the w10:n:NNS:businessman w0:s/s/np:IN:during w24:np:DT:another w23:np\np/np:IN:after w22:n:NN:one w21:n/n:NN:construction w20:n/n:NN:city</pred-info>
<full-words>during:S-during:P-IN:T-s/s/np the:S-the:P-DT:T-np/n past:S-past:P-JJ:T-n/n two:S-two:P-CD:T-n/n years:S-year:P-NNS:T-n ,:S-,:P-,:T-s/s\(s/s) a:S-a:P-DT:T-np/n batch:S-batch:P-NN:T-n of:S-of:P-IN:T-np\np/np foreign:S-foreign:P-JJ:T-n/n businessmen:S-businessman:P-NNS:T-n expressed:S-express:P-VBD:T-s[dcl]\np/np their:S-their:P-PRP$:T-np/n wishes:S-wish:P-NNS:T-n to:S-to:P-TO:T-s[to]\np/(s[b]\np) get:S-get:P-VB:T-s[b]\np/(s[adj]\np) involved:S-involve:P-VBN:T-s[adj]\np/pp in:S-in:P-IN:T-pp/np xining:S-xining:P-NN:T-n &apos;s:S-&apos;s:P-POS:T-np/n\np city:S-city:P-NN:T-n/n construction:S-construction:P-NN:T-n/n one:S-one:P-NN:T-n after:S-after:P-IN:T-np\np/np another:S-another:P-DT:T-np .:S-.:P-.:T-sent\s[dcl]</full-words>
<lf>
  <satop nom="w11">
    <prop name="express"/>
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
    <diamond mode="tense">
      <prop name="past"/>
    </diamond>
    <diamond mode="Arg0">
      <chunk>
        <nom name="w7"/>
        <prop name="batch"/>
        <diamond mode="num">
          <prop name="sg"/>
        </diamond>
        <diamond mode="Det">
          <nom name="w6"/>
          <prop name="a"/>
        </diamond>
        <diamond mode="Mod">
          <chunk>
            <nom name="w8"/>
            <prop name="of"/>
            <diamond mode="Arg1">
              <chunk>
                <nom name="w10"/>
                <prop name="businessman"/>
                <diamond mode="det">
                  <prop name="nil"/>
                </diamond>
                <diamond mode="num">
                  <prop name="pl"/>
                </diamond>
                <diamond mode="Mod">
                  <nom name="w9"/>
                  <prop name="foreign"/>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Arg1">
      <chunk>
        <nom name="w13"/>
        <prop name="wish"/>
        <diamond mode="num">
          <prop name="pl"/>
        </diamond>
        <diamond mode="Det">
          <nom name="w12"/>
          <prop name="their"/>
        </diamond>
        <diamond mode="Purpose">
          <chunk>
            <nom name="w15"/>
            <prop name="get"/>
            <diamond mode="Arg0">
              <nom name="w13"/>
            </diamond>
            <diamond mode="Arg1">
              <chunk>
                <nom name="w16"/>
                <prop name="involve"/>
                <diamond mode="Arg0">
                  <nom name="w13"/>
                </diamond>
                <diamond mode="Arg1">
                  <chunk>
                    <nom name="w17"/>
                    <prop name="in"/>
                    <diamond mode="Arg1">
                      <chunk>
                        <nom name="w22"/>
                        <prop name="one"/>
                        <diamond mode="num">
                          <prop name="sg"/>
                        </diamond>
                        <diamond mode="GenOwn">
                          <nom name="w18"/>
                          <prop name="xining"/>
                          <diamond mode="det">
                            <prop name="nil"/>
                          </diamond>
                          <diamond mode="num">
                            <prop name="sg"/>
                          </diamond>
                        </diamond>
                        <diamond mode="Mod">
                          <nom name="w20"/>
                          <prop name="city"/>
                          <diamond mode="num">
                            <prop name="sg"/>
                          </diamond>
                        </diamond>
                        <diamond mode="Mod">
                          <nom name="w21"/>
                          <prop name="construction"/>
                          <diamond mode="num">
                            <prop name="sg"/>
                          </diamond>
                        </diamond>
                        <diamond mode="Mod">
                          <chunk>
                            <nom name="w23"/>
                            <prop name="after"/>
                            <diamond mode="Arg1">
                              <nom name="w24"/>
                              <prop name="another"/>
                            </diamond>
                          </chunk>
                        </diamond>
                      </chunk>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Mod">
      <chunk>
        <nom name="w0"/>
        <prop name="during"/>
        <diamond mode="emph-intro">
          <prop name="+"/>
        </diamond>
        <diamond mode="Arg1">
          <chunk>
            <nom name="w4"/>
            <prop name="year"/>
            <diamond mode="num">
              <prop name="pl"/>
            </diamond>
            <diamond mode="Det">
              <nom name="w1"/>
              <prop name="the"/>
            </diamond>
            <diamond mode="Mod">
              <nom name="w2"/>
              <prop name="past"/>
            </diamond>
            <diamond mode="Mod">
              <nom name="w3"/>
              <prop name="two"/>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
  </satop>
</lf>
</second>
</paraphrase>
<paraphrase corpus="mtc.common" id="57">
<alignments source="GIZA_INTERSECTED">
<alignment first="1" second="0" status="S"/>
<alignment first="5" second="4" status="S"/>
<alignment first="7" second="6" status="S"/>
<alignment first="8" second="7" status="S"/>
<alignment first="9" second="21" status="S"/>
<alignment first="13" second="19" status="S"/>
<alignment first="16" second="11" status="S"/>
<alignment first="18" second="17" status="S"/>
<alignment first="19" second="18" status="S"/>
<alignment first="22" second="22" status="S"/>
<alignment first="23" second="23" status="S"/>
</alignments>
<alignments source="ANNOTATOR">
<alignment first="1" second="0" status="S"/>
<alignment first="2" second="1" status="S"/>
<alignment first="3" second="1" status="S"/>
<alignment first="4" second="2" status="P"/>
<alignment first="4" second="3" status="P"/>
<alignment first="5" second="4" status="S"/>
<alignment first="6" second="5" status="S"/>
<alignment first="7" second="6" status="S"/>
<alignment first="8" second="7" status="S"/>
<alignment first="9" second="21" status="S"/>
<alignment first="10" second="22" status="P"/>
<alignment first="11" second="22" status="P"/>
<alignment first="12" second="22" status="P"/>
<alignment first="13" second="19" status="S"/>
<alignment first="14" second="8" status="P"/>
<alignment first="15" second="9" status="S"/>
<alignment first="15" second="10" status="S"/>
<alignment first="16" second="11" status="S"/>
<alignment first="17" second="12" status="S"/>
<alignment first="18" second="17" status="S"/>
<alignment first="19" second="18" status="S"/>
<alignment first="20" second="14" status="P"/>
<alignment first="21" second="14" status="P"/>
<alignment first="22" second="15" status="P"/>
<alignment first="22" second="22" status="P"/>
<alignment first="23" second="23" status="S"/>
</alignments>
<first>
<string>the dai yu xiang industrial consulting company said that spacious front door area is the biggest characteristic of yunnan gardens with land ownership .</string>
<pred-info>w19:n:NNS:garden w9:n/n:JJ:spacious w18:n/n:JJ:yunnan w7:s[dcl]\np/s[em]:VBD:say w17:np\np/np:IN:of w16:n:NN:characteristic w6:n:NN:company w15:n/n:JJS:biggest w5:n/n:NN:consulting w14:np/n:DT:the w4:n/n:JJ:industrial w13:s[dcl]\np/np:VBZ:be w3:n/n:VBG:xiang w12:n:NN:area w2:n/n:NN:yu w11:n/n:NN:door w1:n/n:JJ:dai w10:n/n:JJ:front w0:np/n:DT:the w22:n:NN:ownership w21:n/n:NN:land w20:np\np/np:IN:with</pred-info>
<full-words>the:S-the:P-DT:T-np/n dai:S-dai:P-JJ:T-n/n yu:S-yu:P-NN:T-n/n xiang:S-xiang:P-VBG:T-n/n industrial:S-industrial:P-JJ:T-n/n consulting:S-consulting:P-NN:T-n/n company:S-company:P-NN:T-n said:S-say:P-VBD:T-s[dcl]\np/s[em] that:S-that:P-IN:T-s[em]/s[dcl] spacious:S-spacious:P-JJ:T-n/n front:S-front:P-JJ:T-n/n door:S-door:P-NN:T-n/n area:S-area:P-NN:T-n is:S-be:P-VBZ:T-s[dcl]\np/np the:S-the:P-DT:T-np/n biggest:S-biggest:P-JJS:T-n/n characteristic:S-characteristic:P-NN:T-n of:S-of:P-IN:T-np\np/np yunnan:S-yunnan:P-JJ:T-n/n gardens:S-garden:P-NNS:T-n with:S-with:P-IN:T-np\np/np land:S-land:P-NN:T-n/n ownership:S-ownership:P-NN:T-n .:S-.:P-.:T-sent\s[dcl]</full-words>
<lf>
  <satop nom="w7">
    <prop name="say"/>
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
    <diamond mode="tense">
      <prop name="past"/>
    </diamond>
    <diamond mode="Arg0">
      <chunk>
        <nom name="w6"/>
        <prop name="company"/>
        <diamond mode="num">
          <prop name="sg"/>
        </diamond>
        <diamond mode="Det">
          <nom name="w0"/>
          <prop name="the"/>
        </diamond>
        <diamond mode="Mod">
          <nom name="w1"/>
          <prop name="dai"/>
        </diamond>
        <diamond mode="Mod">
          <nom name="w2"/>
          <prop name="yu"/>
          <diamond mode="num">
            <prop name="sg"/>
          </diamond>
        </diamond>
        <diamond mode="Mod">
          <nom name="w3"/>
          <prop name="xiang"/>
          <diamond mode="partic">
            <prop name="pres"/>
          </diamond>
        </diamond>
        <diamond mode="Mod">
          <nom name="w4"/>
          <prop name="industrial"/>
        </diamond>
        <diamond mode="Mod">
          <nom name="w5"/>
          <prop name="consulting"/>
          <diamond mode="num">
            <prop name="sg"/>
          </diamond>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Arg1">
      <chunk>
        <nom name="w13"/>
        <prop name="be"/>
        <diamond mode="tense">
          <prop name="pres"/>
        </diamond>
        <diamond mode="Arg0">
          <chunk>
            <nom name="w12"/>
            <prop name="area"/>
            <diamond mode="det">
              <prop name="nil"/>
            </diamond>
            <diamond mode="num">
              <prop name="sg"/>
            </diamond>
            <diamond mode="Mod">
              <nom name="w10"/>
              <prop name="front"/>
            </diamond>
            <diamond mode="Mod">
              <nom name="w11"/>
              <prop name="door"/>
              <diamond mode="num">
                <prop name="sg"/>
              </diamond>
            </diamond>
            <diamond mode="Mod">
              <nom name="w9"/>
              <prop name="spacious"/>
            </diamond>
          </chunk>
        </diamond>
        <diamond mode="Arg1">
          <chunk>
            <nom name="w16"/>
            <prop name="characteristic"/>
            <diamond mode="num">
              <prop name="sg"/>
            </diamond>
            <diamond mode="Det">
              <nom name="w14"/>
              <prop name="the"/>
            </diamond>
            <diamond mode="Mod">
              <nom name="w15"/>
              <prop name="biggest"/>
            </diamond>
            <diamond mode="Mod">
              <chunk>
                <nom name="w17"/>
                <prop name="of"/>
                <diamond mode="Arg1">
                  <chunk>
                    <nom name="w19"/>
                    <prop name="garden"/>
                    <diamond mode="det">
                      <prop name="nil"/>
                    </diamond>
                    <diamond mode="num">
                      <prop name="pl"/>
                    </diamond>
                    <diamond mode="Mod">
                      <nom name="w18"/>
                      <prop name="yunnan"/>
                    </diamond>
                    <diamond mode="Mod">
                      <chunk>
                        <nom name="w20"/>
                        <prop name="with"/>
                        <diamond mode="Arg1">
                          <chunk>
                            <nom name="w22"/>
                            <prop name="ownership"/>
                            <diamond mode="det">
                              <prop name="nil"/>
                            </diamond>
                            <diamond mode="num">
                              <prop name="sg"/>
                            </diamond>
                            <diamond mode="Mod">
                              <nom name="w21"/>
                              <prop name="land"/>
                              <diamond mode="num">
                                <prop name="sg"/>
                              </diamond>
                            </diamond>
                          </chunk>
                        </diamond>
                      </chunk>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
  </satop>
</lf>
</first>
<second>
<string>dai yuxiang real estate consulting firm said that the most special characteristic of the landed residences at yunnan gardens is their spacious appearance .</string>
<pred-info>w19:s[dcl]\np/np:VBZ:be w9:n/n/(n/n):RBS:most w18:n:NNS:garden w8:np/n:DT:the w17:n/n:JJ:yunnan w6:s[dcl]\np/s[em]:VBD:say w16:np\np/np:IN:at w15:n:NNS:residence w5:n:NN:firm w14:n/n:VBN:land w4:n/n:NN:consulting w13:np/n:DT:the w3:n/n:NN:estate w12:np\np/np:IN:of w2:n/n:JJ:real w11:n:NN:characteristic w1:n/n:NNP:yuxiang w10:n/n:JJ:special w0:n/n:NNP:dai w22:n:NN:appearance w21:n/n:JJ:spacious w20:np/n:PRP$:their</pred-info>
<full-words>dai:S-dai:P-NNP:T-n/n yuxiang:S-yuxiang:P-NNP:T-n/n real:S-real:P-JJ:T-n/n estate:S-estate:P-NN:T-n/n consulting:S-consulting:P-NN:T-n/n firm:S-firm:P-NN:T-n said:S-say:P-VBD:T-s[dcl]\np/s[em] that:S-that:P-IN:T-s[em]/s[dcl] the:S-the:P-DT:T-np/n most:S-most:P-RBS:T-n/n/(n/n) special:S-special:P-JJ:T-n/n characteristic:S-characteristic:P-NN:T-n of:S-of:P-IN:T-np\np/np the:S-the:P-DT:T-np/n landed:S-land:P-VBN:T-n/n residences:S-residence:P-NNS:T-n at:S-at:P-IN:T-np\np/np yunnan:S-yunnan:P-JJ:T-n/n gardens:S-garden:P-NNS:T-n is:S-be:P-VBZ:T-s[dcl]\np/np their:S-their:P-PRP$:T-np/n spacious:S-spacious:P-JJ:T-n/n appearance:S-appearance:P-NN:T-n .:S-.:P-.:T-sent\s[dcl]</full-words>
<lf>
  <satop nom="w6">
    <prop name="say"/>
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
    <diamond mode="tense">
      <prop name="past"/>
    </diamond>
    <diamond mode="Arg0">
      <chunk>
        <nom name="w5"/>
        <prop name="firm"/>
        <diamond mode="det">
          <prop name="nil"/>
        </diamond>
        <diamond mode="num">
          <prop name="sg"/>
        </diamond>
        <diamond mode="Mod">
          <nom name="w0"/>
          <prop name="dai"/>
          <diamond mode="num">
            <prop name="sg"/>
          </diamond>
        </diamond>
        <diamond mode="Mod">
          <nom name="w1"/>
          <prop name="yuxiang"/>
          <diamond mode="num">
            <prop name="sg"/>
          </diamond>
        </diamond>
        <diamond mode="Mod">
          <nom name="w2"/>
          <prop name="real"/>
        </diamond>
        <diamond mode="Mod">
          <nom name="w3"/>
          <prop name="estate"/>
          <diamond mode="num">
            <prop name="sg"/>
          </diamond>
        </diamond>
        <diamond mode="Mod">
          <nom name="w4"/>
          <prop name="consulting"/>
          <diamond mode="num">
            <prop name="sg"/>
          </diamond>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Arg1">
      <chunk>
        <nom name="w19"/>
        <prop name="be"/>
        <diamond mode="tense">
          <prop name="pres"/>
        </diamond>
        <diamond mode="Arg0">
          <chunk>
            <nom name="w11"/>
            <prop name="characteristic"/>
            <diamond mode="num">
              <prop name="sg"/>
            </diamond>
            <diamond mode="Det">
              <nom name="w8"/>
              <prop name="the"/>
            </diamond>
            <diamond mode="Mod">
              <chunk>
                <nom name="w10"/>
                <prop name="special"/>
                <diamond mode="Mod">
                  <nom name="w9"/>
                  <prop name="most"/>
                </diamond>
              </chunk>
            </diamond>
            <diamond mode="Mod">
              <chunk>
                <nom name="w12"/>
                <prop name="of"/>
                <diamond mode="Arg1">
                  <chunk>
                    <nom name="w15"/>
                    <prop name="residence"/>
                    <diamond mode="num">
                      <prop name="pl"/>
                    </diamond>
                    <diamond mode="Det">
                      <nom name="w13"/>
                      <prop name="the"/>
                    </diamond>
                    <diamond mode="Mod">
                      <nom name="w14"/>
                      <prop name="land"/>
                    </diamond>
                    <diamond mode="Mod">
                      <chunk>
                        <nom name="w16"/>
                        <prop name="at"/>
                        <diamond mode="Arg1">
                          <chunk>
                            <nom name="w18"/>
                            <prop name="garden"/>
                            <diamond mode="det">
                              <prop name="nil"/>
                            </diamond>
                            <diamond mode="num">
                              <prop name="pl"/>
                            </diamond>
                            <diamond mode="Mod">
                              <nom name="w17"/>
                              <prop name="yunnan"/>
                            </diamond>
                          </chunk>
                        </diamond>
                      </chunk>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
        <diamond mode="Arg1">
          <chunk>
            <nom name="w22"/>
            <prop name="appearance"/>
            <diamond mode="num">
              <prop name="sg"/>
            </diamond>
            <diamond mode="Det">
              <nom name="w20"/>
              <prop name="their"/>
            </diamond>
            <diamond mode="Mod">
              <nom name="w21"/>
              <prop name="spacious"/>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
  </satop>
</lf>
</second>
</paraphrase>
<paraphrase corpus="mtc.common" id="58">
<alignments source="GIZA_INTERSECTED">
<alignment first="0" second="0" status="S"/>
<alignment first="1" second="1" status="S"/>
<alignment first="3" second="2" status="S"/>
<alignment first="4" second="3" status="S"/>
<alignment first="5" second="4" status="S"/>
<alignment first="10" second="6" status="S"/>
<alignment first="11" second="8" status="S"/>
</alignments>
<alignments source="ANNOTATOR">
<alignment first="0" second="0" status="S"/>
<alignment first="2" second="1" status="P"/>
<alignment first="3" second="2" status="S"/>
<alignment first="4" second="3" status="S"/>
<alignment first="5" second="4" status="S"/>
<alignment first="6" second="5" status="P"/>
<alignment first="8" second="7" status="S"/>
<alignment first="10" second="6" status="S"/>
<alignment first="11" second="8" status="S"/>
</alignments>
<first>
<string>this measure restrained economic growth and raised the rate of unemployment .</string>
<pred-info>w9:np\np/np:IN:of w8:n:NN:rate w7:np/n:DT:the w6:s[dcl]\np/np:VBD:raise w5:s[dcl]$\(s[dcl]$)/(s[dcl]$):CC:and w4:n:NN:growth w3:n/n:JJ:economic w2:s[dcl]\np/np:VBD:restrain w1:n:NN:measure w0:np/n:DT:this w10:n:NN:unemployment</pred-info>
<full-words>this:S-this:P-DT:T-np/n measure:S-measure:P-NN:T-n restrained:S-restrain:P-VBD:T-s[dcl]\np/np economic:S-economic:P-JJ:T-n/n growth:S-growth:P-NN:T-n and:S-and:P-CC:T-s[dcl]$\(s[dcl]$)/(s[dcl]$) raised:S-raise:P-VBD:T-s[dcl]\np/np the:S-the:P-DT:T-np/n rate:S-rate:P-NN:T-n of:S-of:P-IN:T-np\np/np unemployment:S-unemployment:P-NN:T-n .:S-.:P-.:T-sent\s[dcl]</full-words>
<lf>
  <satop nom="w5">
    <prop name="and"/>
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
    <diamond mode="First">
      <chunk>
        <nom name="w2"/>
        <prop name="restrain"/>
        <diamond mode="tense">
          <prop name="past"/>
        </diamond>
        <diamond mode="Arg0">
          <nom name="w1"/>
        </diamond>
        <diamond mode="Arg1">
          <chunk>
            <nom name="w4"/>
            <prop name="growth"/>
            <diamond mode="det">
              <prop name="nil"/>
            </diamond>
            <diamond mode="num">
              <prop name="sg"/>
            </diamond>
            <diamond mode="Mod">
              <nom name="w3"/>
              <prop name="economic"/>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Next">
      <chunk>
        <nom name="w6"/>
        <prop name="raise"/>
        <diamond mode="tense">
          <prop name="past"/>
        </diamond>
        <diamond mode="Arg0">
          <nom name="w1"/>
        </diamond>
        <diamond mode="Arg1">
          <chunk>
            <nom name="w8"/>
            <prop name="rate"/>
            <diamond mode="num">
              <prop name="sg"/>
            </diamond>
            <diamond mode="Det">
              <nom name="w7"/>
              <prop name="the"/>
            </diamond>
            <diamond mode="Mod">
              <chunk>
                <nom name="w9"/>
                <prop name="of"/>
                <diamond mode="Arg1">
                  <nom name="w10"/>
                  <prop name="unemployment"/>
                  <diamond mode="det">
                    <prop name="nil"/>
                  </diamond>
                  <diamond mode="num">
                    <prop name="sg"/>
                  </diamond>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
    <satop nom="w1">
      <chunk>
        <prop name="measure"/>
        <diamond mode="num">
          <prop name="sg"/>
        </diamond>
        <diamond mode="Det">
          <nom name="w0"/>
          <prop name="this"/>
        </diamond>
      </chunk>
    </satop>
  </satop>
</lf>
</first>
<second>
<string>this curbs economic growth and increases unemployment rates .</string>
</second>
</paraphrase>
<paraphrase corpus="mtc.common" id="59">
<alignments source="GIZA_INTERSECTED">
<alignment first="0" second="0" status="S"/>
<alignment first="1" second="1" status="S"/>
<alignment first="2" second="2" status="S"/>
<alignment first="3" second="3" status="S"/>
<alignment first="6" second="6" status="S"/>
<alignment first="8" second="7" status="S"/>
<alignment first="9" second="8" status="S"/>
<alignment first="10" second="9" status="S"/>
<alignment first="11" second="10" status="S"/>
<alignment first="12" second="11" status="S"/>
<alignment first="13" second="14" status="S"/>
<alignment first="17" second="20" status="S"/>
<alignment first="24" second="25" status="S"/>
<alignment first="27" second="27" status="S"/>
<alignment first="30" second="28" status="S"/>
<alignment first="32" second="32" status="S"/>
<alignment first="33" second="35" status="S"/>
<alignment first="34" second="36" status="S"/>
<alignment first="36" second="37" status="S"/>
<alignment first="37" second="38" status="S"/>
<alignment first="38" second="39" status="S"/>
<alignment first="39" second="40" status="S"/>
<alignment first="40" second="41" status="S"/>
<alignment first="41" second="42" status="S"/>
<alignment first="42" second="43" status="S"/>
</alignments>
<alignments source="ANNOTATOR">
<alignment first="0" second="0" status="S"/>
<alignment first="1" second="1" status="S"/>
<alignment first="2" second="2" status="S"/>
<alignment first="3" second="3" status="S"/>
<alignment first="6" second="6" status="S"/>
<alignment first="8" second="7" status="S"/>
<alignment first="9" second="8" status="S"/>
<alignment first="10" second="9" status="P"/>
<alignment first="11" second="10" status="S"/>
<alignment first="12" second="15" status="P"/>
<alignment first="12" second="16" status="P"/>
<alignment first="13" second="14" status="S"/>
<alignment first="14" second="11" status="P"/>
<alignment first="16" second="17" status="S"/>
<alignment first="17" second="20" status="S"/>
<alignment first="17" second="34" status="P"/>
<alignment first="20" second="19" status="S"/>
<alignment first="21" second="18" status="P"/>
<alignment first="22" second="18" status="P"/>
<alignment first="23" second="22" status="P"/>
<alignment first="24" second="25" status="S"/>
<alignment first="26" second="26" status="P"/>
<alignment first="27" second="26" status="P"/>
<alignment first="28" second="28" status="S"/>
<alignment first="30" second="29" status="P"/>
<alignment first="31" second="30" status="S"/>
<alignment first="32" second="31" status="S"/>
<alignment first="32" second="32" status="S"/>
<alignment first="33" second="35" status="S"/>
<alignment first="34" second="36" status="S"/>
<alignment first="36" second="37" status="S"/>
<alignment first="37" second="38" status="S"/>
<alignment first="38" second="39" status="S"/>
<alignment first="39" second="40" status="S"/>
<alignment first="40" second="41" status="S"/>
<alignment first="41" second="42" status="P"/>
<alignment first="42" second="43" status="S"/>
</alignments>
<first>
<string>according to xinhua news agency , london , on february 3rd , bbc reporter bowen stayed in baghdad . the capital of iraq stated that there was no evidence to indicate the bomb-shelter destroyed by a us bomber was a military target .</string>
<pred-info>w36:s[dcl]\np/np:VBD:be w35:s\np/(s\np):NN:bomber w34:np:PRP:us w33:np:DT:a w32:s\np\(s\np)/np:IN:by w31:s[pss]\np:VBN:destroy w30:n:NN:bomb-shelter w29:np/n:DT:the w28:s[b]\np/np:VB:indicate w26:n:NN:evidence w25:np/n:DT:no w24:s[dcl]\np[thr]/np:VBD:be w21:s[dcl]\np/s[em]:VBD:state w20:n:NNP:iraq h1:n\(n/n)/n:,:has-rel w9:n/n:JJ:3rd w8:n/n:JJ:february w7:s\np/(s\np)/np:IN:on w5:n:NN:london w4:n:NN:agency w3:n/n:NN:news w19:np\np/np:IN:of w2:n/n:NNP:xinhua w18:n:NN:capital w1:pp/np:TO:to w17:np/n:DT:the w0:s/s/pp:VBG:accord w16:n:NN:baghdad w15:pp/np:IN:in w14:s[dcl]\np/pp:VBD:stay w13:n:NN:bowen w12:n/n:NN:reporter w11:n/n:JJ:bbc w10:n\(n/n)/n:,:, w39:n:NN:target w38:n/n:JJ:military w37:np/n:DT:a</pred-info>
<full-words>according:S-accord:P-VBG:T-s/s/pp to:S-to:P-TO:T-pp/np xinhua:S-xinhua:P-NNP:T-n/n news:S-news:P-NN:T-n/n agency:S-agency:P-NN:T-n ,:S-,:P-,:T-punct[,] london:S-london:P-NN:T-n ,:S-,:P-,:T-s[dcl]\np/(s[dcl]\np) on:S-on:P-IN:T-s\np/(s\np)/np february:S-february:P-JJ:T-n/n 3rd:S-3rd:P-JJ:T-n/n ,:S-,:P-,:T-n\(n/n)/n bbc:S-bbc:P-JJ:T-n/n reporter:S-reporter:P-NN:T-n/n bowen:S-bowen:P-NN:T-n stayed:S-stay:P-VBD:T-s[dcl]\np/pp in:S-in:P-IN:T-pp/np baghdad:S-baghdad:P-NN:T-n .:S-.:P-.:T-punct[.] the:S-the:P-DT:T-np/n capital:S-capital:P-NN:T-n of:S-of:P-IN:T-np\np/np iraq:S-iraq:P-NNP:T-n stated:S-state:P-VBD:T-s[dcl]\np/s[em] that:S-that:P-IN:T-s[em]/s[dcl] there:S-there:P-EX:T-np[thr] was:S-be:P-VBD:T-s[dcl]\np[thr]/np no:S-no:P-DT:T-np/n evidence:S-evidence:P-NN:T-n to:S-to:P-TO:T-s[to]\np/(s[b]\np) indicate:S-indicate:P-VB:T-s[b]\np/np the:S-the:P-DT:T-np/n bomb&#45;shelter:S-bomb&#45;shelter:P-NN:T-n destroyed:S-destroy:P-VBN:T-s[pss]\np by:S-by:P-IN:T-s\np\(s\np)/np a:S-a:P-DT:T-np us:S-us:P-PRP:T-np bomber:S-bomber:P-NN:T-s\np/(s\np) was:S-be:P-VBD:T-s[dcl]\np/np a:S-a:P-DT:T-np/n military:S-military:P-JJ:T-n/n target:S-target:P-NN:T-n .:S-.:P-.:T-sent\s[dcl]</full-words>
<lf>
  <satop nom="w21">
    <prop name="state"/>
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
    <diamond mode="tense">
      <prop name="past"/>
    </diamond>
    <diamond mode="Arg0">
      <chunk>
        <nom name="w20"/>
        <prop name="capital"/>
        <diamond mode="num">
          <prop name="sg"/>
        </diamond>
        <diamond mode="Det">
          <nom name="w19"/>
          <prop name="the"/>
        </diamond>
        <diamond mode="Mod">
          <chunk>
            <nom name="w21"/>
            <prop name="of"/>
            <diamond mode="Arg1">
              <nom name="w22"/>
              <prop name="iraq"/>
              <diamond mode="det">
                <prop name="nil"/>
              </diamond>
              <diamond mode="num">
                <prop name="sg"/>
              </diamond>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Arg1">
      <chunk>
        <nom name="w26"/>
        <prop name="be"/>
        <diamond mode="tense">
          <prop name="past"/>
        </diamond>
        <diamond mode="Arg0">
          <chunk>
            <nom name="w28"/>
            <prop name="evidence"/>
            <diamond mode="num">
              <prop name="sg"/>
            </diamond>
            <diamond mode="Det">
              <nom name="w27"/>
              <prop name="no"/>
            </diamond>
            <diamond mode="Purpose">
              <chunk>
                <nom name="w30"/>
                <prop name="indicate"/>
                <diamond mode="Arg0">
                  <nom name="w28"/>
                </diamond>
                <diamond mode="Arg1">
                  <chunk>
                    <nom name="w32"/>
                    <prop name="bomb-shelter"/>
                    <diamond mode="num">
                      <prop name="sg"/>
                    </diamond>
                    <diamond mode="Det">
                      <nom name="w31"/>
                      <prop name="the"/>
                    </diamond>
                    <diamond mode="GenRel">
                      <chunk>
                        <nom name="w33"/>
                        <prop name="destroy"/>
                        <diamond mode="partic">
                          <prop name="pass"/>
                        </diamond>
                        <diamond mode="Arg1">
                          <nom name="w32"/>
                        </diamond>
                        <diamond mode="Mod">
                          <chunk>
                            <nom name="w34"/>
                            <prop name="by"/>
                            <diamond mode="Arg1">
                              <chunk>
                                <nom name="w35"/>
                                <prop name="a"/>
                                <diamond mode="GenRel">
                                  <chunk>
                                    <nom name="w38"/>
                                    <prop name="be"/>
                                    <diamond mode="tense">
                                      <prop name="past"/>
                                    </diamond>
                                    <diamond mode="Arg0">
                                      <nom name="w36"/>
                                      <prop name="us"/>
                                    </diamond>
                                    <diamond mode="Arg1">
                                      <chunk>
                                        <nom name="w41"/>
                                        <prop name="target"/>
                                        <diamond mode="num">
                                          <prop name="sg"/>
                                        </diamond>
                                        <diamond mode="Det">
                                          <nom name="w39"/>
                                          <prop name="a"/>
                                        </diamond>
                                        <diamond mode="Mod">
                                          <nom name="w40"/>
                                          <prop name="military"/>
                                        </diamond>
                                      </chunk>
                                    </diamond>
                                    <diamond mode="Mod">
                                      <nom name="w37"/>
                                      <prop name="bomber"/>
                                      <diamond mode="num">
                                        <prop name="sg"/>
                                      </diamond>
                                    </diamond>
                                    <diamond mode="Mod">
                                      <nom name="x3"/>
                                    </diamond>
                                  </chunk>
                                </diamond>
                              </chunk>
                            </diamond>
                          </chunk>
                        </diamond>
                      </chunk>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Mod">
      <chunk>
        <nom name="w0"/>
        <prop name="accord"/>
        <diamond mode="partic">
          <prop name="pres"/>
        </diamond>
        <diamond mode="Arg1">
          <chunk>
            <nom name="w1"/>
            <prop name="to"/>
            <diamond mode="Arg1">
              <chunk>
                <nom name="w4"/>
                <prop name="agency"/>
                <diamond mode="det">
                  <prop name="nil"/>
                </diamond>
                <diamond mode="num">
                  <prop name="sg"/>
                </diamond>
                <diamond mode="Mod">
                  <nom name="w2"/>
                  <prop name="xinhua"/>
                  <diamond mode="num">
                    <prop name="sg"/>
                  </diamond>
                </diamond>
                <diamond mode="Mod">
                  <nom name="w3"/>
                  <prop name="news"/>
                  <diamond mode="num">
                    <prop name="sg"/>
                  </diamond>
                </diamond>
                <diamond mode="GenRel">
                  <chunk>
                    <nom name="w15"/>
                    <prop name="stay"/>
                    <diamond mode="tense">
                      <prop name="past"/>
                    </diamond>
                    <diamond mode="Arg0">
                      <nom name="w6"/>
                      <prop name="london"/>
                      <diamond mode="det">
                        <prop name="nil"/>
                      </diamond>
                      <diamond mode="num">
                        <prop name="sg"/>
                      </diamond>
                    </diamond>
                    <diamond mode="Arg1">
                      <chunk>
                        <nom name="w16"/>
                        <prop name="in"/>
                        <diamond mode="Arg1">
                          <nom name="w17"/>
                          <prop name="baghdad"/>
                          <diamond mode="det">
                            <prop name="nil"/>
                          </diamond>
                          <diamond mode="num">
                            <prop name="sg"/>
                          </diamond>
                        </diamond>
                      </chunk>
                    </diamond>
                    <diamond mode="Mod">
                      <chunk>
                        <nom name="w8"/>
                        <prop name="on"/>
                        <diamond mode="Arg1">
                          <chunk>
                            <nom name="w11"/>
                            <prop name=","/>
                            <diamond mode="det">
                              <prop name="nil"/>
                            </diamond>
                            <diamond mode="Arg0">
                              <chunk>
                                <nom name="h1"/>
                                <prop name="has-rel"/>
                                <diamond mode="Mod">
                                  <nom name="w10"/>
                                  <prop name="3rd"/>
                                </diamond>
                                <diamond mode="Of">
                                  <nom name="w14"/>
                                </diamond>
                              </chunk>
                            </diamond>
                            <diamond mode="Arg1">
                              <chunk>
                                <nom name="w14"/>
                                <prop name="bowen"/>
                                <diamond mode="num">
                                  <prop name="sg"/>
                                </diamond>
                                <diamond mode="Mod">
                                  <nom name="w12"/>
                                  <prop name="bbc"/>
                                </diamond>
                                <diamond mode="Mod">
                                  <nom name="w13"/>
                                  <prop name="reporter"/>
                                  <diamond mode="num">
                                    <prop name="sg"/>
                                  </diamond>
                                </diamond>
                              </chunk>
                            </diamond>
                            <diamond mode="Mod">
                              <nom name="w9"/>
                              <prop name="february"/>
                            </diamond>
                          </chunk>
                        </diamond>
                      </chunk>
                    </diamond>
                    <diamond mode="Mod">
                      <nom name="x1"/>
                    </diamond>
                    <diamond mode="modFeat">
                      <nom name="x2"/>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
  </satop>
</lf>
</first>
<second>
<string>according to xinhua news report from london on february 13 , bonne , a reporter of bbc in iraqi capital baghdad , confirmed on 13th that no any sign showed the bomb shelter in baghdad destroyed by american bomber was a military blindage .</string>
<pred-info>w36:s\np\(s\np)/np:IN:by w35:s[pss]\np:VBN:destroy w34:n:NN:baghdad w33:np\np/np:IN:in w32:n:NN:shelter w31:n/n:NN:bomb w30:np/n:DT:the w29:s[dcl]\np/s[dcl]:VBD:show w28:n:NN:sign w27:n/n:DT:any w26:np/n:DT:no w24:n:NN:13th w23:s\np\(s\np)/np:IN:on w22:s[dcl]\np/np:VBD:confirm w20:n:NN:baghdad w9:n:CD:13 w8:n/n:JJ:february w7:np\np/np:IN:on w6:n:NN:london w5:np\np/np:IN:from w4:n:NN:report w3:n/n:NN:news w19:n/n:NN:capital w2:np/n:DT:xinhua w18:n/n:JJ:iraqi w1:pp/np:TO:to w17:np\np/np:IN:in w0:s/s/pp:VBG:accord w16:n:NN:bbc w15:np\np/np:IN:of w14:n:NN:reporter w13:np/n:DT:a w11:n:NN:bonne w42:n:NN:blindage w41:n/n:JJ:military w40:np/n:DT:a w39:s[dcl]\np/np:VBD:be w38:n:NN:bomber w37:n/n:JJ:american</pred-info>
<full-words>according:S-accord:P-VBG:T-s/s/pp to:S-to:P-TO:T-pp/np xinhua:S-xinhua:P-DT:T-np/n news:S-news:P-NN:T-n/n report:S-report:P-NN:T-n from:S-from:P-IN:T-np\np/np london:S-london:P-NN:T-n on:S-on:P-IN:T-np\np/np february:S-february:P-JJ:T-n/n 13:S-13:P-CD:T-n ,:S-,:P-,:T-np\np/punct[,]/np bonne:S-bonne:P-NN:T-n ,:S-,:P-,:T-punct[,] a:S-a:P-DT:T-np/n reporter:S-reporter:P-NN:T-n of:S-of:P-IN:T-np\np/np bbc:S-bbc:P-NN:T-n in:S-in:P-IN:T-np\np/np iraqi:S-iraqi:P-JJ:T-n/n capital:S-capital:P-NN:T-n/n baghdad:S-baghdad:P-NN:T-n ,:S-,:P-,:T-s[dcl]\np/(s[dcl]\np) confirmed:S-confirm:P-VBD:T-s[dcl]\np/np on:S-on:P-IN:T-s\np\(s\np)/np 13th:S-13th:P-NN:T-n that:S-that:P-IN:T-np\np/(s[dcl]/np) no:S-no:P-DT:T-np/n any:S-any:P-DT:T-n/n sign:S-sign:P-NN:T-n showed:S-show:P-VBD:T-s[dcl]\np/s[dcl] the:S-the:P-DT:T-np/n bomb:S-bomb:P-NN:T-n/n shelter:S-shelter:P-NN:T-n in:S-in:P-IN:T-np\np/np baghdad:S-baghdad:P-NN:T-n destroyed:S-destroy:P-VBN:T-s[pss]\np by:S-by:P-IN:T-s\np\(s\np)/np american:S-american:P-JJ:T-n/n bomber:S-bomber:P-NN:T-n was:S-be:P-VBD:T-s[dcl]\np/np a:S-a:P-DT:T-np/n military:S-military:P-JJ:T-n/n blindage:S-blindage:P-NN:T-n .:S-.:P-.:T-sent\s[dcl]</full-words>
<lf>
  <satop nom="w22">
    <prop name="confirm"/>
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
    <diamond mode="tense">
      <prop name="past"/>
    </diamond>
    <diamond mode="Arg0">
      <chunk>
        <nom name="w14"/>
        <prop name="reporter"/>
        <diamond mode="num">
          <prop name="sg"/>
        </diamond>
        <diamond mode="Det">
          <nom name="w13"/>
          <prop name="a"/>
        </diamond>
        <diamond mode="Mod">
          <chunk>
            <nom name="w15"/>
            <prop name="of"/>
            <diamond mode="Arg1">
              <chunk>
                <nom name="w16"/>
                <prop name="bbc"/>
                <diamond mode="det">
                  <prop name="nil"/>
                </diamond>
                <diamond mode="num">
                  <prop name="sg"/>
                </diamond>
                <diamond mode="Mod">
                  <chunk>
                    <nom name="w17"/>
                    <prop name="in"/>
                    <diamond mode="Arg1">
                      <chunk>
                        <nom name="w20"/>
                        <prop name="baghdad"/>
                        <diamond mode="det">
                          <prop name="nil"/>
                        </diamond>
                        <diamond mode="num">
                          <prop name="sg"/>
                        </diamond>
                        <diamond mode="Mod">
                          <nom name="w18"/>
                          <prop name="iraqi"/>
                        </diamond>
                        <diamond mode="Mod">
                          <nom name="w19"/>
                          <prop name="capital"/>
                          <diamond mode="num">
                            <prop name="sg"/>
                          </diamond>
                        </diamond>
                      </chunk>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Arg1">
      <chunk>
        <nom name="w42"/>
        <prop name="blindage"/>
        <diamond mode="num">
          <prop name="sg"/>
        </diamond>
        <diamond mode="Det">
          <nom name="w40"/>
          <prop name="a"/>
        </diamond>
        <diamond mode="Mod">
          <nom name="w41"/>
          <prop name="military"/>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Mod">
      <chunk>
        <nom name="w0"/>
        <prop name="accord"/>
        <diamond mode="partic">
          <prop name="pres"/>
        </diamond>
        <diamond mode="Arg1">
          <chunk>
            <nom name="w1"/>
            <prop name="to"/>
            <diamond mode="Arg1">
              <chunk>
                <nom name="w4"/>
                <prop name="report"/>
                <diamond mode="num">
                  <prop name="sg"/>
                </diamond>
                <diamond mode="Det">
                  <nom name="w2"/>
                  <prop name="xinhua"/>
                </diamond>
                <diamond mode="Mod">
                  <nom name="w3"/>
                  <prop name="news"/>
                  <diamond mode="num">
                    <prop name="sg"/>
                  </diamond>
                </diamond>
                <diamond mode="Mod">
                  <chunk>
                    <nom name="w5"/>
                    <prop name="from"/>
                    <diamond mode="Arg1">
                      <chunk>
                        <nom name="w6"/>
                        <prop name="london"/>
                        <diamond mode="det">
                          <prop name="nil"/>
                        </diamond>
                        <diamond mode="num">
                          <prop name="sg"/>
                        </diamond>
                        <diamond mode="Mod">
                          <chunk>
                            <nom name="w7"/>
                            <prop name="on"/>
                            <diamond mode="Arg1">
                              <chunk>
                                <nom name="w9"/>
                                <prop name="13"/>
                                <diamond mode="det">
                                  <prop name="nil"/>
                                </diamond>
                                <diamond mode="ApposRel">
                                  <nom name="w11"/>
                                  <prop name="bonne"/>
                                  <diamond mode="det">
                                    <prop name="nil"/>
                                  </diamond>
                                  <diamond mode="num">
                                    <prop name="sg"/>
                                  </diamond>
                                </diamond>
                                <diamond mode="Mod">
                                  <nom name="w8"/>
                                  <prop name="february"/>
                                </diamond>
                              </chunk>
                            </diamond>
                          </chunk>
                        </diamond>
                      </chunk>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Mod">
      <chunk>
        <nom name="w23"/>
        <prop name="on"/>
        <diamond mode="Arg1">
          <chunk>
            <nom name="w24"/>
            <prop name="13th"/>
            <diamond mode="det">
              <prop name="nil"/>
            </diamond>
            <diamond mode="num">
              <prop name="sg"/>
            </diamond>
            <diamond mode="GenRel">
              <chunk>
                <nom name="w29"/>
                <prop name="show"/>
                <diamond mode="tense">
                  <prop name="past"/>
                </diamond>
                <diamond mode="Arg0">
                  <chunk>
                    <nom name="w28"/>
                    <prop name="sign"/>
                    <diamond mode="num">
                      <prop name="sg"/>
                    </diamond>
                    <diamond mode="Det">
                      <nom name="w26"/>
                      <prop name="no"/>
                    </diamond>
                    <diamond mode="Mod">
                      <nom name="w27"/>
                      <prop name="any"/>
                    </diamond>
                  </chunk>
                </diamond>
                <diamond mode="Arg1">
                  <chunk>
                    <nom name="w39"/>
                    <prop name="be"/>
                    <diamond mode="tense">
                      <prop name="past"/>
                    </diamond>
                    <diamond mode="Arg0">
                      <chunk>
                        <nom name="w32"/>
                        <prop name="shelter"/>
                        <diamond mode="num">
                          <prop name="sg"/>
                        </diamond>
                        <diamond mode="Det">
                          <nom name="w30"/>
                          <prop name="the"/>
                        </diamond>
                        <diamond mode="Mod">
                          <nom name="w31"/>
                          <prop name="bomb"/>
                          <diamond mode="num">
                            <prop name="sg"/>
                          </diamond>
                        </diamond>
                        <diamond mode="Mod">
                          <chunk>
                            <nom name="w33"/>
                            <prop name="in"/>
                            <diamond mode="Arg1">
                              <chunk>
                                <nom name="w34"/>
                                <prop name="baghdad"/>
                                <diamond mode="det">
                                  <prop name="nil"/>
                                </diamond>
                                <diamond mode="num">
                                  <prop name="sg"/>
                                </diamond>
                                <diamond mode="GenRel">
                                  <chunk>
                                    <nom name="w35"/>
                                    <prop name="destroy"/>
                                    <diamond mode="partic">
                                      <prop name="pass"/>
                                    </diamond>
                                    <diamond mode="Arg1">
                                      <nom name="w34"/>
                                    </diamond>
                                    <diamond mode="Mod">
                                      <chunk>
                                        <nom name="w36"/>
                                        <prop name="by"/>
                                        <diamond mode="Arg1">
                                          <chunk>
                                            <nom name="w38"/>
                                            <prop name="bomber"/>
                                            <diamond mode="det">
                                              <prop name="nil"/>
                                            </diamond>
                                            <diamond mode="num">
                                              <prop name="sg"/>
                                            </diamond>
                                            <diamond mode="Mod">
                                              <nom name="w37"/>
                                              <prop name="american"/>
                                            </diamond>
                                          </chunk>
                                        </diamond>
                                      </chunk>
                                    </diamond>
                                  </chunk>
                                </diamond>
                              </chunk>
                            </diamond>
                          </chunk>
                        </diamond>
                      </chunk>
                    </diamond>
                    <diamond mode="Arg1">
                      <nom name="w24"/>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="modFeat">
      <nom name="x1"/>
    </diamond>
  </satop>
</lf>
</second>
</paraphrase>
<paraphrase corpus="mtc.common" id="60">
<alignments source="GIZA_INTERSECTED">
<alignment first="1" second="0" status="S"/>
<alignment first="2" second="1" status="S"/>
<alignment first="3" second="2" status="S"/>
<alignment first="4" second="3" status="S"/>
<alignment first="8" second="5" status="S"/>
<alignment first="9" second="6" status="S"/>
<alignment first="11" second="7" status="S"/>
<alignment first="13" second="8" status="S"/>
<alignment first="15" second="9" status="S"/>
<alignment first="16" second="10" status="S"/>
<alignment first="17" second="11" status="S"/>
<alignment first="18" second="12" status="S"/>
<alignment first="20" second="13" status="S"/>
<alignment first="21" second="14" status="S"/>
<alignment first="22" second="15" status="S"/>
<alignment first="23" second="16" status="S"/>
<alignment first="31" second="22" status="S"/>
<alignment first="32" second="23" status="S"/>
<alignment first="33" second="26" status="S"/>
<alignment first="34" second="27" status="S"/>
</alignments>
<alignments source="ANNOTATOR">
<alignment first="0" second="0" status="P"/>
<alignment first="1" second="0" status="S"/>
<alignment first="2" second="1" status="S"/>
<alignment first="3" second="2" status="S"/>
<alignment first="4" second="3" status="S"/>
<alignment first="5" second="4" status="P"/>
<alignment first="6" second="4" status="P"/>
<alignment first="7" second="4" status="P"/>
<alignment first="8" second="5" status="S"/>
<alignment first="9" second="6" status="P"/>
<alignment first="9" second="8" status="P"/>
<alignment first="11" second="7" status="S"/>
<alignment first="12" second="6" status="P"/>
<alignment first="12" second="8" status="P"/>
<alignment first="13" second="6" status="P"/>
<alignment first="13" second="8" status="P"/>
<alignment first="15" second="9" status="S"/>
<alignment first="16" second="10" status="S"/>
<alignment first="17" second="11" status="S"/>
<alignment first="18" second="12" status="S"/>
<alignment first="19" second="13" status="S"/>
<alignment first="20" second="13" status="S"/>
<alignment first="21" second="14" status="S"/>
<alignment first="22" second="15" status="S"/>
<alignment first="23" second="16" status="S"/>
<alignment first="24" second="17" status="P"/>
<alignment first="25" second="18" status="P"/>
<alignment first="25" second="19" status="P"/>
<alignment first="25" second="20" status="P"/>
<alignment first="25" second="21" status="P"/>
<alignment first="26" second="18" status="P"/>
<alignment first="26" second="19" status="P"/>
<alignment first="26" second="20" status="P"/>
<alignment first="26" second="21" status="P"/>
<alignment first="27" second="18" status="P"/>
<alignment first="27" second="19" status="P"/>
<alignment first="27" second="20" status="P"/>
<alignment first="27" second="21" status="P"/>
<alignment first="28" second="18" status="P"/>
<alignment first="28" second="19" status="P"/>
<alignment first="28" second="20" status="P"/>
<alignment first="28" second="21" status="P"/>
<alignment first="29" second="18" status="P"/>
<alignment first="29" second="19" status="P"/>
<alignment first="29" second="20" status="P"/>
<alignment first="29" second="21" status="P"/>
<alignment first="30" second="18" status="P"/>
<alignment first="30" second="19" status="P"/>
<alignment first="30" second="20" status="P"/>
<alignment first="30" second="21" status="P"/>
<alignment first="31" second="22" status="S"/>
<alignment first="32" second="23" status="S"/>
<alignment first="32" second="24" status="S"/>
<alignment first="32" second="25" status="S"/>
<alignment first="33" second="26" status="S"/>
<alignment first="34" second="27" status="S"/>
</alignments>
<first>
<string>mr. siazon said , someone used to say , have n't we been burned once before ? when we were ready to accept them , it did n't take long before they fought agaion .</string>
<pred-info>w32:s\np\(s\np):NN:agaion w31:s[dcl]\np:VBD:fight w30:np:PRP:they w19:s[adj]\np/(s[to]\np):JJ:ready w9:s[dcl]\np/np:VBP:have w18:s[dcl]\np/(s[adj]\np):VBD:be w17:np:PRP:we w7:s[b]\np:VB:say w16:s/s/s[dcl]:WRB:when w15:s\np\(s\np):RB:before w5:s[pss]\np/(s[to]\np):VBD:use w14:s\np\(s\np)/(s\np\(s\np)):RB:once w4:np:DT:someone w13:s[pss]\np:VBN:burn w12:s[dcl]\np/(s[pss]\np):VBD:been w2:s[dcl]\np/s[dcl]/punct[,]:VBD:say w11:np:PRP:we w1:n:NN:siazon w10:s\np\(s\np):RB:n't w0:np/n:DT:mr. w29:s\np\(s\np)/s[dcl]:IN:before w28:s\np\(s\np):RB:long w27:s[b]\np:VB:take w26:s\np\(s\np):RB:n't w25:s[dcl]\np/(s[b]\np):VBD:do w24:np:PRP:it w22:np:PRP:them w21:s[b]\np/np:VB:accept</pred-info>
<full-words>mr.:S-mr.:P-DT:T-np/n siazon:S-siazon:P-NN:T-n said:S-say:P-VBD:T-s[dcl]\np/s[dcl]/punct[,] ,:S-,:P-,:T-punct[,] someone:S-someone:P-DT:T-np used:S-use:P-VBD:T-s[pss]\np/(s[to]\np) to:S-to:P-TO:T-s[to]\np/(s[b]\np) say:S-say:P-VB:T-s[b]\np ,:S-,:P-,:T-s[pss]\np\(s[pss]\np) have:S-have:P-VBP:T-s[dcl]\np/np n&apos;t:S-n&apos;t:P-RB:T-s\np\(s\np) we:S-we:P-PRP:T-np been:S-been:P-VBD:T-s[dcl]\np/(s[pss]\np) burned:S-burn:P-VBN:T-s[pss]\np once:S-once:P-RB:T-s\np\(s\np)/(s\np\(s\np)) before:S-before:P-RB:T-s\np\(s\np) ?:S-?:P-?:T-punct[?] when:S-when:P-WRB:T-s/s/s[dcl] we:S-we:P-PRP:T-np were:S-be:P-VBD:T-s[dcl]\np/(s[adj]\np) ready:S-ready:P-JJ:T-s[adj]\np/(s[to]\np) to:S-to:P-TO:T-s[to]\np/(s[b]\np) accept:S-accept:P-VB:T-s[b]\np/np them:S-them:P-PRP:T-np ,:S-,:P-,:T-s/s\(s/s) it:S-it:P-PRP:T-np did:S-do:P-VBD:T-s[dcl]\np/(s[b]\np) n&apos;t:S-n&apos;t:P-RB:T-s\np\(s\np) take:S-take:P-VB:T-s[b]\np long:S-long:P-RB:T-s\np\(s\np) before:S-before:P-IN:T-s\np\(s\np)/s[dcl] they:S-they:P-PRP:T-np fought:S-fight:P-VBD:T-s[dcl]\np agaion:S-agaion:P-NN:T-s\np\(s\np) .:S-.:P-.:T-sent\s[dcl]</full-words>
<lf>
  <satop nom="w2">
    <chunk>
      <prop name="say"/>
      <diamond mode="tense">
        <prop name="past"/>
      </diamond>
      <diamond mode="Arg0">
        <chunk>
          <nom name="w1"/>
          <prop name="siazon"/>
          <diamond mode="num">
            <prop name="sg"/>
          </diamond>
          <diamond mode="Det">
            <nom name="w0"/>
            <prop name="mr."/>
          </diamond>
        </chunk>
      </diamond>
      <diamond mode="Arg1">
        <chunk>
          <nom name="w9"/>
          <prop name="have"/>
          <diamond mode="tense">
            <prop name="pres"/>
          </diamond>
          <diamond mode="Arg0">
            <chunk>
              <nom name="w4"/>
              <prop name="someone"/>
              <diamond mode="GenRel">
                <chunk>
                  <nom name="w5"/>
                  <prop name="use"/>
                  <diamond mode="tense">
                    <prop name="past"/>
                  </diamond>
                  <diamond mode="Arg1">
                    <nom name="w4"/>
                  </diamond>
                  <diamond mode="Arg2">
                    <chunk>
                      <nom name="w7"/>
                      <prop name="say"/>
                      <diamond mode="Arg0">
                        <nom name="w4"/>
                      </diamond>
                    </chunk>
                  </diamond>
                  <diamond mode="modFeat">
                    <nom name="x1"/>
                  </diamond>
                </chunk>
              </diamond>
            </chunk>
          </diamond>
          <diamond mode="Arg1">
            <chunk>
              <nom name="w11"/>
              <prop name="we"/>
              <diamond mode="GenRel">
                <chunk>
                  <nom name="w12"/>
                  <prop name="been"/>
                  <diamond mode="tense">
                    <prop name="past"/>
                  </diamond>
                  <diamond mode="Arg0">
                    <nom name="w11"/>
                  </diamond>
                  <diamond mode="Arg1">
                    <chunk>
                      <nom name="w13"/>
                      <prop name="burn"/>
                      <diamond mode="partic">
                        <prop name="pass"/>
                      </diamond>
                      <diamond mode="Arg1">
                        <nom name="w11"/>
                      </diamond>
                      <diamond mode="Mod">
                        <chunk>
                          <nom name="w15"/>
                          <prop name="before"/>
                          <diamond mode="Mod">
                            <nom name="w14"/>
                            <prop name="once"/>
                          </diamond>
                        </chunk>
                      </diamond>
                    </chunk>
                  </diamond>
                </chunk>
              </diamond>
            </chunk>
          </diamond>
          <diamond mode="Mod">
            <nom name="w10"/>
            <prop name="n't"/>
          </diamond>
        </chunk>
      </diamond>
    </chunk>
  </satop>
  <satop nom="w25">
    <chunk>
      <prop name="do"/>
      <diamond mode="tense">
        <prop name="past"/>
      </diamond>
      <diamond mode="Arg0">
        <nom name="w25"/>
        <prop name="it"/>
      </diamond>
      <diamond mode="Arg1">
        <chunk>
          <nom name="w28"/>
          <prop name="take"/>
          <diamond mode="Arg0">
            <nom name="w25"/>
          </diamond>
          <diamond mode="Mod">
            <nom name="w29"/>
            <prop name="long"/>
          </diamond>
          <diamond mode="Mod">
            <chunk>
              <nom name="w30"/>
              <prop name="before"/>
              <diamond mode="Arg1">
                <chunk>
                  <nom name="w32"/>
                  <prop name="fight"/>
                  <diamond mode="tense">
                    <prop name="past"/>
                  </diamond>
                  <diamond mode="Arg0">
                    <nom name="w31"/>
                    <prop name="they"/>
                  </diamond>
                  <diamond mode="Mod">
                    <nom name="w33"/>
                    <prop name="agaion"/>
                    <diamond mode="num">
                      <prop name="sg"/>
                    </diamond>
                  </diamond>
                </chunk>
              </diamond>
            </chunk>
          </diamond>
        </chunk>
      </diamond>
      <diamond mode="Mod">
        <chunk>
          <nom name="w17"/>
          <prop name="when"/>
          <diamond mode="emph-intro">
            <prop name="+"/>
          </diamond>
          <diamond mode="Arg1">
            <chunk>
              <nom name="w19"/>
              <prop name="be"/>
              <diamond mode="tense">
                <prop name="past"/>
              </diamond>
              <diamond mode="Arg0">
                <nom name="w18"/>
                <prop name="we"/>
              </diamond>
              <diamond mode="Arg1">
                <chunk>
                  <nom name="w20"/>
                  <prop name="ready"/>
                  <diamond mode="Arg0">
                    <nom name="w18"/>
                  </diamond>
                  <diamond mode="Arg1">
                    <chunk>
                      <nom name="w22"/>
                      <prop name="accept"/>
                      <diamond mode="Arg0">
                        <nom name="x2"/>
                      </diamond>
                      <diamond mode="Arg1">
                        <nom name="w23"/>
                        <prop name="them"/>
                      </diamond>
                    </chunk>
                  </diamond>
                </chunk>
              </diamond>
            </chunk>
          </diamond>
        </chunk>
      </diamond>
      <diamond mode="Mod">
        <nom name="w27"/>
        <prop name="n't"/>
      </diamond>
    </chunk>
  </satop>
  <satop nom="x3">
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
  </satop>
</lf>
</first>
<second>
<string>siazon said : someone says , were we deceived before ? when we prepared to accept them but just after several days they began to fight again .</string>
<pred-info>w19:n/n:JJ:several w9:s\np\(s\np):IN:before w18:s/s/np:IN:after w8:s[dcl]\np:VBD:deceive w17:s/s/(s/s):RB:just w7:np:PRP:we w16:s$\(s$)/(s$):CC:but w6:s[dcl]\np/np:VBD:be w15:np:PRP:them w5:s[dcl]$\(s[dcl]$)/(s[dcl]$):,:, w14:s[b]\np/np:VB:accept w4:s[dcl]\np:VBZ:say w3:np:DT:someone w12:s[dcl]\np/(s[to]\np):VBD:prepare w2:s\s/s[dcl]:IN:| w11:np:PRP:we w1:s[dcl]\np/s[dcl]:VBD:say w10:s/s/s[dcl]:WRB:when w0:n:NN:siazon w25:s\np\(s\np):RB:again w24:s[b]\np:VB:fight w22:s[dcl]\np/(s[to]\np):VBD:begin w21:np:PRP:they w20:n:NNS:day</pred-info>
<full-words>siazon:S-siazon:P-NN:T-n said:S-say:P-VBD:T-s[dcl]\np/s[dcl] &amp;#58;:S-&amp;#58;:P-IN:T-s\s/s[dcl] someone:S-someone:P-DT:T-np says:S-say:P-VBZ:T-s[dcl]\np ,:S-,:P-,:T-s[dcl]$\(s[dcl]$)/(s[dcl]$) were:S-be:P-VBD:T-s[dcl]\np/np we:S-we:P-PRP:T-np deceived:S-deceive:P-VBD:T-s[dcl]\np before:S-before:P-IN:T-s\np\(s\np) ?:S-?:P-?:T-punct[?] when:S-when:P-WRB:T-s/s/s[dcl] we:S-we:P-PRP:T-np prepared:S-prepare:P-VBD:T-s[dcl]\np/(s[to]\np) to:S-to:P-TO:T-s[to]\np/(s[b]\np) accept:S-accept:P-VB:T-s[b]\np/np them:S-them:P-PRP:T-np but:S-but:P-CC:T-s$\(s$)/(s$) just:S-just:P-RB:T-s/s/(s/s) after:S-after:P-IN:T-s/s/np several:S-several:P-JJ:T-n/n days:S-day:P-NNS:T-n they:S-they:P-PRP:T-np began:S-begin:P-VBD:T-s[dcl]\np/(s[to]\np) to:S-to:P-TO:T-s[to]\np/(s[b]\np) fight:S-fight:P-VB:T-s[b]\np again:S-again:P-RB:T-s\np\(s\np) .:S-.:P-.:T-sent\s[dcl]</full-words>
<lf>
  <satop nom="w1">
    <prop name="say"/>
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
    <diamond mode="tense">
      <prop name="past"/>
    </diamond>
    <diamond mode="Arg0">
      <nom name="w0"/>
      <prop name="siazon"/>
      <diamond mode="det">
        <prop name="nil"/>
      </diamond>
      <diamond mode="num">
        <prop name="sg"/>
      </diamond>
    </diamond>
    <diamond mode="Arg1">
      <chunk>
        <nom name="w17"/>
        <prop name="but"/>
        <diamond mode="First">
          <nom name="w23"/>
        </diamond>
        <diamond mode="Next">
          <nom name="w23"/>
        </diamond>
        <satop nom="w22">
          <chunk>
            <prop name="begin"/>
            <diamond mode="tense">
              <prop name="past"/>
            </diamond>
            <diamond mode="Arg0">
              <nom name="w22"/>
              <prop name="they"/>
            </diamond>
            <diamond mode="Arg1">
              <chunk>
                <nom name="w25"/>
                <prop name="fight"/>
                <diamond mode="Arg0">
                  <nom name="w22"/>
                </diamond>
                <diamond mode="Mod">
                  <nom name="w26"/>
                  <prop name="again"/>
                </diamond>
              </chunk>
            </diamond>
            <diamond mode="Mod">
              <chunk>
                <nom name="w11"/>
                <prop name="when"/>
                <diamond mode="Arg1">
                  <chunk>
                    <nom name="w13"/>
                    <prop name="prepare"/>
                    <diamond mode="tense">
                      <prop name="past"/>
                    </diamond>
                    <diamond mode="Arg0">
                      <nom name="w12"/>
                      <prop name="we"/>
                    </diamond>
                    <diamond mode="Arg1">
                      <chunk>
                        <nom name="w15"/>
                        <prop name="accept"/>
                        <diamond mode="Arg0">
                          <nom name="w12"/>
                        </diamond>
                        <diamond mode="Arg1">
                          <nom name="w16"/>
                          <prop name="them"/>
                        </diamond>
                      </chunk>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
            <diamond mode="Mod">
              <chunk>
                <nom name="w19"/>
                <prop name="after"/>
                <diamond mode="Arg1">
                  <chunk>
                    <nom name="w21"/>
                    <prop name="day"/>
                    <diamond mode="det">
                      <prop name="nil"/>
                    </diamond>
                    <diamond mode="num">
                      <prop name="pl"/>
                    </diamond>
                    <diamond mode="Mod">
                      <nom name="w20"/>
                      <prop name="several"/>
                    </diamond>
                  </chunk>
                </diamond>
                <diamond mode="Mod">
                  <nom name="w18"/>
                  <prop name="just"/>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </satop>
      </chunk>
    </diamond>
    <diamond mode="Mod">
      <chunk>
        <nom name="w2"/>
        <prop name="&amp;amp;#58;"/>
        <diamond mode="Arg1">
          <chunk>
            <nom name="w5"/>
            <prop name=","/>
            <diamond mode="First">
              <chunk>
                <nom name="w4"/>
                <prop name="say"/>
                <diamond mode="tense">
                  <prop name="pres"/>
                </diamond>
                <diamond mode="Arg0">
                  <nom name="w3"/>
                </diamond>
              </chunk>
            </diamond>
            <diamond mode="Next">
              <chunk>
                <nom name="w6"/>
                <prop name="be"/>
                <diamond mode="tense">
                  <prop name="past"/>
                </diamond>
                <diamond mode="Arg0">
                  <nom name="w3"/>
                </diamond>
                <diamond mode="Arg1">
                  <chunk>
                    <nom name="w7"/>
                    <prop name="we"/>
                    <diamond mode="GenRel">
                      <chunk>
                        <nom name="w8"/>
                        <prop name="deceive"/>
                        <diamond mode="tense">
                          <prop name="past"/>
                        </diamond>
                        <diamond mode="Arg0">
                          <nom name="w7"/>
                        </diamond>
                        <diamond mode="Mod">
                          <nom name="w9"/>
                          <prop name="before"/>
                        </diamond>
                      </chunk>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
            <satop nom="w3">
              <prop name="someone"/>
            </satop>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
  </satop>
</lf>
</second>
</paraphrase>
<paraphrase corpus="mtc.common" id="61">
<alignments source="GIZA_INTERSECTED">
<alignment first="0" second="5" status="S"/>
<alignment first="1" second="6" status="S"/>
<alignment first="2" second="7" status="S"/>
<alignment first="3" second="8" status="S"/>
<alignment first="4" second="9" status="S"/>
<alignment first="5" second="10" status="S"/>
<alignment first="7" second="12" status="S"/>
<alignment first="8" second="13" status="S"/>
<alignment first="16" second="2" status="S"/>
<alignment first="17" second="0" status="S"/>
<alignment first="18" second="3" status="S"/>
<alignment first="19" second="14" status="S"/>
</alignments>
<alignments source="ANNOTATOR">
<alignment first="0" second="5" status="S"/>
<alignment first="1" second="6" status="S"/>
<alignment first="2" second="7" status="P"/>
<alignment first="3" second="8" status="S"/>
<alignment first="4" second="9" status="S"/>
<alignment first="5" second="10" status="S"/>
<alignment first="6" second="11" status="S"/>
<alignment first="7" second="12" status="S"/>
<alignment first="8" second="13" status="S"/>
<alignment first="14" second="2" status="P"/>
<alignment first="15" second="2" status="P"/>
<alignment first="16" second="2" status="P"/>
<alignment first="17" second="0" status="S"/>
<alignment first="18" second="3" status="S"/>
<alignment first="19" second="14" status="S"/>
</alignments>
<first>
<string>railroad officials blamed the bus passengers for the accident , the indian news agency india press trust report said .</string>
<pred-info>w18:s[dcl]\s[dcl]\np:VBD:say w8:n:NN:accident w17:n:NN:report w7:np/n:DT:the w16:n/n:NN:trust w6:pp/np:IN:for w15:n/n:NN:press w5:n:NNS:passenger w14:n/n:NN:india w4:n/n:NN:bus w13:n/n:NN:agency w3:np/n:DT:the w12:n/n:NN:news w2:s[dcl]\np/pp/np:VBD:blame w11:n/n:JJ:indian w1:n:NNS:official w10:np/n:DT:the w0:n/n:NN:railroad</pred-info>
<full-words>railroad:S-railroad:P-NN:T-n/n officials:S-official:P-NNS:T-n blamed:S-blame:P-VBD:T-s[dcl]\np/pp/np the:S-the:P-DT:T-np/n bus:S-bus:P-NN:T-n/n passengers:S-passenger:P-NNS:T-n for:S-for:P-IN:T-pp/np the:S-the:P-DT:T-np/n accident:S-accident:P-NN:T-n ,:S-,:P-,:T-s\s/(s\s) the:S-the:P-DT:T-np/n indian:S-indian:P-JJ:T-n/n news:S-news:P-NN:T-n/n agency:S-agency:P-NN:T-n/n india:S-india:P-NN:T-n/n press:S-press:P-NN:T-n/n trust:S-trust:P-NN:T-n/n report:S-report:P-NN:T-n said:S-say:P-VBD:T-s[dcl]\s[dcl]\np .:S-.:P-.:T-sent\s[dcl]</full-words>
<lf>
  <satop nom="w2">
    <prop name="blame"/>
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
    <diamond mode="tense">
      <prop name="past"/>
    </diamond>
    <diamond mode="Arg0">
      <chunk>
        <nom name="w1"/>
        <prop name="official"/>
        <diamond mode="det">
          <prop name="nil"/>
        </diamond>
        <diamond mode="num">
          <prop name="pl"/>
        </diamond>
        <diamond mode="Mod">
          <nom name="w0"/>
          <prop name="railroad"/>
          <diamond mode="num">
            <prop name="sg"/>
          </diamond>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Arg1">
      <chunk>
        <nom name="w5"/>
        <prop name="passenger"/>
        <diamond mode="num">
          <prop name="pl"/>
        </diamond>
        <diamond mode="Det">
          <nom name="w3"/>
          <prop name="the"/>
        </diamond>
        <diamond mode="Mod">
          <nom name="w4"/>
          <prop name="bus"/>
          <diamond mode="num">
            <prop name="sg"/>
          </diamond>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Arg2">
      <chunk>
        <nom name="w6"/>
        <prop name="for"/>
        <diamond mode="Arg1">
          <chunk>
            <nom name="w8"/>
            <prop name="accident"/>
            <diamond mode="num">
              <prop name="sg"/>
            </diamond>
            <diamond mode="Det">
              <nom name="w7"/>
              <prop name="the"/>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="ElabRel">
      <nom name="w2"/>
    </diamond>
    <diamond mode="Mod">
      <chunk>
        <nom name="w18"/>
        <prop name="say"/>
        <diamond mode="tense">
          <prop name="past"/>
        </diamond>
        <diamond mode="Arg1">
          <chunk>
            <nom name="w17"/>
            <prop name="report"/>
            <diamond mode="num">
              <prop name="sg"/>
            </diamond>
            <diamond mode="Det">
              <nom name="w10"/>
              <prop name="the"/>
            </diamond>
            <diamond mode="Mod">
              <nom name="w11"/>
              <prop name="indian"/>
            </diamond>
            <diamond mode="Mod">
              <nom name="w12"/>
              <prop name="news"/>
              <diamond mode="num">
                <prop name="sg"/>
              </diamond>
            </diamond>
            <diamond mode="Mod">
              <nom name="w13"/>
              <prop name="agency"/>
              <diamond mode="num">
                <prop name="sg"/>
              </diamond>
            </diamond>
            <diamond mode="Mod">
              <nom name="w14"/>
              <prop name="india"/>
              <diamond mode="num">
                <prop name="sg"/>
              </diamond>
            </diamond>
            <diamond mode="Mod">
              <nom name="w15"/>
              <prop name="press"/>
              <diamond mode="num">
                <prop name="sg"/>
              </diamond>
            </diamond>
            <diamond mode="Mod">
              <nom name="w16"/>
              <prop name="trust"/>
              <diamond mode="num">
                <prop name="sg"/>
              </diamond>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
  </satop>
</lf>
</first>
<second>
<string>report of pti said that railway official charged the bus passengers upon the accident .</string>
<pred-info>w9:n/n:NN:bus w8:np/n:DT:the w7:s[dcl]\np/pp/np:VBD:charge w6:n:NN:official w5:n/n:NN:railway w3:s[dcl]\np/s[em]:VBD:say w2:n:NNS:pti w1:np\np/np:IN:of w0:n:NN:report w13:n:NN:accident w12:np/n:DT:the w11:pp/np:IN:upon w10:n:NNS:passenger</pred-info>
<full-words>report:S-report:P-NN:T-n of:S-of:P-IN:T-np\np/np pti:S-pti:P-NNS:T-n said:S-say:P-VBD:T-s[dcl]\np/s[em] that:S-that:P-DT:T-s[em]/s[dcl] railway:S-railway:P-NN:T-n/n official:S-official:P-NN:T-n charged:S-charge:P-VBD:T-s[dcl]\np/pp/np the:S-the:P-DT:T-np/n bus:S-bus:P-NN:T-n/n passengers:S-passenger:P-NNS:T-n upon:S-upon:P-IN:T-pp/np the:S-the:P-DT:T-np/n accident:S-accident:P-NN:T-n .:S-.:P-.:T-sent\s[dcl]</full-words>
<lf>
  <satop nom="w3">
    <prop name="say"/>
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
    <diamond mode="tense">
      <prop name="past"/>
    </diamond>
    <diamond mode="Arg0">
      <chunk>
        <nom name="w0"/>
        <prop name="report"/>
        <diamond mode="det">
          <prop name="nil"/>
        </diamond>
        <diamond mode="num">
          <prop name="sg"/>
        </diamond>
        <diamond mode="Mod">
          <chunk>
            <nom name="w1"/>
            <prop name="of"/>
            <diamond mode="Arg1">
              <nom name="w2"/>
              <prop name="pti"/>
              <diamond mode="det">
                <prop name="nil"/>
              </diamond>
              <diamond mode="num">
                <prop name="pl"/>
              </diamond>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Arg1">
      <chunk>
        <nom name="w7"/>
        <prop name="charge"/>
        <diamond mode="tense">
          <prop name="past"/>
        </diamond>
        <diamond mode="Arg0">
          <chunk>
            <nom name="w6"/>
            <prop name="official"/>
            <diamond mode="det">
              <prop name="nil"/>
            </diamond>
            <diamond mode="num">
              <prop name="sg"/>
            </diamond>
            <diamond mode="Mod">
              <nom name="w5"/>
              <prop name="railway"/>
              <diamond mode="num">
                <prop name="sg"/>
              </diamond>
            </diamond>
          </chunk>
        </diamond>
        <diamond mode="Arg1">
          <chunk>
            <nom name="w10"/>
            <prop name="passenger"/>
            <diamond mode="num">
              <prop name="pl"/>
            </diamond>
            <diamond mode="Det">
              <nom name="w8"/>
              <prop name="the"/>
            </diamond>
            <diamond mode="Mod">
              <nom name="w9"/>
              <prop name="bus"/>
              <diamond mode="num">
                <prop name="sg"/>
              </diamond>
            </diamond>
          </chunk>
        </diamond>
        <diamond mode="Arg2">
          <chunk>
            <nom name="w11"/>
            <prop name="upon"/>
            <diamond mode="Arg1">
              <chunk>
                <nom name="w13"/>
                <prop name="accident"/>
                <diamond mode="num">
                  <prop name="sg"/>
                </diamond>
                <diamond mode="Det">
                  <nom name="w12"/>
                  <prop name="the"/>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
  </satop>
</lf>
</second>
</paraphrase>
<paraphrase corpus="mtc.common" id="62">
<alignments source="GIZA_INTERSECTED">
<alignment first="0" second="0" status="S"/>
<alignment first="1" second="1" status="S"/>
<alignment first="2" second="2" status="S"/>
<alignment first="3" second="3" status="S"/>
<alignment first="4" second="7" status="S"/>
<alignment first="5" second="8" status="S"/>
<alignment first="8" second="10" status="S"/>
<alignment first="9" second="11" status="S"/>
<alignment first="10" second="12" status="S"/>
<alignment first="11" second="14" status="S"/>
<alignment first="12" second="15" status="S"/>
<alignment first="13" second="19" status="S"/>
<alignment first="14" second="23" status="S"/>
<alignment first="15" second="24" status="S"/>
<alignment first="16" second="25" status="S"/>
<alignment first="17" second="26" status="S"/>
<alignment first="18" second="27" status="S"/>
<alignment first="19" second="28" status="S"/>
<alignment first="20" second="29" status="S"/>
</alignments>
<alignments source="ANNOTATOR">
<alignment first="0" second="0" status="S"/>
<alignment first="1" second="1" status="S"/>
<alignment first="2" second="2" status="S"/>
<alignment first="3" second="3" status="S"/>
<alignment first="4" second="7" status="S"/>
<alignment first="5" second="5" status="P"/>
<alignment first="5" second="6" status="P"/>
<alignment first="5" second="8" status="P"/>
<alignment first="5" second="9" status="P"/>
<alignment first="6" second="5" status="P"/>
<alignment first="6" second="6" status="P"/>
<alignment first="6" second="8" status="P"/>
<alignment first="6" second="9" status="P"/>
<alignment first="7" second="5" status="P"/>
<alignment first="7" second="6" status="P"/>
<alignment first="7" second="8" status="P"/>
<alignment first="7" second="9" status="P"/>
<alignment first="8" second="10" status="S"/>
<alignment first="9" second="11" status="S"/>
<alignment first="10" second="12" status="S"/>
<alignment first="11" second="14" status="S"/>
<alignment first="12" second="15" status="S"/>
<alignment first="13" second="19" status="S"/>
<alignment first="14" second="23" status="S"/>
<alignment first="15" second="24" status="S"/>
<alignment first="16" second="25" status="S"/>
<alignment first="17" second="26" status="S"/>
<alignment first="18" second="27" status="S"/>
<alignment first="19" second="17" status="P"/>
<alignment first="19" second="28" status="S"/>
<alignment first="20" second="18" status="P"/>
<alignment first="20" second="29" status="S"/>
</alignments>
<first>
<string>we mentioned the problems australia is concerned with , such as human rights and dispatching army officers to east timor .</string>
<pred-info>w9:np\np/np:IN:as w18:n:NN:timor w8:np\np/(np\np):JJ:such w7:pp/np:IN:with w17:n/n:JJ:east w16:np\np/np:TO:to w6:s[pss]\np/pp:VBN:concern w15:n:NNS:officer w5:s[dcl]\np/(s[pss]\np):VBZ:PASS w14:n/n:NN:army w4:n:NN:australia w13:n/n:VBG:dispatch w3:n/n:NNS:problem w12:np\np/np:CC:and w2:np/n:DT:the w11:n:NNS:rights w1:s[dcl]\np/np:VBD:mention w10:n/n:JJ:human w0:np:PRP:we</pred-info>
<full-words>we:S-we:P-PRP:T-np mentioned:S-mention:P-VBD:T-s[dcl]\np/np the:S-the:P-DT:T-np/n problems:S-problem:P-NNS:T-n/n australia:S-australia:P-NN:T-n is:S-be:P-VBZ:T-s[dcl]\np/(s[pss]\np) concerned:S-concern:P-VBN:T-s[pss]\np/pp with:S-with:P-IN:T-pp/np ,:S-,:P-,:T-punct[,] such:S-such:P-JJ:T-np\np/(np\np) as:S-as:P-IN:T-np\np/np human:S-human:P-JJ:T-n/n rights:S-rights:P-NNS:T-n and:S-and:P-CC:T-np\np/np dispatching:S-dispatch:P-VBG:T-n/n army:S-army:P-NN:T-n/n officers:S-officer:P-NNS:T-n to:S-to:P-TO:T-np\np/np east:S-east:P-JJ:T-n/n timor:S-timor:P-NN:T-n .:S-.:P-.:T-sent\(np\np)</full-words>
<lf>
  <satop nom="x1">
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
    <diamond mode="Mod">
      <chunk>
        <nom name="w10"/>
        <prop name="as"/>
        <diamond mode="Arg1">
          <chunk>
            <nom name="w13"/>
            <prop name="and"/>
            <diamond mode="First">
              <chunk>
                <nom name="w12"/>
                <prop name="rights"/>
                <diamond mode="det">
                  <prop name="nil"/>
                </diamond>
                <diamond mode="num">
                  <prop name="pl"/>
                </diamond>
                <diamond mode="Mod">
                  <nom name="w11"/>
                  <prop name="human"/>
                </diamond>
              </chunk>
            </diamond>
            <diamond mode="Next">
              <chunk>
                <nom name="w16"/>
                <prop name="officer"/>
                <diamond mode="det">
                  <prop name="nil"/>
                </diamond>
                <diamond mode="num">
                  <prop name="pl"/>
                </diamond>
                <diamond mode="Mod">
                  <nom name="w14"/>
                  <prop name="dispatch"/>
                  <diamond mode="partic">
                    <prop name="pres"/>
                  </diamond>
                </diamond>
                <diamond mode="Mod">
                  <nom name="w15"/>
                  <prop name="army"/>
                  <diamond mode="num">
                    <prop name="sg"/>
                  </diamond>
                </diamond>
                <diamond mode="Mod">
                  <chunk>
                    <nom name="w17"/>
                    <prop name="to"/>
                    <diamond mode="Arg1">
                      <chunk>
                        <nom name="w19"/>
                        <prop name="timor"/>
                        <diamond mode="det">
                          <prop name="nil"/>
                        </diamond>
                        <diamond mode="num">
                          <prop name="sg"/>
                        </diamond>
                        <diamond mode="Mod">
                          <nom name="w18"/>
                          <prop name="east"/>
                        </diamond>
                      </chunk>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
        <diamond mode="Mod">
          <nom name="w9"/>
          <prop name="such"/>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="GenRel">
      <chunk>
        <nom name="w5"/>
        <prop name="PASS"/>
        <diamond mode="tense">
          <prop name="pres"/>
        </diamond>
        <diamond mode="Arg0">
          <chunk>
            <nom name="w0"/>
            <prop name="we"/>
            <diamond mode="GenRel">
              <chunk>
                <nom name="w1"/>
                <prop name="mention"/>
                <diamond mode="tense">
                  <prop name="past"/>
                </diamond>
                <diamond mode="Arg0">
                  <nom name="w0"/>
                </diamond>
                <diamond mode="Arg1">
                  <chunk>
                    <nom name="w4"/>
                    <prop name="australia"/>
                    <diamond mode="num">
                      <prop name="sg"/>
                    </diamond>
                    <diamond mode="Det">
                      <nom name="w2"/>
                      <prop name="the"/>
                    </diamond>
                    <diamond mode="Mod">
                      <nom name="w3"/>
                      <prop name="problem"/>
                      <diamond mode="num">
                        <prop name="pl"/>
                      </diamond>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
        <diamond mode="Arg1">
          <chunk>
            <nom name="w6"/>
            <prop name="concern"/>
            <diamond mode="partic">
              <prop name="pass"/>
            </diamond>
            <diamond mode="Arg1">
              <nom name="w0"/>
            </diamond>
            <diamond mode="Arg2">
              <chunk>
                <nom name="w7"/>
                <prop name="with"/>
                <diamond mode="Arg1">
                  <nom name="x1"/>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
  </satop>
</lf>
</first>
<second>
<string>we mentioned the problems that have attracted australia 's attention , such as the humam rights in east timor and the issue of sending military officers to east timor .</string>
<pred-info>w19:np\np/np:CC:and w9:n:NN:attention w18:n:NN:timor w17:n/n:JJ:east w7:n:NN:australia w6:s[pt]\np/np:VBN:attract w16:np\np/np:IN:in w15:n:NNS:rights w5:s[dcl]\np/(s[pt]\np):VBP:PERF w14:n/n:NN:humam w3:n:NNS:problem w13:np/n:DT:the w12:np\np/np:IN:as w2:np/n:DT:the w11:np\np/(np\np):JJ:such w1:s[dcl]\np/np:VBD:mention w0:np:PRP:we w28:n:NN:timor w27:n/n:JJ:east w26:s\np\(s\np)/np:TO:to w25:n:NNS:officer w24:n/n:JJ:military w23:s[ng]\np/np:VBG:send w22:np\np/(s[ng]\np):IN:of w21:n:NN:issue w20:np/n:DT:the</pred-info>
<full-words>we:S-we:P-PRP:T-np mentioned:S-mention:P-VBD:T-s[dcl]\np/np the:S-the:P-DT:T-np/n problems:S-problem:P-NNS:T-n that:S-that:P-WDT:T-np\np/(s[dcl]\np) have:S-have:P-VBP:T-s[dcl]\np/(s[pt]\np) attracted:S-attract:P-VBN:T-s[pt]\np/np australia:S-australia:P-NN:T-n &apos;s:S-&apos;s:P-POS:T-np/n\np attention:S-attention:P-NN:T-n ,:S-,:P-,:T-s[dcl]\np\(s[dcl]\np) such:S-such:P-JJ:T-np\np/(np\np) as:S-as:P-IN:T-np\np/np the:S-the:P-DT:T-np/n humam:S-humam:P-NN:T-n/n rights:S-rights:P-NNS:T-n in:S-in:P-IN:T-np\np/np east:S-east:P-JJ:T-n/n timor:S-timor:P-NN:T-n and:S-and:P-CC:T-np\np/np the:S-the:P-DT:T-np/n issue:S-issue:P-NN:T-n of:S-of:P-IN:T-np\np/(s[ng]\np) sending:S-send:P-VBG:T-s[ng]\np/np military:S-military:P-JJ:T-n/n officers:S-officer:P-NNS:T-n to:S-to:P-TO:T-s\np\(s\np)/np east:S-east:P-JJ:T-n/n timor:S-timor:P-NN:T-n .:S-.:P-.:T-sent\s[dcl]</full-words>
<lf>
  <satop nom="w1">
    <prop name="mention"/>
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
    <diamond mode="tense">
      <prop name="past"/>
    </diamond>
    <diamond mode="Arg0">
      <nom name="w0"/>
      <prop name="we"/>
    </diamond>
    <diamond mode="Arg1">
      <chunk>
        <nom name="w3"/>
        <prop name="problem"/>
        <diamond mode="num">
          <prop name="pl"/>
        </diamond>
        <diamond mode="Det">
          <nom name="w2"/>
          <prop name="the"/>
        </diamond>
        <diamond mode="Mod">
          <chunk>
            <nom name="w12"/>
            <prop name="as"/>
            <diamond mode="Arg1">
              <chunk>
                <nom name="w19"/>
                <prop name="and"/>
                <diamond mode="First">
                  <chunk>
                    <nom name="w15"/>
                    <prop name="rights"/>
                    <diamond mode="num">
                      <prop name="pl"/>
                    </diamond>
                    <diamond mode="Det">
                      <nom name="w13"/>
                      <prop name="the"/>
                    </diamond>
                    <diamond mode="Mod">
                      <nom name="w14"/>
                      <prop name="humam"/>
                      <diamond mode="num">
                        <prop name="sg"/>
                      </diamond>
                    </diamond>
                    <diamond mode="Mod">
                      <chunk>
                        <nom name="w16"/>
                        <prop name="in"/>
                        <diamond mode="Arg1">
                          <chunk>
                            <nom name="w18"/>
                            <prop name="timor"/>
                            <diamond mode="det">
                              <prop name="nil"/>
                            </diamond>
                            <diamond mode="num">
                              <prop name="sg"/>
                            </diamond>
                            <diamond mode="Mod">
                              <nom name="w17"/>
                              <prop name="east"/>
                            </diamond>
                          </chunk>
                        </diamond>
                      </chunk>
                    </diamond>
                  </chunk>
                </diamond>
                <diamond mode="Next">
                  <chunk>
                    <nom name="w21"/>
                    <prop name="issue"/>
                    <diamond mode="num">
                      <prop name="sg"/>
                    </diamond>
                    <diamond mode="Det">
                      <nom name="w20"/>
                      <prop name="the"/>
                    </diamond>
                    <diamond mode="Mod">
                      <chunk>
                        <nom name="w22"/>
                        <prop name="of"/>
                        <diamond mode="Arg1">
                          <chunk>
                            <nom name="w23"/>
                            <prop name="send"/>
                            <diamond mode="partic">
                              <prop name="pres"/>
                            </diamond>
                            <diamond mode="Arg0">
                              <nom name="x2"/>
                            </diamond>
                            <diamond mode="Arg1">
                              <chunk>
                                <nom name="w25"/>
                                <prop name="officer"/>
                                <diamond mode="det">
                                  <prop name="nil"/>
                                </diamond>
                                <diamond mode="num">
                                  <prop name="pl"/>
                                </diamond>
                                <diamond mode="Mod">
                                  <nom name="w24"/>
                                  <prop name="military"/>
                                </diamond>
                              </chunk>
                            </diamond>
                            <diamond mode="Mod">
                              <chunk>
                                <nom name="w26"/>
                                <prop name="to"/>
                                <diamond mode="Arg1">
                                  <chunk>
                                    <nom name="w28"/>
                                    <prop name="timor"/>
                                    <diamond mode="det">
                                      <prop name="nil"/>
                                    </diamond>
                                    <diamond mode="num">
                                      <prop name="sg"/>
                                    </diamond>
                                    <diamond mode="Mod">
                                      <nom name="w27"/>
                                      <prop name="east"/>
                                    </diamond>
                                  </chunk>
                                </diamond>
                              </chunk>
                            </diamond>
                          </chunk>
                        </diamond>
                      </chunk>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
            <diamond mode="Mod">
              <nom name="w11"/>
              <prop name="such"/>
            </diamond>
          </chunk>
        </diamond>
        <diamond mode="GenRel">
          <chunk>
            <nom name="w5"/>
            <prop name="PERF"/>
            <diamond mode="tense">
              <prop name="pres"/>
            </diamond>
            <diamond mode="Arg0">
              <nom name="w3"/>
            </diamond>
            <diamond mode="Arg1">
              <chunk>
                <nom name="w6"/>
                <prop name="attract"/>
                <diamond mode="partic">
                  <prop name="past"/>
                </diamond>
                <diamond mode="Arg0">
                  <nom name="w3"/>
                </diamond>
                <diamond mode="Arg1">
                  <chunk>
                    <nom name="w9"/>
                    <prop name="attention"/>
                    <diamond mode="num">
                      <prop name="sg"/>
                    </diamond>
                    <diamond mode="GenOwn">
                      <nom name="w7"/>
                      <prop name="australia"/>
                      <diamond mode="det">
                        <prop name="nil"/>
                      </diamond>
                      <diamond mode="num">
                        <prop name="sg"/>
                      </diamond>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
            <diamond mode="modFeat">
              <nom name="x1"/>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
  </satop>
</lf>
</second>
</paraphrase>
<paraphrase corpus="mtc.common" id="63">
<alignments source="GIZA_INTERSECTED">
<alignment first="0" second="0" status="S"/>
<alignment first="1" second="1" status="S"/>
<alignment first="2" second="2" status="S"/>
<alignment first="3" second="3" status="S"/>
<alignment first="4" second="6" status="S"/>
<alignment first="6" second="8" status="S"/>
<alignment first="7" second="9" status="S"/>
<alignment first="8" second="12" status="S"/>
<alignment first="9" second="13" status="S"/>
<alignment first="10" second="14" status="S"/>
<alignment first="11" second="15" status="S"/>
<alignment first="12" second="16" status="S"/>
<alignment first="13" second="19" status="S"/>
<alignment first="14" second="20" status="S"/>
<alignment first="15" second="21" status="S"/>
<alignment first="16" second="22" status="S"/>
<alignment first="17" second="23" status="S"/>
<alignment first="18" second="24" status="S"/>
<alignment first="19" second="25" status="S"/>
<alignment first="20" second="26" status="S"/>
<alignment first="21" second="27" status="S"/>
</alignments>
<alignments source="ANNOTATOR">
<alignment first="0" second="0" status="S"/>
<alignment first="1" second="1" status="S"/>
<alignment first="2" second="2" status="S"/>
<alignment first="3" second="3" status="S"/>
<alignment first="4" second="6" status="S"/>
<alignment first="6" second="8" status="S"/>
<alignment first="7" second="9" status="S"/>
<alignment first="7" second="10" status="P"/>
<alignment first="8" second="12" status="S"/>
<alignment first="9" second="13" status="S"/>
<alignment first="10" second="14" status="S"/>
<alignment first="11" second="15" status="S"/>
<alignment first="12" second="16" status="S"/>
<alignment first="13" second="19" status="S"/>
<alignment first="14" second="20" status="S"/>
<alignment first="15" second="5" status="P"/>
<alignment first="15" second="21" status="S"/>
<alignment first="16" second="22" status="S"/>
<alignment first="17" second="23" status="S"/>
<alignment first="18" second="24" status="S"/>
<alignment first="19" second="25" status="S"/>
<alignment first="20" second="26" status="S"/>
<alignment first="21" second="27" status="S"/>
</alignments>
<first>
<string>the two prime ministers requested that un secretary-general prolong the un representative 's stay in cambodia to 6 months or longer .</string>
<pred-info>w19:np\np\(np\np)/(np\np):CC:or w9:np/n:DT:the w18:n:NNS:month w8:s[ng]\np/np:VBG:prolong w7:n:NN:secretary-general w17:n/n:CD:6 w16:np\np/np:TO:to w6:n/n:JJ:un w15:n:NN:cambodia w5:np/n:DT:that w14:np\np/np:IN:in w4:s[dcl]\np/np:VBD:request w13:n:NN:stay w3:n:NNS:minister w2:n/n:JJ:prime w11:n:NN:representative w1:n/n:CD:two w10:n/n:JJ:un w0:np/n:DT:the w20:np\np:JJR:longer</pred-info>
<full-words>the:S-the:P-DT:T-np/n two:S-two:P-CD:T-n/n prime:S-prime:P-JJ:T-n/n ministers:S-minister:P-NNS:T-n requested:S-request:P-VBD:T-s[dcl]\np/np that:S-that:P-DT:T-np/n un:S-un:P-JJ:T-n/n secretary&#45;general:S-secretary&#45;general:P-NN:T-n prolong:S-prolong:P-VBG:T-s[ng]\np/np the:S-the:P-DT:T-np/n un:S-un:P-JJ:T-n/n representative:S-representative:P-NN:T-n &apos;s:S-&apos;s:P-POS:T-np/n\np stay:S-stay:P-NN:T-n in:S-in:P-IN:T-np\np/np cambodia:S-cambodia:P-NN:T-n to:S-to:P-TO:T-np\np/np 6:S-6:P-CD:T-n/n months:S-month:P-NNS:T-n or:S-or:P-CC:T-np\np\(np\np)/(np\np) longer:S-longer:P-JJR:T-np\np .:S-.:P-.:T-sent\s[dcl]</full-words>
<lf>
  <satop nom="w4">
    <prop name="request"/>
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
    <diamond mode="tense">
      <prop name="past"/>
    </diamond>
    <diamond mode="Arg0">
      <chunk>
        <nom name="w3"/>
        <prop name="minister"/>
        <diamond mode="num">
          <prop name="pl"/>
        </diamond>
        <diamond mode="Det">
          <nom name="w0"/>
          <prop name="the"/>
        </diamond>
        <diamond mode="Mod">
          <nom name="w1"/>
          <prop name="two"/>
        </diamond>
        <diamond mode="Mod">
          <nom name="w2"/>
          <prop name="prime"/>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Arg1">
      <chunk>
        <nom name="w7"/>
        <prop name="secretary-general"/>
        <diamond mode="num">
          <prop name="sg"/>
        </diamond>
        <diamond mode="Det">
          <nom name="w5"/>
          <prop name="that"/>
        </diamond>
        <diamond mode="Mod">
          <nom name="w6"/>
          <prop name="un"/>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="GenRel">
      <chunk>
        <nom name="w8"/>
        <prop name="prolong"/>
        <diamond mode="partic">
          <prop name="pres"/>
        </diamond>
        <diamond mode="Arg0">
          <nom name="w3"/>
        </diamond>
        <diamond mode="Arg1">
          <chunk>
            <nom name="w13"/>
            <prop name="stay"/>
            <diamond mode="num">
              <prop name="sg"/>
            </diamond>
            <diamond mode="GenOwn">
              <chunk>
                <nom name="w11"/>
                <prop name="representative"/>
                <diamond mode="num">
                  <prop name="sg"/>
                </diamond>
                <diamond mode="Det">
                  <nom name="w9"/>
                  <prop name="the"/>
                </diamond>
                <diamond mode="Mod">
                  <nom name="w10"/>
                  <prop name="un"/>
                </diamond>
              </chunk>
            </diamond>
            <diamond mode="Mod">
              <chunk>
                <nom name="w14"/>
                <prop name="in"/>
                <diamond mode="Arg1">
                  <chunk>
                    <nom name="w15"/>
                    <prop name="cambodia"/>
                    <diamond mode="det">
                      <prop name="nil"/>
                    </diamond>
                    <diamond mode="num">
                      <prop name="sg"/>
                    </diamond>
                    <diamond mode="Mod">
                      <chunk>
                        <nom name="w19"/>
                        <prop name="or"/>
                        <diamond mode="Arg1">
                          <chunk>
                            <nom name="x1"/>
                            <diamond mode="Mod">
                              <nom name="w20"/>
                              <prop name="longer"/>
                            </diamond>
                          </chunk>
                        </diamond>
                        <diamond mode="Arg2">
                          <chunk>
                            <nom name="x2"/>
                            <diamond mode="Mod">
                              <chunk>
                                <nom name="w16"/>
                                <prop name="to"/>
                                <diamond mode="Arg1">
                                  <chunk>
                                    <nom name="w18"/>
                                    <prop name="month"/>
                                    <diamond mode="det">
                                      <prop name="nil"/>
                                    </diamond>
                                    <diamond mode="num">
                                      <prop name="pl"/>
                                    </diamond>
                                    <diamond mode="Mod">
                                      <nom name="w17"/>
                                      <prop name="6"/>
                                    </diamond>
                                  </chunk>
                                </diamond>
                              </chunk>
                            </diamond>
                          </chunk>
                        </diamond>
                      </chunk>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
  </satop>
</lf>
</first>
<second>
<string>the two prime ministers of cambodia asked the un secretary general to extend the un representative 's term of stay in cambodia to six months or longer .</string>
<pred-info>w19:n:NN:stay w9:n:NN:secretary w18:np\np/np:IN:of w8:n/n:NN:un w17:n:NN:term w7:np/n:DT:the w6:s[dcl]\np/(s[to]\np)/np:VBD:ask w15:n:NN:representative w5:n:NN:cambodia w14:n/n:JJ:un w4:np\np/np:IN:of w3:n:NNS:minister w13:np/n:DT:the w12:s[b]\np/pp/np:VB:extend w2:n/n:JJ:prime w1:n/n:CD:two w10:s[adj]\np:JJ:general w0:np/n:DT:the w26:np\np:JJR:longer w25:np\np/(np\np):CC:or w24:n:NNS:month w23:n/n:CD:six w22:pp/np:TO:to w21:n:NN:cambodia w20:np\np/np:IN:in</pred-info>
<full-words>the:S-the:P-DT:T-np/n two:S-two:P-CD:T-n/n prime:S-prime:P-JJ:T-n/n ministers:S-minister:P-NNS:T-n of:S-of:P-IN:T-np\np/np cambodia:S-cambodia:P-NN:T-n asked:S-ask:P-VBD:T-s[dcl]\np/(s[to]\np)/np the:S-the:P-DT:T-np/n un:S-un:P-NN:T-n/n secretary:S-secretary:P-NN:T-n general:S-general:P-JJ:T-s[adj]\np to:S-to:P-TO:T-s[to]\np/(s[b]\np) extend:S-extend:P-VB:T-s[b]\np/pp/np the:S-the:P-DT:T-np/n un:S-un:P-JJ:T-n/n representative:S-representative:P-NN:T-n &apos;s:S-&apos;s:P-POS:T-np/n\np term:S-term:P-NN:T-n of:S-of:P-IN:T-np\np/np stay:S-stay:P-NN:T-n in:S-in:P-IN:T-np\np/np cambodia:S-cambodia:P-NN:T-n to:S-to:P-TO:T-pp/np six:S-six:P-CD:T-n/n months:S-month:P-NNS:T-n or:S-or:P-CC:T-np\np/(np\np) longer:S-longer:P-JJR:T-np\np .:S-.:P-.:T-sent\s[dcl]</full-words>
<lf>
  <satop nom="w6">
    <prop name="ask"/>
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
    <diamond mode="tense">
      <prop name="past"/>
    </diamond>
    <diamond mode="Arg0">
      <chunk>
        <nom name="w3"/>
        <prop name="minister"/>
        <diamond mode="num">
          <prop name="pl"/>
        </diamond>
        <diamond mode="Det">
          <nom name="w0"/>
          <prop name="the"/>
        </diamond>
        <diamond mode="Mod">
          <nom name="w1"/>
          <prop name="two"/>
        </diamond>
        <diamond mode="Mod">
          <nom name="w2"/>
          <prop name="prime"/>
        </diamond>
        <diamond mode="Mod">
          <chunk>
            <nom name="w4"/>
            <prop name="of"/>
            <diamond mode="Arg1">
              <nom name="w5"/>
              <prop name="cambodia"/>
              <diamond mode="det">
                <prop name="nil"/>
              </diamond>
              <diamond mode="num">
                <prop name="sg"/>
              </diamond>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Arg1">
      <chunk>
        <nom name="w9"/>
        <prop name="secretary"/>
        <diamond mode="num">
          <prop name="sg"/>
        </diamond>
        <diamond mode="Det">
          <nom name="w7"/>
          <prop name="the"/>
        </diamond>
        <diamond mode="Mod">
          <nom name="w8"/>
          <prop name="un"/>
          <diamond mode="num">
            <prop name="sg"/>
          </diamond>
        </diamond>
        <diamond mode="GenRel">
          <chunk>
            <nom name="w10"/>
            <prop name="general"/>
            <diamond mode="Arg0">
              <nom name="w9"/>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Arg2">
      <chunk>
        <nom name="w12"/>
        <prop name="extend"/>
        <diamond mode="Arg0">
          <nom name="w9"/>
        </diamond>
        <diamond mode="Arg1">
          <chunk>
            <nom name="w17"/>
            <prop name="term"/>
            <diamond mode="num">
              <prop name="sg"/>
            </diamond>
            <diamond mode="GenOwn">
              <chunk>
                <nom name="w15"/>
                <prop name="representative"/>
                <diamond mode="num">
                  <prop name="sg"/>
                </diamond>
                <diamond mode="Det">
                  <nom name="w13"/>
                  <prop name="the"/>
                </diamond>
                <diamond mode="Mod">
                  <nom name="w14"/>
                  <prop name="un"/>
                </diamond>
              </chunk>
            </diamond>
            <diamond mode="Mod">
              <chunk>
                <nom name="w18"/>
                <prop name="of"/>
                <diamond mode="Arg1">
                  <chunk>
                    <nom name="w19"/>
                    <prop name="stay"/>
                    <diamond mode="det">
                      <prop name="nil"/>
                    </diamond>
                    <diamond mode="num">
                      <prop name="sg"/>
                    </diamond>
                    <diamond mode="Mod">
                      <chunk>
                        <nom name="w20"/>
                        <prop name="in"/>
                        <diamond mode="Arg1">
                          <nom name="w21"/>
                          <prop name="cambodia"/>
                          <diamond mode="det">
                            <prop name="nil"/>
                          </diamond>
                          <diamond mode="num">
                            <prop name="sg"/>
                          </diamond>
                        </diamond>
                      </chunk>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
        <diamond mode="Arg2">
          <chunk>
            <nom name="w22"/>
            <prop name="to"/>
            <diamond mode="Arg1">
              <chunk>
                <nom name="w24"/>
                <prop name="month"/>
                <diamond mode="det">
                  <prop name="nil"/>
                </diamond>
                <diamond mode="num">
                  <prop name="pl"/>
                </diamond>
                <diamond mode="Mod">
                  <nom name="w23"/>
                  <prop name="six"/>
                </diamond>
                <diamond mode="Mod">
                  <chunk>
                    <nom name="w26"/>
                    <prop name="longer"/>
                    <diamond mode="Mod">
                      <nom name="w25"/>
                      <prop name="or"/>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
  </satop>
</lf>
</second>
</paraphrase>
</paraphrases>


================================================
FILE: test/rules.xml
================================================
<?xml version="1.0" encoding="UTF-8"?><rules xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:noNamespaceSchemaLocation="../rules.xsd" name="protogrammar">
  <application dir="forward"/>
  <application dir="backward"/>
  <composition harmonic="true" dir="forward"/>
  <composition harmonic="true" dir="backward"/>
  <composition harmonic="false" dir="backward"/>
  <typeraising useDollar="false" dir="forward"/>
  <typeraising useDollar="true" dir="backward"/>
  <typeraising useDollar="true" dir="backward">
    <arg>
      <atomcat type="pp"/>
    </arg>
  </typeraising>
  <typechanging name="n_to_np">
    <arg>
      <atomcat type="n">
        <fs id="2">
          <feat attr="index">
            <lf>
              <nomvar name="X"/>
            </lf>
          </feat>
        </fs>
      </atomcat>
    </arg>
    <result>
      <atomcat type="np">
        <fs id="2">
          <feat val="3rd" attr="pers"/>
        </fs>
        <lf>
          <satop nomvar="X">
            <diamond mode="det">
              <prop name="nil"/>
            </diamond>
          </satop>
        </lf>
      </atomcat>
    </result>
  </typechanging>
  <typechanging name="s[pss]\np_to_np\np">
    <arg>
      <complexcat>
        <atomcat type="s">
          <fs>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
            <feat attr="form" val="pss"/>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </arg>
    <result>
      <complexcat>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X">
            <diamond mode="GenRel">
              <nomvar name="E"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </result>
  </typechanging>
  <typechanging unmatched="true" name="s[dcl]_to_s\s">
    <arg>
      <atomcat type="s">
        <fs>
          <feat attr="form" val="dcl"/>
        </fs>
      </atomcat>
    </arg>
    <result>
      <complexcat>
        <atomcat type="s"/>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="s"/>
      </complexcat>
    </result>
  </typechanging>
  <typechanging name="s[to]\np_to_np\np">
    <arg>
      <complexcat>
        <atomcat type="s">
          <fs>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
            <feat attr="form" val="to"/>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </arg>
    <result>
      <complexcat>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X">
            <diamond mode="Purpose">
              <nomvar name="E"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </result>
  </typechanging>
  <typechanging name="s[to]\np_to_n\n">
    <arg>
      <complexcat>
        <atomcat type="s">
          <fs>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
            <feat attr="form" val="to"/>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </arg>
    <result>
      <complexcat>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="n">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X">
            <diamond mode="Purpose">
              <nomvar name="E"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </result>
  </typechanging>
  <typechanging name="s[dcl]\np_to_np\np">
    <arg>
      <complexcat>
        <atomcat type="s">
          <fs>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
            <feat attr="form" val="dcl"/>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </arg>
    <result>
      <complexcat>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X">
            <diamond mode="GenRel">
              <nomvar name="E"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </result>
  </typechanging>
  <typechanging name="s[ng]\np_to_np\np">
    <arg>
      <complexcat>
        <atomcat type="s">
          <fs>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
            <feat attr="form" val="ng"/>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </arg>
    <result>
      <complexcat>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X">
            <diamond mode="GenRel">
              <nomvar name="E"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </result>
  </typechanging>
  <typechanging name="s[ng]\np_to_s\np\(s\np)">
    <arg>
      <complexcat>
        <atomcat type="s">
          <fs>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
            <feat attr="form" val="ng"/>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </arg>
    <result>
      <complexcat>
        <atomcat type="s">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="E0"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="3">
              <feat attr="index">
                <lf>
                  <nomvar name="E0"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="E0">
            <diamond mode="GenRel">
              <nomvar name="E"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </result>
  </typechanging>
  <typechanging name="s[dcl]/np_to_np\np">
    <arg>
      <complexcat>
        <atomcat type="s">
          <fs>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
            <feat attr="form" val="dcl"/>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </arg>
    <result>
      <complexcat>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X">
            <diamond mode="GenRel">
              <nomvar name="E"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </result>
  </typechanging>
  <typechanging name="s[adj]\np_to_s/s">
    <arg>
      <complexcat>
        <atomcat type="s">
          <fs>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
            <feat attr="form" val="adj"/>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </arg>
    <result>
      <complexcat>
        <atomcat type="s">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="E0"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="/" mode="&gt;"/>
        <atomcat type="s"/>
        <lf>
          <satop nomvar="E0">
            <diamond mode="GenRel">
              <nomvar name="E"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </result>
  </typechanging>
  <typechanging name="s[adj]\np_to_s\np\(s\np)">
    <arg>
      <complexcat>
        <atomcat type="s">
          <fs>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
            <feat attr="form" val="adj"/>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </arg>
    <result>
      <complexcat>
        <atomcat type="s">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="E0"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="3">
              <feat attr="index">
                <lf>
                  <nomvar name="E0"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="E0">
            <diamond mode="GenRel">
              <nomvar name="E"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </result>
  </typechanging>
  <typechanging name="s[ng]$_to_s\np\(s\np)">
    <arg>
      <complexcat>
        <atomcat type="s">
          <fs>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
            <feat attr="form" val="ng"/>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </arg>
    <result>
      <complexcat>
        <atomcat type="s">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="E0"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="3">
              <feat attr="index">
                <lf>
                  <nomvar name="E0"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="E0">
            <diamond mode="GenRel">
              <nomvar name="E"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </result>
  </typechanging>
  <typechanging unmatched="true" name="n[num]_to_np">
    <arg>
      <atomcat type="n">
        <fs>
          <feat attr="form" val="num"/>
        </fs>
      </atomcat>
    </arg>
    <result>
      <atomcat type="np"/>
    </result>
  </typechanging>
  <typechanging name="s[dcl]\np[thr]_to_np\np">
    <arg>
      <complexcat>
        <atomcat type="s">
          <fs>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
            <feat attr="form" val="dcl"/>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
            <feat val="thr" attr="lex"/>
          </fs>
        </atomcat>
      </complexcat>
    </arg>
    <result>
      <complexcat>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X">
            <diamond mode="GenRel">
              <nomvar name="E"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </result>
  </typechanging>
  <typechanging name="s[to]\np_to_s\np\(s\np)">
    <arg>
      <complexcat>
        <atomcat type="s">
          <fs>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
            <feat attr="form" val="to"/>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </arg>
    <result>
      <complexcat>
        <atomcat type="s">
          <fs id="3">
            <feat attr="index">
              <lf>
                <nomvar name="E0"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <complexcat>
          <atomcat type="s">
            <fs id="3">
              <feat attr="index">
                <lf>
                  <nomvar name="E0"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
          <slash dir="\" mode="&lt;"/>
          <atomcat type="np">
            <fs id="2">
              <feat attr="index">
                <lf>
                  <nomvar name="X"/>
                </lf>
              </feat>
            </fs>
          </atomcat>
        </complexcat>
        <lf>
          <satop nomvar="E0">
            <diamond mode="Purpose">
              <nomvar name="E"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </result>
  </typechanging>
  <typechanging name="s[dcl]_to_np\np">
    <arg>
      <atomcat type="s">
        <fs>
          <feat attr="index">
            <lf>
              <nomvar name="E"/>
            </lf>
          </feat>
          <feat val="dcl" attr="form"/>
        </fs>
      </atomcat>
    </arg>
    <result>
      <complexcat>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash mode="&lt;" dir="\"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X">
            <diamond mode="GenRel">
              <nomvar name="E"/>
              <diamond mode="Mod">
                <nomvar name="M"/>
              </diamond>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </result>
  </typechanging>
  <typechanging name="s[adj]\np_to_np\np">
    <arg>
      <complexcat>
        <atomcat type="s">
          <fs>
            <feat attr="index">
              <lf>
                <nomvar name="E"/>
              </lf>
            </feat>
            <feat attr="form" val="adj"/>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
      </complexcat>
    </arg>
    <result>
      <complexcat>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="np">
          <fs id="2">
            <feat attr="index">
              <lf>
                <nomvar name="X"/>
              </lf>
            </feat>
          </fs>
        </atomcat>
        <lf>
          <satop nomvar="X">
            <diamond mode="GenRel">
              <nomvar name="E"/>
            </diamond>
          </satop>
        </lf>
      </complexcat>
    </result>
  </typechanging>
  <typechanging unmatched="true" name="s[dcl]$_to_s\s">
    <arg>
      <atomcat type="s">
        <fs>
          <feat attr="form" val="dcl"/>
        </fs>
      </atomcat>
    </arg>
    <result>
      <complexcat>
        <atomcat type="s"/>
        <slash dir="\" mode="&lt;"/>
        <atomcat type="s"/>
      </complexcat>
    </result>
  </typechanging>
</rules>


================================================
FILE: test/testlf.xml
================================================
<?xml version="1.0"?>

<!-- bank of holland , wuhan office , was also officially established just recently .-->
<lf>
  <satop nom="w7">
    <prop name="be"/>
    <diamond mode="mood">
      <prop name="dcl"/>
    </diamond>
    <diamond mode="tense">
      <prop name="past"/>
    </diamond>
    <diamond mode="Arg0">
      <chunk>
        <nom name="w0"/>
        <prop name="bank"/>
        <diamond mode="det">
          <prop name="nil"/>
        </diamond>
        <diamond mode="Mod">
          <chunk>
            <nom name="w1"/>
            <prop name="of"/>
            <diamond mode="Arg1">
              <chunk>
                <nom name="w2"/>
                <prop name="holland"/>
                <diamond mode="det">
                  <prop name="nil"/>
                </diamond>
                <diamond mode="num">
                  <prop name="sg"/>
                </diamond>
                <diamond mode="ApposRel">
                  <chunk>
                    <nom name="w5"/>
                    <prop name="office"/>
                    <diamond mode="det">
                      <prop name="nil"/>
                    </diamond>
                    <diamond mode="num">
                      <prop name="sg"/>
                    </diamond>
                    <diamond mode="Mod">
                      <nom name="w4"/>
                      <prop name="wuhan"/>
                      <diamond mode="num">
                        <prop name="sg"/>
                      </diamond>
                    </diamond>
                  </chunk>
                </diamond>
              </chunk>
            </diamond>
          </chunk>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Arg1">
      <chunk>
        <nom name="w9"/>
        <prop name="officially"/>
        <diamond mode="Arg0">
          <nom name="w0"/>
        </diamond>
      </chunk>
    </diamond>
    <diamond mode="Mod">
      <nom name="w8"/>
      <prop name="also"/>
    </diamond>
    <diamond mode="GenRel">
      <chunk>
        <nom name="w10"/>
        <prop name="establish"/>
        <diamond mode="tense">
          <prop name="past"/>
        </diamond>
        <diamond mode="Arg1">
          <nom name="w0"/>
        </diamond>
        <diamond mode="Mod">
          <nom name="w11"/>
          <prop name="just"/>
        </diamond>
        <diamond mode="Mod">
          <nom name="w12"/>
          <prop name="recently"/>
        </diamond>
      </chunk>
    </diamond>
  </satop>
</lf>