[developers] Problem with the SMAF interface in PET
Christopher Rupp
Christopher.Rupp at cl.cam.ac.uk
Mon Nov 10 15:08:13 CET 2008
Hi,
I'm having a bit of a problem with the SMAF interface in the latest version of
PET
checked out from the SVN repository. I make that revision 502. (In order to
exhibit
the log I've commented the 'sm := "jhpstg.mem".' setting from the common.set
file
because this causes lots of warnings.)
cr351 at mcgraw /home/cr351/tmp 538: cat s31_smaf_script |
/tmp/cr351/pet/bin/cheap -default-les -packing=15 -memlimit=500 -nsolutions=5
-tok=smaf -mrs=new ~/work/erg/english.grm
reading `/home/cr351/work/erg/pet/english.set'... including
`/home/cr351/work/erg/pet/common.set'... including
`/home/cr351/work/erg/pet/global.set'... including
`/home/cr351/work/erg/pet/mrs.set'... loading `/home/cr351/work/erg/english.grm
'
(LinGO (July-08)) ;;WARNING: The function 'x-read-preprocessor' is deprecated.
Please use 'read-preprocessor' instead.
Reading preprocessor rules '/home/cr351/work/erg/preprocessor.fsr'
Reading preprocessor rules '/local/scratch/cr351/erg/rondane.fsr'
#[X-FSPP (132 global, 141 token-level rules @ `[ \t]+')]
read-vpm(): reading file `semi.vpm'.
92949 types in 6.5 s
no lexicon entries for:
"target="v1698"" []
"type="oscar"" []
"id="p737_f678"" []
"id="p732_f674"" []
"cfrom="6722"" []
"target="v1703"" []
"id="p742_f683"" []
"cfrom="6750"" []
"cfrom="6731"" []
"document="/tmp" []
"type="token"" []
"cfrom="6763"" []
"type="token"" []
"type="oscar"" []
"id="p736_f677"" []
"addressing="char"><lattice" []
"name="surface">amino</slot><slot" []
"deps="s31">amino</edge><edge" []
"deps="s31"><slot" []
"id="p741_f682"" []
"id="f674"" []
"name="surface">hydrogen</slot><slot" []
"cfrom="6747"" []
"target="v1701"" []
"type="token"" []
"cto="6740"" []
"type="token"" []
"type="token"" []
"cfrom="6777"" []
"deps="s31">an</edge><edge" []
"deps="s31">the</edge><edge" []
"deps="s31">hydrogen</edge><edge" []
"cfrom="6741"" []
"cto="6752"" []
"name="dtype">token</slot></edge></lattice></smaf>" []
"type="token"" []
"id="p739_f680"" []
"cto="6734"" []
"cto="6771"" []
"source="v1696"" []
"cfrom="6772"" []
"type="token"" []
"deps="s31">is</edge><edge" []
"deps="s31">however,</edge><edge" []
"deps="s31">donor.</edge><edge" []
"cto="6749"" []
"type="token"" []
"cto="6730"" []
"source="v1699"" []
"source="v1695"" []
"source="v1701"" []
"cto="6783"" []
"type="token"" []
"deps="s31">group</edge><edge" []
"source="v60"" []
"deps="s31">bond</edge><edge" []
"cto="6783"><edge" []
"target="v1697"" []
"cto="6746"" []
"source="v1698"" []
"source="v60"" []
"target="v1695"" []
"cto="6776"" []
"source="v1703"" []
"deps="s31">excellent</edge><edge" []
"b309733a.xml" []
"cr351" []
"target="v1701"" []
"target="v1697"" []
"target="v1702"" []
"id="fo60"" []
"source="v1697"" []
"final="v61"" []
"source="v1702"" []
"cto="6762"" []
"target="v1700"" []
"target="v1696"" []
"id="f680"" []
"target="v1702"" []
"id="f676"" []
"id="fo61"" []
"target="v1699"" []
"source="v1700"" []
"id="f679"" []
"cfrom="6735"" []
"id="f675"" []
"id="f681"" []
"target="v61"" []
"name="tag">jj</slot><slot" []
"name="dtype">token</slot></edge><edge" []
"target="v1698"" []
"cfrom="6750"" []
"id="f678"" []
"cfrom="6731"" []
"cfrom="6763"" []
"type="pos"" []
"target="v1703"" []
"name="tag">at1</slot><slot" []
"name="tag">at</slot><slot" []
"name="tag">nn1</slot><slot" []
"id="f683"" []
"name="dtype">token</slot></edge><edge" []
"name="dtype">token</slot></edge><edge" []
"name="dtype">token</slot></edge><edge" []
"<smaf" []
"cto="6740"" []
"cfrom="6747"" []
"id="f677"" []
"cfrom="6722"" []
"type="pos"" []
"type="pos"" []
"cto="6730"" []
"type="pos"" []
"name="tag">vbz</slot><slot" []
"cfrom="6777"" []
"name="tag">rrq</slot><slot" []
"name="tag">jj</slot><slot" []
"id="f682"" []
"name="dtype">token</slot></edge><edge" []
"name="dtype">token</slot></edge><edge" []
"name="tag">nn1</slot><slot" []
"name="dtype">token</slot></edge><edge" []
"s31"" []
"f1_scixml" []
"cto="6762"" []
"cto="6740"" []
"cto="6771"" []
"source="v1696"" []
"cfrom="6741"" []
"type="pos"" []
"type="pos"" []
"name="tag">nn1</slot><slot" []
"cfrom="6772"" []
"type="pos"" []
"name="dtype">token</slot></edge><edge" []
"name="tag">nn1</slot><slot" []
"cto="6752"" []
"cto="6734"" []
"name="dtype">token</slot></edge><edge" []
"cto="6771"" []
"source="v1700"" []
"source="v1696"" []
"source="v1701"" []
"type="pos"" []
"deps="f676"><slot" []
"init="v60"" []
"name="tag">nn1</slot><slot" []
"type="pos"" []
"name="type">cm</slot></edge><edge" []
"type="token"" []
"name="tag">nn1</slot><slot" []
"cto="6749"" []
"cfrom="6753"" []
"name="type">cm</slot></edge><edge" []
"source="v1699"" []
"source="v1695"" []
"source="v1701"" []
"cto="6783"" []
"deps="f679"><slot" []
"deps="f675"><slot" []
"deps="f681"><slot" []
"cto="6746"" []
"source="v1698"" []
"type="pos"" []
"target="v1697"" []
"deps="f678"><slot" []
"cto="6776"" []
"deps="f674"><slot" []
"source="v1703"" []
"deps="f680"><slot" []
"deps="f683"><slot" []
"deps="s31"><slot" []
"source="v1697"" []
"target="v1700"" []
"target="v1696"" []
"target="v1702"" []
"id="p735_f676"" []
"deps="f677"><slot" []
"source="v1702"" []
"deps="f682"><slot" []
"cfrom="6735"" []
"target="v1699"" []
"target="v1695"" []
"id="p738_f679"" []
"cfrom="6722"" []
"id="p734_f675"" []
"id="p740_f681"" []
"target="v61"" []
"cfrom="6753"" []
"cfrom="6735"" []
"cfrom="6763"" []
It looks as if the XML reader is not coping with the SMAF XML input correctly.
(The cut off point where it stops printing missing lexicon entries is not
always
the same for the same input.)
I've also got an instance of revision 486 checked out which appears to read the
SMAFs correctly.
cr351 at mcgraw /home/cr351/tmp 510:cat s31_smaf_script |
/local/scratch/cr351/pet/bin/cheap -default-les -memlimit=500 -tok=smaf
-mrs=new -results=1 ~/work/erg/english.grm
reading `/home/cr351/work/erg/pet/english.set'... including `/home/cr351/work/erg/pet/common.set'... including `/home/cr351/work/erg/pet/global.set'... including `/home/cr351/work/erg/pet/mrs.set'...
loading `/home/cr351/work/erg/english.grm' (LinGO (July-08))
reading SMAF conf '/local/scratch/cr351/erg/pet/smaf.conf'...
read-vpm(): reading file `semi.vpm'.
92949 types in 5.2 s
(1) `however, the amino group is an excellent hydrogen bond donor.' [0] --- 120 (0.22|0.52s) <45:2968> (28297.9K) [0.5s]
derivation[1] (0):however, the oscarcompound group is an excellent oscarcompound bond donor.
<mrs>
<label vid='1'/><var vid='2'/>
<ep cfrom='6731' cto='6734'><pred>_THE_Q_REL</pred><label vid='3'/>
<fvpair><rargname>ARG0</rargname><var vid='6' sort='x'>
<extrapair><path>PERS</path><value>3</value></extrapair>
<extrapair><path>NUM</path><value>SG</value></extrapair>
<extrapair><path>IND</path><value>+</value></extrapair>
<extrapair><path>SF</path><value>PROP</value></extrapair></var></fvpair>
<fvpair><rargname>RSTR</rargname><var vid='5' sort='h'></var></fvpair>
<fvpair><rargname>BODY</rargname><var vid='4' sort='h'></var></fvpair></ep>
<ep cfrom='6735' cto='6746'><pred>COMPOUND_REL</pred><label vid='7'/>
<fvpair><rargname>ARG0</rargname><var vid='9' sort='e'>
<extrapair><path>TENSE</path><value>UNTENSED</value></extrapair>
<extrapair><path>MOOD</path><value>INDICATIVE</value></extrapair>
<extrapair><path>PROG</path><value>-</value></extrapair>
<extrapair><path>PERF</path><value>-</value></extrapair>
<extrapair><path>SF</path><value>PROP</value></extrapair></var></fvpair>
<fvpair><rargname>ARG1</rargname><var vid='6' sort='x'>
<extrapair><path>PERS</path><value>3</value></extrapair>
<extrapair><path>NUM</path><value>SG</value></extrapair>
<extrapair><path>IND</path><value>+</value></extrapair>
<extrapair><path>SF</path><value>PROP</value></extrapair></var></fvpair>
<fvpair><rargname>ARG2</rargname><var vid='8' sort='x'>
<extrapair><path>SF</path><value>PROP</value></extrapair></var></fvpair></ep>
<ep cfrom='6735' cto='6746'><pred>UDEF_Q_REL</pred><label vid='10'/>
<fvpair><rargname>ARG0</rargname><var vid='8' sort='x'>
<extrapair><path>SF</path><value>PROP</value></extrapair></var></fvpair>
<fvpair><rargname>RSTR</rargname><var vid='12' sort='h'></var></fvpair>
<fvpair><rargname>BODY</rargname><var vid='11' sort='h'></var></fvpair></ep>
<ep cfrom='6735' cto='6740'><spred>_oscarcompound_n_1_rel</spred><label vid='13'/>
<fvpair><rargname>ARG0</rargname><var vid='8' sort='x'>
<extrapair><path>SF</path><value>PROP</value></extrapair></var></fvpair></ep>
<ep cfrom='6741' cto='6746'><spred>_group_n_of_rel</spred><label vid='7'/>
<fvpair><rargname>ARG0</rargname><var vid='6' sort='x'>
<extrapair><path>PERS</path><value>3</value></extrapair>
<extrapair><path>NUM</path><value>SG</value></extrapair>
<extrapair><path>IND</path><value>+</value></extrapair>
<extrapair><path>SF</path><value>PROP</value></extrapair></var></fvpair></ep>
<ep cfrom='6747' cto='6749'><pred>_BE_V_ID_REL</pred><label vid='14'/>
<fvpair><rargname>ARG0</rargname><var vid='2' sort='e'>
<extrapair><path>TENSE</path><value>PRES</value></extrapair>
<extrapair><path>MOOD</path><value>INDICATIVE</value></extrapair>
<extrapair><path>PROG</path><value>-</value></extrapair>
<extrapair><path>PERF</path><value>-</value></extrapair>
<extrapair><path>SF</path><value>PROP</value></extrapair></var></fvpair>
<fvpair><rargname>ARG1</rargname><var vid='6' sort='x'>
<extrapair><path>PERS</path><value>3</value></extrapair>
<extrapair><path>NUM</path><value>SG</value></extrapair>
<extrapair><path>IND</path><value>+</value></extrapair>
<extrapair><path>SF</path><value>PROP</value></extrapair></var></fvpair>
<fvpair><rargname>ARG2</rargname><var vid='15' sort='x'>
<extrapair><path>PERS</path><value>3</value></extrapair>
<extrapair><path>NUM</path><value>SG</value></extrapair>
<extrapair><path>IND</path><value>+</value></extrapair>
<extrapair><path>SF</path><value>PROP</value></extrapair></var></fvpair></ep>
<ep cfrom='6750' cto='6752'><pred>_A_Q_REL</pred><label vid='16'/>
<fvpair><rargname>ARG0</rargname><var vid='15' sort='x'>
<extrapair><path>PERS</path><value>3</value></extrapair>
<extrapair><path>NUM</path><value>SG</value></extrapair>
<extrapair><path>IND</path><value>+</value></extrapair>
<extrapair><path>SF</path><value>PROP</value></extrapair></var></fvpair>
<fvpair><rargname>RSTR</rargname><var vid='17' sort='h'></var></fvpair>
<fvpair><rargname>BODY</rargname><var vid='18' sort='h'></var></fvpair></ep>
<ep cfrom='6753' cto='6762'><spred>_excellent_a_1_rel</spred><label vid='19'/>
<fvpair><rargname>ARG0</rargname><var vid='20' sort='e'>
<extrapair><path>SF</path><value>PROP</value></extrapair></var></fvpair>
<fvpair><rargname>ARG1</rargname><var vid='15' sort='x'>
<extrapair><path>PERS</path><value>3</value></extrapair>
<extrapair><path>NUM</path><value>SG</value></extrapair>
<extrapair><path>IND</path><value>+</value></extrapair>
<extrapair><path>SF</path><value>PROP</value></extrapair></var></fvpair></ep>
<ep cfrom='6763' cto='6783'><pred>COMPOUND_REL</pred><label vid='19'/>
<fvpair><rargname>ARG0</rargname><var vid='21' sort='e'>
<extrapair><path>TENSE</path><value>UNTENSED</value></extrapair>
<extrapair><path>MOOD</path><value>INDICATIVE</value></extrapair>
<extrapair><path>PROG</path><value>-</value></extrapair>
<extrapair><path>PERF</path><value>-</value></extrapair>
<extrapair><path>SF</path><value>PROP</value></extrapair></var></fvpair>
<fvpair><rargname>ARG1</rargname><var vid='15' sort='x'>
<extrapair><path>PERS</path><value>3</value></extrapair>
<extrapair><path>NUM</path><value>SG</value></extrapair>
<extrapair><path>IND</path><value>+</value></extrapair>
<extrapair><path>SF</path><value>PROP</value></extrapair></var></fvpair>
<fvpair><rargname>ARG2</rargname><var vid='22' sort='x'>
<extrapair><path>PERS</path><value>3</value></extrapair>
<extrapair><path>NUM</path><value>SG</value></extrapair>
<extrapair><path>IND</path><value>+</value></extrapair>
<extrapair><path>SF</path><value>PROP</value></extrapair></var></fvpair></ep>
<ep cfrom='6763' cto='6776'><pred>COMPOUND_NAME_REL</pred><label vid='23'/>
<fvpair><rargname>ARG0</rargname><var vid='24' sort='e'>
<extrapair><path>TENSE</path><value>UNTENSED</value></extrapair>
<extrapair><path>MOOD</path><value>INDICATIVE</value></extrapair>
<extrapair><path>PROG</path><value>-</value></extrapair>
<extrapair><path>PERF</path><value>-</value></extrapair>
<extrapair><path>SF</path><value>PROP</value></extrapair></var></fvpair>
<fvpair><rargname>ARG1</rargname><var vid='22' sort='x'>
<extrapair><path>PERS</path><value>3</value></extrapair>
<extrapair><path>NUM</path><value>SG</value></extrapair>
<extrapair><path>IND</path><value>+</value></extrapair>
<extrapair><path>SF</path><value>PROP</value></extrapair></var></fvpair>
<fvpair><rargname>ARG2</rargname><var vid='25' sort='x'>
<extrapair><path>PERS</path><value>3</value></extrapair>
<extrapair><path>NUM</path><value>SG</value></extrapair>
<extrapair><path>SF</path><value>PROP</value></extrapair></var></fvpair></ep>
<ep cfrom='6763' cto='6776'><pred>UDEF_Q_REL</pred><label vid='26'/>
<fvpair><rargname>ARG0</rargname><var vid='25' sort='x'>
<extrapair><path>PERS</path><value>3</value></extrapair>
<extrapair><path>NUM</path><value>SG</value></extrapair>
<extrapair><path>SF</path><value>PROP</value></extrapair></var></fvpair>
<fvpair><rargname>RSTR</rargname><var vid='28' sort='h'></var></fvpair>
<fvpair><rargname>BODY</rargname><var vid='27' sort='h'></var></fvpair></ep>
<ep cfrom='6763' cto='6771'><spred>_oscarcompound_n_1_rel</spred><label vid='29'/>
<fvpair><rargname>ARG0</rargname><var vid='25' sort='x'>
<extrapair><path>PERS</path><value>3</value></extrapair>
<extrapair><path>NUM</path><value>SG</value></extrapair>
<extrapair><path>SF</path><value>PROP</value></extrapair></var></fvpair></ep>
<ep cfrom='6772' cto='6776'><pred>PROPER_Q_REL</pred><label vid='30'/>
<fvpair><rargname>ARG0</rargname><var vid='22' sort='x'>
<extrapair><path>PERS</path><value>3</value></extrapair>
<extrapair><path>NUM</path><value>SG</value></extrapair>
<extrapair><path>IND</path><value>+</value></extrapair>
<extrapair><path>SF</path><value>PROP</value></extrapair></var></fvpair>
<fvpair><rargname>RSTR</rargname><var vid='31' sort='h'></var></fvpair>
<fvpair><rargname>BODY</rargname><var vid='32' sort='h'></var></fvpair></ep>
<ep cfrom='6772' cto='6776'><pred>NAMED_REL</pred><label vid='33'/>
<fvpair><rargname>ARG0</rargname><var vid='22' sort='x'>
<extrapair><path>PERS</path><value>3</value></extrapair>
<extrapair><path>NUM</path><value>SG</value></extrapair>
<extrapair><path>IND</path><value>+</value></extrapair>
<extrapair><path>SF</path><value>PROP</value></extrapair></var></fvpair>
<fvpair><rargname>CARG</rargname><constant>Bond</constant></fvpair></ep>
<ep cfrom='6777' cto='6783'><spred>_donor_n_1_rel</spred><label vid='19'/>
<fvpair><rargname>ARG0</rargname><var vid='15' sort='x'>
<extrapair><path>PERS</path><value>3</value></extrapair>
<extrapair><path>NUM</path><value>SG</value></extrapair>
<extrapair><path>IND</path><value>+</value></extrapair>
<extrapair><path>SF</path><value>PROP</value></extrapair></var></fvpair></ep>
<hcons hreln='qeq'><hi><var vid='5' sort='h'></var></hi><lo><var vid='7' sort='h'></var></lo></hcons>
<hcons hreln='qeq'><hi><var vid='12' sort='h'></var></hi><lo><var vid='13' sort='h'></var></lo></hcons>
<hcons hreln='qeq'><hi><var vid='17' sort='h'></var></hi><lo><var vid='19' sort='h'></var></lo></hcons>
<hcons hreln='qeq'><hi><var vid='28' sort='h'></var></hi><lo><var vid='29' sort='h'></var></lo></hcons>
<hcons hreln='qeq'><hi><var vid='31' sort='h'></var></hi><lo><var vid='33' sort='h'></var></lo></hcons>
</mrs>
(With no model, I restricted the result count. This shouldn't be significant.)
I'm attaching the input SMAF file. I did try to check out the older version again,
but I don't think I have access. I can see the logic in that, but it means someone
else has to look for the modification which causes this change in behaviour. I was
not able to find anything significant in a global diff of the two versions. I do
note however that the lines around the deprecated x-read-preprocess only appear in
the startup of the newer version. (Bearing in mind that the LKB code, ERG grammar,
and config options are the same.
./configure --with-tsdb=/local/scratch/cr351/lkb --with-xml=/local/scratch/cr351/xerces/xerces-c_2_8_0-x86_64-linux-gcc_3_4 --with-mrsdir=/local/scratch/cr351/lkb --with-ecl=/local/scratch/cr351/ecl --with-icu=/local/scratch/cr351/icu --prefix=/tmp/cr351/pet --enable-qccomp
)
Can anyone help with this? Presumably you have to be PET developer to get full
access to the repository. Thanks.
Cheers,
C.J.
--
Dr. C.J. Rupp
University of Cambridge Computer Laboratory
William Gates Building
15 JJ Thomson Avenue
Cambridge CB3 0FD, UK
Tel: +44 1223 767025
Fax: +44 1223 334678
Mobile: +44 795-8496 916
Email: cr351 at cl.cam.ac.uk
-------------- next part --------------
<smaf document="/tmp/cr351/f1_scixml/b309733a.xml - s31" addressing="char"><lattice init="v60" final="v61" cfrom="6722" cto="6783"><edge id="f674" type="token" source="v60" target="v1695" cfrom="6722" cto="6730" deps="s31">However,</edge><edge id="p732_f674" type="pos" source="v60" target="v1695" cfrom="6722" cto="6730" deps="f674"><slot name="tag">RRQ</slot><slot name="dtype">token</slot></edge><edge id="f675" type="token" source="v1695" target="v1696" cfrom="6731" cto="6734" deps="s31">the</edge><edge id="p734_f675" type="pos" source="v1695" target="v1696" cfrom="6731" cto="6734" deps="f675"><slot name="tag">AT</slot><slot name="dtype">token</slot></edge><edge id="f676" type="token" source="v1696" target="v1697" cfrom="6735" cto="6740" deps="s31">amino</edge><edge id="p735_f676" type="pos" source="v1696" target="v1697" cfrom="6735" cto="6740" deps="f676"><slot name="tag">JJ</slot><slot name="dtype">token</slot></edge><edge id="fo60" type="oscar" source="v1696" target="v1697" cfrom="6735" cto="6740" deps="s31"><slot name="surface">amino</slot><slot name="tag">NN1</slot><slot name="type">CM</slot></edge><edge id="f677" type="token" source="v1697" target="v1698" cfrom="6741" cto="6746" deps="s31">group</edge><edge id="p736_f677" type="pos" source="v1697" target="v1698" cfrom="6741" cto="6746" deps="f677"><slot name="tag">NN1</slot><slot name="dtype">token</slot></edge><edge id="f678" type="token" source="v1698" target="v1699" cfrom="6747" cto="6749" deps="s31">is</edge><edge id="p737_f678" type="pos" source="v1698" target="v1699" cfrom="6747" cto="6749" deps="f678"><slot name="tag">VBZ</slot><slot name="dtype">token</slot></edge><edge id="f679" type="token" source="v1699" target="v1700" cfrom="6750" cto="6752" deps="s31">an</edge><edge id="p738_f679" type="pos" source="v1699" target="v1700" cfrom="6750" cto="6752" deps="f679"><slot name="tag">AT1</slot><slot name="dtype">token</slot></edge><edge id="f680" type="token" source="v1700" target="v1701" cfrom="6753" cto="6762" deps="s31">excellent</edge><edge id="p739_f680" type="pos" source="v1700" target="v1701" cfrom="6753" cto="6762" deps="f680"><slot name="tag">JJ</slot><slot name="dtype">token</slot></edge><edge id="f681" type="token" source="v1701" target="v1702" cfrom="6763" cto="6771" deps="s31">hydrogen</edge><edge id="p740_f681" type="pos" source="v1701" target="v1702" cfrom="6763" cto="6771" deps="f681"><slot name="tag">NN1</slot><slot name="dtype">token</slot></edge><edge id="fo61" type="oscar" source="v1701" target="v1702" cfrom="6763" cto="6771" deps="s31"><slot name="surface">hydrogen</slot><slot name="tag">NN1</slot><slot name="type">CM</slot></edge><edge id="f682" type="token" source="v1702" target="v1703" cfrom="6772" cto="6776" deps="s31">bond</edge><edge id="p741_f682" type="pos" source="v1702" target="v1703" cfrom="6772" cto="6776" deps="f682"><slot name="tag">NN1</slot><slot name="dtype">token</slot></edge><edge id="f683" type="token" source="v1703" target="v61" cfrom="6777" cto="6783" deps="s31">donor.</edge><edge id="p742_f683" type="pos" source="v1703" target="v61" cfrom="6777" cto="6783" deps="f683"><slot name="tag">NN1</slot><slot name="dtype">token</slot></edge></lattice></smaf>
More information about the developers
mailing list