<?xml version="1.0" encoding="utf-8"?><fo:root xmlns:fo="http://www.w3.org/1999/XSL/Format" line-height-shift-adjustment="disregard-shifts" line-height="2.4"><!-- generated by XLingPapPublisherStylesheetFO.xsl Version 2.8.0--><fo:layout-master-set><fo:simple-page-master page-width="8.5in" page-height="11in" margin-top="1in" margin-bottom="1in" margin-left="1.5in" margin-right="1in" master-name="FrontMatterPage"><fo:region-body margin-top=".25in" margin-bottom=".25in"/><fo:region-before extent=".25in"/><fo:region-after region-name="xsl-region-after" extent=".25in"/></fo:simple-page-master><fo:simple-page-master page-width="8.5in" page-height="11in" margin-top="1in" margin-bottom="1in" margin-left="1.5in" margin-right="1in" master-name="FrontMatterTOCFirstPage"><fo:region-body margin-top=".25in" margin-bottom=".25in"/><fo:region-before extent=".25in"/><fo:region-after region-name="FrontMatterTOCFirstPage-after" extent=".25in"/></fo:simple-page-master><fo:simple-page-master page-width="8.5in" page-height="11in" margin-top="1in" margin-bottom="1in" margin-left="1in" margin-right="1.5in" master-name="FrontMatterTOCEvenPage"><fo:region-body margin-top=".25in" margin-bottom=".25in"/><fo:region-before region-name="FrontMatterTOCEvenPage-before" extent=".25in"/><fo:region-after region-name="xsl-region-after" extent=".25in"/></fo:simple-page-master><fo:simple-page-master page-width="8.5in" page-height="11in" margin-top="1in" margin-bottom="1in" margin-left="1.5in" margin-right="1in" master-name="FrontMatterTOCOddPage"><fo:region-body margin-top=".25in" margin-bottom=".25in"/><fo:region-before region-name="FrontMatterTOCOddPage-before" extent=".25in"/><fo:region-after region-name="xsl-region-after" extent=".25in"/></fo:simple-page-master><fo:simple-page-master page-width="8.5in" page-height="11in" margin-top="1in" margin-bottom="1in" margin-left="1in" margin-right="1.5in" master-name="FrontMatterBlankEvenPage"><fo:region-body margin-top=".25in" margin-bottom=".25in"/><fo:region-before region-name="xsl-region-before" extent=".25in"/><fo:region-after region-name="xsl-region-after" extent=".25in"/></fo:simple-page-master><fo:simple-page-master page-width="8.5in" page-height="11in" margin-top="1in" margin-bottom="1in" margin-left="1.5in" margin-right="1in" master-name="ChapterFirstPage"><fo:region-body margin-top=".25in" margin-bottom=".25in"/><fo:region-before region-name="ChapterFirstPage-before" extent=".25in"/><fo:region-after region-name="ChapterFirstPage-after" extent=".25in"/></fo:simple-page-master><fo:simple-page-master page-width="8.5in" page-height="11in" margin-top="1in" margin-bottom="1in" margin-left="1in" margin-right="1.5in" master-name="ChapterEvenPage"><fo:region-body margin-top=".25in" margin-bottom=".25in"/><fo:region-before region-name="ChapterEvenPage-before" extent=".25in"/><fo:region-after region-name="ChapterEvenPage-after" extent=".25in"/></fo:simple-page-master><fo:simple-page-master page-width="8.5in" page-height="11in" margin-top="1in" margin-bottom="1in" margin-left="1.5in" margin-right="1in" master-name="ChapterOddPage"><fo:region-body margin-top=".25in" margin-bottom=".25in"/><fo:region-before region-name="ChapterOddPage-before" extent=".25in"/><fo:region-after region-name="ChapterOddPage-after" extent=".25in"/></fo:simple-page-master><fo:simple-page-master page-width="8.5in" page-height="11in" margin-top="1in" margin-bottom="1in" margin-left="1.5in" margin-right="1in" master-name="IndexFirstPage"><fo:region-body margin-top=".25in" margin-bottom=".25in" column-count="2" column-gap="0.25in"/><fo:region-before region-name="IndexFirstPage-before" extent=".25in"/><fo:region-after region-name="IndexFirstPage-after" extent=".25in"/></fo:simple-page-master><fo:simple-page-master page-width="8.5in" page-height="11in" margin-top="1in" margin-bottom="1in" margin-left="1in" margin-right="1.5in" master-name="IndexEvenPage"><fo:region-body margin-top=".25in" margin-bottom=".25in" column-count="2" column-gap="0.25in"/><fo:region-before region-name="IndexEvenPage-before" extent=".25in"/><fo:region-after region-name="IndexEvenPage-after" extent=".25in"/></fo:simple-page-master><fo:simple-page-master page-width="8.5in" page-height="11in" margin-top="1in" margin-bottom="1in" margin-left="1.5in" margin-right="1in" master-name="IndexOddPage"><fo:region-body margin-top=".25in" margin-bottom=".25in" column-count="2" column-gap="0.25in"/><fo:region-before region-name="IndexOddPage-before" extent=".25in"/><fo:region-after region-name="IndexOddPage-after" extent=".25in"/></fo:simple-page-master><fo:simple-page-master page-width="8.5in" page-height="11in" margin-top="1in" margin-bottom="1in" margin-left="1in" margin-right="1.5in" master-name="BlankEvenPage"><fo:region-body margin-top=".25in" margin-bottom=".25in"/><fo:region-before region-name="BlankEvenPage-before" extent=".25in"/><fo:region-after region-name="BlankEvenPage-after" extent=".25in"/></fo:simple-page-master><fo:page-sequence-master master-name="FrontMatter"><fo:repeatable-page-master-alternatives><fo:conditional-page-master-reference page-position="first" master-reference="FrontMatterPage"/><fo:conditional-page-master-reference odd-or-even="odd" master-reference="FrontMatterPage"/><fo:conditional-page-master-reference odd-or-even="even" master-reference="FrontMatterPage"/><fo:conditional-page-master-reference odd-or-even="even" blank-or-not-blank="blank" master-reference="FrontMatterBlankEvenPage"/></fo:repeatable-page-master-alternatives></fo:page-sequence-master><fo:page-sequence-master master-name="FrontMatterTOC"><fo:repeatable-page-master-alternatives><fo:conditional-page-master-reference page-position="first" master-reference="FrontMatterTOCFirstPage"/><fo:conditional-page-master-reference odd-or-even="even" blank-or-not-blank="blank" master-reference="FrontMatterBlankEvenPage"/><fo:conditional-page-master-reference odd-or-even="even" master-reference="FrontMatterTOCEvenPage"/><fo:conditional-page-master-reference odd-or-even="odd" master-reference="FrontMatterTOCOddPage"/></fo:repeatable-page-master-alternatives></fo:page-sequence-master><fo:page-sequence-master master-name="Chapter"><fo:repeatable-page-master-alternatives><fo:conditional-page-master-reference page-position="first" master-reference="ChapterFirstPage"/><fo:conditional-page-master-reference odd-or-even="even" blank-or-not-blank="blank" master-reference="BlankEvenPage"/><fo:conditional-page-master-reference odd-or-even="even" master-reference="ChapterEvenPage"/><fo:conditional-page-master-reference odd-or-even="odd" master-reference="ChapterOddPage"/></fo:repeatable-page-master-alternatives></fo:page-sequence-master><fo:page-sequence-master master-name="Index"><fo:repeatable-page-master-alternatives><fo:conditional-page-master-reference page-position="first" master-reference="IndexFirstPage"/><fo:conditional-page-master-reference odd-or-even="even" blank-or-not-blank="blank" master-reference="BlankEvenPage"/><fo:conditional-page-master-reference odd-or-even="even" master-reference="IndexEvenPage"/><fo:conditional-page-master-reference odd-or-even="odd" master-reference="IndexOddPage"/></fo:repeatable-page-master-alternatives></fo:page-sequence-master></fo:layout-master-set><fo:page-sequence master-reference="FrontMatter" format="i"><fo:static-content flow-name="xsl-footnote-separator"><fo:block text-align="left"><fo:leader leader-pattern="rule" leader-length="2in"/></fo:block></fo:static-content><fo:flow flow-name="xsl-region-body" font-family="Arial"><fo:block space-before.conditionality="retain" break-before="odd-page" font-size="18pt" font-weight="bold" space-before="1.25in" text-align="center"> keep-with-next.within-page="always"</fo:block><fo:block space-before.conditionality="retain" font-size="14pt" font-weight="bold" space-before=".25in" text-align="center">in section 1.1</fo:block><fo:block space-before.conditionality="retain" break-before="odd-page" font-size="18pt" font-weight="bold" space-before="1.25in" text-align="center"> keep-with-next.within-page="always"</fo:block><fo:block space-before.conditionality="retain" font-size="14pt" font-weight="bold" space-before=".25in" text-align="center">in section 1.1</fo:block><fo:block font-style="italic" text-align="center">contact: andy_black@sil.org</fo:block></fo:flow></fo:page-sequence><fo:page-sequence master-reference="Chapter" initial-page-number="1"><fo:static-content display-align="after" flow-name="ChapterFirstPage-after"><fo:block text-align-last="justify" margin-top="6pt" font-family="Times New Roman" font-size="9pt" font-style="italic"><fo:leader/><fo:inline font-size="9pt" font-style="italic"><fo:page-number/></fo:inline><fo:leader/></fo:block></fo:static-content><fo:static-content display-align="before" flow-name="ChapterEvenPage-before"><fo:block text-align-last="justify" font-family="Times New Roman" font-size="9pt" font-style="italic"><fo:inline font-size="9pt" font-style="italic"><fo:page-number/></fo:inline><fo:leader/><fo:inline font-size="9pt" font-style="italic"><fo:retrieve-marker retrieve-class-name="chap-title"/></fo:inline></fo:block></fo:static-content><fo:static-content display-align="before" flow-name="ChapterOddPage-before"><fo:block text-align-last="justify" font-family="Times New Roman" font-size="9pt" font-style="italic"><fo:inline font-size="9pt" font-style="italic"><fo:retrieve-marker retrieve-class-name="section-title"/></fo:inline><fo:leader/><fo:inline font-size="9pt" font-style="italic"><fo:page-number/></fo:inline></fo:block></fo:static-content><fo:static-content flow-name="xsl-footnote-separator"><fo:block text-align="left"><fo:leader leader-pattern="rule" leader-length="2in"/></fo:block></fo:static-content><fo:flow flow-name="xsl-region-body" font-family="Arial" font-size="12pt"><fo:marker marker-class-name="chap-title">PROBLEM</fo:marker><fo:block id="c2" break-before="odd-page" font-size="18pt" font-weight="bold" space-before="144pt" space-before.conditionality="retain" space-after="10.8pt" text-align="center" span="all">1</fo:block><fo:block font-size="18pt" font-weight="bold" space-after="21.6pt" text-align="center">PROBLEM</fo:block><fo:block orphans="2" widows="2" text-indent="1em"><fo:basic-link internal-destination="rSapir">Sapir (1921)</fo:basic-link> has said that “All grammars leak” meaning that as much as we want to believe that all published grammatical descriptions are watertight, there is always data that the linguist has not seen or has chosen to ignore (residue). The description may adequately explain what is happening in a carefully selected set of data or the description may adequately account for the majority of the data. But still there is residue that is not reported. How can the reviewer of a grammatical description ever obtain access to the residue, or ever be certain that the description would actually work for a totally new text gathered from a native speaker, or even that it would even work for the whole data corpus the linguist was studying? A new kind of linguistic analysis and description is needed.</fo:block><fo:block id="sMorphologyproblem" keep-with-next.within-page="always" font-size="12pt" font-weight="bold" space-before="20pt" space-before.conditionality="retain" space-after="10pt" text-align="left"><fo:marker marker-class-name="section-title">Morphology</fo:marker><fo:inline><fo:inline>1.1</fo:inline> Morphology</fo:inline></fo:block><fo:block orphans="2" widows="2" keep-with-previous.within-page="always" text-indent="1em">The real test of a description of the morphology of a language is whether it can be used to parse any word in the language appearing in a natural text while at the same time rejecting ungrammatical wordforms. The ultimate goal is that the description could be empirically verified by implementing it in an automated parser that would correctly parse any wordform occurring in natural text. FLEx enables such synchronization between description and automatic parsing as it uses the same underlying data to generate both a morphology sketch and an automated parser for testing the accuracy of the analysis on natural texts.</fo:block><fo:block orphans="2" widows="2" text-indent="1em">The goal of morphological research is not only to unambiguously parse all the words of a language into their constituent morphemes, but also to account for the whole structure of the wordform. Ideally, Philippine language features like voice/focus and aspect could be linked to the morphemes that bear them and then percolate up through the parsing process to become a part of the description of the whole wordform. This information can then be used by syntactic parsers that would operate on the analyzed wordforms. This is especially important for Philippine languages where voice affixes relate to the semantic roles of the nouns in the sentence. A syntactic parser that will work on the output of the morphological parser will need this feature information also, not just the final syntactic category of the wordform.</fo:block><fo:block orphans="2" widows="2" text-indent="1em">FLEx is the only software package that integrates a morphological parser, lexicon, and analysis tools with the ability to automatically generate structured morphology sketches. Unfortunately, even though FLEx has been available for a few years, uptake has been slow among Philippine linguists. Of those that are using it for dictionary purposes, none have made a serious attempt at a computational description of the morphology. Because of the degree of similarity between affixation systems of Philippine languages, having an empirically tested morphology model for one Philippine language should prove helpful for other Philippine language researchers and thus simplify their task.</fo:block><fo:block orphans="2" widows="2" text-indent="1em">FLEx automatically generates a sketch of the morphology based on the information in the database. This tool has the potential for aiding both linguists and linguistic consultants in identifying problems and inconsistencies in analysis as well as being a basis for a publishable morphological description. To date, however, the parsing tool has not yet been used for checking analyses and the morphology sketch has not yet been used for describing a Philippine language. Research identifying the strengths and weaknesses of using this method of analysis and description can help clarify its usefulness for other Austronesian languages as well.</fo:block><fo:block id="sSyntaxproblem" keep-with-next.within-page="always" font-size="12pt" font-weight="bold" space-before="20pt" space-before.conditionality="retain" space-after="10pt" text-align="left"><fo:marker marker-class-name="section-title">Syntax</fo:marker><fo:inline><fo:inline>1.2</fo:inline> Syntax</fo:inline></fo:block><fo:block orphans="2" widows="2" text-indent="1em">The real test of a syntax description is whether it can account for the syntax of any grammatically correct sentence in that language. When prose-only descriptions of the syntax of a language are written, it is hard to ascertain what percentage of the language phenomena is being described. If, however, the syntax description is formalized with a set of formal PSRs (Phrase Structure Rules) and natural language texts are used for testing the rules, it may be possible to state what portion of the syntax is accounted for by the description.</fo:block><fo:block orphans="2" widows="2" text-indent="1em">The team at the Center for Language Technologies led by Dr. Rachel Roxas of De La Salle University in Manila is seeking to develop computational tools and ultimately machine translation systems to and from Tagalog. Members of this team have mentioned “the minimal work done on the development of a computational grammar for the Filipino language for the development of robust and industrial strength natural language analysis and technologies” <fo:basic-link internal-destination="rAlcantara2008a">Alcantara and Borra (2008a)</fo:basic-link>. Many approaches have been proposed and prototypes have been developed for automatic generation of PSRs from various text collections, but as of this time, all of the final results have been labelled “insubstantial” by Borra.<fo:footnote><fo:inline font-family="Arial" text-align="left" text-align-last="left" text-indent="1em" start-indent="0pt" end-indent="0pt" font-style="normal" font-weight="normal" font-variant="normal" color="black" font-size="6pt" baseline-shift="super" id="nBorra">1</fo:inline><fo:footnote-body><fo:block font-family="Arial" text-align="left" text-align-last="left" text-indent="1em" start-indent="0pt" end-indent="0pt" font-style="normal" font-weight="normal" font-variant="normal" color="black" font-size="8pt" text-transform="none"><fo:inline baseline-shift="super" font-size="6pt">1</fo:inline>Personal communcation (Nov. 11, 2008).</fo:block></fo:footnote-body></fo:footnote></fo:block><fo:block orphans="2" widows="2" text-indent="1em">The lack of a complete set of PSRs for Tagalog is a significant hindrance to NLP research in the Philippines. The same problem exists for other Philippine languages, especially the minority languages. But because of the similarities of syntax of many Philippine languages, it is hypothesized that PSRs modelling general language characteristics for any Philippine language could contribute insights into the development of PSR grammars for other Philippine languages. Thus a set of basic PSRs for any Philippine language could be used as a starting point for developing PSR grammars for other Philippine languages. However, as of this time, no such published grammar exists in a current linguistic formalism.</fo:block><fo:block orphans="2" widows="2" text-indent="1em">The PAWS Starter Kit could be a significant step forward toward this goal of developing Context Free PSRs for Philippine languages. If the developer’s claim is really true that 75% of the syntax of any language can be modelled in PSRs generated by just answering the questions in the PAWS Starter Kit, then this would be a significant step forward for all those doing research in this area. The problem is that no one has attempted to use the system for any Philippine language. Determining the percentage of phenomena handled by the automatically generated rules and performing an analysis of what went wrong and right in the syntax parsing process would be most helpful not only to the developers of PAWS but also to Philippine linguists considering whether to use it.</fo:block><fo:block orphans="2" widows="2" text-indent="1em">The syntax sketch that PAWS generates would seem to be a helpful tool for linguistic description, but it has not been used for a syntactic description of any Philippine language. This thesis provides an initial syntactic description of a Philippine language using the PAWS generated sketch. Discovering the areas where the linguist needs to adjust the description will be the most helpful in evaluating the usefulness of this tool.</fo:block></fo:flow></fo:page-sequence><fo:page-sequence master-reference="Chapter" initial-page-number="auto-odd"><fo:static-content display-align="after" flow-name="ChapterFirstPage-after"><fo:block text-align-last="justify" margin-top="6pt" font-family="Times New Roman" font-size="9pt" font-style="italic"><fo:leader/><fo:inline font-size="9pt" font-style="italic"><fo:page-number/></fo:inline><fo:leader/></fo:block></fo:static-content><fo:static-content display-align="before" flow-name="ChapterEvenPage-before"><fo:block text-align-last="justify" font-family="Times New Roman" font-size="9pt" font-style="italic"><fo:inline font-size="9pt" font-style="italic"><fo:page-number/></fo:inline><fo:leader/><fo:inline font-size="9pt" font-style="italic"><fo:retrieve-marker retrieve-class-name="chap-title"/></fo:inline></fo:block></fo:static-content><fo:static-content display-align="before" flow-name="ChapterOddPage-before"><fo:block text-align-last="justify" font-family="Times New Roman" font-size="9pt" font-style="italic"><fo:inline font-size="9pt" font-style="italic"><fo:retrieve-marker retrieve-class-name="section-title"/></fo:inline><fo:leader/><fo:inline font-size="9pt" font-style="italic"><fo:page-number/></fo:inline></fo:block></fo:static-content><fo:static-content flow-name="xsl-footnote-separator"><fo:block text-align="left"><fo:leader leader-pattern="rule" leader-length="2in"/></fo:block></fo:static-content><fo:flow flow-name="xsl-region-body" font-family="Arial" font-size="12pt"><fo:marker marker-class-name="chap-title">References</fo:marker><fo:block id="rXLingPapReferences" span="all" break-before="odd-page" font-size="18pt" font-weight="bold" space-before="176pt" space-before.conditionality="retain" space-after="10.8pt" text-align="center">References</fo:block><fo:block line-height="1.2"><fo:block text-indent="-.25in" start-indent=".25in" id="rAlcantara2008a" font-size="10pt"><fo:inline>Alcantara, Danniel, and Allan Borra.  </fo:inline><fo:inline>2008a.  </fo:inline><fo:inline>“Constituent structure for Filipino: Induction through probabilistic approaches.”  </fo:inline><fo:inline>Proceedings of the 22nd Pacific Asia Conference on Language, Information and Computation (PACLIC22).  </fo:inline><fo:inline>Cebu, Philippines.</fo:inline></fo:block><fo:block text-indent="-.25in" start-indent=".25in" id="rSapir" font-size="10pt"><fo:inline>Sapir, Edward.  </fo:inline><fo:inline>1921.  </fo:inline><fo:inline font-style="italic">Language: an introduction to the study of speech.  </fo:inline><fo:inline>New York: </fo:inline><fo:inline>Harcourt Brace &amp; Company.</fo:inline></fo:block></fo:block></fo:flow></fo:page-sequence></fo:root>
