<?xml version="1.0" encoding="UTF-8"?>
<rss version="2.0"
	xmlns:content="http://purl.org/rss/1.0/modules/content/"
	xmlns:wfw="http://wellformedweb.org/CommentAPI/"
	xmlns:dc="http://purl.org/dc/elements/1.1/"
	xmlns:atom="http://www.w3.org/2005/Atom"
	xmlns:sy="http://purl.org/rss/1.0/modules/syndication/"
	xmlns:slash="http://purl.org/rss/1.0/modules/slash/"
	xmlns:georss="http://www.georss.org/georss" xmlns:geo="http://www.w3.org/2003/01/geo/wgs84_pos#" xmlns:media="http://search.yahoo.com/mrss/"
	>

<channel>
	<title>Kais Dukes - Blog</title>
	<atom:link href="http://kaisdukes.wordpress.com/feed/" rel="self" type="application/rss+xml" />
	<link>http://kaisdukes.wordpress.com</link>
	<description>Financial Software Engineering and Scientific Research</description>
	<lastBuildDate>Wed, 02 Nov 2011 19:27:38 +0000</lastBuildDate>
	<language>en</language>
	<sy:updatePeriod>hourly</sy:updatePeriod>
	<sy:updateFrequency>1</sy:updateFrequency>
	<generator>http://wordpress.com/</generator>
<cloud domain='kaisdukes.wordpress.com' port='80' path='/?rsscloud=notify' registerProcedure='' protocol='http-post' />
<image>
		<url>http://1.gravatar.com/blavatar/f60d99f2416dba7bacfb4349de3f3cec?s=96&#038;d=http%3A%2F%2Fs2.wp.com%2Fi%2Fbuttonw-com.png</url>
		<title>Kais Dukes - Blog</title>
		<link>http://kaisdukes.wordpress.com</link>
	</image>
	<atom:link rel="search" type="application/opensearchdescription+xml" href="http://kaisdukes.wordpress.com/osd.xml" title="Kais Dukes - Blog" />
	<atom:link rel='hub' href='http://kaisdukes.wordpress.com/?pushpress=hub'/>
		<item>
		<title>Maryam&#8217;s First Words</title>
		<link>http://kaisdukes.wordpress.com/2011/11/02/maryams-first-words/</link>
		<comments>http://kaisdukes.wordpress.com/2011/11/02/maryams-first-words/#comments</comments>
		<pubDate>Wed, 02 Nov 2011 19:27:34 +0000</pubDate>
		<dc:creator>kaisdukes</dc:creator>
				<category><![CDATA[Maryam]]></category>
		<category><![CDATA[Baby]]></category>
		<category><![CDATA[Crawling]]></category>
		<category><![CDATA[First Words]]></category>

		<guid isPermaLink="false">http://kaisdukes.wordpress.com/?p=506</guid>
		<description><![CDATA[Maryam is now just over 6 months old. We have been letting her play a lot on the floor under our supervision, and she has started to crawl in the last few weeks. Also, on Sunday and again today, Maryam said her first word &#8220;Baba&#8221;. This is a bit different to Khalid who said the [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=kaisdukes.wordpress.com&amp;blog=12997370&amp;post=506&amp;subd=kaisdukes&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>Maryam is now just over 6 months old. We have been letting her play a lot on the floor under our supervision, and she has started to crawl in the last few weeks. Also, on Sunday and again today, Maryam said her first word &#8220;Baba&#8221;. This is a bit different to Khalid who said the same first word (which means &#8220;Daddy&#8221;, in Arabic) earlier at 4 months. He only started to crawl later at 8 months.</p>
<p><a href="http://kaisdukes.files.wordpress.com/2011/11/maryam_nov2012_p2.jpg"><img class="alignnone size-full wp-image-507" title="Maryam_Nov2012_p2" src="http://kaisdukes.files.wordpress.com/2011/11/maryam_nov2012_p2.jpg?w=380&#038;h=281" alt="" width="380" height="281" /></a></p>
<p>Maryam is very cute, very healthy, and has grown very big and tall compared to when she was first born. She laughs and smiles a lot, especially when happy after eating, and also when playing with her big brother Khalid, who is now 2 years and 3 months old.</p>
<p><a href="http://kaisdukes.files.wordpress.com/2011/11/maryam_nov2012_p1.jpg"><img class="alignnone size-full wp-image-508" title="Maryam_Nov2012_p1" src="http://kaisdukes.files.wordpress.com/2011/11/maryam_nov2012_p1.jpg?w=380&#038;h=285" alt="" width="380" height="285" /></a></p>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/kaisdukes.wordpress.com/506/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/kaisdukes.wordpress.com/506/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/kaisdukes.wordpress.com/506/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/kaisdukes.wordpress.com/506/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/kaisdukes.wordpress.com/506/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/kaisdukes.wordpress.com/506/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/kaisdukes.wordpress.com/506/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/kaisdukes.wordpress.com/506/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/kaisdukes.wordpress.com/506/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/kaisdukes.wordpress.com/506/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/kaisdukes.wordpress.com/506/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/kaisdukes.wordpress.com/506/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/kaisdukes.wordpress.com/506/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/kaisdukes.wordpress.com/506/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=kaisdukes.wordpress.com&amp;blog=12997370&amp;post=506&amp;subd=kaisdukes&amp;ref=&amp;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://kaisdukes.wordpress.com/2011/11/02/maryams-first-words/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
	
		<media:content url="http://1.gravatar.com/avatar/3c8e1cc0b54e6f96239ab19177fc92ad?s=96&#38;d=identicon&#38;r=G" medium="image">
			<media:title type="html">kaisdukes</media:title>
		</media:content>

		<media:content url="http://kaisdukes.files.wordpress.com/2011/11/maryam_nov2012_p2.jpg" medium="image">
			<media:title type="html">Maryam_Nov2012_p2</media:title>
		</media:content>

		<media:content url="http://kaisdukes.files.wordpress.com/2011/11/maryam_nov2012_p1.jpg" medium="image">
			<media:title type="html">Maryam_Nov2012_p1</media:title>
		</media:content>
	</item>
		<item>
		<title>IWPT 2011 at Dublin City University</title>
		<link>http://kaisdukes.wordpress.com/2011/10/05/iwpt-2011-at-dublin-city-university/</link>
		<comments>http://kaisdukes.wordpress.com/2011/10/05/iwpt-2011-at-dublin-city-university/#comments</comments>
		<pubDate>Wed, 05 Oct 2011 21:56:00 +0000</pubDate>
		<dc:creator>kaisdukes</dc:creator>
				<category><![CDATA[PhD]]></category>
		<category><![CDATA[Quranic Arabic Corpus]]></category>
		<category><![CDATA[Writing]]></category>
		<category><![CDATA[IWPT]]></category>
		<category><![CDATA[parsing]]></category>

		<guid isPermaLink="false">http://kaisdukes.wordpress.com/?p=482</guid>
		<description><![CDATA[Today I presented a paper (co-authored with Nizar Habash) on statistical parsing at the IWPT 2011 conference. A three day event at Dublin City University, this was a great opportunity to meet some leading names in the fields of Computational Linguistics and Natural Language Parsing, and to discuss ideas for further research work and future [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=kaisdukes.wordpress.com&amp;blog=12997370&amp;post=482&amp;subd=kaisdukes&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>Today I presented a <a href="http://www.kaisdukes.com/papers/qparse-iwpt2011.pdf">paper</a> (co-authored with <a href="http://www.nizarhabash.com/">Nizar Habash</a>) on statistical parsing at the <a href="http://www.dcu.ie/conferences/iwpt/">IWPT 2011 conference</a>. A three day event at <a href="http://www.dcu.ie/index.shtml">Dublin City University</a>, this was a great opportunity to meet some leading names in the fields of Computational Linguistics and Natural Language Parsing, and to discuss ideas for further research work and future collaboration.</p>
<p>Due to family commitments, I was only able to attend the first day of the conference to present my talk, and so I missed out on the full three day event. However, it was still a great experience.</p>
<p><strong>Presentation</strong></p>
<p>The paper I presented, <a href="http://www.kaisdukes.com/papers/qparse-iwpt2011.pdf">One-Step Statistical Parsing of Hybrid Dependency-Constituency Syntactic Representations</a>, was received well, judging by the feedback and response I got after the talk. I managed to get across the key points of the research in the presentation: The linguistic context for why the Quranic Treebank uses a hybrid syntactic representation, the rich morphological features annotated in the treebank, and the challenges this gives rise to for statistical parsing. I mentioned that although there could be many ways to solve the hybrid parsing problem, we focused on <em>transition-based</em> shift-reduce parsing, as opposed to a graph-based parsing algorithm. In other words, more like <a href="http://maltparser.org/">MaltParser</a> as opposed to <a href="http://www.seas.upenn.edu/~strctlrn/MSTParser/MSTParser.html">MSTParser</a>.</p>
<p>At the end of the talk, I had time to answer a few questions.</p>
<p><a href="http://kaisdukes.files.wordpress.com/2011/10/helix-dcu.jpeg"><img class="alignnone size-full wp-image-488" title="helix-dcu" src="http://kaisdukes.files.wordpress.com/2011/10/helix-dcu.jpeg?w=380&#038;h=285" alt="" width="380" height="285" /></a></p>
<p>In the first question, <a href="http://stp.ling.uu.se/~nivre/">Joakim Nivre</a> wanted some further clarification on exactly what the input to the parser was. Although the presentation described the input as gold-standard morphologically tagged text with segmentation, I did not make clear during the talk if empty categories were assumed in the input, or if these were generated by the parser. This was a fair point by Joakim. The paper does cover this in more detail &#8211; the parser handles elision directly and this is not assumed in the input. We take only the original source text, segmented and annotated with morphological features.</p>
<p>The section question by <a href="http://www.dfki.de/~feiyu/">Feiyu Xu</a> related to how the parser produced phrase structure. In particular, how it was possible to produce complete subgraphs under a phrase or clause. The assumption, I explained, was that at a certain point in its operation, the parser would learn to recognize the head of a sub-graph that should be raised to a phrase from the top of the stack. Of course, not all phrases could be formed this way, but given the strong accuracy of the parser for hybrid phrase structure reported in the paper, this would appear to be a reasonable assumption.</p>
<p>In the last question, <a href="http://homepages.inf.ed.ac.uk/steedman/">Mark Steedman</a> wanted to know more about the traditional Arabic grammar used as the linguistic framework for annotating the <a href="http://corpus.quran.com">Quranic Arabic Treebank</a>. In particular, the question was under what conditions the grammar would treat a chunk as a phrase and give it a phrase label as opposed to using only dependency structure. My answer was that as far as I could tell from having been through numerous examples from the grammatical gold-standard reference texts, was that phrases appear to be made explicit in the grammar when a chunk can stand alone, independent of the rest of the sentence, such as an embedded sentence or subordinate clause.</p>
<p><strong>Opportunities for Future Work and Collaboration</strong></p>
<p>I met a lot of interesting and smart people at the conference, too many to list all here by name. Overall, I received two pieces of common feedback when discussing my parsing research. The first, was that the hybrid representation was interesting and appealing as a research idea given that not much work has been done in this area, and that there is definitely merit in combining the best of both representations into a single treebank. Secondly, a lot of the feedback I received cantered around the next logical step in the research, which would be to integrate morphological analysis into the parser. This would allow the parser to run against raw text instead of using gold-standard morphological input. Different people had different ideas about how this could be done, but nearly everyone agreed it was an important next step.</p>
<p>I also learnt that although some recent initial work has been done on integrating POS-tagging and transition dependency parsing for Chinese, there does not appear to be any work on joint morphological analysis for <em>transition</em> dependency parsing in any language. <a href="http://people.ict.usc.edu/~sagae/">Kenji Sagae</a> confirmed my own hunch that for a full integrated transition approach some form of non-deterministic parsing would be necessary, in order to explore the joint disambiguation search space. He pointed me to his <a href="www.isi.edu/~lhuang/dp-final.pdf">2010 ACL paper</a> on introducing dynamic programming into shift-reduce parsing. He suggested that I might want to get in touch with <a href="http://www-tsujii.is.s.u-tokyo.ac.jp/~matuzaki/atlab.html">Takuya Matsuzaki</a> (also at IWPT 2011) whose <a href="http://www-tsujii.is.s.u-tokyo.ac.jp/~hatori/papers/ijcnlp2011-joint.pdf">2011 IJCNLP</a> paper uses the same algorithm as Kenji’s to perform joint POS-tagging and syntactic dependency parsing for Chinese. Interestingly, Nizar had pointed out a related <a href="http://aclweb.org/anthology-new/D/D11/D11-1109.pdf">2011 EMNLP</a> paper to me back in July, also on joint tagging for Chinese, but with a focus on graph algorithms instead of transition parsing &#8211; another good paper.</p>
<p><a href="http://kaisdukes.files.wordpress.com/2011/10/parsing.png"><img class="alignnone size-full wp-image-491" title="parsing" src="http://kaisdukes.files.wordpress.com/2011/10/parsing.png?w=380&#038;h=306" alt="" width="380" height="306" /></a></p>
<p>I later met with <a href="http://staff.science.uva.nl/~simaan/">Khalil Sima&#8217;an</a> who it turns out can speak Arabic as well as Hebrew. Interestingly, Khalil was <a href="http://stp.ling.uu.se/~tsarfaty/">Reut Tsarfaty</a>’s co-supervisor during her PhD thesis on joint morphological and syntactic analysis for Hebrew. Khalil also knows <a href="http://www.engineering.leeds.ac.uk/people/computing/staff/e.s.atwell">Eric Atwell</a>, my PhD supervisor at the University of Leeds. He advised that research into joint morphological and syntactic analysis for Arabic was something definitely needed.</p>
<p>Finally, I ended the day with a follow-up discussion with <a href="http://stp.ling.uu.se/~nivre/">Joakim Nivre</a> after the main conference talks had ended. Joakim was open to the idea of collaborating on future research, especially if this involved doing further work on transition-based parsing. Some ideas could include revisiting his work on hybrid parsing for Swedish and German. He seemed impressed with my presentation and the paper, and especially liked the strong empirical results &#8211; achieving around 90% accuracy (near state-of-the-art) for dependency parsing. Confirming the other feedback I had received today, he thought that joint morphological and syntactic analysis would be the way to go for further research into parsing Classical Arabic. He also liked the way in which the basic <a href="http://maltparser.org/">MaltParser</a> algorithm had been extended using additional parser actions to handle hybrid parsing – apparently something he had wanted to do himself for some time.</p>
<p>We also talked briefly about different possible ways to add non-determinism to the parser, as a step towards joint morphological disambiguation. Dynamic programming could be one way, but Joakim suggested that even experimenting with vanilla beam search would be a good first step.</p>
<p><strong>Conclusion</strong></p>
<p>All-in-all a great day. I met some very intelligent people, experts in their respective fields, and also got to listen to some very interesting and relevant talks. A shame I could only stay for the first day instead of the full three day conference, but I do have a lot else going on right now with work and family. I would definitely like to pursue some of the ideas discussed today for further collaboration. Hybrid parsing was of interest to the conference delegates given that it is a bit different and not often studied. I also heard from nearly everyone I spoke to that joint morphological disambiguation and syntactic parsing would be a very interesting next step. From what I could tell, the start-of-the-art in this particular research area for transition-based parsing was to include only POS tagging as a joint task. Joakim suggested that including morphological analysis directly into a transition-based parser would be new research, but something that other researchers might soon also be looking at as well.</p>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/kaisdukes.wordpress.com/482/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/kaisdukes.wordpress.com/482/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/kaisdukes.wordpress.com/482/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/kaisdukes.wordpress.com/482/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/kaisdukes.wordpress.com/482/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/kaisdukes.wordpress.com/482/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/kaisdukes.wordpress.com/482/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/kaisdukes.wordpress.com/482/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/kaisdukes.wordpress.com/482/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/kaisdukes.wordpress.com/482/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/kaisdukes.wordpress.com/482/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/kaisdukes.wordpress.com/482/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/kaisdukes.wordpress.com/482/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/kaisdukes.wordpress.com/482/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=kaisdukes.wordpress.com&amp;blog=12997370&amp;post=482&amp;subd=kaisdukes&amp;ref=&amp;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://kaisdukes.wordpress.com/2011/10/05/iwpt-2011-at-dublin-city-university/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
	
		<media:content url="http://1.gravatar.com/avatar/3c8e1cc0b54e6f96239ab19177fc92ad?s=96&#38;d=identicon&#38;r=G" medium="image">
			<media:title type="html">kaisdukes</media:title>
		</media:content>

		<media:content url="http://kaisdukes.files.wordpress.com/2011/10/helix-dcu.jpeg" medium="image">
			<media:title type="html">helix-dcu</media:title>
		</media:content>

		<media:content url="http://kaisdukes.files.wordpress.com/2011/10/parsing.png" medium="image">
			<media:title type="html">parsing</media:title>
		</media:content>
	</item>
		<item>
		<title>International Conference on Parsing Technologies</title>
		<link>http://kaisdukes.wordpress.com/2011/08/31/international-conference-on-parsing-technologies/</link>
		<comments>http://kaisdukes.wordpress.com/2011/08/31/international-conference-on-parsing-technologies/#comments</comments>
		<pubDate>Wed, 31 Aug 2011 15:09:55 +0000</pubDate>
		<dc:creator>kaisdukes</dc:creator>
				<category><![CDATA[PhD]]></category>
		<category><![CDATA[Writing]]></category>
		<category><![CDATA[IWPT]]></category>
		<category><![CDATA[parsing]]></category>

		<guid isPermaLink="false">http://kaisdukes.wordpress.com/?p=453</guid>
		<description><![CDATA[I&#8217;m very pleased that my joint paper on statistical parsing co-authored with Dr Nizar Habash, has been accepted at the 12th International Conference on Parsing Technologies. The conference is being held in Dublin, Ireland from the 5th to the 7th of October. Entry into this year&#8217;s conference was very competitive, so I should really thank [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=kaisdukes.wordpress.com&amp;blog=12997370&amp;post=453&amp;subd=kaisdukes&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>I&#8217;m very pleased that my joint paper on statistical parsing co-authored with <a href="http://www.nizarhabash.com">Dr Nizar Habash</a>, has been accepted at the <a href="http://www.dcu.ie/conferences/iwpt">12th International Conference on Parsing Technologies</a>. The conference is being held in Dublin, Ireland from the 5th to the 7th of October. Entry into this year&#8217;s conference was very competitive, so I should really thank Nizar for pushing me to work on a high-quality paper, and also for my supervisor at the <a href="http://www.engineering.leeds.ac.uk/computing/research/institute-artificial-intelligence-biological-systems.shtml">Institute of Artificial Intelligence</a>, <a href="http://www.comp.leeds.ac.uk/eric">Dr Eric Atwell</a> for encouraging me to pursue research into statistical parsing of the rich Arabic language of the Quran. I&#8217;m very pleased to have been accepted at this particular conference, given the high quality research into natural language parsing presented at the conference in recent years.</p>
<p><strong>One-step Statistical Parsing of Hybrid Dependency-Constituency Syntactic Representations.</strong></p>
<p>In a nutshell, the paper builds on techniques from <a href="http://en.wikipedia.org/wiki/Machine_learning">Machine Learning</a> and <a href="http://en.wikipedia.org/wiki/Artificial_intelligence">Artificial Intelligence</a> (specifically, <a href="http://en.wikipedia.org/wiki/Support_vector_machine">Support Vector Machines</a>), and describes a new algorithm ideally suited to parsing the <a href="http://corpus.quran.com/documentation/dependencygraph.jsp">complex linguistic structures</a> found in traditional grammatical analysis of the Quran.</p>
<p>The current draft of the paper is available <a href="http://www.kaisdukes.com/papers/qparse-iwpt2011.pdf">here</a>.</p>
<p><a href="http://kaisdukes.files.wordpress.com/2011/08/redneuronal.jpg"><img class="alignnone size-full wp-image-454" title="RedNeuronal" src="http://kaisdukes.files.wordpress.com/2011/08/redneuronal.jpg?w=380&#038;h=285" alt="" width="380" height="285" /></a></p>
<p>As well as being excited that my recent research is getting published, I&#8217;m also happy that my writing ability is improving. Before starting my PhD in 2009, the last time I had written anything substantial was around 15 years ago while doing GCSE English. My A-levels and University degrees were all numerical with plenty of equations. It’s only relatively recently that I&#8217;ve had to describe my research through prose and present this as a consistent story. In my <a href="http://www.kaisdukes.com/publications.html">first few papers</a>, I found this really hard. But recently, I’ve gotten into the swing of things. This really shows in the recent feedback from the three anonymous reviewers of the IWPT paper:</p>
<blockquote><p>The paper is well written and the structure of the paper flows well.</p></blockquote>
<blockquote><p>I like this paper.</p></blockquote>
<blockquote><p>The paper is well structured and it presents substantial amount of research.</p></blockquote>
<p>Overall, the paper was given a score of 4 out of 5. This latest publication will really help towards the research material that I need for the final PhD thesis. Looks like I&#8217;ll be taking Imen and the kids to Dublin City University in October!</p>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/kaisdukes.wordpress.com/453/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/kaisdukes.wordpress.com/453/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/kaisdukes.wordpress.com/453/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/kaisdukes.wordpress.com/453/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/kaisdukes.wordpress.com/453/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/kaisdukes.wordpress.com/453/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/kaisdukes.wordpress.com/453/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/kaisdukes.wordpress.com/453/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/kaisdukes.wordpress.com/453/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/kaisdukes.wordpress.com/453/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/kaisdukes.wordpress.com/453/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/kaisdukes.wordpress.com/453/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/kaisdukes.wordpress.com/453/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/kaisdukes.wordpress.com/453/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=kaisdukes.wordpress.com&amp;blog=12997370&amp;post=453&amp;subd=kaisdukes&amp;ref=&amp;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://kaisdukes.wordpress.com/2011/08/31/international-conference-on-parsing-technologies/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
	
		<media:content url="http://1.gravatar.com/avatar/3c8e1cc0b54e6f96239ab19177fc92ad?s=96&#38;d=identicon&#38;r=G" medium="image">
			<media:title type="html">kaisdukes</media:title>
		</media:content>

		<media:content url="http://kaisdukes.files.wordpress.com/2011/08/redneuronal.jpg" medium="image">
			<media:title type="html">RedNeuronal</media:title>
		</media:content>
	</item>
		<item>
		<title>July</title>
		<link>http://kaisdukes.wordpress.com/2011/07/11/july/</link>
		<comments>http://kaisdukes.wordpress.com/2011/07/11/july/#comments</comments>
		<pubDate>Mon, 11 Jul 2011 07:51:20 +0000</pubDate>
		<dc:creator>kaisdukes</dc:creator>
				<category><![CDATA[Khalid]]></category>
		<category><![CDATA[Maryam]]></category>
		<category><![CDATA[Learning]]></category>
		<category><![CDATA[Painting]]></category>
		<category><![CDATA[Speaking]]></category>
		<category><![CDATA[Talking]]></category>

		<guid isPermaLink="false">http://kaisdukes.wordpress.com/?p=442</guid>
		<description><![CDATA[We&#8217;re not even half way through July and it&#8217;s already been a very busy month. Maryam has grown so fast. She&#8217;s only 11 weeks old, but looking strong and healthy. She loves feeding on milk, and smiles a lot especially when given attention. Khalid has been very busy as well. The last few weeks have [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=kaisdukes.wordpress.com&amp;blog=12997370&amp;post=442&amp;subd=kaisdukes&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>We&#8217;re not even half way through July and it&#8217;s already been a very busy month. Maryam has grown so fast. She&#8217;s only 11 weeks old, but looking strong and healthy. She loves feeding on milk, and smiles a lot especially when given attention.</p>
<p><a href="http://kaisdukes.files.wordpress.com/2011/07/maryam-11weeks.jpg"><img class="alignnone size-full wp-image-443" title="maryam-11weeks" src="http://kaisdukes.files.wordpress.com/2011/07/maryam-11weeks.jpg?w=380&#038;h=506" alt="" width="380" height="506" /></a></p>
<p>Khalid has been very busy as well. The last few weeks have seen an big leap in his ability to put together simple two and three word sentences. At the moment his favourites are &#8216;read a book&#8217; and &#8216;lets go out&#8217;, for when he wants to be read a bedtime story and for when he wants to go out to the park.</p>
<p>Khalid has also painted his first picture using paints and a brush, which Imen and I both think looks pretty impressive. He is going to be two years old in August, next month.</p>
<p><a href="http://kaisdukes.files.wordpress.com/2011/07/khalid-painting.jpeg"><img class="alignnone size-full wp-image-444" title="khalid-painting" src="http://kaisdukes.files.wordpress.com/2011/07/khalid-painting.jpeg?w=380&#038;h=396" alt="" width="380" height="396" /></a></p>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/kaisdukes.wordpress.com/442/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/kaisdukes.wordpress.com/442/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/kaisdukes.wordpress.com/442/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/kaisdukes.wordpress.com/442/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/kaisdukes.wordpress.com/442/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/kaisdukes.wordpress.com/442/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/kaisdukes.wordpress.com/442/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/kaisdukes.wordpress.com/442/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/kaisdukes.wordpress.com/442/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/kaisdukes.wordpress.com/442/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/kaisdukes.wordpress.com/442/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/kaisdukes.wordpress.com/442/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/kaisdukes.wordpress.com/442/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/kaisdukes.wordpress.com/442/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=kaisdukes.wordpress.com&amp;blog=12997370&amp;post=442&amp;subd=kaisdukes&amp;ref=&amp;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://kaisdukes.wordpress.com/2011/07/11/july/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
	
		<media:content url="http://1.gravatar.com/avatar/3c8e1cc0b54e6f96239ab19177fc92ad?s=96&#38;d=identicon&#38;r=G" medium="image">
			<media:title type="html">kaisdukes</media:title>
		</media:content>

		<media:content url="http://kaisdukes.files.wordpress.com/2011/07/maryam-11weeks.jpg" medium="image">
			<media:title type="html">maryam-11weeks</media:title>
		</media:content>

		<media:content url="http://kaisdukes.files.wordpress.com/2011/07/khalid-painting.jpeg" medium="image">
			<media:title type="html">khalid-painting</media:title>
		</media:content>
	</item>
		<item>
		<title>Khalid and Maryam</title>
		<link>http://kaisdukes.wordpress.com/2011/05/23/khalid-and-maryam/</link>
		<comments>http://kaisdukes.wordpress.com/2011/05/23/khalid-and-maryam/#comments</comments>
		<pubDate>Mon, 23 May 2011 06:59:44 +0000</pubDate>
		<dc:creator>kaisdukes</dc:creator>
				<category><![CDATA[Khalid]]></category>
		<category><![CDATA[Maryam]]></category>
		<category><![CDATA[Chickens]]></category>
		<category><![CDATA[Children]]></category>
		<category><![CDATA[Newborn]]></category>
		<category><![CDATA[Stepney City Farm]]></category>

		<guid isPermaLink="false">http://kaisdukes.wordpress.com/?p=431</guid>
		<description><![CDATA[Taken on the 4th of May 2011, here is Khalid looking at Maryam when she was only 12 days old: Here&#8217;s another picture of Maryam when she was a bit older &#8211; this time at 2-weeks old. As is normal for newborns, she was a lot more responsive and alert by this age, compared to [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=kaisdukes.wordpress.com&amp;blog=12997370&amp;post=431&amp;subd=kaisdukes&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>Taken on the 4th of May 2011, here is Khalid looking at Maryam when she was only 12 days old:</p>
<p><a href="http://kaisdukes.files.wordpress.com/2011/05/may4th.jpg"><img class="alignnone size-full wp-image-432" title="May4th" src="http://kaisdukes.files.wordpress.com/2011/05/may4th.jpg?w=380&#038;h=506" alt="" width="380" height="506" /></a></p>
<p>Here&#8217;s another picture of Maryam when she was a bit older &#8211; this time at 2-weeks old. As is normal for newborns, she was a lot more responsive and alert by this age, compared to the first days after being born:</p>
<p><a href="http://kaisdukes.files.wordpress.com/2011/05/may8th.jpg"><img class="alignnone size-full wp-image-433" title="May8th" src="http://kaisdukes.files.wordpress.com/2011/05/may8th.jpg?w=380&#038;h=506" alt="" width="380" height="506" /></a></p>
<p>This weekend Khalid had a nice time chasing chickens! We are very fortunate to be living only a couple of minutes away from <a href="http://www.stepneycityfarm.org">Stepney City Farm</a>:</p>
<p><a href="http://kaisdukes.files.wordpress.com/2011/05/may21st.jpg"><img class="alignnone size-full wp-image-434" title="May21st" src="http://kaisdukes.files.wordpress.com/2011/05/may21st.jpg?w=380&#038;h=506" alt="" width="380" height="506" /></a></p>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/kaisdukes.wordpress.com/431/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/kaisdukes.wordpress.com/431/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/kaisdukes.wordpress.com/431/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/kaisdukes.wordpress.com/431/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/kaisdukes.wordpress.com/431/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/kaisdukes.wordpress.com/431/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/kaisdukes.wordpress.com/431/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/kaisdukes.wordpress.com/431/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/kaisdukes.wordpress.com/431/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/kaisdukes.wordpress.com/431/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/kaisdukes.wordpress.com/431/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/kaisdukes.wordpress.com/431/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/kaisdukes.wordpress.com/431/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/kaisdukes.wordpress.com/431/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=kaisdukes.wordpress.com&amp;blog=12997370&amp;post=431&amp;subd=kaisdukes&amp;ref=&amp;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://kaisdukes.wordpress.com/2011/05/23/khalid-and-maryam/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
	
		<media:content url="http://1.gravatar.com/avatar/3c8e1cc0b54e6f96239ab19177fc92ad?s=96&#38;d=identicon&#38;r=G" medium="image">
			<media:title type="html">kaisdukes</media:title>
		</media:content>

		<media:content url="http://kaisdukes.files.wordpress.com/2011/05/may4th.jpg" medium="image">
			<media:title type="html">May4th</media:title>
		</media:content>

		<media:content url="http://kaisdukes.files.wordpress.com/2011/05/may8th.jpg" medium="image">
			<media:title type="html">May8th</media:title>
		</media:content>

		<media:content url="http://kaisdukes.files.wordpress.com/2011/05/may21st.jpg" medium="image">
			<media:title type="html">May21st</media:title>
		</media:content>
	</item>
		<item>
		<title>Parsing the Quran using Support Vector Machines</title>
		<link>http://kaisdukes.wordpress.com/2011/05/21/parsing-the-quran-using-support-vector-machines/</link>
		<comments>http://kaisdukes.wordpress.com/2011/05/21/parsing-the-quran-using-support-vector-machines/#comments</comments>
		<pubDate>Sat, 21 May 2011 10:07:38 +0000</pubDate>
		<dc:creator>kaisdukes</dc:creator>
				<category><![CDATA[PhD]]></category>
		<category><![CDATA[Quranic Arabic Corpus]]></category>
		<category><![CDATA[Writing]]></category>
		<category><![CDATA[AI]]></category>
		<category><![CDATA[parsing]]></category>
		<category><![CDATA[quran]]></category>
		<category><![CDATA[Support Vector Machines]]></category>

		<guid isPermaLink="false">http://kaisdukes.wordpress.com/?p=424</guid>
		<description><![CDATA[I&#8217;ve been working hard the last few days on PhD research. I&#8217;ve submitted for Eric&#8216;s review a suggested plan for our joint submission to Arabica. The current working title is Detailed Grammatical Analysis of the Quran using Artificial Intelligence. At the same time, I&#8217;ve also been running some machine learning experiments for parsing the latest version [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=kaisdukes.wordpress.com&amp;blog=12997370&amp;post=424&amp;subd=kaisdukes&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>I&#8217;ve been working hard the last few days on PhD research. I&#8217;ve submitted for <a href="http://www.comp.leeds.ac.uk/eric">Eric</a>&#8216;s review a suggested plan for our joint submission to <a href="http://www.brill.nl/arab">Arabica</a>. The current working title is <em>Detailed Grammatical Analysis of the Quran using Artificial Intelligence</em>. At the same time, I&#8217;ve also been running some machine learning experiments for parsing the latest version of the <a href="http://corpus.quran.com/treebank.jsp">Quranic Arabic Dependency Treebank</a>, for a separate paper. The good news is that I&#8217;ve finally managed to figure out how to use SVMs to parse the treebank, with an F-measure accuracy score of around 90%! This should lead to a stronger submission for <a href="https://sites.google.com/site/spmrl2011/">SPMRL 2011</a>.</p>
<p><a href="http://kaisdukes.files.wordpress.com/2011/05/svm.png"><img class="alignnone size-full wp-image-425" title="svm" src="http://kaisdukes.files.wordpress.com/2011/05/svm.png?w=380&#038;h=294" alt="" width="380" height="294" /></a></p>
<p>Previously, I was working with a C4.5 decision tree classifier, which although competitive, had a slightly lower accuracy score. To get SVMs working, I closely followed <a href="http://www.aclweb.org/anthology/W/W08/W08-1007.pdf">Hall and Nivre’s approach</a> to parsing German:</p>
<blockquote><p>All symbolic features were converted to numerical features and we use the quadratic kernel of the LIBSVM package (Chang and Lin, 2001) for mapping histories to parser actions and arc labels. All results are based on the following settings of LIBSVM: gamma = 0.2 and r = 0 for the kernel parameters, C = 0.5 for the penalty parameter, and epsilon = 1.0 for the termination criterion. We also split the training instances into smaller sets according to the ﬁne-grained part-of-speech of the next input token to train separate one-versus-one multi-class LIBSVM-classiﬁers.</p></blockquote>
<p>Not using <a href="http://www.cs.waikato.ac.nz/ml/weka/">Weka</a> and instead going direct to <a href="http://www.csie.ntu.edu.tw/~cjlin/libsvm/">LIBSVM</a> has helped a bit with training time. But the the three main things I needed to do to get this working was (1) using the right kernel parameters as above, (2) binarization of features, and crucially (3) train multiple classifiers, one for each part-of-speech of the next input token &#8211; essential for reducing training time considerably.</p>
<p>Running a complete end-to-end test takes around only two minutes. This includes training on 90% of the data, and then testing against an unseen 10% of the data to work out the F-measure score. I&#8217;m very happy having finally got this working. SVMs are way cool!</p>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/kaisdukes.wordpress.com/424/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/kaisdukes.wordpress.com/424/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/kaisdukes.wordpress.com/424/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/kaisdukes.wordpress.com/424/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/kaisdukes.wordpress.com/424/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/kaisdukes.wordpress.com/424/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/kaisdukes.wordpress.com/424/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/kaisdukes.wordpress.com/424/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/kaisdukes.wordpress.com/424/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/kaisdukes.wordpress.com/424/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/kaisdukes.wordpress.com/424/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/kaisdukes.wordpress.com/424/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/kaisdukes.wordpress.com/424/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/kaisdukes.wordpress.com/424/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=kaisdukes.wordpress.com&amp;blog=12997370&amp;post=424&amp;subd=kaisdukes&amp;ref=&amp;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://kaisdukes.wordpress.com/2011/05/21/parsing-the-quran-using-support-vector-machines/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
	
		<media:content url="http://1.gravatar.com/avatar/3c8e1cc0b54e6f96239ab19177fc92ad?s=96&#38;d=identicon&#38;r=G" medium="image">
			<media:title type="html">kaisdukes</media:title>
		</media:content>

		<media:content url="http://kaisdukes.files.wordpress.com/2011/05/svm.png" medium="image">
			<media:title type="html">svm</media:title>
		</media:content>
	</item>
		<item>
		<title>Statistical Parsing of Morphologically Rich Languages (SPMRL 2011)</title>
		<link>http://kaisdukes.wordpress.com/2011/05/12/statistical-parsing-of-morphologically-rich-languages-spmrl-2011/</link>
		<comments>http://kaisdukes.wordpress.com/2011/05/12/statistical-parsing-of-morphologically-rich-languages-spmrl-2011/#comments</comments>
		<pubDate>Thu, 12 May 2011 07:21:37 +0000</pubDate>
		<dc:creator>kaisdukes</dc:creator>
				<category><![CDATA[PhD]]></category>
		<category><![CDATA[Quranic Arabic Corpus]]></category>
		<category><![CDATA[Writing]]></category>
		<category><![CDATA[Conference]]></category>
		<category><![CDATA[IWPT]]></category>
		<category><![CDATA[parsing]]></category>
		<category><![CDATA[Publication]]></category>
		<category><![CDATA[Research]]></category>
		<category><![CDATA[SPMRL]]></category>

		<guid isPermaLink="false">http://kaisdukes.wordpress.com/?p=420</guid>
		<description><![CDATA[I’ve got a couple of packed months ahead with regards to research. This is a good thing, as having this research going through peer-review and being accepted for publication can only increase the chances of being awarded a doctorate for the final thesis. As well as working on a submission for the Arabica Journal (co-authored [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=kaisdukes.wordpress.com&amp;blog=12997370&amp;post=420&amp;subd=kaisdukes&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>I’ve got a couple of packed months ahead with regards to research. This is a good thing, as having this research going through peer-review and being accepted for publication can only increase the chances of being awarded a doctorate for the final thesis. As well as working on a submission for the <a href="http://www.brill.nl/arabica">Arabica Journal</a> (co-authored with PhD supervisor <a href="http://www.comp.leeds.ac.uk/eric">Eric Atwell</a>), I’m also working on a separate submission with another collaborator for SPMRL 2011.</p>
<p><a href="http://kaisdukes.files.wordpress.com/2011/05/oconnell-bridge.jpg"><img class="alignnone size-full wp-image-421" title="oconnell-bridge" src="http://kaisdukes.files.wordpress.com/2011/05/oconnell-bridge.jpg?w=380&#038;h=143" alt="" width="380" height="143" /></a></p>
<p>For <a href="https://sites.google.com/site/spmrl2011">SPMRL</a> it is possible to also dual submit to the main <a href="http://www.dcu.ie/conferences/iwpt/index.shtml">IWPT</a> conference. The deadline for this is the 18th of July, with the conference and workshop being held at Dublin City University.</p>
<p><strong>Workshop Important Dates (SPMRL)</strong></p>
<p>Submission deadline: July 31st, 2011</p>
<p>Notification to authors: September 5th, 2011</p>
<p>Camera ready copy: September 20th, 2011</p>
<p>Workshop: October 6th, 2011</p>
<p>From the workshop’s FAQ: <em>Can I submit the same paper to IWPT and SPMRL?</em> Yes, double submissions are permitted but obviously the same paper will not be published at both venues. Another possibility for those working on parsing MRLs is submit two different papers: in this scenario, we encourage authors to view the SPMRL workshop as a venue for more detailed analysis papers.</p>
<p><strong>Main Conference Important Dates (IWPT)</strong></p>
<p>Deadline for paper submission: July 18th, 2011</p>
<p>Notification of acceptance: August 29th, 2011</p>
<p>Final papers due: September 12th, 2011</p>
<p>Conference: October 5th-7th, 2011</p>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/kaisdukes.wordpress.com/420/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/kaisdukes.wordpress.com/420/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/kaisdukes.wordpress.com/420/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/kaisdukes.wordpress.com/420/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/kaisdukes.wordpress.com/420/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/kaisdukes.wordpress.com/420/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/kaisdukes.wordpress.com/420/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/kaisdukes.wordpress.com/420/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/kaisdukes.wordpress.com/420/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/kaisdukes.wordpress.com/420/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/kaisdukes.wordpress.com/420/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/kaisdukes.wordpress.com/420/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/kaisdukes.wordpress.com/420/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/kaisdukes.wordpress.com/420/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=kaisdukes.wordpress.com&amp;blog=12997370&amp;post=420&amp;subd=kaisdukes&amp;ref=&amp;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://kaisdukes.wordpress.com/2011/05/12/statistical-parsing-of-morphologically-rich-languages-spmrl-2011/feed/</wfw:commentRss>
		<slash:comments>1</slash:comments>
	
		<media:content url="http://1.gravatar.com/avatar/3c8e1cc0b54e6f96239ab19177fc92ad?s=96&#38;d=identicon&#38;r=G" medium="image">
			<media:title type="html">kaisdukes</media:title>
		</media:content>

		<media:content url="http://kaisdukes.files.wordpress.com/2011/05/oconnell-bridge.jpg" medium="image">
			<media:title type="html">oconnell-bridge</media:title>
		</media:content>
	</item>
		<item>
		<title>Detailed Morphological and Syntactic Analysis of the Quran in the Framework of Traditional Arabic Linguistics</title>
		<link>http://kaisdukes.wordpress.com/2011/05/12/detailed-morphological-and-syntactic-analysis-of-the-quran-in-the-framework-of-traditional-arabic-linguistics/</link>
		<comments>http://kaisdukes.wordpress.com/2011/05/12/detailed-morphological-and-syntactic-analysis-of-the-quran-in-the-framework-of-traditional-arabic-linguistics/#comments</comments>
		<pubDate>Thu, 12 May 2011 07:14:11 +0000</pubDate>
		<dc:creator>kaisdukes</dc:creator>
				<category><![CDATA[PhD]]></category>
		<category><![CDATA[Quranic Arabic Corpus]]></category>
		<category><![CDATA[Writing]]></category>
		<category><![CDATA[Arabic Linguistics]]></category>
		<category><![CDATA[Journal]]></category>
		<category><![CDATA[quran]]></category>

		<guid isPermaLink="false">http://kaisdukes.wordpress.com/?p=413</guid>
		<description><![CDATA[I recently submitted an abstract to Brill&#8217;s Arabica Journal. Eric has kindly agreed to be a co-author on this paper, and his advice and guidance on this will be very valuable. Sébastien Garnier from the journal replied to us to let us know that such a paper would  fall within the scope of the Journal&#8217;s [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=kaisdukes.wordpress.com&amp;blog=12997370&amp;post=413&amp;subd=kaisdukes&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>I recently submitted an abstract to Brill&#8217;s <a href="http://www.brill.nl/arabica">Arabica Journal</a>. Eric has kindly agreed to be a co-author on this paper, and his advice and guidance on this will be very valuable. Sébastien Garnier from the journal replied to us to let us know that such a paper would  fall within the scope of the Journal&#8217;s publication, but that we must submit the full paper for formal peer-review. Sounds promising. Now we need to write the full paper! Here is the abstract we sent to Arabica:</p>
<p><strong>Abstract</strong></p>
<p>The Quranic Arabic Corpus is a recently annotated linguistic resource used to study the Quran through the historical grammar for Classical Arabic known as <em>i&#8217;rāb</em> (Dukes, Atwell and Sharaf, 2010). The website (<a href="http://corpus.quran.com">http://corpus.quran.com</a>) is used by Arabic linguists and Quranic students, and provides detailed morphological and syntactic analysis for each word in the Quran. This grammatical information was originally generated by an Artificial Intelligence (AI) computer program, by applying techniques from corpus linguistics to ‘learn’ how to recognize reoccurring patterns in Arabic text. To ensure a high level of accuracy, the website has been proofread by volunteers, who compare the automatic analysis against traditional sources of Quranic grammar through online collaboration (Dukes, Atwell and Habash, 2011). This paper is organized into two parts. In the first part, we describe this new annotated resource and its online interface, and illustrate how its features are used to study the Arabic language of the Quran. In the second part of the paper, we consider a further linguistic application of the resource and its use as a comprehensive grammar of Quranic Arabic. We discuss grammatical analysis for several representative examples from the Quran.</p>
<p>In part one, we describe the Quranic Arabic Corpus and its associated website. This annotated linguistic resource shows the Arabic grammar, syntax and morphology for each word in the Quran. The corpus provides three levels of analysis: morphological annotation, a syntactic treebank and a semantic ontology. Most other Quranic websites include the Arabic text of the Quran, English translations and possibly audio recitation. The Quran Arabic Corpus goes beyond this, by applying annotation techniques from modern corpus linguistics. The website provides detailed part-of-speech and morphological tagging, syntactic dependencies, a word-by-word interlinear translation into English, a hyperlinked concordance and a morphological dictionary organized by Arabic root and lemma. In addition, a comment based system allows online visitors to discuss the resource in detail, and to suggest corrections online. This feedback mechanism allows corrections to be reviewed and integrated back into the dataset over time, resulting in a highly accurate annotated resource. This has grown from a small research project into a significant worldwide study site for Arabic, now used by 100,000 visitors each month including academic researchers, Quranic scholars and students of Arabic, who have found the Quranic Arabic Corpus useful (Dukes et. al., 2010).</p>
<p>In part two, we provide further linguistic details, and discuss how dependency graphs are used to annotate grammatical relationships between words. This provides a novel way to visually understand the syntactic structure of Quranic Arabic. These graphs are collected into a treebank that models linguistic dependencies such as verb and subject (<em>fi&#8217;il wa fa&#8217;il</em>) and subject and predicate (<em>mubtada wa khabar</em>). Similar dependency treebanks have developed for English (Cinková et. al., 2009), Chinese (Liu et. Al., 2006) and more recently for Modern Standard Arabic (Habash and Roth, 2009). However, using the notation of dependency syntax presents a special set of challenges when applied to <em>i&#8217;rāb</em>. This paper addresses the question of how well modern dependency graphs can be used to represent traditional analyses, and we consider the differences between these two approaches. Central to this, is the relationship between the concepts of <em>amal and amil</em> from <em>i&#8217;rāb</em> (action and actor), and the modern notion of heads and dependents. We show that by extending standard dependency grammar to include hidden nodes, it is possible to support the key technique from <em>i&#8217;rāb</em> known as <em>hadhf wa taqdeer</em> (elision and reconstruction).  In addition, to fully account for the classical treatment of conjunction and preposition phrases, it is necessary to go beyond the syntactic representation used in most other treebanks, by introducing phrase nodes into dependency graphs.</p>
<p>We present a new linguistic resource for the Quran, and the first treebank for Quranic Arabic. We also present a novel contribution to Arabic grammatical theory, by investigating the assumed linguistic dependency framework that underlies <em>i&#8217;rāb</em>, and by modeling this using formal structures that correspond to other recent treebanking efforts for Modern Standard Arabic (MSA).</p>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/kaisdukes.wordpress.com/413/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/kaisdukes.wordpress.com/413/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/kaisdukes.wordpress.com/413/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/kaisdukes.wordpress.com/413/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/kaisdukes.wordpress.com/413/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/kaisdukes.wordpress.com/413/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/kaisdukes.wordpress.com/413/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/kaisdukes.wordpress.com/413/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/kaisdukes.wordpress.com/413/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/kaisdukes.wordpress.com/413/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/kaisdukes.wordpress.com/413/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/kaisdukes.wordpress.com/413/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/kaisdukes.wordpress.com/413/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/kaisdukes.wordpress.com/413/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=kaisdukes.wordpress.com&amp;blog=12997370&amp;post=413&amp;subd=kaisdukes&amp;ref=&amp;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://kaisdukes.wordpress.com/2011/05/12/detailed-morphological-and-syntactic-analysis-of-the-quran-in-the-framework-of-traditional-arabic-linguistics/feed/</wfw:commentRss>
		<slash:comments>1</slash:comments>
	
		<media:content url="http://1.gravatar.com/avatar/3c8e1cc0b54e6f96239ab19177fc92ad?s=96&#38;d=identicon&#38;r=G" medium="image">
			<media:title type="html">kaisdukes</media:title>
		</media:content>
	</item>
		<item>
		<title>Annotation Plan for Version 0.5 of the Quranic Arabic Corpus</title>
		<link>http://kaisdukes.wordpress.com/2011/05/02/annotation-plan-for-version-0-5-of-the-quranic-arabic-corpus/</link>
		<comments>http://kaisdukes.wordpress.com/2011/05/02/annotation-plan-for-version-0-5-of-the-quranic-arabic-corpus/#comments</comments>
		<pubDate>Mon, 02 May 2011 17:32:34 +0000</pubDate>
		<dc:creator>kaisdukes</dc:creator>
				<category><![CDATA[PhD]]></category>
		<category><![CDATA[Quranic Arabic Corpus]]></category>

		<guid isPermaLink="false">http://kaisdukes.wordpress.com/?p=410</guid>
		<description><![CDATA[In version 0.5 of the Quranic Arabic Corpus, it is planned to extend the Quranic Arabic Dependency Treebank to include chapters 9-10 and 50-58. The following annotation plan divides this work into 36 blocks of roughly 200 words each: Block #1: (9:1-12) &#8211; 214 words Block #2: (9:13-24) &#8211; 217 words Block #3: (9:25-34) &#8211; [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=kaisdukes.wordpress.com&amp;blog=12997370&amp;post=410&amp;subd=kaisdukes&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>In version 0.5 of the Quranic Arabic Corpus, it is planned to extend the <a href="http://corpus.quran.com/treebank.jsp">Quranic Arabic Dependency Treebank</a> to include chapters 9-10 and 50-58. The following annotation plan divides this work into 36 blocks of roughly 200 words each:</p>
<p>Block #1: (9:1-12) &#8211; 214 words<br />
Block #2: (9:13-24) &#8211; 217 words<br />
Block #3: (9:25-34) &#8211; 212 words<br />
Block #4: (9:35-42) &#8211; 211 words<br />
Block #5: (9:43-55) &#8211; 207 words<br />
Block #6: (9:56-68) &#8211; 213 words<br />
Block #7: (9:69-78) &#8211; 210 words<br />
Block #8: (9:79-90) &#8211; 212 words<br />
Block #9: (9:91-100) &#8211; 214 words<br />
Block #10: (9:101-111) &#8211; 225 words<br />
Block #11: (9:112-120) &#8211; 211 words<br />
Block #12: (9:121-129) &#8211; 152 words<br />
Block #13: (10:1-12) &#8211; 220 words<br />
Block #14: (10:13-22) &#8211; 223 words<br />
Block #15: (10:23-32) &#8211; 204 words<br />
Block #16: (10:33-45) &#8211; 209 words<br />
Block #17: (10:46-60) &#8211; 208 words<br />
Block #18: (10:61-71) &#8211; 201 words<br />
Block #19: (10:72-87) &#8211; 211 words<br />
Block #20: (10:88-109) &#8211; 357 words<br />
Block #21: (50:1-26) &#8211; 209 words<br />
Block #22: (50:27-45) &#8211; 164 words<br />
Block #23: (51:1-39) &#8211; 204 words<br />
Block #24: (51:40-60) &#8211; 156 words<br />
Block #25: (52:1-49) &#8211; 312 words<br />
Block #26: (53:1-31) &#8211; 206 words<br />
Block #27: (53:32-62) &#8211; 154 words<br />
Block #28: (54:1-55) &#8211; 342 words<br />
Block #29: (55:1-78) &#8211; 351 words<br />
Block #30: (56:1-57) &#8211; 200 words<br />
Block #31: (56:58-96) &#8211; 179 words<br />
Block #32: (57:1-12) &#8211; 203 words<br />
Block #33: (57:13-22) &#8211; 220 words<br />
Block #34: (57:23-29) &#8211; 151 words<br />
Block #35: (58:1-8) &#8211; 206 words<br />
Block #36: (58:9-22) &#8211; 266 words</p>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/kaisdukes.wordpress.com/410/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/kaisdukes.wordpress.com/410/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/kaisdukes.wordpress.com/410/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/kaisdukes.wordpress.com/410/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/kaisdukes.wordpress.com/410/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/kaisdukes.wordpress.com/410/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/kaisdukes.wordpress.com/410/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/kaisdukes.wordpress.com/410/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/kaisdukes.wordpress.com/410/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/kaisdukes.wordpress.com/410/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/kaisdukes.wordpress.com/410/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/kaisdukes.wordpress.com/410/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/kaisdukes.wordpress.com/410/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/kaisdukes.wordpress.com/410/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=kaisdukes.wordpress.com&amp;blog=12997370&amp;post=410&amp;subd=kaisdukes&amp;ref=&amp;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://kaisdukes.wordpress.com/2011/05/02/annotation-plan-for-version-0-5-of-the-quranic-arabic-corpus/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
	
		<media:content url="http://1.gravatar.com/avatar/3c8e1cc0b54e6f96239ab19177fc92ad?s=96&#38;d=identicon&#38;r=G" medium="image">
			<media:title type="html">kaisdukes</media:title>
		</media:content>
	</item>
		<item>
		<title>New Version 0.4 of the Quranic Arabic Corpus</title>
		<link>http://kaisdukes.wordpress.com/2011/05/02/new-version-0-4-of-the-quranic-arabic-corpus/</link>
		<comments>http://kaisdukes.wordpress.com/2011/05/02/new-version-0-4-of-the-quranic-arabic-corpus/#comments</comments>
		<pubDate>Mon, 02 May 2011 09:21:14 +0000</pubDate>
		<dc:creator>kaisdukes</dc:creator>
				<category><![CDATA[PhD]]></category>
		<category><![CDATA[Quranic Arabic Corpus]]></category>

		<guid isPermaLink="false">http://kaisdukes.wordpress.com/?p=406</guid>
		<description><![CDATA[Version 0.4 of the Quranic Arabic Corpus was released on the 1st May, 2011. Here are the release notes from the website: The Quranic Arabic Corpus (http://corpus.quran.com) is an international collaborative linguistic project initiated at the University of Leeds, that aims to bridge the gap between the traditional Arabic grammar of i&#8217;rab and techniques from [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=kaisdukes.wordpress.com&amp;blog=12997370&amp;post=406&amp;subd=kaisdukes&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>Version 0.4 of the Quranic Arabic Corpus was released on the 1st May, 2011. Here are the release notes from the website:</p>
<p>The Quranic Arabic Corpus (http://corpus.quran.com) is an international collaborative linguistic project initiated at the University of Leeds, that aims to bridge the gap between the traditional Arabic grammar of i&#8217;rab and techniques from modern computational linguistics. This open source resource includes part-of-speech tagging for the Quran, morphological segmentation and a formal representation of Quranic syntax using dependency graphs. Version 0.4 of the corpus provides several improvements over the previous release:</p>
<p>*** [Increased coverage for the syntactic treebank]. Version 0.4 of the treebank covers 40% of the Quran by word count (30,895 out of 77,429 words). The treebank provides syntactic annotation using dependency grammar for chapters 1-8 and 59-114 of the Quran.</p>
<p>*** [Revised morphological analysis]. Following online collaboration by volunteer annotators, over 500 suggestions have cross-checked against traditional sources of Arabic grammar, resulting in more accurate morphological tagging.</p>
<p>*** [Improved Quran dictionary and lemmatization]. The list of roots and lemmas that group related derived words has been made more consistent with traditional Arabic lexicons. The online Quran dictionary now also includes concordance lines from Quranic verses as context.</p>
<p>*** [Readability and navigation improvements]. The content of the website has been better organized, with improvements to navigation and layout. Several typing mistakes and omissions have been corrected in the word by word interlinear translation into English.</p>
<p>*** [More accurate tagging of proper nouns]. Eight new named entities have been added to the semantic ontology that were previously tagged only as nouns: Al-Ahqaf, Al-Jahiliyah, Al-Jumu&#8217;ah, Baal, Magians, Salsabil, Sirius, and Zaqqum.</p>
<p>*** [More accurate tagging for particles waw and fa]. In accordance with traditional Arabic grammar, for certain words, the particle fa is now tagged as a supplemental particle (harf za&#8217;id), such as in the combination a-fa-man.</p>
<p>*** [Version 0.4 of the morphologically annotated corpus] is freely available for download from the Quranic Arabic Corpus website.</p>
<p>The Quranic Arabic Corpus is an open source project. Contributions or questions about the research are more than welcome. Please direct any correspondence to Kais Dukes, PhD researcher at the School of Computing, University of Leeds:</p>
<p>web: www.kaisdukes.com<br />
e-mail: sckd@leeds.ac.uk</p>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/kaisdukes.wordpress.com/406/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/kaisdukes.wordpress.com/406/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/kaisdukes.wordpress.com/406/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/kaisdukes.wordpress.com/406/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/kaisdukes.wordpress.com/406/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/kaisdukes.wordpress.com/406/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/kaisdukes.wordpress.com/406/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/kaisdukes.wordpress.com/406/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/kaisdukes.wordpress.com/406/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/kaisdukes.wordpress.com/406/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/kaisdukes.wordpress.com/406/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/kaisdukes.wordpress.com/406/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/kaisdukes.wordpress.com/406/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/kaisdukes.wordpress.com/406/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=kaisdukes.wordpress.com&amp;blog=12997370&amp;post=406&amp;subd=kaisdukes&amp;ref=&amp;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://kaisdukes.wordpress.com/2011/05/02/new-version-0-4-of-the-quranic-arabic-corpus/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
	
		<media:content url="http://1.gravatar.com/avatar/3c8e1cc0b54e6f96239ab19177fc92ad?s=96&#38;d=identicon&#38;r=G" medium="image">
			<media:title type="html">kaisdukes</media:title>
		</media:content>
	</item>
	</channel>
</rss>
