<?xml version="1.0" encoding="UTF-8"?>
<?xml-stylesheet type="text/xsl" media="screen" href="/~d/styles/rss2full.xsl"?><?xml-stylesheet type="text/css" media="screen" href="http://feeds.feedburner.com/~d/styles/itemcontent.css"?><rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:wfw="http://wellformedweb.org/CommentAPI/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:atom="http://www.w3.org/2005/Atom" xmlns:sy="http://purl.org/rss/1.0/modules/syndication/" xmlns:slash="http://purl.org/rss/1.0/modules/slash/" xmlns:feedburner="http://rssnamespace.org/feedburner/ext/1.0" version="2.0">

<channel>
	<title>我爱自然语言处理</title>
	
	<link>http://www.52nlp.cn</link>
	<description>I Love Natural Language Processing</description>
	<lastBuildDate>Wed, 21 Jul 2010 15:33:24 +0000</lastBuildDate>
	<generator>http://wordpress.org/?v=2.9.2</generator>
	<language>en</language>
	<sy:updatePeriod>hourly</sy:updatePeriod>
	<sy:updateFrequency>1</sy:updateFrequency>
			<atom10:link xmlns:atom10="http://www.w3.org/2005/Atom" rel="self" type="application/rss+xml" href="http://feeds.feedburner.com/52nlp" /><feedburner:info uri="52nlp" /><atom10:link xmlns:atom10="http://www.w3.org/2005/Atom" rel="hub" href="http://pubsubhubbub.appspot.com/" /><feedburner:emailServiceId>52nlp</feedburner:emailServiceId><feedburner:feedburnerHostname>http://feedburner.google.com</feedburner:feedburnerHostname><item>
		<title>机器翻译新闻一则：SDL公司收购Language Weaver</title>
		<link>http://feedproxy.google.com/~r/52nlp/~3/FtPCl299HvQ/%e6%9c%ba%e5%99%a8%e7%bf%bb%e8%af%91%e6%96%b0%e9%97%bb%e4%b8%80%e5%88%99-sdl%e5%85%ac%e5%8f%b8%e6%94%b6%e8%b4%adlanguage-weaver</link>
		<comments>http://www.52nlp.cn/%e6%9c%ba%e5%99%a8%e7%bf%bb%e8%af%91%e6%96%b0%e9%97%bb%e4%b8%80%e5%88%99-sdl%e5%85%ac%e5%8f%b8%e6%94%b6%e8%b4%adlanguage-weaver#comments</comments>
		<pubDate>Wed, 21 Jul 2010 15:27:37 +0000</pubDate>
		<dc:creator>52nlp</dc:creator>
				<category><![CDATA[机器翻译]]></category>
		<category><![CDATA[自然语言处理]]></category>
		<category><![CDATA[Kevin Knight]]></category>
		<category><![CDATA[Language Weaver]]></category>
		<category><![CDATA[SDL]]></category>
		<category><![CDATA[统计机器翻译]]></category>

		<guid isPermaLink="false">http://www.52nlp.cn/?p=3420</guid>
		<description><![CDATA[　　也许是时下流行收购吧，前天刚谈了“Google收购语义网公司Metaweb”，没想到今天又发现“SDL公司收购Language Weaver”。Language Weaver是我非常崇拜的统计机器翻译公司，曾经在这里写过”自然语言处理公司巡礼七：Language Weaver“，没想到也被收购了！以下是上述新闻摘录的要点：
　　英国梅登黑德——作为一家领先的全球信息管理方案提供商，SDL 2010年7月15日宣布已签署收购 Language Weaver Inc.（以下简称“Language Weaver”） 的协议。Language Weaver 是统计机器翻译领域的先驱，对其收购不仅仅是为了将最好的自动翻译技术移植到 SDL 全球信息管理平台中，事实上它的意义远大于此。将安全的机器翻译技术集成到翻译供应链的各个环节中，可使企业和政府能更快更高效地翻译超大容量的内容，以满足当今急剧增长的网络世界对海量信息的需求。经股东同意，此次交易共购买 Language Weaver 85% 以上的资本所有权，预计将于 2010 年 7 月底完成交易。
　　．．．
　　Language Weaver 总部设在美国加利福尼亚州洛杉矶市，在美国、欧洲和日本都有办公室，拥有雇员96 名。公司与南加利福尼亚大学信息科学研究院（机器翻译研究的领军机构）合作紧密。双方科学家都在共同努力，以期进一步研究和提高统计机器翻译方法。Language Weaver 的创始人Daniel Marcu 和 Kevin Knight 均为统计机器翻译领域的领军人物，他们将继续留任公司。因为 Language Weaver 技术的品质与性能已达到全新水平，Mark Tapling新近提拔成为了 Language Weaver 的 CEO， 以便进一步加强公司的商业化进程，Mark Tapling 也将继续留任公司。且当前并无对 Language Weaver 公司进行裁员的计划。
　　．．．
　　 “尽管谷歌翻译已成为消费者即时翻译的标准，但我们发现，大多数企业希望拥有自己的自动翻译技术，”Language Weaver 的董事长兼执行总裁Mark Tapling 说到，“使用Language Weaver，可保证您的内容安全、保密；它遵循翻译工作流程，而且可以很容易地集成到其他系统中。它也可以提供质量排序和受训系统，以提供值得您信赖的质量。它遵守诸如公司品牌和翻译一致性这类要求。Language Weaver的研发团队，不断推进统计机器翻译研究的极限，同时为企业和政府机构提供人际交往解决方案。SDL的收购将大大增强Language Weaver团队解决问题的能力，并向市场推出独特的高价值机器翻译产品和解决方案。”
　　．．．
　　今天，自动翻译仅占翻译市场总量的 1% [...]


相关文章:<ol><li><a href='http://www.52nlp.cn/natural-language-processing-company-language-weaver' rel='bookmark' title='Permanent Link: 自然语言处理公司巡礼七：Language Weaver'>自然语言处理公司巡礼七：Language Weaver</a></li>
<li><a href='http://www.52nlp.cn/%e6%9c%ba%e5%99%a8%e7%bf%bb%e8%af%91%e6%96%b0%e9%97%bb%e4%b8%80%e5%88%99' rel='bookmark' title='Permanent Link: 机器翻译新闻一则'>机器翻译新闻一则</a></li>
<li><a href='http://www.52nlp.cn/natural-language-processing-and-computational-linguistics-books-summary-five-machine-translation' rel='bookmark' title='Permanent Link: 自然语言处理与计算语言学书籍汇总之五：机器翻译'>自然语言处理与计算语言学书籍汇总之五：机器翻译</a></li>
<li><a href='http://www.52nlp.cn/moses%e6%9c%80%e6%96%b0%e7%89%88%e6%9c%ac%e5%8f%91%e5%b8%83' rel='bookmark' title='Permanent Link: Moses最新版本发布'>Moses最新版本发布</a></li>
<li><a href='http://www.52nlp.cn/natural-language-processing-company-systran' rel='bookmark' title='Permanent Link: 自然语言处理公司巡礼四：Systran'>自然语言处理公司巡礼四：Systran</a></li>
<li><a href='http://www.52nlp.cn/natural-language-processing-and-machine-translation-faq' rel='bookmark' title='Permanent Link: 自然语言处理与机器翻译FAQ'>自然语言处理与机器翻译FAQ</a></li>
<li><a href='http://www.52nlp.cn/statistical-machine-translation-tutorial-reading' rel='bookmark' title='Permanent Link: 统计机器翻译文献阅读指南'>统计机器翻译文献阅读指南</a></li>
<li><a href='http://www.52nlp.cn/about-acl-anthology-network' rel='bookmark' title='Permanent Link: ACL Anthology 姊妹篇：ACL Anthology Network'>ACL Anthology 姊妹篇：ACL Anthology Network</a></li>
<li><a href='http://www.52nlp.cn/liu-qun-article-recommended' rel='bookmark' title='Permanent Link: 推荐刘群老师的《计算所与北大往事回顾》'>推荐刘群老师的《计算所与北大往事回顾》</a></li>
<li><a href='http://www.52nlp.cn/mit-nlp-first-lesson-introduction-and-overview-second-part' rel='bookmark' title='Permanent Link: MIT自然语言处理第一讲：简介和概述（第二部分）'>MIT自然语言处理第一讲：简介和概述（第二部分）</a></li>
</ol>]]></description>
			<content:encoded><![CDATA[<p>　　也许是时下流行收购吧，前天刚谈了“<a href="http://www.52nlp.cn/%E8%AF%AD%E4%B9%89%E7%BD%91%E6%96%B0%E9%97%BB%E4%B8%80%E5%88%99-google%E6%94%B6%E8%B4%AD%E8%AF%AD%E4%B9%89%E7%BD%91%E5%85%AC%E5%8F%B8metaweb">Google收购语义网公司Metaweb</a>”，没想到今天又发现“<a href="http://news.dayoo.com/china/201007/20/54502_13347123.htm">SDL公司收购Language Weaver</a>”。Language Weaver是我非常崇拜的统计机器翻译公司，曾经在这里写过”<a href="http://www.52nlp.cn/natural-language-processing-company-language-weaver">自然语言处理公司巡礼七：Language Weaver</a>“，没想到也被收购了！以下是上述新闻摘录的要点：<span id="more-3420"></span></p>
<blockquote><p>　　英国梅登黑德——作为一家领先的全球信息管理方案提供商，SDL 2010年7月15日宣布已签署收购 Language Weaver Inc.（以下简称“Language Weaver”） 的协议。Language Weaver 是统计机器翻译领域的先驱，对其收购不仅仅是为了将最好的自动翻译技术移植到 SDL 全球信息管理平台中，事实上它的意义远大于此。将安全的机器翻译技术集成到翻译供应链的各个环节中，可使企业和政府能更快更高效地翻译超大容量的内容，以满足当今急剧增长的网络世界对海量信息的需求。经股东同意，此次交易共购买 Language Weaver 85% 以上的资本所有权，预计将于 2010 年 7 月底完成交易。<br />
　　．．．<br />
　　Language Weaver 总部设在美国加利福尼亚州洛杉矶市，在美国、欧洲和日本都有办公室，拥有雇员96 名。公司与南加利福尼亚大学信息科学研究院（机器翻译研究的领军机构）合作紧密。双方科学家都在共同努力，以期进一步研究和提高统计机器翻译方法。Language Weaver 的创始人Daniel Marcu 和 Kevin Knight 均为统计机器翻译领域的领军人物，他们将继续留任公司。因为 Language Weaver 技术的品质与性能已达到全新水平，Mark Tapling新近提拔成为了 Language Weaver 的 CEO， 以便进一步加强公司的商业化进程，Mark Tapling 也将继续留任公司。且当前并无对 Language Weaver 公司进行裁员的计划。<br />
　　．．．<br />
　　 “尽管谷歌翻译已成为消费者即时翻译的标准，但我们发现，大多数企业希望拥有自己的自动翻译技术，”Language Weaver 的董事长兼执行总裁Mark Tapling 说到，“使用Language Weaver，可保证您的内容安全、保密；它遵循翻译工作流程，而且可以很容易地集成到其他系统中。它也可以提供质量排序和受训系统，以提供值得您信赖的质量。它遵守诸如公司品牌和翻译一致性这类要求。Language Weaver的研发团队，不断推进统计机器翻译研究的极限，同时为企业和政府机构提供人际交往解决方案。SDL的收购将大大增强Language Weaver团队解决问题的能力，并向市场推出独特的高价值机器翻译产品和解决方案。”<br />
　　．．．<br />
　　今天，自动翻译仅占翻译市场总量的 1% 左右（据IDC提供的数据，约为100-150亿美元）但市场分析人士预计，无论是整个翻译市场，还是自动翻译的市场份额都将持续大幅度增长。SDL发现自动翻译能降低客户 30％ 到50％ 的翻译成本，与此同时，已翻译内容的市场投放时间可缩短 50% 以上。</p></blockquote>
<p>注：转载请注明出处“<a href="http://www.52nlp.cn">我爱自然语言处理</a>”：<a href="http://www.52nlp.cn">www.52nlp.cn</a></p>
<p>本文链接地址：<a href="http://www.52nlp.cn/机器翻译新闻一则-sdl公司收购language-weaver">http://www.52nlp.cn/机器翻译新闻一则-sdl公司收购language-weaver</a></p>
<p>
<!-- Begin Google Adsense code -->
<script type="text/javascript"><!--
google_ad_client = "pub-4332174469367599";
/* 336x280, 创建于 09-2-7 */
google_ad_slot = "5707022987";
google_ad_width = 336;
google_ad_height = 280;
//-->
</script>
<script type="text/javascript"
src="http://pagead2.googlesyndication.com/pagead/show_ads.js">
</script>
<!-- End Google Adsense code -->
   </p>


<p>相关文章:<ol><li><a href='http://www.52nlp.cn/natural-language-processing-company-language-weaver' rel='bookmark' title='Permanent Link: 自然语言处理公司巡礼七：Language Weaver'>自然语言处理公司巡礼七：Language Weaver</a></li>
<li><a href='http://www.52nlp.cn/%e6%9c%ba%e5%99%a8%e7%bf%bb%e8%af%91%e6%96%b0%e9%97%bb%e4%b8%80%e5%88%99' rel='bookmark' title='Permanent Link: 机器翻译新闻一则'>机器翻译新闻一则</a></li>
<li><a href='http://www.52nlp.cn/natural-language-processing-and-computational-linguistics-books-summary-five-machine-translation' rel='bookmark' title='Permanent Link: 自然语言处理与计算语言学书籍汇总之五：机器翻译'>自然语言处理与计算语言学书籍汇总之五：机器翻译</a></li>
<li><a href='http://www.52nlp.cn/moses%e6%9c%80%e6%96%b0%e7%89%88%e6%9c%ac%e5%8f%91%e5%b8%83' rel='bookmark' title='Permanent Link: Moses最新版本发布'>Moses最新版本发布</a></li>
<li><a href='http://www.52nlp.cn/natural-language-processing-company-systran' rel='bookmark' title='Permanent Link: 自然语言处理公司巡礼四：Systran'>自然语言处理公司巡礼四：Systran</a></li>
<li><a href='http://www.52nlp.cn/natural-language-processing-and-machine-translation-faq' rel='bookmark' title='Permanent Link: 自然语言处理与机器翻译FAQ'>自然语言处理与机器翻译FAQ</a></li>
<li><a href='http://www.52nlp.cn/statistical-machine-translation-tutorial-reading' rel='bookmark' title='Permanent Link: 统计机器翻译文献阅读指南'>统计机器翻译文献阅读指南</a></li>
<li><a href='http://www.52nlp.cn/about-acl-anthology-network' rel='bookmark' title='Permanent Link: ACL Anthology 姊妹篇：ACL Anthology Network'>ACL Anthology 姊妹篇：ACL Anthology Network</a></li>
<li><a href='http://www.52nlp.cn/liu-qun-article-recommended' rel='bookmark' title='Permanent Link: 推荐刘群老师的《计算所与北大往事回顾》'>推荐刘群老师的《计算所与北大往事回顾》</a></li>
<li><a href='http://www.52nlp.cn/mit-nlp-first-lesson-introduction-and-overview-second-part' rel='bookmark' title='Permanent Link: MIT自然语言处理第一讲：简介和概述（第二部分）'>MIT自然语言处理第一讲：简介和概述（第二部分）</a></li>
</ol></p><img src="http://feeds.feedburner.com/~r/52nlp/~4/FtPCl299HvQ" height="1" width="1"/>]]></content:encoded>
			<wfw:commentRss>http://www.52nlp.cn/%e6%9c%ba%e5%99%a8%e7%bf%bb%e8%af%91%e6%96%b0%e9%97%bb%e4%b8%80%e5%88%99-sdl%e5%85%ac%e5%8f%b8%e6%94%b6%e8%b4%adlanguage-weaver/feed</wfw:commentRss>
		<slash:comments>2</slash:comments>
		<feedburner:origLink>http://www.52nlp.cn/%e6%9c%ba%e5%99%a8%e7%bf%bb%e8%af%91%e6%96%b0%e9%97%bb%e4%b8%80%e5%88%99-sdl%e5%85%ac%e5%8f%b8%e6%94%b6%e8%b4%adlanguage-weaver</feedburner:origLink></item>
		<item>
		<title>语义网新闻一则：Google收购语义网公司Metaweb</title>
		<link>http://feedproxy.google.com/~r/52nlp/~3/yvs-m6Gz9J4/%e8%af%ad%e4%b9%89%e7%bd%91%e6%96%b0%e9%97%bb%e4%b8%80%e5%88%99-google%e6%94%b6%e8%b4%ad%e8%af%ad%e4%b9%89%e7%bd%91%e5%85%ac%e5%8f%b8metaweb</link>
		<comments>http://www.52nlp.cn/%e8%af%ad%e4%b9%89%e7%bd%91%e6%96%b0%e9%97%bb%e4%b8%80%e5%88%99-google%e6%94%b6%e8%b4%ad%e8%af%ad%e4%b9%89%e7%bd%91%e5%85%ac%e5%8f%b8metaweb#comments</comments>
		<pubDate>Mon, 19 Jul 2010 13:36:36 +0000</pubDate>
		<dc:creator>52nlp</dc:creator>
				<category><![CDATA[自然语言处理]]></category>
		<category><![CDATA[语义网]]></category>
		<category><![CDATA[Google]]></category>
		<category><![CDATA[Metaweb]]></category>
		<category><![CDATA[W3CHINA]]></category>

		<guid isPermaLink="false">http://www.52nlp.cn/?p=3415</guid>
		<description><![CDATA[　　这几天比较重磅的消息是“Google收购语义网公司Metaweb”，关于Metaweb，这里曾在《自然语言处理公司巡礼六：Metaweb》中介绍过：Metaweb是从事语义网（Semantic Web）技术开发的风险企业，目标是开发用于Web的语义数据存储的基础结构，是曾就职于原美国网景（Netscape）、英特尔以及 AlexaInternet等公司的人才聚集在一起，于2005年7月成立，总部设在美国旧金山。
Google产品管理主管杰克·门泽尔(Jack Menzel)发表博客文章称，该公司可以处理许多搜索请求，但Metaweb的信息可以使其处理更多搜索请求，“通过推出搜索答案等功能，我们才刚刚开始将我们对互联网的理解用于改进搜索体验”，但对于部分搜索仍然无能为力，“例如，‘美国西海岸地区学费低于3万美元的大学’或‘年龄超过40岁且获得过至少一次奥斯卡奖的演员’，这些问题都很难回答。我们之所以收购Metaweb，是因为我们相信，整合Metaweb的技术将使我们能提供更好的答案”。
　　关于此次收购，国内语义网方面知名的W3CHINA（中国万维网联盟）论坛上专门开贴讨论，其中W3China站长的评论尤为精彩：
去年三月，谷歌三位重量级搜索技术专家Alon Halevy、Peter Norvig和Fernando Pereira曾共同撰文《The Unreasonable Effectiveness of Data》（发表于IEEE Intelligent System）低估语义技术的功效，引来一阵拍砖。
当时就有人声称“谷歌不搞语义”，其实在一家商业公司里，存在走不同甚至相反路线的阵营也是很正常的事。
85公里在地球上并算不上多长的路，但这段路如果被铺设在白令海峡上，那么它将贯通美洲大陆和亚欧大陆。
　　有兴趣的读者可以关注原帖：Google购买语义网公司Metaweb，迈向语义网技术领域重要一步
注：转载请注明出处“我爱自然语言处理”：www.52nlp.cn
本文链接地址：http://www.52nlp.cn/语义网新闻一则-google收购语义网公司metaweb







   


相关文章:Beautiful Data-统计语言模型的应用一：缘起
自然语言处理公司巡礼六：Metaweb
自然语言处理公司巡礼四：Systran
机器翻译新闻一则：SDL公司收购Language Weaver
CWB中文词库试用及其他
Beautiful Data-统计语言模型的应用三：分词5
Beautiful Data-统计语言模型的应用二：背景
自然语言处理及计算语言学常见缩略语
自动作文评分与自然语言处理
ACL Anthology 姊妹篇：ACL Anthology Network



相关文章:<ol><li><a href='http://www.52nlp.cn/beautiful-data-%e7%bb%9f%e8%ae%a1%e8%af%ad%e8%a8%80%e6%a8%a1%e5%9e%8b%e7%9a%84%e5%ba%94%e7%94%a8%e4%b8%80%e7%bc%98%e8%b5%b7' rel='bookmark' title='Permanent Link: Beautiful Data-统计语言模型的应用一：缘起'>Beautiful Data-统计语言模型的应用一：缘起</a></li>
<li><a href='http://www.52nlp.cn/natural-language-processing-company-metaweb' rel='bookmark' title='Permanent Link: 自然语言处理公司巡礼六：Metaweb'>自然语言处理公司巡礼六：Metaweb</a></li>
<li><a href='http://www.52nlp.cn/natural-language-processing-company-systran' rel='bookmark' title='Permanent Link: 自然语言处理公司巡礼四：Systran'>自然语言处理公司巡礼四：Systran</a></li>
<li><a href='http://www.52nlp.cn/%e6%9c%ba%e5%99%a8%e7%bf%bb%e8%af%91%e6%96%b0%e9%97%bb%e4%b8%80%e5%88%99-sdl%e5%85%ac%e5%8f%b8%e6%94%b6%e8%b4%adlanguage-weaver' rel='bookmark' title='Permanent Link: 机器翻译新闻一则：SDL公司收购Language Weaver'>机器翻译新闻一则：SDL公司收购Language Weaver</a></li>
<li><a href='http://www.52nlp.cn/cwb-trial-and-others' rel='bookmark' title='Permanent Link: CWB中文词库试用及其他'>CWB中文词库试用及其他</a></li>
<li><a href='http://www.52nlp.cn/beautiful-data-%e7%bb%9f%e8%ae%a1%e8%af%ad%e8%a8%80%e6%a8%a1%e5%9e%8b%e7%9a%84%e5%ba%94%e7%94%a8%e4%b8%89%e5%88%86%e8%af%8d5' rel='bookmark' title='Permanent Link: Beautiful Data-统计语言模型的应用三：分词5'>Beautiful Data-统计语言模型的应用三：分词5</a></li>
<li><a href='http://www.52nlp.cn/beautiful-data-%e7%bb%9f%e8%ae%a1%e8%af%ad%e8%a8%80%e6%a8%a1%e5%9e%8b%e7%9a%84%e5%ba%94%e7%94%a8%e4%ba%8c%e8%83%8c%e6%99%af' rel='bookmark' title='Permanent Link: Beautiful Data-统计语言模型的应用二：背景'>Beautiful Data-统计语言模型的应用二：背景</a></li>
<li><a href='http://www.52nlp.cn/natural-language-processing-and-computational-linguistics-common-abbreviations-acronyms' rel='bookmark' title='Permanent Link: 自然语言处理及计算语言学常见缩略语'>自然语言处理及计算语言学常见缩略语</a></li>
<li><a href='http://www.52nlp.cn/automated-essay-scoring-and-natural-language-processing' rel='bookmark' title='Permanent Link: 自动作文评分与自然语言处理'>自动作文评分与自然语言处理</a></li>
<li><a href='http://www.52nlp.cn/about-acl-anthology-network' rel='bookmark' title='Permanent Link: ACL Anthology 姊妹篇：ACL Anthology Network'>ACL Anthology 姊妹篇：ACL Anthology Network</a></li>
</ol>]]></description>
			<content:encoded><![CDATA[<p>　　这几天比较重磅的消息是“<a href="http://www.nytimes.com/external/readwriteweb/2010/07/16/16readwriteweb-google-makes-major-semantic-web-play-acquir-62129.html?emc=eta1"target=_blank>Google收购语义网公司Metaweb</a>”，关于Metaweb，这里曾在《<a href="http://www.52nlp.cn/natural-language-processing-company-metaweb">自然语言处理公司巡礼六：Metaweb</a>》中介绍过：Metaweb是从事语义网（Semantic Web）技术开发的风险企业，目标是开发用于Web的语义数据存储的基础结构，是曾就职于原美国网景（Netscape）、英特尔以及 AlexaInternet等公司的人才聚集在一起，于2005年7月成立，总部设在美国旧金山。<span id="more-3415"></span></p>
<blockquote><p>Google产品管理主管杰克·门泽尔(Jack Menzel)发表博客文章称，该公司可以处理许多搜索请求，但Metaweb的信息可以使其处理更多搜索请求，“通过推出搜索答案等功能，我们才刚刚开始将我们对互联网的理解用于改进搜索体验”，但对于部分搜索仍然无能为力，“例如，‘美国西海岸地区学费低于3万美元的大学’或‘年龄超过40岁且获得过至少一次奥斯卡奖的演员’，这些问题都很难回答。我们之所以收购Metaweb，是因为我们相信，整合Metaweb的技术将使我们能提供更好的答案”。</p></blockquote>
<p>　　关于此次收购，国内语义网方面知名的W3CHINA（中国万维网联盟）论坛上专门开贴讨论，其中W3China站长的评论尤为精彩：</p>
<blockquote><p>去年三月，谷歌三位重量级搜索技术专家Alon Halevy、Peter Norvig和Fernando Pereira曾共同撰文《The Unreasonable Effectiveness of Data》（发表于IEEE Intelligent System）低估语义技术的功效，引来一阵拍砖。</p>
<p>当时就有人声称“谷歌不搞语义”，其实在一家商业公司里，存在走不同甚至相反路线的阵营也是很正常的事。</p>
<p>85公里在地球上并算不上多长的路，但这段路如果被铺设在白令海峡上，那么它将贯通美洲大陆和亚欧大陆。</p></blockquote>
<p>　　有兴趣的读者可以关注原帖：<a href="http://bbs.w3china.org/dispbbs.asp?boardID=2&#038;ID=85780"target=_blank>Google购买语义网公司Metaweb，迈向语义网技术领域重要一步</a></p>
<p>注：转载请注明出处“<a href="http://www.52nlp.cn">我爱自然语言处理</a>”：<a href="http://www.52nlp.cn">www.52nlp.cn</a></p>
<p>本文链接地址：<a href="http://www.52nlp.cn/语义网新闻一则-google收购语义网公司metaweb">http://www.52nlp.cn/语义网新闻一则-google收购语义网公司metaweb</a></p>
<p>
<!-- Begin Google Adsense code -->
<script type="text/javascript"><!--
google_ad_client = "pub-4332174469367599";
/* 336x280, 创建于 09-2-7 */
google_ad_slot = "5707022987";
google_ad_width = 336;
google_ad_height = 280;
//-->
</script>
<script type="text/javascript"
src="http://pagead2.googlesyndication.com/pagead/show_ads.js">
</script>
<!-- End Google Adsense code -->
   </p>


<p>相关文章:<ol><li><a href='http://www.52nlp.cn/beautiful-data-%e7%bb%9f%e8%ae%a1%e8%af%ad%e8%a8%80%e6%a8%a1%e5%9e%8b%e7%9a%84%e5%ba%94%e7%94%a8%e4%b8%80%e7%bc%98%e8%b5%b7' rel='bookmark' title='Permanent Link: Beautiful Data-统计语言模型的应用一：缘起'>Beautiful Data-统计语言模型的应用一：缘起</a></li>
<li><a href='http://www.52nlp.cn/natural-language-processing-company-metaweb' rel='bookmark' title='Permanent Link: 自然语言处理公司巡礼六：Metaweb'>自然语言处理公司巡礼六：Metaweb</a></li>
<li><a href='http://www.52nlp.cn/natural-language-processing-company-systran' rel='bookmark' title='Permanent Link: 自然语言处理公司巡礼四：Systran'>自然语言处理公司巡礼四：Systran</a></li>
<li><a href='http://www.52nlp.cn/%e6%9c%ba%e5%99%a8%e7%bf%bb%e8%af%91%e6%96%b0%e9%97%bb%e4%b8%80%e5%88%99-sdl%e5%85%ac%e5%8f%b8%e6%94%b6%e8%b4%adlanguage-weaver' rel='bookmark' title='Permanent Link: 机器翻译新闻一则：SDL公司收购Language Weaver'>机器翻译新闻一则：SDL公司收购Language Weaver</a></li>
<li><a href='http://www.52nlp.cn/cwb-trial-and-others' rel='bookmark' title='Permanent Link: CWB中文词库试用及其他'>CWB中文词库试用及其他</a></li>
<li><a href='http://www.52nlp.cn/beautiful-data-%e7%bb%9f%e8%ae%a1%e8%af%ad%e8%a8%80%e6%a8%a1%e5%9e%8b%e7%9a%84%e5%ba%94%e7%94%a8%e4%b8%89%e5%88%86%e8%af%8d5' rel='bookmark' title='Permanent Link: Beautiful Data-统计语言模型的应用三：分词5'>Beautiful Data-统计语言模型的应用三：分词5</a></li>
<li><a href='http://www.52nlp.cn/beautiful-data-%e7%bb%9f%e8%ae%a1%e8%af%ad%e8%a8%80%e6%a8%a1%e5%9e%8b%e7%9a%84%e5%ba%94%e7%94%a8%e4%ba%8c%e8%83%8c%e6%99%af' rel='bookmark' title='Permanent Link: Beautiful Data-统计语言模型的应用二：背景'>Beautiful Data-统计语言模型的应用二：背景</a></li>
<li><a href='http://www.52nlp.cn/natural-language-processing-and-computational-linguistics-common-abbreviations-acronyms' rel='bookmark' title='Permanent Link: 自然语言处理及计算语言学常见缩略语'>自然语言处理及计算语言学常见缩略语</a></li>
<li><a href='http://www.52nlp.cn/automated-essay-scoring-and-natural-language-processing' rel='bookmark' title='Permanent Link: 自动作文评分与自然语言处理'>自动作文评分与自然语言处理</a></li>
<li><a href='http://www.52nlp.cn/about-acl-anthology-network' rel='bookmark' title='Permanent Link: ACL Anthology 姊妹篇：ACL Anthology Network'>ACL Anthology 姊妹篇：ACL Anthology Network</a></li>
</ol></p><img src="http://feeds.feedburner.com/~r/52nlp/~4/yvs-m6Gz9J4" height="1" width="1"/>]]></content:encoded>
			<wfw:commentRss>http://www.52nlp.cn/%e8%af%ad%e4%b9%89%e7%bd%91%e6%96%b0%e9%97%bb%e4%b8%80%e5%88%99-google%e6%94%b6%e8%b4%ad%e8%af%ad%e4%b9%89%e7%bd%91%e5%85%ac%e5%8f%b8metaweb/feed</wfw:commentRss>
		<slash:comments>2</slash:comments>
		<feedburner:origLink>http://www.52nlp.cn/%e8%af%ad%e4%b9%89%e7%bd%91%e6%96%b0%e9%97%bb%e4%b8%80%e5%88%99-google%e6%94%b6%e8%b4%ad%e8%af%ad%e4%b9%89%e7%bd%91%e5%85%ac%e5%8f%b8metaweb</feedburner:origLink></item>
		<item>
		<title>天佑安康，天佑父老乡亲！</title>
		<link>http://feedproxy.google.com/~r/52nlp/~3/ExyvQ-nyLzw/%e5%a4%a9%e4%bd%91%e5%ae%89%e5%ba%b7-%e5%a4%a9%e4%bd%91%e7%88%b6%e8%80%81%e4%b9%a1%e4%ba%b2</link>
		<comments>http://www.52nlp.cn/%e5%a4%a9%e4%bd%91%e5%ae%89%e5%ba%b7-%e5%a4%a9%e4%bd%91%e7%88%b6%e8%80%81%e4%b9%a1%e4%ba%b2#comments</comments>
		<pubDate>Sun, 18 Jul 2010 16:05:53 +0000</pubDate>
		<dc:creator>52nlp</dc:creator>
				<category><![CDATA[随笔]]></category>

		<guid isPermaLink="false">http://www.52nlp.cn/?p=3413</guid>
		<description><![CDATA[　　还有一尺，水就要到达家里的二楼了，父亲还在安慰我没事~~虽然从小生活在汉江边，见惯了每年夏天的大小洪水，但是真正的大洪水，我却并没有多少亲历：
　　1983年7月安康遭遇百年不遇的特大洪水，我刚出生三个月，家里的老房子上面还过船，但是我没有任何印记；
　　2005年安康10月大洪水，我在哈尔滨，等父亲告诉我的时候水已退了，那个时候的最大水位就是还有一尺水就要到家里二楼，幸好水没有再涨；
　　前天给家里打电话，父母还告诉我老家没怎么下雨，等今天知道消息时，水已经到家门口了！刚刚给父亲打电话，水平了2005年的记录，不过还在慢慢涨，但是他还在安慰我说没事，让我早点休息！
　　这个时候最应该陪在父母身边的是我，可是自己却远隔千里之外，只能通过一部手机还有这个网络搜寻着任何可能的消息！
　　天佑安康，天佑父老乡亲！挺过今晚，一切都会好的！


相关文章:博客新家，开始新的旅程！
Google&#8217;s Python Class &#8211; SOS
“知行合一”与自然语言处理
“我爱自然语言处理”PageRank再次更新
5.12一周年，愿逝者安息！
单词也疯狂——漂亮的“单词云”
关于计算语言学的一首词
祝大家牛年一帆风顺
赞一下host2ez
Google’s Python Class SOS 续 &#8211;下载



相关文章:<ol><li><a href='http://www.52nlp.cn/new-home-new-start' rel='bookmark' title='Permanent Link: 博客新家，开始新的旅程！'>博客新家，开始新的旅程！</a></li>
<li><a href='http://www.52nlp.cn/googles-python-class-sos' rel='bookmark' title='Permanent Link: Google&#8217;s Python Class &#8211; SOS'>Google&#8217;s Python Class &#8211; SOS</a></li>
<li><a href='http://www.52nlp.cn/the-knowledge-and-action-in-natural-language-processing' rel='bookmark' title='Permanent Link: “知行合一”与自然语言处理'>“知行合一”与自然语言处理</a></li>
<li><a href='http://www.52nlp.cn/52nlp-pagerank-update-second' rel='bookmark' title='Permanent Link: “我爱自然语言处理”PageRank再次更新'>“我爱自然语言处理”PageRank再次更新</a></li>
<li><a href='http://www.52nlp.cn/512%e4%b8%80%e5%91%a8%e5%b9%b4%ef%bc%8c%e6%84%bf%e9%80%9d%e8%80%85%e5%ae%89%e6%81%af%ef%bc%81' rel='bookmark' title='Permanent Link: 5.12一周年，愿逝者安息！'>5.12一周年，愿逝者安息！</a></li>
<li><a href='http://www.52nlp.cn/crazy-word-beautiful-word-clouds' rel='bookmark' title='Permanent Link: 单词也疯狂——漂亮的“单词云”'>单词也疯狂——漂亮的“单词云”</a></li>
<li><a href='http://www.52nlp.cn/a-poem-computational-linguistics' rel='bookmark' title='Permanent Link: 关于计算语言学的一首词'>关于计算语言学的一首词</a></li>
<li><a href='http://www.52nlp.cn/happy-niu-year' rel='bookmark' title='Permanent Link: 祝大家牛年一帆风顺'>祝大家牛年一帆风顺</a></li>
<li><a href='http://www.52nlp.cn/praise-host2ez' rel='bookmark' title='Permanent Link: 赞一下host2ez'>赞一下host2ez</a></li>
<li><a href='http://www.52nlp.cn/googles-python-class-sos-%e7%bb%ad-%e4%b8%8b%e8%bd%bd' rel='bookmark' title='Permanent Link: Google’s Python Class SOS 续 &#8211;下载'>Google’s Python Class SOS 续 &#8211;下载</a></li>
</ol>]]></description>
			<content:encoded><![CDATA[<p>　　还有一尺，水就要到达家里的二楼了，父亲还在安慰我没事~~虽然从小生活在汉江边，见惯了每年夏天的大小洪水，但是真正的大洪水，我却并没有多少亲历：<br />
　　1983年7月安康遭遇百年不遇的特大洪水，我刚出生三个月，家里的老房子上面还过船，但是我没有任何印记；<br />
　　2005年安康10月大洪水，我在哈尔滨，等父亲告诉我的时候水已退了，那个时候的最大水位就是还有一尺水就要到家里二楼，幸好水没有再涨；<br />
　　前天给家里打电话，父母还告诉我老家没怎么下雨，等今天知道消息时，水已经到家门口了！刚刚给父亲打电话，水平了2005年的记录，不过还在慢慢涨，但是他还在安慰我说没事，让我早点休息！<br />
　　这个时候最应该陪在父母身边的是我，可是自己却远隔千里之外，只能通过一部手机还有这个网络搜寻着任何可能的消息！<br />
　　天佑安康，天佑父老乡亲！挺过今晚，一切都会好的！</p>


<p>相关文章:<ol><li><a href='http://www.52nlp.cn/new-home-new-start' rel='bookmark' title='Permanent Link: 博客新家，开始新的旅程！'>博客新家，开始新的旅程！</a></li>
<li><a href='http://www.52nlp.cn/googles-python-class-sos' rel='bookmark' title='Permanent Link: Google&#8217;s Python Class &#8211; SOS'>Google&#8217;s Python Class &#8211; SOS</a></li>
<li><a href='http://www.52nlp.cn/the-knowledge-and-action-in-natural-language-processing' rel='bookmark' title='Permanent Link: “知行合一”与自然语言处理'>“知行合一”与自然语言处理</a></li>
<li><a href='http://www.52nlp.cn/52nlp-pagerank-update-second' rel='bookmark' title='Permanent Link: “我爱自然语言处理”PageRank再次更新'>“我爱自然语言处理”PageRank再次更新</a></li>
<li><a href='http://www.52nlp.cn/512%e4%b8%80%e5%91%a8%e5%b9%b4%ef%bc%8c%e6%84%bf%e9%80%9d%e8%80%85%e5%ae%89%e6%81%af%ef%bc%81' rel='bookmark' title='Permanent Link: 5.12一周年，愿逝者安息！'>5.12一周年，愿逝者安息！</a></li>
<li><a href='http://www.52nlp.cn/crazy-word-beautiful-word-clouds' rel='bookmark' title='Permanent Link: 单词也疯狂——漂亮的“单词云”'>单词也疯狂——漂亮的“单词云”</a></li>
<li><a href='http://www.52nlp.cn/a-poem-computational-linguistics' rel='bookmark' title='Permanent Link: 关于计算语言学的一首词'>关于计算语言学的一首词</a></li>
<li><a href='http://www.52nlp.cn/happy-niu-year' rel='bookmark' title='Permanent Link: 祝大家牛年一帆风顺'>祝大家牛年一帆风顺</a></li>
<li><a href='http://www.52nlp.cn/praise-host2ez' rel='bookmark' title='Permanent Link: 赞一下host2ez'>赞一下host2ez</a></li>
<li><a href='http://www.52nlp.cn/googles-python-class-sos-%e7%bb%ad-%e4%b8%8b%e8%bd%bd' rel='bookmark' title='Permanent Link: Google’s Python Class SOS 续 &#8211;下载'>Google’s Python Class SOS 续 &#8211;下载</a></li>
</ol></p><img src="http://feeds.feedburner.com/~r/52nlp/~4/ExyvQ-nyLzw" height="1" width="1"/>]]></content:encoded>
			<wfw:commentRss>http://www.52nlp.cn/%e5%a4%a9%e4%bd%91%e5%ae%89%e5%ba%b7-%e5%a4%a9%e4%bd%91%e7%88%b6%e8%80%81%e4%b9%a1%e4%ba%b2/feed</wfw:commentRss>
		<slash:comments>8</slash:comments>
		<feedburner:origLink>http://www.52nlp.cn/%e5%a4%a9%e4%bd%91%e5%ae%89%e5%ba%b7-%e5%a4%a9%e4%bd%91%e7%88%b6%e8%80%81%e4%b9%a1%e4%ba%b2</feedburner:origLink></item>
		<item>
		<title>ACL 2010 Best Paper Awards</title>
		<link>http://feedproxy.google.com/~r/52nlp/~3/CixbXgGjhyY/acl-2010-best-paper-awards</link>
		<comments>http://www.52nlp.cn/acl-2010-best-paper-awards#comments</comments>
		<pubDate>Thu, 15 Jul 2010 14:21:19 +0000</pubDate>
		<dc:creator>52nlp</dc:creator>
				<category><![CDATA[自然语言处理]]></category>
		<category><![CDATA[计算语言学]]></category>
		<category><![CDATA[ACL]]></category>
		<category><![CDATA[ACL 2010]]></category>
		<category><![CDATA[Best long paper]]></category>
		<category><![CDATA[Best Paper Awards]]></category>
		<category><![CDATA[Best short paper]]></category>
		<category><![CDATA[IBM Best student paper]]></category>
		<category><![CDATA[Lifetime Achievement Award]]></category>

		<guid isPermaLink="false">http://www.52nlp.cn/?p=3404</guid>
		<description><![CDATA[　　ACL 2010官方主页似乎在前几天已经确定好了本次大会的Best Paper Awards，在其Awards页面里，不仅给出了本次大会的Best long paper, Best short paper, IBM Best student paper，而且包括其在会议期间Presented time. 
Best long paper
Beyond NomBank: A Study of Implicit Arguments for Nominal Predicates
Matthew Gerber and Joyce Chai
Despite its substantial coverage, NomBank does not account for all within-sentence arguments and ignores extrasentential arguments altogether. These arguments, which we call implicit, are important to [...]


相关文章:<ol><li><a href='http://www.52nlp.cn/acl-ijcnlp-2009-best-paper-awards' rel='bookmark' title='Permanent Link: ACL-IJCNLP 2009 Best Paper Awards'>ACL-IJCNLP 2009 Best Paper Awards</a></li>
<li><a href='http://www.52nlp.cn/acl-ijcnlp-2009-running-one' rel='bookmark' title='Permanent Link: ACL-IJCNLP 2009会议进行时一'>ACL-IJCNLP 2009会议进行时一</a></li>
<li><a href='http://www.52nlp.cn/acl-2010%e6%96%87%e7%ab%a0%e5%b7%b2%e5%8f%af%e4%b8%8b%e8%bd%bd' rel='bookmark' title='Permanent Link: ACL 2010文章已可下载'>ACL 2010文章已可下载</a></li>
<li><a href='http://www.52nlp.cn/acl-2010-paper-%e5%9b%bd%e5%86%85%e7%a0%94%e7%a9%b6%e5%8d%95%e4%bd%8d%e5%bd%95%e7%94%a8%e6%83%85%e5%86%b5' rel='bookmark' title='Permanent Link: ACL 2010 Paper国内研究单位录用情况'>ACL 2010 Paper国内研究单位录用情况</a></li>
<li><a href='http://www.52nlp.cn/coling-2010-prospect' rel='bookmark' title='Permanent Link: COLING 2010前瞻——规则与统计共舞，语言随计算齐飞'>COLING 2010前瞻——规则与统计共舞，语言随计算齐飞</a></li>
<li><a href='http://www.52nlp.cn/natural-language-processing-and-computational-linguistics-books-summary-six-foreign-book' rel='bookmark' title='Permanent Link: 自然语言处理与计算语言学书籍汇总之六：国外书籍'>自然语言处理与计算语言学书籍汇总之六：国外书籍</a></li>
<li><a href='http://www.52nlp.cn/acl-ijcnlp-2009-%e8%af%84%e8%bf%b0%e8%8a%82%e9%80%89' rel='bookmark' title='Permanent Link: ACL-IJCNLP 2009 评述节选'>ACL-IJCNLP 2009 评述节选</a></li>
<li><a href='http://www.52nlp.cn/acl-2010-list-of-accepted-papers' rel='bookmark' title='Permanent Link: ACL 2010: List of Accepted Papers'>ACL 2010: List of Accepted Papers</a></li>
<li><a href='http://www.52nlp.cn/acl-anthology-computational-linguistics-digital-archive' rel='bookmark' title='Permanent Link: ACL Anthology——计算语言学的数字档案'>ACL Anthology——计算语言学的数字档案</a></li>
<li><a href='http://www.52nlp.cn/about-acl-anthology-network' rel='bookmark' title='Permanent Link: ACL Anthology 姊妹篇：ACL Anthology Network'>ACL Anthology 姊妹篇：ACL Anthology Network</a></li>
</ol>]]></description>
			<content:encoded><![CDATA[<p>　　ACL 2010官方主页似乎在前几天已经确定好了本次大会的Best Paper Awards，在其<a href="http://acl2010.org/awards.html"target=_blank>Awards</a>页面里，不仅给出了本次大会的Best long paper, Best short paper, IBM Best student paper，而且包括其在会议期间Presented time. <span id="more-3404"></span></p>
<p><strong>Best long paper</strong><br />
Beyond NomBank: A Study of Implicit Arguments for Nominal Predicates<br />
Matthew Gerber and Joyce Chai</p>
<blockquote><p>Despite its substantial coverage, NomBank does not account for all within-sentence arguments and ignores extrasentential arguments altogether. These arguments, which we call implicit, are important to semantic processing, and their recovery could potentially benefit many NLP applications. We present a study of implicit arguments for a select group of frequent nominal predicates. We show that implicit arguments are pervasive for these predicates, adding 65% to the coverage of NomBank. We demonstrate the feasibility of recovering implicit arguments with a supervised classification model. Our results and analyses provide a baseline for future work on this emerging task.</p></blockquote>
<p><strong>Best short paper</strong><br />
SVD and Clustering for Unsupervised POS Tagging<br />
Michael Lamar, Yariv Maron, Mark Johnson, Elie Bienenstock</p>
<blockquote><p>
We revisit the algorithm of Schütze (1995) for unsupervised part-of-speech tagging. The algorithm uses reduced-rank singular value decomposition followed by clustering to extract latent features from context distributions. As implemented here, it achieves state-of-the-art tagging accuracy at considerably less cost than more recent methods. It can also produce a range of finer-grained taggings, with potential applications to various tasks.</p></blockquote>
<p><strong>IBM Best student paper</strong><br />
Extracting Social Networks from Literary Fiction<br />
David Elson,  Nicholas Dames,  Kathleen McKeown<br />
（注：该文也是一篇long paper，作者是学生）</p>
<blockquote><p>
We present a method for extracting social networks from literature, namely, nineteenth-century British novels and serials. We derive the networks from dialogue interactions, and thus our method depends on the ability to determine when two characters are in conversation. Our approach involves character name chunking, quoted speech attribution and conversation detection given the set of quotes. We extract features from the social networks and examine their correlation with one another, as well as with metadata such as the novel’s setting. Our results provide evidence that the majority of novels in this time period do not fit two characterizations provided by literacy scholars. Instead, our results suggest an alternative explanation for differences in social networks.</p></blockquote>
<p>　　Best Paper Awards是由ACL的一个专门委员会评选出的，将在大会结束时进行颁奖。ACL 2010还有一个”Lifetime Achievement Award（终生成就奖）“，不过目前还没有揭晓获奖者。关于这个奖项，ACL 2010给了一段很有意思的介绍：</p>
<blockquote><p>The ACL Lifetime Achievement Award (LTA) was instituted on the occasion of the Association&#8217;s 40th anniversary meeting.  The award is presented for scientific achievement, of both theoretical and applied nature, in the field of Computational Linguistics.  Currently, an ACL committee nominates and selects at most one award recipient annually, considering the originality, depth, breadth, and impact of the entire body of the nominee&#8217;s work in the field. The award is a crystal trophy and the recipient is invited to give a 45-minute speech on his or her view of the development of Computational Linguistics at the annual meeting of the association.  As of 2004, the speech has been subsequently published in the Association&#8217;s journal, Computational Linguistics.  The speech is introduced by the announcement of the award winner, whose identity is not made public until that time.</p></blockquote>
<p>　　Lifetime Achievement Award（终生成就奖）每届最多只授予一位对于自然语言处理与计算语言学有着举足轻重影响的候选者，此前获得该奖项的分别是：Aravind Joshi (2002), Makoto Nagao (2003), Karen Spärck Jones (2004), Martin Kay (2005), Eva Hajicová (2006), Lauri Karttunen (2007), Yorick Wilks (2008) and Fred Jelinek (2009).  </p>
<p>注：转载请注明出处“<a href="http://www.52nlp.cn">我爱自然语言处理</a>”：<a href="http://www.52nlp.cn">www.52nlp.cn</a></p>
<p>本文链接地址：<a href="http://www.52nlp.cn/acl-2010-best-paper-awards">http://www.52nlp.cn/acl-2010-best-paper-awards</a></p>
<p>
<!-- Begin Google Adsense code -->
<script type="text/javascript"><!--
google_ad_client = "pub-4332174469367599";
/* 336x280, 创建于 09-2-7 */
google_ad_slot = "5707022987";
google_ad_width = 336;
google_ad_height = 280;
//-->
</script>
<script type="text/javascript"
src="http://pagead2.googlesyndication.com/pagead/show_ads.js">
</script>
<!-- End Google Adsense code -->
   </p>


<p>相关文章:<ol><li><a href='http://www.52nlp.cn/acl-ijcnlp-2009-best-paper-awards' rel='bookmark' title='Permanent Link: ACL-IJCNLP 2009 Best Paper Awards'>ACL-IJCNLP 2009 Best Paper Awards</a></li>
<li><a href='http://www.52nlp.cn/acl-ijcnlp-2009-running-one' rel='bookmark' title='Permanent Link: ACL-IJCNLP 2009会议进行时一'>ACL-IJCNLP 2009会议进行时一</a></li>
<li><a href='http://www.52nlp.cn/acl-2010%e6%96%87%e7%ab%a0%e5%b7%b2%e5%8f%af%e4%b8%8b%e8%bd%bd' rel='bookmark' title='Permanent Link: ACL 2010文章已可下载'>ACL 2010文章已可下载</a></li>
<li><a href='http://www.52nlp.cn/acl-2010-paper-%e5%9b%bd%e5%86%85%e7%a0%94%e7%a9%b6%e5%8d%95%e4%bd%8d%e5%bd%95%e7%94%a8%e6%83%85%e5%86%b5' rel='bookmark' title='Permanent Link: ACL 2010 Paper国内研究单位录用情况'>ACL 2010 Paper国内研究单位录用情况</a></li>
<li><a href='http://www.52nlp.cn/coling-2010-prospect' rel='bookmark' title='Permanent Link: COLING 2010前瞻——规则与统计共舞，语言随计算齐飞'>COLING 2010前瞻——规则与统计共舞，语言随计算齐飞</a></li>
<li><a href='http://www.52nlp.cn/natural-language-processing-and-computational-linguistics-books-summary-six-foreign-book' rel='bookmark' title='Permanent Link: 自然语言处理与计算语言学书籍汇总之六：国外书籍'>自然语言处理与计算语言学书籍汇总之六：国外书籍</a></li>
<li><a href='http://www.52nlp.cn/acl-ijcnlp-2009-%e8%af%84%e8%bf%b0%e8%8a%82%e9%80%89' rel='bookmark' title='Permanent Link: ACL-IJCNLP 2009 评述节选'>ACL-IJCNLP 2009 评述节选</a></li>
<li><a href='http://www.52nlp.cn/acl-2010-list-of-accepted-papers' rel='bookmark' title='Permanent Link: ACL 2010: List of Accepted Papers'>ACL 2010: List of Accepted Papers</a></li>
<li><a href='http://www.52nlp.cn/acl-anthology-computational-linguistics-digital-archive' rel='bookmark' title='Permanent Link: ACL Anthology——计算语言学的数字档案'>ACL Anthology——计算语言学的数字档案</a></li>
<li><a href='http://www.52nlp.cn/about-acl-anthology-network' rel='bookmark' title='Permanent Link: ACL Anthology 姊妹篇：ACL Anthology Network'>ACL Anthology 姊妹篇：ACL Anthology Network</a></li>
</ol></p><img src="http://feeds.feedburner.com/~r/52nlp/~4/CixbXgGjhyY" height="1" width="1"/>]]></content:encoded>
			<wfw:commentRss>http://www.52nlp.cn/acl-2010-best-paper-awards/feed</wfw:commentRss>
		<slash:comments>3</slash:comments>
		<feedburner:origLink>http://www.52nlp.cn/acl-2010-best-paper-awards</feedburner:origLink></item>
		<item>
		<title>ACL 2010文章已可下载</title>
		<link>http://feedproxy.google.com/~r/52nlp/~3/0OPn-TcXP1c/acl-2010%e6%96%87%e7%ab%a0%e5%b7%b2%e5%8f%af%e4%b8%8b%e8%bd%bd</link>
		<comments>http://www.52nlp.cn/acl-2010%e6%96%87%e7%ab%a0%e5%b7%b2%e5%8f%af%e4%b8%8b%e8%bd%bd#comments</comments>
		<pubDate>Sun, 11 Jul 2010 14:30:49 +0000</pubDate>
		<dc:creator>52nlp</dc:creator>
				<category><![CDATA[自然语言处理]]></category>
		<category><![CDATA[计算语言学]]></category>
		<category><![CDATA[ACL]]></category>
		<category><![CDATA[ACL 2010]]></category>
		<category><![CDATA[ACL Anthology]]></category>
		<category><![CDATA[Min-Yen Kan]]></category>

		<guid isPermaLink="false">http://www.52nlp.cn/?p=3398</guid>
		<description><![CDATA[　　晚上收到ACL Anthology负责人Min-Yen Kan发给ACL Anthology Google Group的邮件，通知说目前ACL 2010的文章已经可以下载，包括full papers, short papers, student research workshop papers, demonstrations, tutorial abstracts以及所有的workshops的Paper，才想起今天（7月11号）ACL 2010会议召开。以下是具体的下载地址，有兴趣的读者可以关注一下。
　　一、ACL 2010大会论文集：
　　Proceedings of the ACL 2010 conference can be found here:
　　http://www.aclweb.org/anthology/P/P10/
　　These include both volumes: (I) full papers and (II) short papers,student research workshop papers, demonstrations and tutorial abstracts.
　　二、Workshop论文集：
　　The proceedings of the workshops and conferences co-located with ACL 2010 [...]


相关文章:<ol><li><a href='http://www.52nlp.cn/acl-anthology-computational-linguistics-digital-archive' rel='bookmark' title='Permanent Link: ACL Anthology——计算语言学的数字档案'>ACL Anthology——计算语言学的数字档案</a></li>
<li><a href='http://www.52nlp.cn/coling-2010-prospect' rel='bookmark' title='Permanent Link: COLING 2010前瞻——规则与统计共舞，语言随计算齐飞'>COLING 2010前瞻——规则与统计共舞，语言随计算齐飞</a></li>
<li><a href='http://www.52nlp.cn/acl-wiki-encyclopedia-of-computational-linguistics' rel='bookmark' title='Permanent Link: ACL Wiki——计算语言学的百科全书'>ACL Wiki——计算语言学的百科全书</a></li>
<li><a href='http://www.52nlp.cn/about-acl-anthology-network' rel='bookmark' title='Permanent Link: ACL Anthology 姊妹篇：ACL Anthology Network'>ACL Anthology 姊妹篇：ACL Anthology Network</a></li>
<li><a href='http://www.52nlp.cn/acl-ijcnlp-2009-running-one' rel='bookmark' title='Permanent Link: ACL-IJCNLP 2009会议进行时一'>ACL-IJCNLP 2009会议进行时一</a></li>
<li><a href='http://www.52nlp.cn/getting-started-in-natural-language-processing' rel='bookmark' title='Permanent Link: 如何学习自然语言处理'>如何学习自然语言处理</a></li>
<li><a href='http://www.52nlp.cn/acl-2010-best-paper-awards' rel='bookmark' title='Permanent Link: ACL 2010 Best Paper Awards'>ACL 2010 Best Paper Awards</a></li>
<li><a href='http://www.52nlp.cn/natural-language-processing-and-computational-linguistics-common-abbreviations-acronyms' rel='bookmark' title='Permanent Link: 自然语言处理及计算语言学常见缩略语'>自然语言处理及计算语言学常见缩略语</a></li>
<li><a href='http://www.52nlp.cn/natural-language-processing-and-computational-linguistics-books-summary-seven-other-book' rel='bookmark' title='Permanent Link: 自然语言处理与计算语言学书籍汇总之七：其他书籍'>自然语言处理与计算语言学书籍汇总之七：其他书籍</a></li>
<li><a href='http://www.52nlp.cn/natural-language-processing-and-computational-linguistics-books-summary-six-foreign-book' rel='bookmark' title='Permanent Link: 自然语言处理与计算语言学书籍汇总之六：国外书籍'>自然语言处理与计算语言学书籍汇总之六：国外书籍</a></li>
</ol>]]></description>
			<content:encoded><![CDATA[<p>　　晚上收到<a href="http://www.52nlp.cn/acl-anthology-computational-linguistics-digital-archive">ACL Anthology</a>负责人Min-Yen Kan发给ACL Anthology Google Group的邮件，通知说目前ACL 2010的文章已经可以下载，包括full papers, short papers, student research workshop papers, demonstrations, tutorial abstracts以及所有的workshops的Paper，才想起今天（7月11号）ACL 2010会议召开。以下是具体的下载地址，有兴趣的读者可以关注一下。<span id="more-3398"></span></p>
<p>　　一、ACL 2010大会论文集：<br />
　　Proceedings of the ACL 2010 conference can be found here:<br />
　　<a href=" http://www.aclweb.org/anthology/P/P10/"target=_blank>http://www.aclweb.org/anthology/P/P10/</a><br />
　　These include both volumes: (I) full papers and (II) short papers,student research workshop papers, demonstrations and tutorial abstracts.</p>
<p>　　二、Workshop论文集：<br />
　　The proceedings of the workshops and conferences co-located with ACL 2010 are now online.<br />
　　<a href="http://www.aclweb.org/anthology/W/W10/"target=_blank>http://www.aclweb.org/anthology/W/W10/</a><br />
(scroll towards the bottom of the table of contents)</p>
<p>* Joint Fifth Workshop on Statistical Machine Translation and MetricsMATR<br />
* Fourth Linguistic Annotation Workshop<br />
* 2010 Workshop on Biomedical Natural Language Processing<br />
* 2010 Workshop on Cognitive Modeling and Computational Linguistics<br />
* 2010 Workshop on NLP and Linguistics: Finding the Common Ground<br />
* 11th Meeting of the ACL Special Interest Group on Computational Morphology and Phonology<br />
* TextGraphs-5 &#8211; 2010 Workshop on Graph-based Methods for Natural Language Processing<br />
* 2010 Named Entities Workshop<br />
* 2010 Workshop on Applications of Tree Automata in Natural Language Processing<br />
* 2010 Workshop on Domain Adaptation for Natural Language Processing<br />
* 2010 Workshop on Companionable Dialogue Systems<br />
* 2010 Workshop on GEometrical Models of Natural Language Semantics</p>
<p>注：转载请注明出处“<a href="http://www.52nlp.cn">我爱自然语言处理</a>”：<a href="http://www.52nlp.cn">www.52nlp.cn</a></p>
<p>本文链接地址：<a href="http://www.52nlp.cn/acl-2010文章已可下载">http://www.52nlp.cn/acl-2010文章已可下载</a></p>
<p>
<!-- Begin Google Adsense code -->
<script type="text/javascript"><!--
google_ad_client = "pub-4332174469367599";
/* 336x280, 创建于 09-2-7 */
google_ad_slot = "5707022987";
google_ad_width = 336;
google_ad_height = 280;
//-->
</script>
<script type="text/javascript"
src="http://pagead2.googlesyndication.com/pagead/show_ads.js">
</script>
<!-- End Google Adsense code -->
      </p>


<p>相关文章:<ol><li><a href='http://www.52nlp.cn/acl-anthology-computational-linguistics-digital-archive' rel='bookmark' title='Permanent Link: ACL Anthology——计算语言学的数字档案'>ACL Anthology——计算语言学的数字档案</a></li>
<li><a href='http://www.52nlp.cn/coling-2010-prospect' rel='bookmark' title='Permanent Link: COLING 2010前瞻——规则与统计共舞，语言随计算齐飞'>COLING 2010前瞻——规则与统计共舞，语言随计算齐飞</a></li>
<li><a href='http://www.52nlp.cn/acl-wiki-encyclopedia-of-computational-linguistics' rel='bookmark' title='Permanent Link: ACL Wiki——计算语言学的百科全书'>ACL Wiki——计算语言学的百科全书</a></li>
<li><a href='http://www.52nlp.cn/about-acl-anthology-network' rel='bookmark' title='Permanent Link: ACL Anthology 姊妹篇：ACL Anthology Network'>ACL Anthology 姊妹篇：ACL Anthology Network</a></li>
<li><a href='http://www.52nlp.cn/acl-ijcnlp-2009-running-one' rel='bookmark' title='Permanent Link: ACL-IJCNLP 2009会议进行时一'>ACL-IJCNLP 2009会议进行时一</a></li>
<li><a href='http://www.52nlp.cn/getting-started-in-natural-language-processing' rel='bookmark' title='Permanent Link: 如何学习自然语言处理'>如何学习自然语言处理</a></li>
<li><a href='http://www.52nlp.cn/acl-2010-best-paper-awards' rel='bookmark' title='Permanent Link: ACL 2010 Best Paper Awards'>ACL 2010 Best Paper Awards</a></li>
<li><a href='http://www.52nlp.cn/natural-language-processing-and-computational-linguistics-common-abbreviations-acronyms' rel='bookmark' title='Permanent Link: 自然语言处理及计算语言学常见缩略语'>自然语言处理及计算语言学常见缩略语</a></li>
<li><a href='http://www.52nlp.cn/natural-language-processing-and-computational-linguistics-books-summary-seven-other-book' rel='bookmark' title='Permanent Link: 自然语言处理与计算语言学书籍汇总之七：其他书籍'>自然语言处理与计算语言学书籍汇总之七：其他书籍</a></li>
<li><a href='http://www.52nlp.cn/natural-language-processing-and-computational-linguistics-books-summary-six-foreign-book' rel='bookmark' title='Permanent Link: 自然语言处理与计算语言学书籍汇总之六：国外书籍'>自然语言处理与计算语言学书籍汇总之六：国外书籍</a></li>
</ol></p><img src="http://feeds.feedburner.com/~r/52nlp/~4/0OPn-TcXP1c" height="1" width="1"/>]]></content:encoded>
			<wfw:commentRss>http://www.52nlp.cn/acl-2010%e6%96%87%e7%ab%a0%e5%b7%b2%e5%8f%af%e4%b8%8b%e8%bd%bd/feed</wfw:commentRss>
		<slash:comments>10</slash:comments>
		<feedburner:origLink>http://www.52nlp.cn/acl-2010%e6%96%87%e7%ab%a0%e5%b7%b2%e5%8f%af%e4%b8%8b%e8%bd%bd</feedburner:origLink></item>
		<item>
		<title>自然语言处理与世界杯</title>
		<link>http://feedproxy.google.com/~r/52nlp/~3/njtT16mIAlM/%e8%87%aa%e7%84%b6%e8%af%ad%e8%a8%80%e5%a4%84%e7%90%86%e4%b8%8e%e4%b8%96%e7%95%8c%e6%9d%af</link>
		<comments>http://www.52nlp.cn/%e8%87%aa%e7%84%b6%e8%af%ad%e8%a8%80%e5%a4%84%e7%90%86%e4%b8%8e%e4%b8%96%e7%95%8c%e6%9d%af#comments</comments>
		<pubDate>Wed, 30 Jun 2010 13:00:36 +0000</pubDate>
		<dc:creator>52nlp</dc:creator>
				<category><![CDATA[自然语言处理]]></category>
		<category><![CDATA[随笔]]></category>
		<category><![CDATA[世界杯]]></category>
		<category><![CDATA[情感分析]]></category>
		<category><![CDATA[章成志]]></category>
		<category><![CDATA[聚类]]></category>

		<guid isPermaLink="false">http://www.52nlp.cn/?p=3389</guid>
		<description><![CDATA[　　自然语言处理与世界杯似乎没啥关系，不过今晚世界杯没有比赛了，我也可以回来照顾一下52nlp了。但是这两者的确没什么关系，我简单的Google了一下“自然语言处理 &#038; 世界杯”，没有什么好的材料，就先从读者评论说起吧。
　　读者Brishen评论：“可不可以对网络上赛前的言论做sentiment analysis来预测一下比赛结果呢？” 估计Brishen对Sentiment analysis（情感分析）有比较深的认识，我个人没有任何这方面的经验，不过感觉是一个不错的方向，不仅仅对于世界杯。如果读者有这方面的经验，欢迎在这里讨论。
　　聚类在自然语言处理中也有比较重要的应用，譬如词的聚类或者文本聚类。章成志老师近期写了一篇《世界杯比赛规则与数据聚类》，大概是与世界杯相关的最具科普性的一篇博文了，和自然语言处理也能扯点关系，以下全文转载自章成志老师的博客。
　　　　　　　　　世界杯比赛规则与数据聚类
       　　应该有很多博友像我一样，这段时间可能要花些时间看世界杯。有些博友还会发些心得。俺就从数据聚类的角度，来对世界杯比赛规则进行“重认识”一下，呵呵。
       　　先交代下基础背景知识，内行直接跳过本段，呵呵。数据聚类包括划分聚类、层次聚类等、基于模型的聚类等基本模式。划分聚类中最经典的方法就是K-均值聚类，需要事先给定初始点和聚类类目数。层次聚类中最常用的是HAC聚类，事先两两求出相似度，将最相似的或者最不相似的连接起来呢，然后再求次相似的，一直到所有点的都被连接为止。近年来，基于模型的聚类越来越火，可以将基于竞争的聚类方法划入这个类别。07年Frey提出的AP聚类方法更是被大量引用。
      　　再结合数据聚类，说下世界杯比赛规则。
      　　1. 首先，小组划分，是做基于约束的划分聚类：    
      　　(1) 经过预选赛入围的32只球队，被划分为4个档次，其中第一档中的8支球队作为种子队 （32个数据，8个聚类类目，将以往世界排名作为权重，选择初始聚类中心，当然东道主特殊，直接作为种子）；
      　　(2) 剩余球队按照其档次和所在洲的约束，进行抽签划分到相应的小组中（24个数据按照一定的规则约束后，随机分配到每个聚类中心的所在组中）；
 　　   [...]


相关文章:<ol><li><a href='http://www.52nlp.cn/natural-language-processing-company-teragram' rel='bookmark' title='Permanent Link: 自然语言处理公司巡礼一：Teragram'>自然语言处理公司巡礼一：Teragram</a></li>
<li><a href='http://www.52nlp.cn/tears-and-uninitiated-learn-from-natural-language-processing-heros' rel='bookmark' title='Permanent Link: “眼泪”与“门外汉”——向自然语言处理的大牛们学习'>“眼泪”与“门外汉”——向自然语言处理的大牛们学习</a></li>
<li><a href='http://www.52nlp.cn/nlpers-can-not-visit-recently' rel='bookmark' title='Permanent Link: nlpers最近无法访问'>nlpers最近无法访问</a></li>
<li><a href='http://www.52nlp.cn/i-love-natural-language-processing-stage-summary' rel='bookmark' title='Permanent Link: “我爱自然语言处理”阶段性总结'>“我爱自然语言处理”阶段性总结</a></li>
<li><a href='http://www.52nlp.cn/natural-language-processing-company-metaweb' rel='bookmark' title='Permanent Link: 自然语言处理公司巡礼六：Metaweb'>自然语言处理公司巡礼六：Metaweb</a></li>
<li><a href='http://www.52nlp.cn/natural-language-processing-company-autonomy' rel='bookmark' title='Permanent Link: 自然语言处理公司巡礼五：Autonomy'>自然语言处理公司巡礼五：Autonomy</a></li>
<li><a href='http://www.52nlp.cn/natural-language-processing-company-systran' rel='bookmark' title='Permanent Link: 自然语言处理公司巡礼四：Systran'>自然语言处理公司巡礼四：Systran</a></li>
<li><a href='http://www.52nlp.cn/natural-language-processing-company-inxight' rel='bookmark' title='Permanent Link: 自然语言处理公司巡礼三：Inxight'>自然语言处理公司巡礼三：Inxight</a></li>
<li><a href='http://www.52nlp.cn/natural-language-processing-company-powerset' rel='bookmark' title='Permanent Link: 自然语言处理公司巡礼二：Powerset'>自然语言处理公司巡礼二：Powerset</a></li>
<li><a href='http://www.52nlp.cn/%e8%87%aa%e7%84%b6%e8%af%ad%e8%a8%80%e5%a4%84%e7%90%86%e4%b8%8e%e5%8c%bb%e7%96%97%e5%81%a5%e5%ba%b7' rel='bookmark' title='Permanent Link: 自然语言处理与医疗健康'>自然语言处理与医疗健康</a></li>
</ol>]]></description>
			<content:encoded><![CDATA[<p>　　自然语言处理与世界杯似乎没啥关系，不过今晚世界杯没有比赛了，我也可以回来照顾一下52nlp了。但是这两者的确没什么关系，我简单的Google了一下“自然语言处理 &#038; 世界杯”，没有什么好的材料，就先从读者评论说起吧。<span id="more-3389"></span><br />
　　读者Brishen评论：“可不可以对网络上赛前的言论做sentiment analysis来预测一下比赛结果呢？” 估计Brishen对Sentiment analysis（情感分析）有比较深的认识，我个人没有任何这方面的经验，不过感觉是一个不错的方向，不仅仅对于世界杯。如果读者有这方面的经验，欢迎在这里讨论。<br />
　　聚类在自然语言处理中也有比较重要的应用，譬如词的聚类或者文本聚类。章成志老师近期写了一篇《<a href="http://www.sciencenet.cn/m/user_content.aspx?id=339277"target=_blank>世界杯比赛规则与数据聚类</a>》，大概是与世界杯相关的最具科普性的一篇博文了，和自然语言处理也能扯点关系，以下全文转载自<a href="http://www.sciencenet.cn/u/timy/">章成志老师的博客</a>。</p>
<blockquote><p>　　　　　　　　　世界杯比赛规则与数据聚类</p>
<p>       　　应该有很多博友像我一样，这段时间可能要花些时间看世界杯。有些博友还会发些心得。俺就从数据聚类的角度，来对世界杯比赛规则进行“重认识”一下，呵呵。</p>
<p>       　　先交代下基础背景知识，内行直接跳过本段，呵呵。数据聚类包括划分聚类、层次聚类等、基于模型的聚类等基本模式。划分聚类中最经典的方法就是K-均值聚类，需要事先给定初始点和聚类类目数。层次聚类中最常用的是HAC聚类，事先两两求出相似度，将最相似的或者最不相似的连接起来呢，然后再求次相似的，一直到所有点的都被连接为止。近年来，基于模型的聚类越来越火，可以将基于竞争的聚类方法划入这个类别。07年Frey提出的AP聚类方法更是被大量引用。</p>
<p>      　　再结合数据聚类，说下世界杯比赛规则。</p>
<p>      　　1. 首先，小组划分，是做基于约束的划分聚类：    </p>
<p>      　　(1) 经过预选赛入围的32只球队，被划分为4个档次，其中第一档中的8支球队作为种子队 （32个数据，8个聚类类目，将以往世界排名作为权重，选择初始聚类中心，当然东道主特殊，直接作为种子）；</p>
<p>      　　(2) 剩余球队按照其档次和所在洲的约束，进行抽签划分到相应的小组中（24个数据按照一定的规则约束后，随机分配到每个聚类中心的所在组中）；</p>
<p> 　　     2. 然后，正式比赛，是做层次聚类：</p>
<p>      　　(1) 小组确定后，每组四个对，两两求“相似度”，就是说两两打一场，胜的权重给3，平了给1，输了给0，每小组的6场赛事结束后，得到每个队的总体权重（当然了，有可能还要考虑净胜球，相互战绩啥的），那么小组中排名前2的队作为连接点参与下一个层次的聚类。（这里，两两求相似度，完全是基于竞争的，整个比赛阶段基于竞争的层次聚类）；</p>
<p>      　　(2) 淘汰赛阶段，直接竞争，做二分聚类，胜的参加下一轮聚类；</p>
<p>　　(3) 直到最后两支最牛的打决赛，冠军队成为了根节点。</p>
<p>     　　 3. 聚类结束，参数重新分配，准备4年后的聚类，呵呵。</p>
<p>　　     所以，世界杯做了大量的约束，注意比赛的观赏性，用了比较简单公平的方法，在较短时间内确定聚类层次关系。</p>
<p>     　　如果是动物界打比赛，可能又是另一个场景，完全自由随机的打，最强的完全有可能因为体力不支，提早被淘汰而成不了冠军。</p>
<p>　　    以上仅供娱乐参考，推理和比喻不当地方，请博友指出，谢谢。</p></blockquote>
<p>　　关于自然语言处理与世界杯，不知道读者朋友还能想到些什么？</p>
<p>注：转载请注明出处“<a href="http://www.52nlp.cn">我爱自然语言处理</a>”：<a href="http://www.52nlp.cn">www.52nlp.cn</a></p>
<p>本文链接地址：<a href="http://www.52nlp.cn/自然语言处理与世界杯">http://www.52nlp.cn/自然语言处理与世界杯</a></p>
<p>
<!-- Begin Google Adsense code -->
<script type="text/javascript"><!--
google_ad_client = "pub-4332174469367599";
/* 336x280, 创建于 09-2-7 */
google_ad_slot = "5707022987";
google_ad_width = 336;
google_ad_height = 280;
//-->
</script>
<script type="text/javascript"
src="http://pagead2.googlesyndication.com/pagead/show_ads.js">
</script>
<!-- End Google Adsense code -->
      </p>


<p>相关文章:<ol><li><a href='http://www.52nlp.cn/natural-language-processing-company-teragram' rel='bookmark' title='Permanent Link: 自然语言处理公司巡礼一：Teragram'>自然语言处理公司巡礼一：Teragram</a></li>
<li><a href='http://www.52nlp.cn/tears-and-uninitiated-learn-from-natural-language-processing-heros' rel='bookmark' title='Permanent Link: “眼泪”与“门外汉”——向自然语言处理的大牛们学习'>“眼泪”与“门外汉”——向自然语言处理的大牛们学习</a></li>
<li><a href='http://www.52nlp.cn/nlpers-can-not-visit-recently' rel='bookmark' title='Permanent Link: nlpers最近无法访问'>nlpers最近无法访问</a></li>
<li><a href='http://www.52nlp.cn/i-love-natural-language-processing-stage-summary' rel='bookmark' title='Permanent Link: “我爱自然语言处理”阶段性总结'>“我爱自然语言处理”阶段性总结</a></li>
<li><a href='http://www.52nlp.cn/natural-language-processing-company-metaweb' rel='bookmark' title='Permanent Link: 自然语言处理公司巡礼六：Metaweb'>自然语言处理公司巡礼六：Metaweb</a></li>
<li><a href='http://www.52nlp.cn/natural-language-processing-company-autonomy' rel='bookmark' title='Permanent Link: 自然语言处理公司巡礼五：Autonomy'>自然语言处理公司巡礼五：Autonomy</a></li>
<li><a href='http://www.52nlp.cn/natural-language-processing-company-systran' rel='bookmark' title='Permanent Link: 自然语言处理公司巡礼四：Systran'>自然语言处理公司巡礼四：Systran</a></li>
<li><a href='http://www.52nlp.cn/natural-language-processing-company-inxight' rel='bookmark' title='Permanent Link: 自然语言处理公司巡礼三：Inxight'>自然语言处理公司巡礼三：Inxight</a></li>
<li><a href='http://www.52nlp.cn/natural-language-processing-company-powerset' rel='bookmark' title='Permanent Link: 自然语言处理公司巡礼二：Powerset'>自然语言处理公司巡礼二：Powerset</a></li>
<li><a href='http://www.52nlp.cn/%e8%87%aa%e7%84%b6%e8%af%ad%e8%a8%80%e5%a4%84%e7%90%86%e4%b8%8e%e5%8c%bb%e7%96%97%e5%81%a5%e5%ba%b7' rel='bookmark' title='Permanent Link: 自然语言处理与医疗健康'>自然语言处理与医疗健康</a></li>
</ol></p><img src="http://feeds.feedburner.com/~r/52nlp/~4/njtT16mIAlM" height="1" width="1"/>]]></content:encoded>
			<wfw:commentRss>http://www.52nlp.cn/%e8%87%aa%e7%84%b6%e8%af%ad%e8%a8%80%e5%a4%84%e7%90%86%e4%b8%8e%e4%b8%96%e7%95%8c%e6%9d%af/feed</wfw:commentRss>
		<slash:comments>14</slash:comments>
		<feedburner:origLink>http://www.52nlp.cn/%e8%87%aa%e7%84%b6%e8%af%ad%e8%a8%80%e5%a4%84%e7%90%86%e4%b8%8e%e4%b8%96%e7%95%8c%e6%9d%af</feedburner:origLink></item>
		<item>
		<title>COLING 2010: List of Accepted Papers (Oral)</title>
		<link>http://feedproxy.google.com/~r/52nlp/~3/mCHtS9xfDHk/coling-2010-list-of-accepted-papers-oral</link>
		<comments>http://www.52nlp.cn/coling-2010-list-of-accepted-papers-oral#comments</comments>
		<pubDate>Fri, 04 Jun 2010 12:31:58 +0000</pubDate>
		<dc:creator>52nlp</dc:creator>
				<category><![CDATA[自然语言处理]]></category>
		<category><![CDATA[计算语言学]]></category>
		<category><![CDATA[COLING]]></category>
		<category><![CDATA[COLING 2010]]></category>
		<category><![CDATA[中文信息学会]]></category>

		<guid isPermaLink="false">http://www.52nlp.cn/?p=3385</guid>
		<description><![CDATA[　　这是Coling 2010的List of Accepted Papers(Oral)，先是从水木自然语言处理社区看到，才在Coling的官方主页上找到。关于Coling本次的录用情况，水木自然语言处理版已经有过一波大讨论了，有兴趣的读者可以关注一下。 Coling是ACL之外另一个自然语言处理与计算语言学界的顶级会议，全称国际计算语言学大会(International Conference on Computational Linguistics)，每两年举办一次，第23届COLING会议将于2010年8月23日~27日在中国北京举行，由中文信息学会承办。
　　以下仅列出Oral的录用情况，关于Poster的录用情况，可以在Coling 2010官方网站的全部录用结果中找到：
　　http://www.coling-2010.org/accepted%20papers.htm
Oral
   1.  Adrian Bickerstaffe and Ingrid Zukerman. A Hierarchical Classifier Applied to Multi-way Sentiment Detection
   2. Yiping Zhou, Lan Nie and Scott Gaffney. Surface Form Resolution Based on Wikipedia
   3. Zhongwu Zhai, Bing Liu, Hua Xu and Peifa [...]


相关文章:<ol><li><a href='http://www.52nlp.cn/acl-2010-list-of-accepted-papers' rel='bookmark' title='Permanent Link: ACL 2010: List of Accepted Papers'>ACL 2010: List of Accepted Papers</a></li>
<li><a href='http://www.52nlp.cn/acl-2010-paper-%e5%9b%bd%e5%86%85%e7%a0%94%e7%a9%b6%e5%8d%95%e4%bd%8d%e5%bd%95%e7%94%a8%e6%83%85%e5%86%b5' rel='bookmark' title='Permanent Link: ACL 2010 Paper国内研究单位录用情况'>ACL 2010 Paper国内研究单位录用情况</a></li>
<li><a href='http://www.52nlp.cn/coling-2010-prospect' rel='bookmark' title='Permanent Link: COLING 2010前瞻——规则与统计共舞，语言随计算齐飞'>COLING 2010前瞻——规则与统计共舞，语言随计算齐飞</a></li>
<li><a href='http://www.52nlp.cn/acl-ijcnlp-2009-running-two' rel='bookmark' title='Permanent Link: ACL-IJCNLP 2009会议进行时二'>ACL-IJCNLP 2009会议进行时二</a></li>
<li><a href='http://www.52nlp.cn/acl09-full-paper-accepted-details' rel='bookmark' title='Permanent Link: ACL09 Full Paper录用情况'>ACL09 Full Paper录用情况</a></li>
<li><a href='http://www.52nlp.cn/acl-ijcnlp-2009-running-one' rel='bookmark' title='Permanent Link: ACL-IJCNLP 2009会议进行时一'>ACL-IJCNLP 2009会议进行时一</a></li>
<li><a href='http://www.52nlp.cn/natural-language-processing-and-computational-linguistics-common-abbreviations-acronyms' rel='bookmark' title='Permanent Link: 自然语言处理及计算语言学常见缩略语'>自然语言处理及计算语言学常见缩略语</a></li>
<li><a href='http://www.52nlp.cn/acl-2010-best-paper-awards' rel='bookmark' title='Permanent Link: ACL 2010 Best Paper Awards'>ACL 2010 Best Paper Awards</a></li>
<li><a href='http://www.52nlp.cn/acl09-acceptance-rates-by-areas' rel='bookmark' title='Permanent Link: ACL09 Full Paper各研究领域的录用情况'>ACL09 Full Paper各研究领域的录用情况</a></li>
<li><a href='http://www.52nlp.cn/natural-language-processing-and-machine-translation-faq' rel='bookmark' title='Permanent Link: 自然语言处理与机器翻译FAQ'>自然语言处理与机器翻译FAQ</a></li>
</ol>]]></description>
			<content:encoded><![CDATA[<p>　　这是Coling 2010的List of Accepted Papers(Oral)，先是从水木自然语言处理社区看到，才在Coling的官方主页上找到。关于Coling本次的录用情况，水木自然语言处理版已经有过一波大讨论了，有兴趣的读者可以关注一下。 Coling是ACL之外另一个自然语言处理与计算语言学界的顶级会议，全称国际计算语言学大会(International Conference on Computational Linguistics)，每两年举办一次，第23届COLING会议将于2010年8月23日~27日在中国北京举行，由中文信息学会承办。<span id="more-3385"></span><br />
　　以下仅列出Oral的录用情况，关于Poster的录用情况，可以在Coling 2010官方网站的全部录用结果中找到：<br />
　　<a href="http://www.coling-2010.org/accepted%20papers.htm"target=_blank>http://www.coling-2010.org/accepted%20papers.htm</a></p>
<p>Oral<br />
   1.  Adrian Bickerstaffe and Ingrid Zukerman. A Hierarchical Classifier Applied to Multi-way Sentiment Detection<br />
   2. Yiping Zhou, Lan Nie and Scott Gaffney. Surface Form Resolution Based on Wikipedia<br />
   3. Zhongwu Zhai, Bing Liu, Hua Xu and Peifa Jia. Grouping Product Features Using Semi-Supervised Learning with Soft-Constraints<br />
   4. Qin Gao, Francisco Guzman and Stephan Vogel. EMDC: A Semi-supervised Approach for Word Alignment<br />
   5. George Tsatsaronis, Iraklis Varlamis and Kjetil Nørvåg. SemanticRank: Ranking Keywords and Sentences Using Semantic Graphs<br />
   6. Jian Huang, Pucktada Treeratpituk, Sarah Taylor and C. Lee Giles. Enhancing Cross Document Coreference of Web Documents with Context Similarity and Very Large Scale Text Categorization<br />
   7. Verena Henrich and Erhard Hinrichs. Standardizing Wordnets in the ISO Standard Wordnet-LMF: The Case of GermaNet<br />
   8. Ekaterina Shutova, Lin Sun and Anna Korhonen. Metaphor Identification Using Verb and Noun Clustering<br />
   9. Xiaoyan Cai, Wenjie Li and You Ouyang. Simultaneous Ranking and Clustering of Sentences: An Reinforcement Approach to Multi-Document Summarization<br />
  10. Peter Nilsson and Pierre Nugues. Automatic Discovery of Feature Sets for Dependency Parsing<br />
  11. Kavita Ganesan and ChengXiang Zhai. Opinosis: A Graph Based Approach to Abstractive Summarization of Highly Redundant Opinions<br />
  12. Doo Soon Kim, Ken Barker and Bruce Porter. Improving the Quality of Text Understanding by Delaying Ambiguity Resolution<br />
  13. Gumwon Hong, Chi-Ho Li, Ming Zhou and Hae-Chang Rim. An Empirical Study on Web Mining of Parallel Data<br />
  14. Nigel Collier, Reiko Matsuda Goodwin, John McCrae, Son Doan, Ai Kawazoe, Mike Conway, Asanee Kawtrakul, Koichi Takeuchi and Dinh Dien. An ontology-driven system for detecting global health events<br />
  15. Changqin Quan and Fuji Ren. An Exploration of Features for Recognizing Word Emotion<br />
  16. Jun Sun, Min Zhang and Chew Lim Tan. Discriminative Induction of Sub-Tree Alignment using Limited Labeled Data<br />
  17. Wanxiang Che and Ting Liu. Jointly Modeling WSD and SRL with Markov Logic<br />
  18. Su Nam Kim, Timothy Baldwin and Min-Yen Kan. Evaluating N-gram based Evaluation Metrics for Automatic Keyphrase Extraction<br />
  19. Yang Liu and Qun Liu. Joint Parsing and Translation<br />
  20. Shiqi Zhao, Haifeng Wang and Ting Liu. Paraphrasing with Search Engine Query Logs<br />
  21. Daniel Tse and James R. Curran. Chinese CCGbank: extracting CCG derivations from the Penn Chinese Treebank<br />
  22. Liang-Chih Yu, Hsiu-Min Shih, Yu-Ling Lai, Jui-Feng Yeh and Chung-Hsien Wu. Discriminative Training for Near-Synonym Substitution<br />
  23. Shiqi Zhao, Haifeng Wang, Xiang Lan and Ting Liu. Leveraging Multiple MT Engines for Paraphrase Generation<br />
  24. Audrey Laroche and Philippe Langlais. Revisiting Context-based Projection Methods for Term-Translation Spotting in Comparable Corpora<br />
  25. Bernd Bohnet. Top Accuracy and Fast Dependency Parsing is not a Contradiction<br />
  26. Sebastian Spiegler and Andrew van der Spuy. Ukwabelana &#8211; An open-source morphological Zulu corpus<br />
  27. Fang KONG, Guodong ZHOU, Longhua QIAN and Qiaoming ZHU. Dependency-driven Anaphoricity Determination for Coreference Resolution<br />
  28. Veronika Vincze and János Csirik. Hungarian Corpus of Light Verb Constructions<br />
  29. ding liu and daniel gildea. Semantic Role Features for Machine Translation<br />
  30. Fan Bu, Xiaoyan Zhu and Ming Li. Measuring the Non-compositionality of Multiword Expressions<br />
  31. Kai Wang and Tat-Seng Chua. Exploiting Salient Patterns for Question Detection and Question Retrieval in Community-based Question Answering<br />
  32. Matthias Hartung and Anette Frank. A Structured Vector Space Model for Hidden Attribute Meaning in Adjective-Noun Phrases<br />
  33. Guintaré Grigonyté, João Paulo Cordeiro, Rumen Moraliyski, Gaël Dias and Pavel Brazdil. Paraphrase Alignment for Synonym Evidence Discovery<br />
  34. Yaakov HaCohen-Kerner, Aharon Tayeb and Natan Ben-Dror. Plagiarism Detection in Computer Science Papers<br />
  35. Shane Bergsma and Colin Cherry. Fast and Accurate Arc Filtering for Dependency Parsing<br />
  36. Fei Huang and Bing Xiang. Feature-Rich Discriminative Phrase Rescoring for SMT<br />
  37. Katja Filippova. Multi-Sentence Compression: Finding Shortest Paths in Word Graphs<br />
  38. Roland Kuhn, Boxing Chen, George Foster and Evan Stratford. Phrase Clustering for Smoothing TM Probabilities – or, How to Extract Paraphrases from Phrase Tables<br />
  39. Josep Maria Crego, Aurélien Max and Fran?ois Yvon. Local lexical adaptation in Machine Translation through triangulation: SMT helping SMT<br />
  40. Young-Suk Lee, Bing Zhao and Xiaoqian Luo. Constituent Reordering and Syntax Models for English-to-Japanese Statistical Machine Translation<br />
  41. Mu Li, Ying-Gong Zhao, Dongdong Zhang and Ming Zhou. Adaptive Log-linear Model Parameter Selection for Statistical Machine Translation<br />
  42. Mengqiu Wang and Christopher Manning. Probabilistic Tree-Edit Models with Structured Latent Variables for Textual Entailment and Question Answering<br />
  43. Sara Salem and Samir AbdelRahman. A Multiple-Domain Ontology Builder<br />
  44. Ge Xu, Xinfan Meng and Houfeng Wang. Build Chinese Emotion Lexicons Using A Graph-based Algorithm and Multiple Resources<br />
  45. Yunfang Wu and Miaomiao Wen. Disambiguating Dynamic Sentiment Ambiguous Adjectives<br />
  46. Shasha Liao and Ralph Grishman. Filtered Ranking for Bootstrapping in Event Extraction<br />
  47. Shoushan Li, Sophia Y. M. Lee, Ying Chen, Chu-Ren Huang and Guodong Zhou. Sentiment Classification and Polarity Shifting<br />
  48. Bernard Brosseau-Villeneuve, Jian-Yun Nie and Noriko Kando. Towards an optimal weighting of context words based on distance<br />
  49. Makoto Miwa, Rune Sætre, Yusuke Miyao and Jun&#8217;ichi Tsujii. Entity-Focused Sentence Simplification for Relation Extraction<br />
  50. Chien Chin Chen and Chen-Yuan Wu. Bipolar Person Name Identification of Topic Documents Using Principal Component Analysis<br />
  51. Fangtao Li, Chao Han, Minlie Huang, Xiaoyan Zhu, Ying-Ju Xia, Shu Zhang and Hao Yu. Structure-Aware Review Mining and Summarization<br />
  52. Hassan Al-Haj and Shuly Wintner. Identifying Multi-word Expressions by Leveraging Morphological and Syntactic Idiosyncrasy<br />
  53. Nan Duan, Mu Li, Dongdong Zhang and Ming Zhou. Mixture Model-based Minimum Bayes Risk Decoding using Multiple Machine Translation Systems<br />
  54. Xinyan Xiao, Yang Liu, YoungSook Hwang, Qun Liu and Shouxun Lin. Joint Tokenization and Translation<br />
  55. Nan Duan. Translation Model Generalization using Probability Averaging for Machine Translation<br />
  56. Anders S?gaard and Christian Rish?j. Robust semi-supervised dependency parsing of German and Swedish using generalized tri-training<br />
  57. Laura Kallmeyer and Wolfgang Maier. Data-Driven Parsing with Probabilistic Linear Context-Free Rewriting Systems<br />
  58. Xian Qian, Qi Zhang, Xuangjing Huang and Lide Wu. 2D Trie for fast parsing<br />
  59. Stergos Afantenos and Nicholas Asher. Testing SDRT&#8217;s Right Frontier: Implications for Machine Learning Discourse Graphs<br />
  60. Naoaki Okazaki and Jun&#8217;ichi Tsujii. Simple and Efficient Algorithm for Approximate Dictionary Matching<br />
  61. Zarrieß Sina, Cahill Aoife, Kuhn Jonas and Rohrer Christian. Cross-Lingual Induction for Deep Broad-Coverage Syntax: A Case Study on German Participles<br />
  62. Jinhua Du and Andy Way. A Discriminative Latent Variable-Based “DE” Classifier for Chinese–English SMT<br />
  63. Makoto Miwa, Sampo Pyysalo, Tadayoshi Hara and Jun&#8217;ichi Tsujii. Evaluating Dependency Representations for Event Extraction<br />
  64. Zhemin Zhu, Delphine Bernhard and Iryna Gurevych. A Monolingual Syntactic Translation Model for Sentence Simplification<br />
  65. Ksenia Shalonova and Bruno Golenia. Weakly Supervised Morphology Learning for Agglutinating Languages Using Small Training Sets.<br />
  66. Xiaojun Wan. Towards a Unified Approach to Simultaneous Single-Document and Multi-Document Summarizations<br />
  67. Seokhwan Kim, Minwoo Jeong, Jonghoon Lee and Gary Geunbae Lee. A Cross-lingual Annotation Projection Approach for Relation Detection<br />
  68. Erwin Marsi and Emiel Krahmer. Automatic analysis of semantic similarity in comparable text through syntactic tree matching<br />
  69. Chao Shen and Tao Li. Multi-Document Summarization via the Minimum Dominating Set<br />
  70. Kun Wang, Chengqing Zong and Keh-Yih Su. A Character-Based Joint Model for Chinese Word Segmentation<br />
  71. Sung-Pil Choi and Sung-Hyon Myaeng. Simplicity is Better: Revisiting Single Kernel PPI Extraction<br />
  72. Tao Zhuang and Chengqing Zong. A Minimum Error Weighting Combination Strategy for Chinese Semantic Role Labeling<br />
  73. Hui Yang, Anne De Roeck, Alistair Willis and Bashar Nuseibeh. A Methodology for Automatic Identification of Nocuous Ambiguity<br />
  74. Toyomi Meguro, Ryuichiro Higashinaka, Yasuhiro Minami and Kohji Dohsaka. Controlling Listening-oriented Dialogue using Partially Observable Markov Decision Processes<br />
  75. Makbule Ozsoy, Ilyas Cicekli and Ferda Alpaslan. Text Summarization of Turkish Texts using Latent Semantic Analysis<br />
  76. Alena Neviarouskaya, Helmut Prendinger and Mitsuru Ishizuka. Recognition of Affect, Judgment, and Appreciation in Text<br />
  77. Mark Dredze, Paul McNamee, Delip Rao, Adam Gerber and Tim Finin. Entity Disambiguation for Knowledge Base Population<br />
  78. Minh-Thang Luong and Min-Yen Kan. Enhancing Morphological Alignment for Translating Highly Inflected Languages<br />
  79. Junhui Li, Guodong Zhou and Qiaoming Zhu. Learning the Scope of Negation via Shallow Semantic Parsing<br />
  80. Graeme Blackwood, Adrià de Gispert and William Byrne. Fluency Constraints for Minimum Bayes-Risk Decoding of Statistical Machine Translation Lattices<br />
  81. Muhua Zhu, Jingbo Zhu and Tong Xiao. Heterogeneous Parsing via Collaborative Decoding<br />
  82. Yue Lu, Huizhong Duan, Hongning Wang and ChengXiang Zhai. Exploiting Structured Ontology to Organize Scattered Online Opinions<br />
  83. Richard Johansson and Alessandro Moschitti. Reranking Models in Fine-grained Opinion Analysis<br />
  84. Ying Chen, Sophia Yat Mei Lee, Shoushan Li and Chu-Ren Huang. Emotion Cause Detection with Linguistic Constructions<br />
  85. Karthik Visweswariah, Jiri Navratil, Jeffrey Sorensen, Vijil Chenthamarakshan and Nandakishore Kambhatla. Syntax Based Reordering with Automatically Derived Rules for Improved Statistical Machine Translation<br />
  86. Bo Li and Eric Gaussier. Improving Corpus Comparability for Bilingual Lexicon Extraction from Comparable Corpora<br />
  87. Zhaopeng Tu, Yang Liu, Young-Sook Hwang, Qun Liu and Shouxun Lin. Dependency Forest for Statistical Machine Translation<br />
  88. Tomek Strzalkowski, George Aaron Broadwell, Jennifer Stromer-Galley, Samira Shaikh, Sarah Taylor and Nick Webb. Modeling Socio-Cultural Phenomena in Discourse<br />
  89. Henning Wachsmuth, Peter Prettenhofer and Benno Stein. Ef?cient Statement Identi?cation for Automatic Market Forecasting<br />
  90. Spence Green and Christopher D. Manning. Better Arabic Parsing: Baselines, Evaluations, and Analysis<br />
  91. Jian Zhang and Pascale Fung. A Rhetorical Syntax-Driven Model for Speech Summarization<br />
  92. Nuria Bel, Maria Coll and Gabriela Resnik. Automatic Detection of Non-deverbal Event Nouns for Quick Lexicon Production<br />
  93. Joakim Nivre, Laura Rimell, Ryan McDonald and Carlos Gómez Rodríguez. Evaluation of Dependency Parsers on Unbounded Dependencies<br />
  94. Lin Sun, Thierry Poibeau, Anna Korhonen and Cedric Messiant. Investigating the cross-linguistic potential of VerbNet -style classification<br />
  95. Sebastian Spiegler and Christian Monson. EMMA: A novel Evaluation Metric for Morphological Analysis<br />
  96. Naoki Yoshinaga and Masaru Kitsuregawa. Kernel Slicing: Scalable Online Training with Conjunctive Features<br />
  97. Xiaohua LIU, Kuan LI, Bo HAN, Ming ZHOU and Long JIANG. Semantic Role Labeling for News Tweets<br />
  98. Hector Llorens, Estela Saquete and Borja Navarro. TimeML Events Recognition and Classification: Learning CRF Models with Semantic Roles<br />
  99. Dmitry Davidov and Ari Rappoport. Automated Translation of Semantic Relationships<br />
 100. Bernd Bohnet, Leo Wanner, Simon Mill and Alicia Burga. Broad Coverage Multilingual Deep Sentence Generation with a Stochastic Multi-Level Realizer<br />
 101. Smruthi Mukund, Debanjan Ghosh and Rohini Srihari. Using Cross-Lingual Projections to Generate Semantic Role Labeled Annotated Corpus for Urdu &#8211; A Resource Poor Language<br />
 102. Michael Roth and Anette Frank. EM-based Alignment of Routes and Route Directions for Natural Language Generation<br />
 103. Lilja Øvrelid, Erik Velldal and Stephan Oepen. Syntactic Scope Resolution in Uncertainty Analysis<br />
 104. Vahed Qazvinian and Dragomir R. Radev. Citation Summarization Through Keyphrase Extraction<br />
 105. Jianfeng Gao, Xiaolong Li, Daniel Micol and Chris Quirk. A Large Scale Ranker-Based System A large scale ranker-bsaed system for search query spelling correction<br />
 106. Fabio Massimo Zanzotto, Ioannis Korkontzelos, Francesca Fallucchi and Suresh Manandhar. Estimating Linear Models for Compositional Distributional Semantics<br />
 107. Daniel Andrade, Tetsuya Nasukawa and Junichi Tsujii. Robust Measurement and Comparison of Context Similarity for Finding Translation Pairs<br />
 108. Markus Dickinson. Generating Learner-Like Morphological Errors in Russian<br />
 109. Alberto Barrón-Cede?o, Paolo Rosso, Eneko Agirre and Gorka Labaka. Plagiarism Detection across Distant Language Pairs<br />
 110. ThuyLinh Nguyen, Stephan Vogel and Noah A. Smith. Nonparametric Word Segmentation for Machine Translation<br />
 111. Claire Gardent and Laura Perez-Beltrachini. Efficient RTG based surface realisation for TAG<br />
 112. Rohit Kate, Xiaoqiang Luo, Siddharth Patwardhan, Martin Franz, Radu Florian, Raymond Mooney, Salim Roukos and Chris Welty. Learning to Predict Readability using Diverse Linguistic Features<br />
 113. Tong Wang and Graeme Hirst. Near-synonym Lexical Choice in Latent Semantic Space<br />
 114. Xiaowen Ding and Bing Liu. Resolving Object and Attribute Coreference in Opinion Mining<br />
 115. Ines Rehbein, Josef Ruppenhofer and Alexis Palmer. Bringing Active Learning to Life<br />
 116. Shachar Mirkin, Jonathan Berant, Ido Dagan and Eyal Shnarch. Recognising Entailment within Discourse<br />
 117. Alpa Jain and Patrick Pantel. FactRank: Random Walks on a Web of Facts<br />
 118. Petr Knoth, Jakub Novotny and Zdenek Zdrahal. Automatic generation of inter-passage links based on textual analysis of content<br />
 119. Andre Blessing and Hinrich Schütze. Self-Annotation for fine-grained geospatial relation extraction<br />
 120. Bart Cramer and Yi Zhang. Constraining robust constructions for broad-coverage parsing with precision grammars<br />
 121. Alpa Jain and Marco Pennacchiotti. Open Entity Extraction fromWeb Search Query Logs<br />
 122. Simon Zwarts, Mark Johnson and Robert Dale. Detecting Speech Repairs Incrementally Using a Noisy Channel Approach<br />
 123. Shuming Shi, Huibin Zhang, Xiaojie Yuan and Ji-Rong Wen. Corpus-based Semantic Class Mining: Distributional vs. Pattern-Based Approaches<br />
 124. Mark Johnson and Katherine Demuth. Unsupervised phonemic Chinese word segmentation using Adaptor Grammars<br />
 125. Sujith Ravi, Ashish Vaswani, Kevin Knight and David Chiang. Fast, Greedy Model Minimization for Unsupervised Tagging<br />
 126. Sanae Fujita and Masaaki Nagata. Enriching Dictionaries with Images from the Internet &#8211; Targeting Wikipedia and a Japanese Semantic Lexicon: Lexeed -<br />
 127. Dmitriy Genzel. Automatically Learning Source-side Reordering Rules for Large Scale Machine Translation<br />
 128. Bin Chen, Jian Su and Chew Lim Tan. A Twin-Candidate Based Approach for Event Pronoun Resolution using Composite Kernel<br />
 129. Yao Yao and Feng-hsi Liu. A Working Report on Statistically Modeling Dative Variation in Mandarin Chinese<br />
 130. Emily Pitler, Shane Bergsma, Dekang Lin and Kenneth Church. Using Web-scale N-grams to Improve Base NP Parsing Performance<br />
 131. Derya Ozkan, Kenji Sagae and Louis-Philippe Morency. Latent Mixture of Discriminative Experts for Multimodal Prediction Modeling<br />
 132. Carmen Banea, Rada Mihalcea and Janyce Wiebe. Multilingual Subjectivity: Are More Languages Better?<br />
 133. Tom Lippincott, Diarmuid ó Séaghdha, Lin Sun and Anna Korhonen. Exploring variation across biomedical subdomains<br />
 134. Jie Cai and Michael Strube. End-to-End Coreference Resolution via Hypergraph Partitioning<br />
 135. Pascal Denis and Philippe Muller. Comparison of different algebras for inducing the temporal structure of texts<br />
 136. Yang Wang and Kathleen McKeown. “Got You!”: Automatic Vandalism Detection in Wikipedia with Web-based Syntactic-Semantic Modeling<br />
 137. Katsuhiko Hayashi, Hajime Tsukada, Katsuhito Sudoh, Kevin Duh and Seiichi Yamamoto. Hierarchical Phrase-based Machine Translation with Word-based Reordering Model<br />
 138. Razvan Bunescu and Yunfeng Huang. A Utility-Driven Approach to Question Ranking<br />
 139. Jakob Uszkoreit, Jay Ponte, Ashok Popat and Moshe Dubiner. Large Scale Parallel Document Mining for Machine Translation<br />
 140. Xiance Si and Maosong Sun. Explore the Structure of Social Tags by Subsumption Relations<br />
 141. Mitesh Khapra, Saurabh Sohoney, Anup Kulkarni and Pushpak Bhattacharyya. Value for Money: Balancing Annotation Effort, Lexicon Building and Accuracy for Multilingual WSD<br />
 142. Mei Yang and Katrin Kirchhoff. Contextual Modeling for Meeting Translation Using Unsupervised Word Sense Disambiguation<br />
 143. Yee Seng Chan and Dan Roth. Exploiting Background Knowledge for Relation Extraction<br />
 144. Jong-Hoon Oh, Ichiro Yamada, Kentaro Torisawa and De Saeger Stijn. Co-STAR: A Co-training Style Algorithm for Hyponymy Relation Acquisition from Structured and Unstructured Text<br />
 145. Yuncong Chen and Pascale Fung. Unsupervised Synthesis of Multilingual Wikipedia Articles<br />
 146. Xiaofeng YU and Wai LAM. Jointly Identifying Entities and Extracting Relations in Encyclopedia Text via A Graphical Model Approach<br />
 147. Ryan Georgi, Fei Xia and Will Lewis. Comparing Language Similarity Across Genetic and Typologically-Based Groupings<br />
 148. Julia Hockenmaier and Yonatan Bisk. Normal-form parsing for Combinatory Categorial Grammars with generalized composition and type-raising<br />
 149. Lizhen Qu, Georgiana Ifrim and Gerhard Weikum. The Bag-of-Opinions Method for Review Rating Prediction from Sparse Text Patterns<br />
 150. Yanqing He and Yu Zhou. A Novel Reordering Model Based on Multi-layer Phrase for Statistical Machine Translation<br />
 151. Jeff Pasternack and Dan Roth. Knowing what to Believe (when you already know something)<br />
 152. Wei Zhang, Jian Su and Chew Lim Tan. Entity Linking Leveraging Automatically Generated Annotation<br />
 153. Yajuan Duan, Long Jiang, Tao Qin, Ming Zhou and Harry Shum. An Empirical Study on Learning to Rank of Tweets<br />
 154. Shanheng Zhao and Hwee Tou Ng. Maximum Metric Score Training for Coreference Resolution<br />
 155. Sheng Guo and Naren Ramakrishnan. Finding the Storyteller: Automatic Spoiler Tagging using Linguistic Cues<br />
 156. Altaf Rahman and Vincent Ng. Fine-Grained Semantic Class Induction via Hierarchical and Collective Classification<br />
 157. Yao-zhong Zhang, Takuya Matsuzaki and Jun&#8217;ichi Tsujii. Forest-guided Supertagger Training</p>
<p>注：转载请注明出处“<a href="http://www.52nlp.cn">我爱自然语言处理</a>”：<a href="http://www.52nlp.cn">www.52nlp.cn</a></p>
<p>本文链接地址：<a href="http://www.52nlp.cn/coling-2010-list-of-accepted-papers-oral">http://www.52nlp.cn/coling-2010-list-of-accepted-papers-oral</a></p>
<p>
<!-- Begin Google Adsense code -->
<script type="text/javascript"><!--
google_ad_client = "pub-4332174469367599";
/* 336x280, 创建于 09-2-7 */
google_ad_slot = "5707022987";
google_ad_width = 336;
google_ad_height = 280;
//-->
</script>
<script type="text/javascript"
src="http://pagead2.googlesyndication.com/pagead/show_ads.js">
</script>
<!-- End Google Adsense code -->
</p>


<p>相关文章:<ol><li><a href='http://www.52nlp.cn/acl-2010-list-of-accepted-papers' rel='bookmark' title='Permanent Link: ACL 2010: List of Accepted Papers'>ACL 2010: List of Accepted Papers</a></li>
<li><a href='http://www.52nlp.cn/acl-2010-paper-%e5%9b%bd%e5%86%85%e7%a0%94%e7%a9%b6%e5%8d%95%e4%bd%8d%e5%bd%95%e7%94%a8%e6%83%85%e5%86%b5' rel='bookmark' title='Permanent Link: ACL 2010 Paper国内研究单位录用情况'>ACL 2010 Paper国内研究单位录用情况</a></li>
<li><a href='http://www.52nlp.cn/coling-2010-prospect' rel='bookmark' title='Permanent Link: COLING 2010前瞻——规则与统计共舞，语言随计算齐飞'>COLING 2010前瞻——规则与统计共舞，语言随计算齐飞</a></li>
<li><a href='http://www.52nlp.cn/acl-ijcnlp-2009-running-two' rel='bookmark' title='Permanent Link: ACL-IJCNLP 2009会议进行时二'>ACL-IJCNLP 2009会议进行时二</a></li>
<li><a href='http://www.52nlp.cn/acl09-full-paper-accepted-details' rel='bookmark' title='Permanent Link: ACL09 Full Paper录用情况'>ACL09 Full Paper录用情况</a></li>
<li><a href='http://www.52nlp.cn/acl-ijcnlp-2009-running-one' rel='bookmark' title='Permanent Link: ACL-IJCNLP 2009会议进行时一'>ACL-IJCNLP 2009会议进行时一</a></li>
<li><a href='http://www.52nlp.cn/natural-language-processing-and-computational-linguistics-common-abbreviations-acronyms' rel='bookmark' title='Permanent Link: 自然语言处理及计算语言学常见缩略语'>自然语言处理及计算语言学常见缩略语</a></li>
<li><a href='http://www.52nlp.cn/acl-2010-best-paper-awards' rel='bookmark' title='Permanent Link: ACL 2010 Best Paper Awards'>ACL 2010 Best Paper Awards</a></li>
<li><a href='http://www.52nlp.cn/acl09-acceptance-rates-by-areas' rel='bookmark' title='Permanent Link: ACL09 Full Paper各研究领域的录用情况'>ACL09 Full Paper各研究领域的录用情况</a></li>
<li><a href='http://www.52nlp.cn/natural-language-processing-and-machine-translation-faq' rel='bookmark' title='Permanent Link: 自然语言处理与机器翻译FAQ'>自然语言处理与机器翻译FAQ</a></li>
</ol></p><img src="http://feeds.feedburner.com/~r/52nlp/~4/mCHtS9xfDHk" height="1" width="1"/>]]></content:encoded>
			<wfw:commentRss>http://www.52nlp.cn/coling-2010-list-of-accepted-papers-oral/feed</wfw:commentRss>
		<slash:comments>9</slash:comments>
		<feedburner:origLink>http://www.52nlp.cn/coling-2010-list-of-accepted-papers-oral</feedburner:origLink></item>
		<item>
		<title>条件随机场文献阅读指南</title>
		<link>http://feedproxy.google.com/~r/52nlp/~3/O7kN40IUais/%e6%9d%a1%e4%bb%b6%e9%9a%8f%e6%9c%ba%e5%9c%ba%e6%96%87%e7%8c%ae%e9%98%85%e8%af%bb%e6%8c%87%e5%8d%97</link>
		<comments>http://www.52nlp.cn/%e6%9d%a1%e4%bb%b6%e9%9a%8f%e6%9c%ba%e5%9c%ba%e6%96%87%e7%8c%ae%e9%98%85%e8%af%bb%e6%8c%87%e5%8d%97#comments</comments>
		<pubDate>Mon, 24 May 2010 15:49:02 +0000</pubDate>
		<dc:creator>52nlp</dc:creator>
				<category><![CDATA[机器学习]]></category>
		<category><![CDATA[条件随机场]]></category>
		<category><![CDATA[自然语言处理]]></category>
		<category><![CDATA[Brown90]]></category>
		<category><![CDATA[CRF]]></category>
		<category><![CDATA[Hanna Wallach]]></category>
		<category><![CDATA[John D. Lafferty]]></category>
		<category><![CDATA[文献]]></category>
		<category><![CDATA[最大熵模型]]></category>

		<guid isPermaLink="false">http://www.52nlp.cn/?p=3378</guid>
		<description><![CDATA[　　与最大熵模型相似，条件随机场（Conditional random fields，CRFs）是一种机器学习模型，在自然语言处理的许多领域（如词性标注、中文分词、命名实体识别等）都有比较好的应用效果。条件随机场最早由John D. Lafferty提出，其也是Brown90的作者之一，和贾里尼克相似，在离开IBM后他去了卡耐基梅隆大学继续搞学术研究，2001年以第一作者的身份发表了CRF的经典论文 “Conditional random fields: Probabilistic models for segmenting and labeling sequence data”。
　　关于条件随机场的参考文献及其他资料，Hanna Wallach在05年整理和维护的这个页面“conditional random fields”非常不错，其中涵盖了自01年CRF提出以来的很多经典论文（不过似乎只到05年，之后并未更新）以及几个相关的工具包(不过也没有包括CRF++），但是仍然非常值得入门条件随机场的读者参考，以下摘选自该网页。
introduction
Conditional random fields (CRFs) are a probabilistic framework for labeling and segmenting structured data, such as sequences, trees and lattices. The underlying idea is that of defining a conditional probability distribution over label sequences given a particular [...]


相关文章:<ol><li><a href='http://www.52nlp.cn/natural-language-processing-and-computational-linguistics-common-abbreviations-acronyms' rel='bookmark' title='Permanent Link: 自然语言处理及计算语言学常见缩略语'>自然语言处理及计算语言学常见缩略语</a></li>
<li><a href='http://www.52nlp.cn/maximum-entropy-model-tutorial-reading' rel='bookmark' title='Permanent Link: 最大熵模型文献阅读指南'>最大熵模型文献阅读指南</a></li>
<li><a href='http://www.52nlp.cn/most-influential-nlp-papers' rel='bookmark' title='Permanent Link: 最有影响力的自然语言处理论文'>最有影响力的自然语言处理论文</a></li>
<li><a href='http://www.52nlp.cn/coling-2010-prospect' rel='bookmark' title='Permanent Link: COLING 2010前瞻——规则与统计共舞，语言随计算齐飞'>COLING 2010前瞻——规则与统计共舞，语言随计算齐飞</a></li>
<li><a href='http://www.52nlp.cn/acl-ijcnlp-2009-running-one' rel='bookmark' title='Permanent Link: ACL-IJCNLP 2009会议进行时一'>ACL-IJCNLP 2009会议进行时一</a></li>
<li><a href='http://www.52nlp.cn/bayesian-modeling-for-language-tutorial-reading' rel='bookmark' title='Permanent Link: 贝叶斯模型文献阅读指南'>贝叶斯模型文献阅读指南</a></li>
<li><a href='http://www.52nlp.cn/%e4%b8%ad%e6%96%87%e5%88%86%e8%af%8d%e5%85%a5%e9%97%a8%e4%b9%8b%e6%96%87%e7%8c%ae' rel='bookmark' title='Permanent Link: 中文分词入门之文献'>中文分词入门之文献</a></li>
<li><a href='http://www.52nlp.cn/acl-ijcnlp-2009-running-two' rel='bookmark' title='Permanent Link: ACL-IJCNLP 2009会议进行时二'>ACL-IJCNLP 2009会议进行时二</a></li>
<li><a href='http://www.52nlp.cn/natural-language-processing-and-computational-linguistics-books-summary-one-foreign-book' rel='bookmark' title='Permanent Link: 自然语言处理与计算语言学书籍汇总之一：国外书籍'>自然语言处理与计算语言学书籍汇总之一：国外书籍</a></li>
<li><a href='http://www.52nlp.cn/strong-author-team-of-smt-classic-brown90' rel='bookmark' title='Permanent Link: SMT经典再回首之Brown90:强大的作者阵容'>SMT经典再回首之Brown90:强大的作者阵容</a></li>
</ol>]]></description>
			<content:encoded><![CDATA[<p>　　与最大熵模型相似，条件随机场（Conditional random fields，CRFs）是一种机器学习模型，在自然语言处理的许多领域（如词性标注、中文分词、命名实体识别等）都有比较好的应用效果。条件随机场最早由John D. Lafferty提出，其也是<a href="http://www.52nlp.cn/strong-author-team-of-smt-classic-brown90">Brown90</a>的作者之一，和贾里尼克相似，在离开IBM后他去了卡耐基梅隆大学继续搞学术研究，2001年以第一作者的身份发表了CRF的经典论文 “Conditional random fields: Probabilistic models for segmenting and labeling sequence data”。<span id="more-3378"></span><br />
　　关于条件随机场的参考文献及其他资料，Hanna Wallach在05年整理和维护的这个页面“<a href="http://www.inference.phy.cam.ac.uk/hmw26/crf/">conditional random fields</a>”非常不错，其中涵盖了自01年CRF提出以来的很多经典论文（不过似乎只到05年，之后并未更新）以及几个相关的工具包(不过也没有包括CRF++），但是仍然非常值得入门条件随机场的读者参考，以下摘选自该网页。</p>
<h1><a name="introduction">introduction</a></h1>
<p>Conditional random fields (CRFs) are a probabilistic framework for labeling and segmenting structured data, such as sequences, trees and lattices. The underlying idea is that of defining a conditional probability distribution over label sequences given a particular observation sequence, rather than a joint distribution over both label and observation sequences. The primary advantage of CRFs over hidden Markov models is their conditional nature, resulting in the relaxation of the independence assumptions required by HMMs in order to ensure tractable inference. Additionally, CRFs avoid the label bias problem, a weakness exhibited by maximum entropy Markov models (MEMMs) and other conditional Markov models based on directed graphical models. CRFs outperform both MEMMs and HMMs on a number of real-world tasks in many fields, including bioinformatics, computational linguistics and speech recognition.</p>
<h1><a name="tutorial">tutorial</a></h1>
<p>Hanna M. Wallach. <a href="http://www.inference.phy.cam.ac.uk/hmw26/papers/crf_intro.pdf">Conditional Random  Fields: An Introduction.</a> Technical Report MS-CIS-04-21. Department of Computer and Information Science, University of Pennsylvania, 2004.</p>
<h1><a name="papers">papers by year</a></h1>
<h2><a name="2001">2001</a></h2>
<p>John Lafferty, Andrew McCallum, Fernando Pereira. <a href="http://www.cs.umass.edu/%7Emccallum/papers/crf-icml01.ps.gz">Conditional Random  Fields: Probabilistic Models for Segmenting and Labeling Sequence Data.</a> In <em>Proceedings of the Eighteenth International Conference on Machine Learning</em> (ICML-2001), 2001.</p>
<h2><a name="2002">2002</a></h2>
<p>Hanna Wallach. <a href="http://www.cogsci.ed.ac.uk/%7Eosborne/msc-projects/wallach.ps.gz">Efficient Training  of Conditional Random Fields.</a> M.Sc. thesis, Division of Informatics, University of Edinburgh, 2002.</p>
<p>Thomas G. Dietterich. <a href="http://eecs.oregonstate.edu/%7Etgd/publications/mlsd-ssspr.pdf">Machine Learning  for Sequential Data: A Review.</a> In <em>Structural, Syntactic, and Statistical Pattern Recognition; Lecture Notes in Computer Science, Vol. 2396</em>, T. Caelli (Ed.), pp. 15–30, Springer-Verlag, 2002.</p>
<h2><a name="2003">2003</a></h2>
<p>Fei Sha and Fernando Pereira. <a href="http://www.cis.upenn.edu/%7Efeisha/pubs/shallow03.pdf">Shallow Parsing with Conditional Random Fields.</a> In <em>Proceedings of the 2003 Human Language Technology Conference and North American Chapter of the Association for Computational Linguistics</em> (HLT/NAACL-03), 2003.</p>
<p>Andrew McCallum. <a href="http://www.cs.umass.edu/%7Emccallum/papers/ifcrf-uai2003.pdf">Efficiently Inducing  Features of Conditional Random Fields.</a> In <em>Proceedings of the 19th Conference in Uncertainty in Articifical Intelligence</em> (UAI-2003), 2003.</p>
<p>David Pinto, Andrew McCallum, Xing Wei and W. Bruce Croft. <a href="http://www.cs.umass.edu/%7Emccallum/papers/crftable-sigir2003.pdf">Table Extraction  Using Conditional Random Fields.</a> In <em>Proceedings of the 26th Annual International ACM SIGIR Conference on Research and Development in Information Retrieval</em> (SIGIR 2003), 2003.</p>
<p>Andrew McCallum and Wei Li. <a href="http://cnts.uia.ac.be/conll2003/pdf/18891mcc.pdf">Early Results for Named Entity Recognition with Conditional Random Fields, Feature Induction and Web-Enhanced Lexicons.</a> In <em>Proceedings of the Seventh Conference on Natural Language Learning</em> (CoNLL), 2003.</p>
<p>Wei Li and Andrew McCallum. <a href="http://www.cs.umass.edu/%7Emccallum/papers/hindi-talip2003.pdf">Rapid Development  of Hindi Named Entity Recognition Using Conditional Random Fields and Feature Induction.</a> In <em>ACM Transactions on Asian Language Information Processing</em> (TALIP), 2003.</p>
<p>Yasemin Altun and Thomas Hofmann. <a href="http://www.cs.brown.edu/people/altun/pubs/AltunHofmann-EuroSpeech2003.pdf">Large Margin  Methods for Label Sequence Learning.</a> In <em>Proceedings of 8th European Conference on Speech Communication and Technology</em> (EuroSpeech), 2003.</p>
<p>Simon Lacoste-Julien. <a href="http://www.cs.berkeley.edu/%7Eslacoste/school/cs281a/project/M3netReportpdf.pdf">Combining SVM  with graphical models for supervised classification: an introduction to Max-Margin Markov Networks</a>. CS281A Project Report, UC Berkeley, 2003.</p>
<blockquote></blockquote>
<h2><a name="2004">2004</a></h2>
<p>Andrew McCallum, Khashayar Rohanimanesh and Charles Sutton. <a href="http://www.cs.umass.edu/%7Emccallum/papers/dcrf-nips03.pdf">Dynamic Conditional  Random Fields for Jointly Labeling Multiple Sequences.</a> Workshop on Syntax, Semantics, Statistics; 16th Annual Conference on Neural Information Processing Systems (NIPS 2003), 2004.</p>
<p>Kevin Murphy, Antonio Torralba and William T.F. Freeman. <a href="http://web.mit.edu/torralba/www/nips2003.pdf">Using the forest to see the trees: a graphical model relating features, objects and scenes.</a> In <em>Advances in Neural Information Processing Systems 16</em> (NIPS 2003), 2004.</p>
<blockquote></blockquote>
<p>Sanjiv Kumar and Martial Hebert. <a href="http://www-2.cs.cmu.edu/%7Eskumar/DRF/modDRF.pdf">Discriminative Fields for Modeling Spatial Dependencies in Natural Images.</a> In <em>Advances in Neural Information Processing Systems 16</em> (NIPS 2003), 2004.</p>
<p>Ben Taskar, Carlos Guestrin and Daphne Koller. <a href="http://books.nips.cc/papers/files/nips16/NIPS2003_AA04.pdf">Max-Margin Markov  Networks.</a> In <em>Advances in Neural Information Processing Systems 16</em> (NIPS 2003), 2004.</p>
<blockquote></blockquote>
<p>Burr Settles. <a href="http://www.cs.wisc.edu/%7Ebsettles/pub/bsettles-nlpba04.pdf">Biomedical Named  Entity Recognition Using Conditional Random Fields and Rich Feature Sets.</a> To appear in <em>Proceedings of the International Joint Workshop on Natural Language Processing in Biomedicine and its Applications</em> (NLPBA), 2004.</p>
<p>A demo of the system can be downloaded <a href="http://www.cs.wisc.edu/%7Ebsettles/abner/">here</a>.</p>
<p>Charles Sutton, Khashayar Rohanimanesh and Andrew McCallum. <a href="http://www.aicml.cs.ualberta.ca/banff04/icml/pages/papers/308.pdf">Dynamic Conditional  Random Fields: Factorized Probabilistic Models for Labeling and Segmenting Sequence Data.</a> In <em>Proceedings of the Twenty-First International Conference on Machine Learning</em> (ICML 2004), 2004.</p>
<p>John Lafferty, Xiaojin Zhu and Yan Liu. <a href="http://portal.acm.org/citation.cfm?id=1015330.1015337">Kernel conditional random fields: representation and clique selection.</a> In <em>Proceedings of the Twenty-First International Conference on Machine Learning</em> (ICML 2004), 2004.</p>
<p>Xuming He, Richard Zemel, and Miguel Á. Carreira-Perpiñán. <a href="http://www.cs.toronto.edu/pub/zemel/Papers/cvpr04.pdf">Multiscale conditional random fields for image labelling.</a> In <em>Proceedings of the 2004 IEEE Computer Society Conference on Computer Vision and Pattern Recognition</em> (CVPR 2004), 2004.</p>
<p>Yasemin Altun, Alex J. Smola, Thomas Hofmann. <a href="http://www.cs.brown.edu/%7Eth/papers/AltSmoHof-UAI2004.pdf">Exponential Families  for Conditional Random Fields.</a> In <em>Proceedings of the 20th Conference on Uncertainty in Artificial Intelligence</em> (UAI-2004), 2004.</p>
<p>Michelle L. Gregory and Yasemin Altun. <a href="http://www.cs.brown.edu/people/altun/pubs/GregoryAltun.pdf">Using Conditional Random Fields to Predict Pitch Accents in Conversational Speech.</a> In <em>Proceedings of the 42<sup>nd</sup> Annual Meeting of the Association for Computational Linguistics</em> (ACL 2004), 2004.</p>
<p>Brian Roark, Murat Saraclar, Michael Collins and Mark Johnson. <a href="http://www.cslu.ogi.edu/people/roark/ACL04CRFLM.pdf">Discriminative Language  Modeling with Conditional Random Fields and the Perceptron Algorithm.</a> In <em>Proceedings of the 42<sup>nd</sup> Annual Meeting of the Association for Computational Linguistics</em> (ACL 2004), 2004.</p>
<p>Ryan McDonald and Fernando Pereira. <a href="http://www.pdg.cnb.uam.es/BioLINK/workshop_BioCreative_04/handout/pdf/task1A.pdf">Identifying Gene  and Protein Mentions in Text Using Conditional Random Fields.</a> BioCreative, 2004.</p>
<p>Trausti T. Kristjansson, Aron Culotta, Paul Viola and Andrew McCallum.  <a href="http://http//www.cs.umass.edu/%7Emccallum/papers/addrie-aaai04.pdf">Interactive Information  Extraction with Constrained Conditional Random Fields.</a> In <em>Proceedings of the Nineteenth National Conference on Artificial Intelligence</em> (AAAI 2004), 2004.</p>
<p>Thomas G. Dietterich, Adam Ashenfelter and Yaroslav Bulatov. <a href="http://web.engr.oregonstate.edu/%7Etgd/publications/ml2004-treecrf.pdf">Training Conditional  Random Fields via Gradient Tree Boosting.</a> In <em>Proceedings of the Twenty-First International Conference on Machine Learning</em> (ICML 2004), 2004.</p>
<blockquote></blockquote>
<p>John Lafferty, Yan Liu and Xiaojin Zhu. <a href="http://www.aladdin.cs.cmu.edu/papers/pdfs/y2004/kernecon.pdf">Kernel Conditional  Random Fields: Representation, Clique Selection, and Semi-Supervised Learning.</a> Technical Report CMU-CS-04-115, Carnegie Mellon University, 2004.</p>
<p>Fuchun Peng and Andrew McCallum (2004). <a href="http://acl.ldc.upenn.edu/hlt-naacl2004/main/pdf/176_Paper.pdf">Accurate Information  Extraction from Research Papers using Conditional Random Fields.</a> In <em>Proceedings of Human Language Technology Conference and North American Chapter of the Association for Computational Linguistics</em> (HLT/NAACL-04), 2004.</p>
<p>Yasemin Altun, Thomas Hofmann and Alexander J. Smola. <a href="http://www.cs.brown.edu/%7Eth/papers/AltHofSmo-ICML2004.pdf">Gaussian process  classification for segmenting and annotating sequences.</a> In <em>Proceedings of the Twenty-First International Conference on Machine Learning</em> (ICML 2004), 2004.</p>
<p>Yasemin Altun and Thomas Hofmann. <a href="http://www.cs.brown.edu/people/altun/pubs/CS-03-23.ps">Gaussian Process Classification for Segmenting and Annotating Sequences.</a> Technical Report CS-04-12, Department of Computer Science, Brown University, 2004.</p>
<h2><a name="2005">2005</a></h2>
<p>Cristian Smimchisescu, Atul Kanaujia, Zhiguo Li and Dimitris Metaxus. <a href="http://www.cs.toronto.edu/%7Ecrismin/PAPERS/iccv05.pdf">Conditional Models  for Contextual Human Motion Recognition.</a> In <em>Proceedings of the International Conference on Computer Vision</em>, (ICCV 2005), Beijing, China, 2005.</p>
<p>Ariadna Quattoni, Michael Collins and Trevor Darrel. <a href="http://books.nips.cc/papers/files/nips17/NIPS2004_0810.pdf"> Conditional Random Fields for Object Recognition.</a> In <em>Advances in Neural Information Processing Systems 17</em> (NIPS 2004), 2005.</p>
<p>Jospeh Bockhorst and Mark Craven. <a href="http://books.nips.cc/papers/files/nips17/2004_0745.pdf"> Markov Networks for Detecting Overlapping Elements in Sequence Data.</a> In <em>Advances in Neural Information Processing Systems 17</em> (NIPS 2004), 2005.</p>
<p>Antonio Torralba, Kevin P. Murphy, William T. Freeman. <a href="http://www.ai.mit.edu/%7Emurphyk/Papers/BRFaimemo.pdf">Contextual models for object detection using boosted random fields.</a> In <em>Advances in Neural Information Processing Systems 17</em> (NIPS 2004), 2005.</p>
<p>Sunita Sarawagi and William W. Cohen. <a href="http://www-2.cs.cmu.edu/%7Ewcohen/postscript/semiCRF.pdf">Semi-Markov Conditional  Random Fields for Information Extraction.</a> In <em>Advances in Neural Information Processing Systems 17</em> (NIPS 2004), 2005.</p>
<blockquote></blockquote>
<p>Yuan Qi, Martin Szummer and Thomas P. Minka. <a href="http://people.csail.mit.edu/u/a/alanqi/public_html/papers/Qi-Bayesian-CRF-AIstat05.pdf">Bayesian Conditional  Random Fields.</a> To appear in <cite>Proceedings of the Tenth International Workshop on Artificial Intelligence and Statistics</cite> (AISTATS 2005), 2005.</p>
<p>Aron Culotta, David Kulp and Andrew McCallum. <a href="http://www.cs.umass.edu/%7Eculotta/pubs/crfgene.pdf">Gene Prediction with Conditional Random Fields.</a> Technical Report UM-CS-2005-028. University of Massachusetts, Amherst, 2005.</p>
<p>Yang Wang and Qiang Ji. <a href="http://www.geocities.com/wang_yang_mr/publication/DCRFcvpr05.pdf">A Dynamic Conditional Random Field Model for Object Segmentation in Image Sequences.</a> In <cite>IEEE Computer Society Conference on Computer Vision and Pattern Recognition</cite> (CVPR 2005), Volume 1, 2005.</p>
<h1><a name="software">software</a></h1>
<p><a href="http://mallet.cs.umass.edu/">MALLET</a>: A Machine Learning for Language Toolkit.</p>
<blockquote><p>MALLET is an integrated collection of Java code useful for statistical natural language processing, document classification, clustering, information extraction, and other machine learning applications to text.</p></blockquote>
<p><a href="http://www.cs.wisc.edu/%7Ebsettles/abner/">ABNER</a>: A Biomedical Named Entity Recognizer.</p>
<blockquote><p>ABNER is a text analysis tool for molecular biology. It is essentially an interactive, user-friendly interface to a system designed as part of the NLPBA/BioNLP 2004 Shared Task challenge.</p></blockquote>
<p><a href="http://minorthird.sourceforge.net/">MinorThird</a>.</p>
<blockquote><p>MinorThird is a collection of Java classes for storing text, annotating text, and learning to extract entities and categorize text.</p></blockquote>
<p><a href="http://www.cs.ubc.ca/%7Emurphyk/Software/CRF/crf.html">Kevin  Murphy&#8217;s MATLAB CRF code</a>.</p>
<blockquote><p>Conditional random fields (chains, trees and general graphs; includes BP code).</p></blockquote>
<p><a href="http://crf.sourceforge.net/">Sunita Sarawagi&#8217;s CRF package</a>.</p>
<blockquote><p>The CRF package is a Java implementation of conditional random fields  for sequential labeling.</p></blockquote>
<p>　　最后推荐<a href="http://crfpp.sourceforge.net/">CRF++:Yet Another CRF toolkit</a>，如果读者对于基于字标注的中文分词感兴趣，可以很快的利用该工具包构造一个基于条件随机场的中文分词工具，而且性能也不赖。</p>
<p>注：转载请注明出处“<a href="http://www.52nlp.cn">我爱自然语言处理</a>”：<a href="http://www.52nlp.cn">www.52nlp.cn</a></p>
<p>本文链接地址：<a href="http://www.52nlp.cn/条件随机场文献阅读指南">http://www.52nlp.cn/条件随机场文献阅读指南</a></p>
<p>
<!-- Begin Google Adsense code -->
<script type="text/javascript"><!--
google_ad_client = "pub-4332174469367599";
/* 336x280, 创建于 09-2-7 */
google_ad_slot = "5707022987";
google_ad_width = 336;
google_ad_height = 280;
//-->
</script>
<script type="text/javascript"
src="http://pagead2.googlesyndication.com/pagead/show_ads.js">
</script>
<!-- End Google Adsense code -->
</p>


<p>相关文章:<ol><li><a href='http://www.52nlp.cn/natural-language-processing-and-computational-linguistics-common-abbreviations-acronyms' rel='bookmark' title='Permanent Link: 自然语言处理及计算语言学常见缩略语'>自然语言处理及计算语言学常见缩略语</a></li>
<li><a href='http://www.52nlp.cn/maximum-entropy-model-tutorial-reading' rel='bookmark' title='Permanent Link: 最大熵模型文献阅读指南'>最大熵模型文献阅读指南</a></li>
<li><a href='http://www.52nlp.cn/most-influential-nlp-papers' rel='bookmark' title='Permanent Link: 最有影响力的自然语言处理论文'>最有影响力的自然语言处理论文</a></li>
<li><a href='http://www.52nlp.cn/coling-2010-prospect' rel='bookmark' title='Permanent Link: COLING 2010前瞻——规则与统计共舞，语言随计算齐飞'>COLING 2010前瞻——规则与统计共舞，语言随计算齐飞</a></li>
<li><a href='http://www.52nlp.cn/acl-ijcnlp-2009-running-one' rel='bookmark' title='Permanent Link: ACL-IJCNLP 2009会议进行时一'>ACL-IJCNLP 2009会议进行时一</a></li>
<li><a href='http://www.52nlp.cn/bayesian-modeling-for-language-tutorial-reading' rel='bookmark' title='Permanent Link: 贝叶斯模型文献阅读指南'>贝叶斯模型文献阅读指南</a></li>
<li><a href='http://www.52nlp.cn/%e4%b8%ad%e6%96%87%e5%88%86%e8%af%8d%e5%85%a5%e9%97%a8%e4%b9%8b%e6%96%87%e7%8c%ae' rel='bookmark' title='Permanent Link: 中文分词入门之文献'>中文分词入门之文献</a></li>
<li><a href='http://www.52nlp.cn/acl-ijcnlp-2009-running-two' rel='bookmark' title='Permanent Link: ACL-IJCNLP 2009会议进行时二'>ACL-IJCNLP 2009会议进行时二</a></li>
<li><a href='http://www.52nlp.cn/natural-language-processing-and-computational-linguistics-books-summary-one-foreign-book' rel='bookmark' title='Permanent Link: 自然语言处理与计算语言学书籍汇总之一：国外书籍'>自然语言处理与计算语言学书籍汇总之一：国外书籍</a></li>
<li><a href='http://www.52nlp.cn/strong-author-team-of-smt-classic-brown90' rel='bookmark' title='Permanent Link: SMT经典再回首之Brown90:强大的作者阵容'>SMT经典再回首之Brown90:强大的作者阵容</a></li>
</ol></p><img src="http://feeds.feedburner.com/~r/52nlp/~4/O7kN40IUais" height="1" width="1"/>]]></content:encoded>
			<wfw:commentRss>http://www.52nlp.cn/%e6%9d%a1%e4%bb%b6%e9%9a%8f%e6%9c%ba%e5%9c%ba%e6%96%87%e7%8c%ae%e9%98%85%e8%af%bb%e6%8c%87%e5%8d%97/feed</wfw:commentRss>
		<slash:comments>4</slash:comments>
		<feedburner:origLink>http://www.52nlp.cn/%e6%9d%a1%e4%bb%b6%e9%9a%8f%e6%9c%ba%e5%9c%ba%e6%96%87%e7%8c%ae%e9%98%85%e8%af%bb%e6%8c%87%e5%8d%97</feedburner:origLink></item>
		<item>
		<title>足球依然是圆的！</title>
		<link>http://feedproxy.google.com/~r/52nlp/~3/kX0ZzHoGi7A/%e8%b6%b3%e7%90%83%e4%be%9d%e7%84%b6%e6%98%af%e5%9c%86%e7%9a%84</link>
		<comments>http://www.52nlp.cn/%e8%b6%b3%e7%90%83%e4%be%9d%e7%84%b6%e6%98%af%e5%9c%86%e7%9a%84#comments</comments>
		<pubDate>Sat, 22 May 2010 20:43:18 +0000</pubDate>
		<dc:creator>52nlp</dc:creator>
				<category><![CDATA[随笔]]></category>

		<guid isPermaLink="false">http://www.52nlp.cn/?p=3376</guid>
		<description><![CDATA[　　作为国米的死忠和穆里尼奥的追随者，这一刻，很幸福！


相关文章:胡正，StarDict，TheSourceCodeOfMyWorld
Google&#8217;s Python Class &#8211; SOS
祝福大家虎年吉祥如意
单词也疯狂——漂亮的“单词云”
52nlp博客恢复
“大教堂与市集”摘要
关于计算语言学的一首词
机器翻译与微软对联
赞一下host2ez
天佑安康，天佑父老乡亲！



相关文章:<ol><li><a href='http://www.52nlp.cn/huzheng-stardict-thesourcecodeofmyworld' rel='bookmark' title='Permanent Link: 胡正，StarDict，TheSourceCodeOfMyWorld'>胡正，StarDict，TheSourceCodeOfMyWorld</a></li>
<li><a href='http://www.52nlp.cn/googles-python-class-sos' rel='bookmark' title='Permanent Link: Google&#8217;s Python Class &#8211; SOS'>Google&#8217;s Python Class &#8211; SOS</a></li>
<li><a href='http://www.52nlp.cn/%e7%a5%9d%e7%a6%8f%e5%a4%a7%e5%ae%b6%e8%99%8e%e5%b9%b4%e5%90%89%e7%a5%a5%e5%a6%82%e6%84%8f' rel='bookmark' title='Permanent Link: 祝福大家虎年吉祥如意'>祝福大家虎年吉祥如意</a></li>
<li><a href='http://www.52nlp.cn/crazy-word-beautiful-word-clouds' rel='bookmark' title='Permanent Link: 单词也疯狂——漂亮的“单词云”'>单词也疯狂——漂亮的“单词云”</a></li>
<li><a href='http://www.52nlp.cn/52nlp%e5%8d%9a%e5%ae%a2%e6%81%a2%e5%a4%8d' rel='bookmark' title='Permanent Link: 52nlp博客恢复'>52nlp博客恢复</a></li>
<li><a href='http://www.52nlp.cn/the-cathedral-and-the-bazaar-abstract' rel='bookmark' title='Permanent Link: “大教堂与市集”摘要'>“大教堂与市集”摘要</a></li>
<li><a href='http://www.52nlp.cn/a-poem-computational-linguistics' rel='bookmark' title='Permanent Link: 关于计算语言学的一首词'>关于计算语言学的一首词</a></li>
<li><a href='http://www.52nlp.cn/machine-translation-and-microsoft-couplet' rel='bookmark' title='Permanent Link: 机器翻译与微软对联'>机器翻译与微软对联</a></li>
<li><a href='http://www.52nlp.cn/praise-host2ez' rel='bookmark' title='Permanent Link: 赞一下host2ez'>赞一下host2ez</a></li>
<li><a href='http://www.52nlp.cn/%e5%a4%a9%e4%bd%91%e5%ae%89%e5%ba%b7-%e5%a4%a9%e4%bd%91%e7%88%b6%e8%80%81%e4%b9%a1%e4%ba%b2' rel='bookmark' title='Permanent Link: 天佑安康，天佑父老乡亲！'>天佑安康，天佑父老乡亲！</a></li>
</ol>]]></description>
			<content:encoded><![CDATA[<p>　　作为国米的死忠和穆里尼奥的追随者，这一刻，很幸福！</p>


<p>相关文章:<ol><li><a href='http://www.52nlp.cn/huzheng-stardict-thesourcecodeofmyworld' rel='bookmark' title='Permanent Link: 胡正，StarDict，TheSourceCodeOfMyWorld'>胡正，StarDict，TheSourceCodeOfMyWorld</a></li>
<li><a href='http://www.52nlp.cn/googles-python-class-sos' rel='bookmark' title='Permanent Link: Google&#8217;s Python Class &#8211; SOS'>Google&#8217;s Python Class &#8211; SOS</a></li>
<li><a href='http://www.52nlp.cn/%e7%a5%9d%e7%a6%8f%e5%a4%a7%e5%ae%b6%e8%99%8e%e5%b9%b4%e5%90%89%e7%a5%a5%e5%a6%82%e6%84%8f' rel='bookmark' title='Permanent Link: 祝福大家虎年吉祥如意'>祝福大家虎年吉祥如意</a></li>
<li><a href='http://www.52nlp.cn/crazy-word-beautiful-word-clouds' rel='bookmark' title='Permanent Link: 单词也疯狂——漂亮的“单词云”'>单词也疯狂——漂亮的“单词云”</a></li>
<li><a href='http://www.52nlp.cn/52nlp%e5%8d%9a%e5%ae%a2%e6%81%a2%e5%a4%8d' rel='bookmark' title='Permanent Link: 52nlp博客恢复'>52nlp博客恢复</a></li>
<li><a href='http://www.52nlp.cn/the-cathedral-and-the-bazaar-abstract' rel='bookmark' title='Permanent Link: “大教堂与市集”摘要'>“大教堂与市集”摘要</a></li>
<li><a href='http://www.52nlp.cn/a-poem-computational-linguistics' rel='bookmark' title='Permanent Link: 关于计算语言学的一首词'>关于计算语言学的一首词</a></li>
<li><a href='http://www.52nlp.cn/machine-translation-and-microsoft-couplet' rel='bookmark' title='Permanent Link: 机器翻译与微软对联'>机器翻译与微软对联</a></li>
<li><a href='http://www.52nlp.cn/praise-host2ez' rel='bookmark' title='Permanent Link: 赞一下host2ez'>赞一下host2ez</a></li>
<li><a href='http://www.52nlp.cn/%e5%a4%a9%e4%bd%91%e5%ae%89%e5%ba%b7-%e5%a4%a9%e4%bd%91%e7%88%b6%e8%80%81%e4%b9%a1%e4%ba%b2' rel='bookmark' title='Permanent Link: 天佑安康，天佑父老乡亲！'>天佑安康，天佑父老乡亲！</a></li>
</ol></p><img src="http://feeds.feedburner.com/~r/52nlp/~4/kX0ZzHoGi7A" height="1" width="1"/>]]></content:encoded>
			<wfw:commentRss>http://www.52nlp.cn/%e8%b6%b3%e7%90%83%e4%be%9d%e7%84%b6%e6%98%af%e5%9c%86%e7%9a%84/feed</wfw:commentRss>
		<slash:comments>2</slash:comments>
		<feedburner:origLink>http://www.52nlp.cn/%e8%b6%b3%e7%90%83%e4%be%9d%e7%84%b6%e6%98%af%e5%9c%86%e7%9a%84</feedburner:origLink></item>
		<item>
		<title>微软：Web N-gram Services</title>
		<link>http://feedproxy.google.com/~r/52nlp/~3/D2yUzPxrEA8/%e5%be%ae%e8%bd%af-web-n-gram-services</link>
		<comments>http://www.52nlp.cn/%e5%be%ae%e8%bd%af-web-n-gram-services#comments</comments>
		<pubDate>Wed, 12 May 2010 18:07:12 +0000</pubDate>
		<dc:creator>52nlp</dc:creator>
				<category><![CDATA[语料库]]></category>
		<category><![CDATA[语言模型]]></category>
		<category><![CDATA[Google]]></category>
		<category><![CDATA[Microsoft]]></category>
		<category><![CDATA[n-gram]]></category>
		<category><![CDATA[Web]]></category>
		<category><![CDATA[Web N-gram Services]]></category>
		<category><![CDATA[云存储]]></category>
		<category><![CDATA[微软]]></category>

		<guid isPermaLink="false">http://www.52nlp.cn/?p=3369</guid>
		<description><![CDATA[　　微软研究院的官方网站上近期发布了一篇文章：“Microsoft Web N-gram Services&#8220;，大意是邀请整个社区使用其提供的&#8221;Web N-gram services&#8221;,这个服务旨在通过基于云的存储平台，推动网络搜索，自然语言处理，语音技术等相关领域，在研究现实世界的大规模网络数据时，利用该服务所提供动态数据对项目中的常规数据进行补充更新，进而有所发现和创新。
　　有意思的是它的副标题：“Access petabytes of data via the Web N-gram services (Public Beta)”，注意微软这个服务提供的是PB(petabytes)级别的数据:
　　1PB = 1PeraByte = 1024 TB = 1024 * 1024 * 1024 MB
　　如果说Google的1T n-gram语言模型还可以压缩到大硬盘里使用的话，那么PB级别的n-gram语言模型目前来说最好的存储平台就是“云端”了。
　　微软的这项&#8221;Web N-gram Services&#8221;包括如下服务内容：
    　　* Content types: Document Body, Document Title, Anchor Texts
    　　* Model types: Smoothed models
    　　* [...]


相关文章:<ol><li><a href='http://www.52nlp.cn/beautiful-data-%e7%bb%9f%e8%ae%a1%e8%af%ad%e8%a8%80%e6%a8%a1%e5%9e%8b%e7%9a%84%e5%ba%94%e7%94%a8%e4%ba%8c%e8%83%8c%e6%99%af' rel='bookmark' title='Permanent Link: Beautiful Data-统计语言模型的应用二：背景'>Beautiful Data-统计语言模型的应用二：背景</a></li>
<li><a href='http://www.52nlp.cn/beautiful-data-%e7%bb%9f%e8%ae%a1%e8%af%ad%e8%a8%80%e6%a8%a1%e5%9e%8b%e7%9a%84%e5%ba%94%e7%94%a8%e4%b8%89%e5%88%86%e8%af%8d8' rel='bookmark' title='Permanent Link: Beautiful Data-统计语言模型的应用三：分词8'>Beautiful Data-统计语言模型的应用三：分词8</a></li>
<li><a href='http://www.52nlp.cn/hmm-learn-best-practices-seven-forward-backward-algorithm-2' rel='bookmark' title='Permanent Link: HMM学习最佳范例七：前向-后向算法2'>HMM学习最佳范例七：前向-后向算法2</a></li>
<li><a href='http://www.52nlp.cn/language-model-training-tools-srilm-details' rel='bookmark' title='Permanent Link: 语言模型训练工具SRILM详解'>语言模型训练工具SRILM详解</a></li>
<li><a href='http://www.52nlp.cn/hmm-learn-best-practices-seven-forward-backward-algorithm-5' rel='bookmark' title='Permanent Link: HMM学习最佳范例七：前向-后向算法5'>HMM学习最佳范例七：前向-后向算法5</a></li>
<li><a href='http://www.52nlp.cn/language-modeling-toolkit-irstlm-installation-and-trial-noting' rel='bookmark' title='Permanent Link: 语言模型工具IRSTLM安装及试用手记'>语言模型工具IRSTLM安装及试用手记</a></li>
<li><a href='http://www.52nlp.cn/mit-nlp-second-lesson-word-counting-first-part' rel='bookmark' title='Permanent Link: MIT自然语言处理第二讲：单词计数（第一部分）'>MIT自然语言处理第二讲：单词计数（第一部分）</a></li>
<li><a href='http://www.52nlp.cn/mit-nlp-third-lesson-probabilistic-language-modeling-first-part' rel='bookmark' title='Permanent Link: MIT自然语言处理第三讲：概率语言模型（第一部分）'>MIT自然语言处理第三讲：概率语言模型（第一部分）</a></li>
<li><a href='http://www.52nlp.cn/%e6%8e%a8%e8%8d%90%e5%bc%a0%e5%8d%8e%e5%b9%b3%e8%80%81%e5%b8%88%e7%9a%84%e4%b8%ad%e6%96%87%e5%88%86%e8%af%8d%e5%b7%a5%e5%85%b7-ictclas2010' rel='bookmark' title='Permanent Link: 推荐张华平老师的中文分词工具ICTCLAS2010'>推荐张华平老师的中文分词工具ICTCLAS2010</a></li>
<li><a href='http://www.52nlp.cn/beautiful-data-%e7%bb%9f%e8%ae%a1%e8%af%ad%e8%a8%80%e6%a8%a1%e5%9e%8b%e7%9a%84%e5%ba%94%e7%94%a8%e4%b8%89%e5%88%86%e8%af%8d2' rel='bookmark' title='Permanent Link: Beautiful Data-统计语言模型的应用三：分词2'>Beautiful Data-统计语言模型的应用三：分词2</a></li>
</ol>]]></description>
			<content:encoded><![CDATA[<p>　　微软研究院的官方网站上近期发布了一篇文章：“<a href="http://research.microsoft.com/en-us/collaboration/focus/cs/bingiton.aspx"target=_blank>Microsoft Web N-gram Services</a>&#8220;，大意是邀请整个社区使用其提供的&#8221;Web N-gram services&#8221;,这个服务旨在通过基于云的存储平台，推动网络搜索，自然语言处理，语音技术等相关领域，在研究现实世界的大规模网络数据时，利用该服务所提供动态数据对项目中的常规数据进行补充更新，进而有所发现和创新。<span id="more-3369"></span><br />
　　有意思的是它的副标题：“Access petabytes of data via the Web N-gram services (Public Beta)”，注意微软这个服务提供的是PB(petabytes)级别的数据:<br />
　　1PB = 1PeraByte = 1024 TB = 1024 * 1024 * 1024 MB<br />
　　如果说Google的1T n-gram语言模型还可以压缩到大硬盘里使用的话，那么PB级别的n-gram语言模型目前来说最好的存储平台就是“云端”了。<br />
　　微软的这项&#8221;Web N-gram Services&#8221;包括如下服务内容：<br />
    　　* Content types: Document Body, Document Title, Anchor Texts<br />
    　　* Model types: Smoothed models<br />
    　　* N-gram availability: unigram, bigram, trigram, N-gram with N=4, 5.（最大也是5元）<br />
    　　* Training size (Body): All documents indexed by Bing<br />
    　　* Access: Hosted Services by Microsoft<br />
    　　* Updates: Periodical updates<br />
　　查了一下微软的这个“Web N-gram Services”，大致是在4月下旬WWW2010会议上公开的，之前一年属于&#8221;private beta”，目前是“public beta”，不过这篇文章最后说得是：“We are now expanding access in the Public Beta Web N-gram Services to include professors and students at accredited colleges and universities worldwide.” 似乎只针对授权的大学教授和学生开放。<br />
　　不过网上目前可以查到如何使用该服务的文章：<a href="http://data-gov.tw.rpi.edu/wiki/How_to_use_Microsoft_Web_N-gram_service"target=_blank>How to use Microsoft Web N-gram service</a>，微软自己也有一个“Quick Start&#8221;，需要你”read the terms of use”并点击“I agree&#8221;之后就能看到，或者，可以试一下下面这个网页：</p>
<p><a href="http://web-ngram.research.microsoft.com/info/quickstart.htm">http://web-ngram.research.microsoft.com/info/quickstart.htm</a></p>
<p>　　这两份文档都比较详细，有兴趣和条件的读者可以试一下。</p>
<p>注：转载请注明出处“<a href="http://www.52nlp.cn">我爱自然语言处理</a>”：<a href="http://www.52nlp.cn">www.52nlp.cn</a></p>
<p>本文链接地址：<a href="http://www.52nlp.cn/微软-web-n-gram-services">http://www.52nlp.cn/微软-web-n-gram-services</a></p>
<p>
<!-- Begin Google Adsense code -->
<script type="text/javascript"><!--
google_ad_client = "pub-4332174469367599";
/* 336x280, 创建于 09-2-7 */
google_ad_slot = "5707022987";
google_ad_width = 336;
google_ad_height = 280;
//-->
</script>
<script type="text/javascript"
src="http://pagead2.googlesyndication.com/pagead/show_ads.js">
</script>
<!-- End Google Adsense code -->
</p>


<p>相关文章:<ol><li><a href='http://www.52nlp.cn/beautiful-data-%e7%bb%9f%e8%ae%a1%e8%af%ad%e8%a8%80%e6%a8%a1%e5%9e%8b%e7%9a%84%e5%ba%94%e7%94%a8%e4%ba%8c%e8%83%8c%e6%99%af' rel='bookmark' title='Permanent Link: Beautiful Data-统计语言模型的应用二：背景'>Beautiful Data-统计语言模型的应用二：背景</a></li>
<li><a href='http://www.52nlp.cn/beautiful-data-%e7%bb%9f%e8%ae%a1%e8%af%ad%e8%a8%80%e6%a8%a1%e5%9e%8b%e7%9a%84%e5%ba%94%e7%94%a8%e4%b8%89%e5%88%86%e8%af%8d8' rel='bookmark' title='Permanent Link: Beautiful Data-统计语言模型的应用三：分词8'>Beautiful Data-统计语言模型的应用三：分词8</a></li>
<li><a href='http://www.52nlp.cn/hmm-learn-best-practices-seven-forward-backward-algorithm-2' rel='bookmark' title='Permanent Link: HMM学习最佳范例七：前向-后向算法2'>HMM学习最佳范例七：前向-后向算法2</a></li>
<li><a href='http://www.52nlp.cn/language-model-training-tools-srilm-details' rel='bookmark' title='Permanent Link: 语言模型训练工具SRILM详解'>语言模型训练工具SRILM详解</a></li>
<li><a href='http://www.52nlp.cn/hmm-learn-best-practices-seven-forward-backward-algorithm-5' rel='bookmark' title='Permanent Link: HMM学习最佳范例七：前向-后向算法5'>HMM学习最佳范例七：前向-后向算法5</a></li>
<li><a href='http://www.52nlp.cn/language-modeling-toolkit-irstlm-installation-and-trial-noting' rel='bookmark' title='Permanent Link: 语言模型工具IRSTLM安装及试用手记'>语言模型工具IRSTLM安装及试用手记</a></li>
<li><a href='http://www.52nlp.cn/mit-nlp-second-lesson-word-counting-first-part' rel='bookmark' title='Permanent Link: MIT自然语言处理第二讲：单词计数（第一部分）'>MIT自然语言处理第二讲：单词计数（第一部分）</a></li>
<li><a href='http://www.52nlp.cn/mit-nlp-third-lesson-probabilistic-language-modeling-first-part' rel='bookmark' title='Permanent Link: MIT自然语言处理第三讲：概率语言模型（第一部分）'>MIT自然语言处理第三讲：概率语言模型（第一部分）</a></li>
<li><a href='http://www.52nlp.cn/%e6%8e%a8%e8%8d%90%e5%bc%a0%e5%8d%8e%e5%b9%b3%e8%80%81%e5%b8%88%e7%9a%84%e4%b8%ad%e6%96%87%e5%88%86%e8%af%8d%e5%b7%a5%e5%85%b7-ictclas2010' rel='bookmark' title='Permanent Link: 推荐张华平老师的中文分词工具ICTCLAS2010'>推荐张华平老师的中文分词工具ICTCLAS2010</a></li>
<li><a href='http://www.52nlp.cn/beautiful-data-%e7%bb%9f%e8%ae%a1%e8%af%ad%e8%a8%80%e6%a8%a1%e5%9e%8b%e7%9a%84%e5%ba%94%e7%94%a8%e4%b8%89%e5%88%86%e8%af%8d2' rel='bookmark' title='Permanent Link: Beautiful Data-统计语言模型的应用三：分词2'>Beautiful Data-统计语言模型的应用三：分词2</a></li>
</ol></p><img src="http://feeds.feedburner.com/~r/52nlp/~4/D2yUzPxrEA8" height="1" width="1"/>]]></content:encoded>
			<wfw:commentRss>http://www.52nlp.cn/%e5%be%ae%e8%bd%af-web-n-gram-services/feed</wfw:commentRss>
		<slash:comments>7</slash:comments>
		<feedburner:origLink>http://www.52nlp.cn/%e5%be%ae%e8%bd%af-web-n-gram-services</feedburner:origLink></item>
	</channel>
</rss>
