🌐 Baseline System 1 - NTCIR Project.html (Html) 15.1 KB 2016-01-06
HTML template for Baseline System 1 NTCIR Project
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52 | <!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
<!-- saved from url=(0048)http://ntcir.nii.ac.jp/PatentMT/baselineSystem1/ -->
<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en"><script type="text/javascript">window["_gaUserPrefs"] = { ioo : function() { return true; } }</script><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta http-equiv="content-language" content="en"><meta name="robots" content="index,follow"><meta name="keywords" content="CMS,Netcommons,Maple"><meta name="description" content="CMS,Netcommons,Maple"><meta name="rating" content="General"><meta name="author" content="NetCommons"><meta name="copyright" content="Copyright © 2007-2008"><meta http-equiv="content-script-type" content="text/javascript"><meta http-equiv="content-style-type" content="text/css"><link rel="canonical" href="http://ntcir.nii.ac.jp/PatentMT/baselineSystem1/"><title>Baseline System 1 - NTCIR Project</title><script type="text/javascript">_nc_lang_name = "english";_nc_layoutmode = "off";_nc_base_url = "http://ntcir.nii.ac.jp";_nc_core_base_url = "http://ntcir.nii.ac.jp";_nc_index_file_name = "/index.php";_nc_current_url = 'http://ntcir.nii.ac.jp/index.php?_restful_permalink=PatentMT%2FbaselineSystem1';_nc_allow_attachment = '0';_nc_allow_htmltag = '0';_nc_allow_video = '0';_nc_main_page_id = '256';_nc_user_id = '0';_nc_debug = 0;_nc_ajaxFlag = false;_nc_dwScriptCount = 0;_nc_dwScriptList = Array();_nc_js_vs = '20130326222549';_nc_css_vs = '20131025063628';</script><link href="http://ntcir.nii.ac.jp/images/common/favicon.ico" rel="SHORTCUT ICON"><link class="_common_css" rel="stylesheet" type="text/css" media="all" href="./Baseline System 1 - NTCIR Project_files/index.php"><style type="text/css"></style><style type="text/css"></style><style type="text/css">:root .container > .infoBoxList > .shareInfoBox
{display:none !important;}</style><link rel="stylesheet" type="text/css" href="chrome-extension://pkehgijcmpdhfbdbbnkijodmdjhbjlgp/skin/socialwidgets.css"></head><body style=""><noscript><div class="errorHeaderMsg">You need to have JavaScript enabled to use this page.</div></noscript><script type="text/javascript">if (document.cookie == "") {document.write(unescape('%3Cdiv class="errorHeaderMsg"%3EYou need to have Cookie enabled to use this page.%3C/div%3E'));}</script>
<link rel="stylesheet" type="text/css" href="./Baseline System 1 - NTCIR Project_files/user.css"><div class="ntcir_bg"><table class="ntcir_container" align="center"><tbody><tr><td><table id="_container" class="container" summary="" style="text-align:left;"><tbody><tr><td class="valign-top align-left">
<div id="_headercolumn" class="headercolumn">
<div id="__headercolumn" class="main_column">
<table class="widthmax" summary=""><tbody><tr><td class="column valign-top"><div class="cell" style="padding:0px 0px 0px 0px;"><table id="_449" class="blockstyle_449 module_box noneframe" style="width:100%"><tbody><tr><td><input type="hidden" id="_token_449" class="_token" value="089d507e8493ec0966c6c10cf2053bb1"><input type="hidden" id="_url_449" class="_url" value="http://ntcir.nii.ac.jp/index.php?theme_name=noneframe&page_id=3&block_id=449&module_id=14&action=announcement_view_main_init&temp_name=default"><a id="_href_449" name="_449"></a><table border="0" cellspacing="0" cellpadding="0" class="th_none widthmax"><tbody><tr><td class="th_none_content"><h2 class="th_none_title nc_block_title display-none" title=""></h2><div class="content"><div class="widthmax">
<div class="header"><script src="./Baseline System 1 - NTCIR Project_files/jquery.min.js"></script><script type="text/javascript" src="./Baseline System 1 - NTCIR Project_files/jquery.rollover.js"></script><h1 class="logo"><a href="http://ntcir.nii.ac.jp/"><img alt="NTCIR" src="./Baseline System 1 - NTCIR Project_files/logo.gif"></a></h1><div class="copy">NII Testbeds and Community for Information access Research</div><ul class="menu"><li class="home"><a href="http://ntcir.nii.ac.jp/"><img alt="Home" src="./Baseline System 1 - NTCIR Project_files/btn_home_off.gif"></a></li><li><a href="http://ntcir.nii.ac.jp/about/"><img alt="About NTCIR" src="./Baseline System 1 - NTCIR Project_files/btn_about_off.gif"></a></li><li><a href="http://ntcir.nii.ac.jp/faq/"><img alt="FAQ" src="./Baseline System 1 - NTCIR Project_files/btn_faq_off.gif"></a></li><li><a href="http://ntcir.nii.ac.jp/index.php?action=pages_view_main&active_center=search_view_main_center"><img alt="Search" src="./Baseline System 1 - NTCIR Project_files/btn_search_off.gif"></a></li></ul><ul class="gnavi"><li><a href="http://research.nii.ac.jp/ntcir/index-en.html" target="_blank"><img alt="NTCIR Official site" src="./Baseline System 1 - NTCIR Project_files/gnavi_officialsite_off.png"></a></li><li><a href="http://research.nii.ac.jp/ntcir/ntcir-12/index.html" target="_blank"><img alt="Conference" src="./Baseline System 1 - NTCIR Project_files/gnavi_conference_off.png"></a></li><li><a href="http://research.nii.ac.jp/ntcir/ntcir-12/chairs.html" target="_blank"><img alt="Organizers" src="./Baseline System 1 - NTCIR Project_files/gnavi_organizers_off.png"></a></li><li><a href="http://research.nii.ac.jp/ntcir/data/data-en.html" target="_blank"><img alt="Data" src="./Baseline System 1 - NTCIR Project_files/gnavi_data_off.png"></a></li><li><a href="http://research.nii.ac.jp/ntcir/ntcir-12/dates.html" target="_blank"><img alt="Important Dates" src="./Baseline System 1 - NTCIR Project_files/gnavi_importantdates_off.png"></a></li></ul></div>
<div class="float-clear-div"> </div>
</div>
</div></td></tr></tbody></table></td></tr></tbody></table></div></td></tr></tbody></table>
</div>
</div>
</td></tr><tr><td><table class="widthmax" summary=""><tbody><tr><td id="_leftcolumn" class="leftcolumn valign-top align-left" style=""><div id="__leftcolumn" class="main_column"><table class="widthmax" summary=""><tbody><tr><td class="column valign-top"><div class="cell" style="padding:0px 30px 0px 0px;"><table id="_4" class="blockstyle_4 module_box classic_default" style="width:100%"><tbody><tr><td><input type="hidden" id="_token_4" class="_token" value="089d507e8493ec0966c6c10cf2053bb1"><input type="hidden" id="_url_4" class="_url" value="http://ntcir.nii.ac.jp/index.php?theme_name=classic_default&page_id=4&block_id=4&module_id=26&action=menu_view_main_init&temp_name=common_menu"><a id="_href_4" name="_4"></a><table id="_theme_top_4" class="th_classic_default widthmax" summary=""><tbody><tr class="_block_title_event display-none"><td class="th_classic_default_header"><table class="_move_bar widthmax" title="" summary=""><tbody><tr><td><h2 class="nc_block_title th_classic_default_title" title=""></h2></td><td class="align-right"></td></tr></tbody></table></td></tr><tr><td><div class="th_classic_content content"><div class="outerdiv"><ul id="common_menu"><!--<li ><a href="http://ntcir.nii.ac.jp/index.php?action=pages_view_main&page_id=207"><div>HOME</div></a></li>//--><li><a href="http://ntcir.nii.ac.jp/QA-Lab/"><div>QA Lab</div></a></li><li><a href="http://ntcir.nii.ac.jp/Temporalia/"><div>Temporalia</div></a></li><li><a href="http://ntcir.nii.ac.jp/CrossLink-1/"><div>CrossLink</div></a></li><li><a href="http://ntcir.nii.ac.jp/PatentMTList/"><div>PatentMT</div></a></li><li><a href="http://ntcir.nii.ac.jp/about/"><div>About NTCIR</div></a></li><ul></ul><li><a href="http://ntcir.nii.ac.jp/Papers-on-NTCIR-using-NTCIR/"><div>Papers on NTCIR/using NTCIR</div></a></li><li><a href="http://ntcir.nii.ac.jp/NTCIR-Blog/"><div>NTCIR Blog</div></a></li><li><a href="http://ntcir.nii.ac.jp/Album/"><div>Album</div></a></li><li><a href="http://ntcir.nii.ac.jp/Your-Voice/"><div>Your Voice</div></a></li><li><a href="http://ntcir.nii.ac.jp/past_ws/"><div>Past Workshop</div></a></li><li><a href="http://ntcir.nii.ac.jp/calendar/"><div>Calendar</div></a></li></ul></div></div></td></tr></tbody></table></td></tr></tbody></table></div></td></tr></tbody></table></div></td><td id="_centercolumn" class="centercolumn valign-top align-left" style=""><a class="hidelink" name="center_column"></a><div id="__centercolumn" class="main_column"><table class="widthmax" summary=""><tbody><tr><td class="column valign-top"><div class="cell" style="padding:8px 8px 8px 8px;"><table id="_330" class="blockstyle_330 module_box noneframe" style="width:100%"><tbody><tr><td><input type="hidden" id="_token_330" class="_token" value="089d507e8493ec0966c6c10cf2053bb1"><input type="hidden" id="_url_330" class="_url" value="http://ntcir.nii.ac.jp/index.php?theme_name=noneframe&page_id=256&block_id=330&module_id=14&action=announcement_view_main_init&temp_name=default"><a id="_href_330" name="_330"></a><table border="0" cellspacing="0" cellpadding="0" class="th_none widthmax"><tbody><tr><td class="th_none_content"><h2 class="th_none_title nc_block_title display-none" title=""></h2><div class="content"><div class="widthmax">
<span style="color: rgb(0, 0, 0); "><font size="3"><center><h2>Baseline System 1: Hierarchical phrase-based SMT</h2></center><br>
Here, "fr" represents the source language and "en" represents the target language.
<blockquote><code>export SCRIPTS_ROOTDIR=${pathName}/moses-scripts/scripts-XXXXXXXX-XXXX<br>
MOSES_CHART_CMD=${pathName}/moses/trunk/moses-chart-cmd/src/moses_chart<br>
MOSES_CMD=${pathName}/moses/trunk/moses-cmd/src/moses<br>
MERT_DIR=${pathName}/moses/trunk/mert<br>
GIZA_BIN_DIR=${pathName}/giza-pp/bin<br>
SRILM_DIR=${pathName}/srilm/bin/i686-m64<br>
SCRIPTS_DIR=${pathName}/scripts<br>
</code></blockquote><h2>Build Language Model</h2><blockquote><code>mkdir lm<br>
${SRILM_DIR}/ngram-count -order 5 -interpolate -kndiscount -unk -text corpus.tok/train-all.tok.lower.en -lm lm/train-all.en.lm<br>
</code></blockquote><h2>Train Model</h2><blockquote><code>mkdir hierarModel<br>
cd hierarModel/<br>
<br>
mkdir work<br>
<br>
${SCRIPTS_ROOTDIR}/training/train-model.perl \<br>
--scripts-root-dir ${SCRIPTS_ROOTDIR} \<br>
--root-dir `pwd`/work \<br>
--bin-dir ${GIZA_BIN_DIR} \<br>
--corpus ../corpus.tok/train-all.clean1-40 \<br>
--f fr \<br>
--e en \<br>
--parallel \<br>
--alignment grow-diag-final \<br>
--hierarchical \<br>
--glue-grammar \<br>
--extract-options="--MinHoleSource 1" \<br>
--lm 0:5:`pwd`/../lm/train-all.en.lm \<br>
>& work/training.out<br>
... [truncated, 105 more lines] ...
|
{
"@context": "https://schema.org",
"@type": "SoftwareSourceCode",
"name": "Baseline System 1 - NTCIR Project.html",
"description": "HTML template for Baseline System 1 NTCIR Project",
"dateModified": "2016-01-06",
"dateCreated": "2025-03-23",
"contentSize": "15.1 KB",
"contentUrl": "https://www.artikelschreiber.com/opensource/onetipp/Technisches/Realisierung/Moses/Baseline System 1 - NTCIR Project.html",
"encodingFormat": "text/html",
"programmingLanguage": {
"@type": "ComputerLanguage",
"name": "Html"
},
"codeRepository": "https://www.artikelschreiber.com/opensource/onetipp/Technisches/Realisierung/Moses/"
}
🌐 Tree-to-String SMT (Baseline System at WAT2015).html (Html) 6.6 KB 2015-12-22
HTML template for Tree to String SMT (Baseline System at WAT2015)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52 | <html>
<head>
<TITLE>Tree-to-String SMT (Baseline System at WAT2015)</TITLE>
<LINK REL="stylesheet" type="text/css" href="baseline.css">
<meta http-equiv="content-type" content="text/html;charset=utf-8">
</head>
<body>
<script>
(function(i,s,o,g,r,a,m){i['GoogleAnalyticsObject']=r;i[r]=i[r]||function(){
(i[r].q=i[r].q||[]).push(arguments)},i[r].l=1*new Date();a=s.createElement(o),
m=s.getElementsByTagName(o)[0];a.async=1;a.src=g;m.parentNode.insertBefore(a,m)
})(window,document,'script','//www.google-analytics.com/analytics.js','ga');
ga('create', 'UA-48872754-1', 'kyoto-u.ac.jp');
ga('send', 'pageview');
</script>
<center>
<div align="left" style="position: relative; height: 30;">
<img src="../pic/jst_logo.jpg" alt="JST_LOGO.JPG" height="40">
<img src="../pic/nict_logo.jpg" alt="NICT_LOGO.JPG" height="40">
<img src="../pic/kyoto-u_logo.jpg" alt="KYOTO-U_LOGO.JPG" height="40">
</div>
<h1 id="#home.html">
<div style="font-size: 140%; height: 15">WAT 2015</div><br>
<div sytle="font-size: 70%">The 2nd Workshop on Asian Translation</div>
<div style="font-size: 100%">Baseline Systems</div>
<div style="font-size: 100%">Tree-to-String SMT</div>
<div style="font-size: 100%">for the EJ and CJ subtasks</div>
</h1>
[<A HREF="baselineSystems.html">BASELINE SYSTEMS TOP</A>]
| [<A HREF="#setup.html">SETUP</A>]
| [<A HREF="#lm.html">TRAINING LANGUAGE MODEL</A>]
| [<A HREF="#tm.html">TRAINING TRANSLATION MODEL</A>]
| [<A HREF="#tuning.html">TUNING</A>]
| [<A HREF="#translating.html">TRANSLATING</A>]
| [<A HREF="#detokenize.html">DETOKENIZE THE OUTPUT</A>]
</center>
<span style="color: rgb(0, 0, 0);"><font size="3">
<h2 id="setup.html">Setup</h2>
(Here, ${LANG_F} represents the source language and ${LANG_E} represents the target language.
"en" and "ja" are samples.)
... [truncated, 166 more lines] ...
|
{
"@context": "https://schema.org",
"@type": "SoftwareSourceCode",
"name": "Tree-to-String SMT (Baseline System at WAT2015).html",
"description": "HTML template for Tree to String SMT (Baseline System at WAT2015)",
"dateModified": "2015-12-22",
"dateCreated": "2025-03-23",
"contentSize": "6.6 KB",
"contentUrl": "https://www.artikelschreiber.com/opensource/onetipp/Technisches/Realisierung/Moses/Tree-to-String SMT (Baseline System at WAT2015).html",
"encodingFormat": "text/html",
"programmingLanguage": {
"@type": "ComputerLanguage",
"name": "Html"
},
"codeRepository": "https://www.artikelschreiber.com/opensource/onetipp/Technisches/Realisierung/Moses/"
}
📄 trainingsablauf.txt (Text) 2.0 KB 2015-12-27
Source code file for trainingsablauf
{
"@context": "https://schema.org",
"@type": "SoftwareSourceCode",
"name": "trainingsablauf.txt",
"description": "Source code file for trainingsablauf",
"dateModified": "2015-12-27",
"dateCreated": "2025-03-23",
"contentSize": "2.0 KB",
"contentUrl": "https://www.artikelschreiber.com/opensource/onetipp/Technisches/Realisierung/Moses/trainingsablauf.txt",
"encodingFormat": "text/plain",
"programmingLanguage": {
"@type": "ComputerLanguage",
"name": "Text"
},
"codeRepository": "https://www.artikelschreiber.com/opensource/onetipp/Technisches/Realisierung/Moses/"
}
📄 trainingsablauf_deutsch_zu_english.txt (Text) 2.9 KB 2016-01-06
Source code file for trainingsablauf deutsch zu english
{
"@context": "https://schema.org",
"@type": "SoftwareSourceCode",
"name": "trainingsablauf_deutsch_zu_english.txt",
"description": "Source code file for trainingsablauf deutsch zu english",
"dateModified": "2016-01-06",
"dateCreated": "2025-03-23",
"contentSize": "2.9 KB",
"contentUrl": "https://www.artikelschreiber.com/opensource/onetipp/Technisches/Realisierung/Moses/trainingsablauf_deutsch_zu_english.txt",
"encodingFormat": "text/plain",
"programmingLanguage": {
"@type": "ComputerLanguage",
"name": "Text"
},
"codeRepository": "https://www.artikelschreiber.com/opensource/onetipp/Technisches/Realisierung/Moses/"
}
📄 trainingsablauf_english_zu_deutsch.txt (Text) 2.1 KB 2015-12-31
Source code file for trainingsablauf english zu deutsch
{
"@context": "https://schema.org",
"@type": "SoftwareSourceCode",
"name": "trainingsablauf_english_zu_deutsch.txt",
"description": "Source code file for trainingsablauf english zu deutsch",
"dateModified": "2015-12-31",
"dateCreated": "2025-03-23",
"contentSize": "2.1 KB",
"contentUrl": "https://www.artikelschreiber.com/opensource/onetipp/Technisches/Realisierung/Moses/trainingsablauf_english_zu_deutsch.txt",
"encodingFormat": "text/plain",
"programmingLanguage": {
"@type": "ComputerLanguage",
"name": "Text"
},
"codeRepository": "https://www.artikelschreiber.com/opensource/onetipp/Technisches/Realisierung/Moses/"
}